diff --git "a/metrics.json" "b/metrics.json" new file mode 100644--- /dev/null +++ "b/metrics.json" @@ -0,0 +1,6144 @@ +{"num_parameters": 108882432, "trainable_parameters": 108882432, "step": 0} +{"train_info/time_between_train_steps": 2.626723051071167, "step": 0} +{"info/global_step": 1, "train_info/time_within_train_step": 4.597600698471069, "step": 1} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 4412.87744140625, "train_info/memory_reserved": 4642.0, "train_info/memory_max_reserved": 4642.0, "_timestamp": 1746286011, "_runtime": 33}, "step": 1} +{"logs": {"train/loss": 10.3429, "train/learning_rate": 2e-06, "train/epoch": 0.0, "_timestamp": 1746286011, "_runtime": 33}, "step": 1} +{"train_info/time_between_train_steps": 0.03618049621582031, "step": 1} +{"info/global_step": 2, "train_info/time_within_train_step": 2.462554931640625, "step": 2} +{"train_info/time_between_train_steps": 0.003852367401123047, "step": 2} +{"info/global_step": 3, "train_info/time_within_train_step": 2.5017359256744385, "step": 3} +{"train_info/time_between_train_steps": 0.004141807556152344, "step": 3} +{"info/global_step": 4, "train_info/time_within_train_step": 2.5884695053100586, "step": 4} +{"train_info/time_between_train_steps": 0.004038572311401367, "step": 4} +{"info/global_step": 5, "train_info/time_within_train_step": 2.6397485733032227, "step": 5} +{"train_info/time_between_train_steps": 0.00394439697265625, "step": 5} +{"info/global_step": 6, "train_info/time_within_train_step": 2.6759400367736816, "step": 6} +{"train_info/time_between_train_steps": 0.0039021968841552734, "step": 6} +{"info/global_step": 7, "train_info/time_within_train_step": 2.6823246479034424, "step": 7} +{"train_info/time_between_train_steps": 0.0039670467376708984, "step": 7} +{"info/global_step": 8, "train_info/time_within_train_step": 2.6862590312957764, "step": 8} +{"train_info/time_between_train_steps": 0.003899812698364258, "step": 8} +{"info/global_step": 9, "train_info/time_within_train_step": 2.6874840259552, "step": 9} +{"train_info/time_between_train_steps": 0.004126787185668945, "step": 9} +{"info/global_step": 10, "train_info/time_within_train_step": 2.6911332607269287, "step": 10} +{"train_info/time_between_train_steps": 0.0042591094970703125, "step": 10} +{"info/global_step": 11, "train_info/time_within_train_step": 2.689183235168457, "step": 11} +{"train_info/time_between_train_steps": 0.004075288772583008, "step": 11} +{"info/global_step": 12, "train_info/time_within_train_step": 2.691103935241699, "step": 12} +{"train_info/time_between_train_steps": 0.0041081905364990234, "step": 12} +{"info/global_step": 13, "train_info/time_within_train_step": 2.6940817832946777, "step": 13} +{"train_info/time_between_train_steps": 0.004172801971435547, "step": 13} +{"info/global_step": 14, "train_info/time_within_train_step": 2.692338466644287, "step": 14} +{"train_info/time_between_train_steps": 0.004104137420654297, "step": 14} +{"info/global_step": 15, "train_info/time_within_train_step": 2.692690849304199, "step": 15} +{"train_info/time_between_train_steps": 0.004250288009643555, "step": 15} +{"info/global_step": 16, "train_info/time_within_train_step": 2.6936864852905273, "step": 16} +{"train_info/time_between_train_steps": 0.004152059555053711, "step": 16} +{"info/global_step": 17, "train_info/time_within_train_step": 2.695035219192505, "step": 17} +{"train_info/time_between_train_steps": 0.0042743682861328125, "step": 17} +{"info/global_step": 18, "train_info/time_within_train_step": 2.694998264312744, "step": 18} +{"train_info/time_between_train_steps": 0.004660367965698242, "step": 18} +{"info/global_step": 19, "train_info/time_within_train_step": 2.6937267780303955, "step": 19} +{"train_info/time_between_train_steps": 0.004026174545288086, "step": 19} +{"info/global_step": 20, "train_info/time_within_train_step": 2.6929643154144287, "step": 20} +{"train_info/time_between_train_steps": 0.004086732864379883, "step": 20} +{"info/global_step": 21, "train_info/time_within_train_step": 2.6938247680664062, "step": 21} +{"train_info/time_between_train_steps": 0.004019737243652344, "step": 21} +{"info/global_step": 22, "train_info/time_within_train_step": 2.694256067276001, "step": 22} +{"train_info/time_between_train_steps": 0.0040972232818603516, "step": 22} +{"info/global_step": 23, "train_info/time_within_train_step": 2.694798707962036, "step": 23} +{"train_info/time_between_train_steps": 0.00412297248840332, "step": 23} +{"info/global_step": 24, "train_info/time_within_train_step": 2.6948959827423096, "step": 24} +{"train_info/time_between_train_steps": 0.004129171371459961, "step": 24} +{"info/global_step": 25, "train_info/time_within_train_step": 2.7027716636657715, "step": 25} +{"train_info/time_between_train_steps": 0.004180192947387695, "step": 25} +{"info/global_step": 26, "train_info/time_within_train_step": 2.695613384246826, "step": 26} +{"train_info/time_between_train_steps": 0.004084587097167969, "step": 26} +{"info/global_step": 27, "train_info/time_within_train_step": 2.6973044872283936, "step": 27} +{"train_info/time_between_train_steps": 0.004054069519042969, "step": 27} +{"info/global_step": 28, "train_info/time_within_train_step": 2.6948578357696533, "step": 28} +{"train_info/time_between_train_steps": 0.004002809524536133, "step": 28} +{"info/global_step": 29, "train_info/time_within_train_step": 2.6960513591766357, "step": 29} +{"train_info/time_between_train_steps": 0.0041539669036865234, "step": 29} +{"info/global_step": 30, "train_info/time_within_train_step": 2.6970412731170654, "step": 30} +{"train_info/time_between_train_steps": 0.0040895938873291016, "step": 30} +{"info/global_step": 31, "train_info/time_within_train_step": 2.6956701278686523, "step": 31} +{"train_info/time_between_train_steps": 0.003968238830566406, "step": 31} +{"info/global_step": 32, "train_info/time_within_train_step": 2.6971657276153564, "step": 32} +{"train_info/time_between_train_steps": 0.003943920135498047, "step": 32} +{"info/global_step": 33, "train_info/time_within_train_step": 2.695720672607422, "step": 33} +{"train_info/time_between_train_steps": 0.003964662551879883, "step": 33} +{"info/global_step": 34, "train_info/time_within_train_step": 2.6974973678588867, "step": 34} +{"train_info/time_between_train_steps": 0.0040798187255859375, "step": 34} +{"info/global_step": 35, "train_info/time_within_train_step": 2.6964848041534424, "step": 35} +{"train_info/time_between_train_steps": 0.0040509700775146484, "step": 35} +{"info/global_step": 36, "train_info/time_within_train_step": 2.6965324878692627, "step": 36} +{"train_info/time_between_train_steps": 0.003936290740966797, "step": 36} +{"info/global_step": 37, "train_info/time_within_train_step": 2.6966805458068848, "step": 37} +{"train_info/time_between_train_steps": 0.0040073394775390625, "step": 37} +{"info/global_step": 38, "train_info/time_within_train_step": 2.698275327682495, "step": 38} +{"train_info/time_between_train_steps": 0.004039287567138672, "step": 38} +{"info/global_step": 39, "train_info/time_within_train_step": 2.698680877685547, "step": 39} +{"train_info/time_between_train_steps": 0.003976583480834961, "step": 39} +{"info/global_step": 40, "train_info/time_within_train_step": 2.6996264457702637, "step": 40} +{"train_info/time_between_train_steps": 0.0041162967681884766, "step": 40} +{"info/global_step": 41, "train_info/time_within_train_step": 2.6988260746002197, "step": 41} +{"train_info/time_between_train_steps": 0.004037618637084961, "step": 41} +{"info/global_step": 42, "train_info/time_within_train_step": 3.0784823894500732, "step": 42} +{"train_info/time_between_train_steps": 0.0037713050842285156, "step": 42} +{"info/global_step": 43, "train_info/time_within_train_step": 2.697226047515869, "step": 43} +{"train_info/time_between_train_steps": 0.0037279129028320312, "step": 43} +{"info/global_step": 44, "train_info/time_within_train_step": 2.6973724365234375, "step": 44} +{"train_info/time_between_train_steps": 0.0037202835083007812, "step": 44} +{"info/global_step": 45, "train_info/time_within_train_step": 2.694927453994751, "step": 45} +{"train_info/time_between_train_steps": 0.003791332244873047, "step": 45} +{"info/global_step": 46, "train_info/time_within_train_step": 2.69455885887146, "step": 46} +{"train_info/time_between_train_steps": 0.003766298294067383, "step": 46} +{"info/global_step": 47, "train_info/time_within_train_step": 2.7145802974700928, "step": 47} +{"train_info/time_between_train_steps": 0.0037391185760498047, "step": 47} +{"info/global_step": 48, "train_info/time_within_train_step": 2.6942429542541504, "step": 48} +{"train_info/time_between_train_steps": 0.0038008689880371094, "step": 48} +{"info/global_step": 49, "train_info/time_within_train_step": 2.6943981647491455, "step": 49} +{"train_info/time_between_train_steps": 0.0038526058197021484, "step": 49} +{"info/global_step": 50, "train_info/time_within_train_step": 2.6944804191589355, "step": 50} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746286146, "_runtime": 168}, "step": 50} +{"logs": {"train/loss": 8.5826, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 0.02, "_timestamp": 1746286146, "_runtime": 168}, "step": 50} +{"train_info/time_between_train_steps": 0.0258791446685791, "step": 50} +{"info/global_step": 51, "train_info/time_within_train_step": 2.6939589977264404, "step": 51} +{"train_info/time_between_train_steps": 0.003957986831665039, "step": 51} +{"info/global_step": 52, "train_info/time_within_train_step": 2.696467876434326, "step": 52} +{"train_info/time_between_train_steps": 0.003823995590209961, "step": 52} +{"info/global_step": 53, "train_info/time_within_train_step": 2.6974258422851562, "step": 53} +{"train_info/time_between_train_steps": 0.003908872604370117, "step": 53} +{"info/global_step": 54, "train_info/time_within_train_step": 2.6960861682891846, "step": 54} +{"train_info/time_between_train_steps": 0.0038890838623046875, "step": 54} +{"info/global_step": 55, "train_info/time_within_train_step": 2.697305202484131, "step": 55} +{"train_info/time_between_train_steps": 0.003773212432861328, "step": 55} +{"info/global_step": 56, "train_info/time_within_train_step": 2.696592330932617, "step": 56} +{"train_info/time_between_train_steps": 0.003908872604370117, "step": 56} +{"info/global_step": 57, "train_info/time_within_train_step": 2.696945905685425, "step": 57} +{"train_info/time_between_train_steps": 0.004067420959472656, "step": 57} +{"info/global_step": 58, "train_info/time_within_train_step": 2.6971163749694824, "step": 58} +{"train_info/time_between_train_steps": 0.0040891170501708984, "step": 58} +{"info/global_step": 59, "train_info/time_within_train_step": 2.6981558799743652, "step": 59} +{"train_info/time_between_train_steps": 0.0041425228118896484, "step": 59} +{"info/global_step": 60, "train_info/time_within_train_step": 2.6965575218200684, "step": 60} +{"train_info/time_between_train_steps": 0.003975391387939453, "step": 60} +{"info/global_step": 61, "train_info/time_within_train_step": 2.69683575630188, "step": 61} +{"train_info/time_between_train_steps": 0.004027366638183594, "step": 61} +{"info/global_step": 62, "train_info/time_within_train_step": 2.698867082595825, "step": 62} +{"train_info/time_between_train_steps": 0.004077434539794922, "step": 62} +{"info/global_step": 63, "train_info/time_within_train_step": 2.876469373703003, "step": 63} +{"train_info/time_between_train_steps": 0.003793001174926758, "step": 63} +{"info/global_step": 64, "train_info/time_within_train_step": 2.696782350540161, "step": 64} +{"train_info/time_between_train_steps": 0.0038673877716064453, "step": 64} +{"info/global_step": 65, "train_info/time_within_train_step": 2.7285943031311035, "step": 65} +{"train_info/time_between_train_steps": 0.0037674903869628906, "step": 65} +{"info/global_step": 66, "train_info/time_within_train_step": 2.950040102005005, "step": 66} +{"train_info/time_between_train_steps": 0.0038061141967773438, "step": 66} +{"info/global_step": 67, "train_info/time_within_train_step": 2.780561685562134, "step": 67} +{"train_info/time_between_train_steps": 0.003815174102783203, "step": 67} +{"info/global_step": 68, "train_info/time_within_train_step": 2.7026872634887695, "step": 68} +{"train_info/time_between_train_steps": 0.003793001174926758, "step": 68} +{"info/global_step": 69, "train_info/time_within_train_step": 2.697599411010742, "step": 69} +{"train_info/time_between_train_steps": 0.0037860870361328125, "step": 69} +{"info/global_step": 70, "train_info/time_within_train_step": 2.698197841644287, "step": 70} +{"train_info/time_between_train_steps": 0.0038225650787353516, "step": 70} +{"info/global_step": 71, "train_info/time_within_train_step": 2.7035558223724365, "step": 71} +{"train_info/time_between_train_steps": 0.0037560462951660156, "step": 71} +{"info/global_step": 72, "train_info/time_within_train_step": 2.697897434234619, "step": 72} +{"train_info/time_between_train_steps": 0.003789186477661133, "step": 72} +{"info/global_step": 73, "train_info/time_within_train_step": 2.698354959487915, "step": 73} +{"train_info/time_between_train_steps": 0.0037994384765625, "step": 73} +{"info/global_step": 74, "train_info/time_within_train_step": 2.7021279335021973, "step": 74} +{"train_info/time_between_train_steps": 0.003740072250366211, "step": 74} +{"info/global_step": 75, "train_info/time_within_train_step": 2.717054843902588, "step": 75} +{"train_info/time_between_train_steps": 0.003807544708251953, "step": 75} +{"info/global_step": 76, "train_info/time_within_train_step": 2.7026431560516357, "step": 76} +{"train_info/time_between_train_steps": 0.0037882328033447266, "step": 76} +{"info/global_step": 77, "train_info/time_within_train_step": 2.7027993202209473, "step": 77} +{"train_info/time_between_train_steps": 0.0038406848907470703, "step": 77} +{"info/global_step": 78, "train_info/time_within_train_step": 2.6968812942504883, "step": 78} +{"train_info/time_between_train_steps": 0.003887176513671875, "step": 78} +{"info/global_step": 79, "train_info/time_within_train_step": 2.698570966720581, "step": 79} +{"train_info/time_between_train_steps": 0.0038912296295166016, "step": 79} +{"info/global_step": 80, "train_info/time_within_train_step": 2.698380947113037, "step": 80} +{"train_info/time_between_train_steps": 0.003961801528930664, "step": 80} +{"info/global_step": 81, "train_info/time_within_train_step": 2.698392868041992, "step": 81} +{"train_info/time_between_train_steps": 0.004052639007568359, "step": 81} +{"info/global_step": 82, "train_info/time_within_train_step": 2.708785057067871, "step": 82} +{"train_info/time_between_train_steps": 0.00404047966003418, "step": 82} +{"info/global_step": 83, "train_info/time_within_train_step": 2.700000762939453, "step": 83} +{"train_info/time_between_train_steps": 0.003996372222900391, "step": 83} +{"info/global_step": 84, "train_info/time_within_train_step": 2.8716771602630615, "step": 84} +{"train_info/time_between_train_steps": 0.0039980411529541016, "step": 84} +{"info/global_step": 85, "train_info/time_within_train_step": 2.953153133392334, "step": 85} +{"train_info/time_between_train_steps": 0.003971576690673828, "step": 85} +{"info/global_step": 86, "train_info/time_within_train_step": 2.7012393474578857, "step": 86} +{"train_info/time_between_train_steps": 0.004042863845825195, "step": 86} +{"info/global_step": 87, "train_info/time_within_train_step": 2.698364019393921, "step": 87} +{"train_info/time_between_train_steps": 0.004556179046630859, "step": 87} +{"info/global_step": 88, "train_info/time_within_train_step": 2.6990532875061035, "step": 88} +{"train_info/time_between_train_steps": 0.0040738582611083984, "step": 88} +{"info/global_step": 89, "train_info/time_within_train_step": 2.704359292984009, "step": 89} +{"train_info/time_between_train_steps": 0.004021167755126953, "step": 89} +{"info/global_step": 90, "train_info/time_within_train_step": 2.9196250438690186, "step": 90} +{"train_info/time_between_train_steps": 0.004029035568237305, "step": 90} +{"info/global_step": 91, "train_info/time_within_train_step": 2.889819622039795, "step": 91} +{"train_info/time_between_train_steps": 0.004070758819580078, "step": 91} +{"info/global_step": 92, "train_info/time_within_train_step": 2.7119853496551514, "step": 92} +{"train_info/time_between_train_steps": 0.0039217472076416016, "step": 92} +{"info/global_step": 93, "train_info/time_within_train_step": 2.7050371170043945, "step": 93} +{"train_info/time_between_train_steps": 0.00397491455078125, "step": 93} +{"info/global_step": 94, "train_info/time_within_train_step": 3.119417190551758, "step": 94} +{"train_info/time_between_train_steps": 0.003770112991333008, "step": 94} +{"info/global_step": 95, "train_info/time_within_train_step": 2.6966893672943115, "step": 95} +{"train_info/time_between_train_steps": 0.003648042678833008, "step": 95} +{"info/global_step": 96, "train_info/time_within_train_step": 2.6990628242492676, "step": 96} +{"train_info/time_between_train_steps": 0.0036439895629882812, "step": 96} +{"info/global_step": 97, "train_info/time_within_train_step": 2.69742751121521, "step": 97} +{"train_info/time_between_train_steps": 0.0036628246307373047, "step": 97} +{"info/global_step": 98, "train_info/time_within_train_step": 2.726517915725708, "step": 98} +{"train_info/time_between_train_steps": 0.0036499500274658203, "step": 98} +{"info/global_step": 99, "train_info/time_within_train_step": 3.004136085510254, "step": 99} +{"train_info/time_between_train_steps": 0.003676176071166992, "step": 99} +{"info/global_step": 100, "train_info/time_within_train_step": 2.8678529262542725, "step": 100} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746286287, "_runtime": 309}, "step": 100} +{"logs": {"train/loss": 7.3152, "train/learning_rate": 0.00019999999999999998, "train/epoch": 0.03, "_timestamp": 1746286287, "_runtime": 309}, "step": 100} +{"train_info/time_between_train_steps": 19.150439739227295, "step": 100} +{"info/global_step": 101, "train_info/time_within_train_step": 2.488243818283081, "step": 101} +{"train_info/time_between_train_steps": 0.0036890506744384766, "step": 101} +{"info/global_step": 102, "train_info/time_within_train_step": 2.476057291030884, "step": 102} +{"train_info/time_between_train_steps": 0.003670215606689453, "step": 102} +{"info/global_step": 103, "train_info/time_within_train_step": 2.642223596572876, "step": 103} +{"train_info/time_between_train_steps": 0.003774881362915039, "step": 103} +{"info/global_step": 104, "train_info/time_within_train_step": 2.6972732543945312, "step": 104} +{"train_info/time_between_train_steps": 0.003641843795776367, "step": 104} +{"info/global_step": 105, "train_info/time_within_train_step": 2.6947107315063477, "step": 105} +{"train_info/time_between_train_steps": 0.003609180450439453, "step": 105} +{"info/global_step": 106, "train_info/time_within_train_step": 2.6975274085998535, "step": 106} +{"train_info/time_between_train_steps": 0.0037517547607421875, "step": 106} +{"info/global_step": 107, "train_info/time_within_train_step": 2.695176601409912, "step": 107} +{"train_info/time_between_train_steps": 0.003695249557495117, "step": 107} +{"info/global_step": 108, "train_info/time_within_train_step": 2.69584321975708, "step": 108} +{"train_info/time_between_train_steps": 0.003603219985961914, "step": 108} +{"info/global_step": 109, "train_info/time_within_train_step": 2.6978721618652344, "step": 109} +{"train_info/time_between_train_steps": 0.0037200450897216797, "step": 109} +{"info/global_step": 110, "train_info/time_within_train_step": 2.8837203979492188, "step": 110} +{"train_info/time_between_train_steps": 0.003637552261352539, "step": 110} +{"info/global_step": 111, "train_info/time_within_train_step": 2.6998131275177, "step": 111} +{"train_info/time_between_train_steps": 0.0036635398864746094, "step": 111} +{"info/global_step": 112, "train_info/time_within_train_step": 2.746694803237915, "step": 112} +{"train_info/time_between_train_steps": 0.0036880970001220703, "step": 112} +{"info/global_step": 113, "train_info/time_within_train_step": 2.9409191608428955, "step": 113} +{"train_info/time_between_train_steps": 0.0038285255432128906, "step": 113} +{"info/global_step": 114, "train_info/time_within_train_step": 3.05031681060791, "step": 114} +{"train_info/time_between_train_steps": 0.0036668777465820312, "step": 114} +{"info/global_step": 115, "train_info/time_within_train_step": 3.005021095275879, "step": 115} +{"train_info/time_between_train_steps": 0.0037069320678710938, "step": 115} +{"info/global_step": 116, "train_info/time_within_train_step": 2.709369659423828, "step": 116} +{"train_info/time_between_train_steps": 0.0037012100219726562, "step": 116} +{"info/global_step": 117, "train_info/time_within_train_step": 2.698776960372925, "step": 117} +{"train_info/time_between_train_steps": 0.004498481750488281, "step": 117} +{"info/global_step": 118, "train_info/time_within_train_step": 2.6980843544006348, "step": 118} +{"train_info/time_between_train_steps": 0.0036954879760742188, "step": 118} +{"info/global_step": 119, "train_info/time_within_train_step": 2.700178861618042, "step": 119} +{"train_info/time_between_train_steps": 0.0037147998809814453, "step": 119} +{"info/global_step": 120, "train_info/time_within_train_step": 2.9185099601745605, "step": 120} +{"train_info/time_between_train_steps": 0.0038499832153320312, "step": 120} +{"info/global_step": 121, "train_info/time_within_train_step": 3.0709524154663086, "step": 121} +{"train_info/time_between_train_steps": 0.003843545913696289, "step": 121} +{"info/global_step": 122, "train_info/time_within_train_step": 2.80683970451355, "step": 122} +{"train_info/time_between_train_steps": 0.0036542415618896484, "step": 122} +{"info/global_step": 123, "train_info/time_within_train_step": 2.699954032897949, "step": 123} +{"train_info/time_between_train_steps": 0.003773212432861328, "step": 123} +{"info/global_step": 124, "train_info/time_within_train_step": 2.7890872955322266, "step": 124} +{"train_info/time_between_train_steps": 0.0038568973541259766, "step": 124} +{"info/global_step": 125, "train_info/time_within_train_step": 2.848677158355713, "step": 125} +{"train_info/time_between_train_steps": 0.13263583183288574, "step": 125} +{"info/global_step": 126, "train_info/time_within_train_step": 2.7153711318969727, "step": 126} +{"train_info/time_between_train_steps": 0.004012107849121094, "step": 126} +{"info/global_step": 127, "train_info/time_within_train_step": 2.7492778301239014, "step": 127} +{"train_info/time_between_train_steps": 0.0039594173431396484, "step": 127} +{"info/global_step": 128, "train_info/time_within_train_step": 2.8733115196228027, "step": 128} +{"train_info/time_between_train_steps": 0.003863811492919922, "step": 128} +{"info/global_step": 129, "train_info/time_within_train_step": 2.8515918254852295, "step": 129} +{"train_info/time_between_train_steps": 0.00396728515625, "step": 129} +{"info/global_step": 130, "train_info/time_within_train_step": 2.7619400024414062, "step": 130} +{"train_info/time_between_train_steps": 0.0038881301879882812, "step": 130} +{"info/global_step": 131, "train_info/time_within_train_step": 2.757040500640869, "step": 131} +{"train_info/time_between_train_steps": 0.003991127014160156, "step": 131} +{"info/global_step": 132, "train_info/time_within_train_step": 2.8269870281219482, "step": 132} +{"train_info/time_between_train_steps": 0.00400233268737793, "step": 132} +{"info/global_step": 133, "train_info/time_within_train_step": 2.7821223735809326, "step": 133} +{"train_info/time_between_train_steps": 0.004294395446777344, "step": 133} +{"info/global_step": 134, "train_info/time_within_train_step": 2.7509195804595947, "step": 134} +{"train_info/time_between_train_steps": 0.0043261051177978516, "step": 134} +{"info/global_step": 135, "train_info/time_within_train_step": 2.6992290019989014, "step": 135} +{"train_info/time_between_train_steps": 0.004296064376831055, "step": 135} +{"info/global_step": 136, "train_info/time_within_train_step": 2.699530601501465, "step": 136} +{"train_info/time_between_train_steps": 0.004373073577880859, "step": 136} +{"info/global_step": 137, "train_info/time_within_train_step": 2.712951183319092, "step": 137} +{"train_info/time_between_train_steps": 0.004425048828125, "step": 137} +{"info/global_step": 138, "train_info/time_within_train_step": 2.8095993995666504, "step": 138} +{"train_info/time_between_train_steps": 0.00416874885559082, "step": 138} +{"info/global_step": 139, "train_info/time_within_train_step": 2.975980758666992, "step": 139} +{"train_info/time_between_train_steps": 0.004235982894897461, "step": 139} +{"info/global_step": 140, "train_info/time_within_train_step": 2.781244993209839, "step": 140} +{"train_info/time_between_train_steps": 0.004120349884033203, "step": 140} +{"info/global_step": 141, "train_info/time_within_train_step": 2.7005386352539062, "step": 141} +{"train_info/time_between_train_steps": 0.0041124820709228516, "step": 141} +{"info/global_step": 142, "train_info/time_within_train_step": 2.7012267112731934, "step": 142} +{"train_info/time_between_train_steps": 0.00416874885559082, "step": 142} +{"info/global_step": 143, "train_info/time_within_train_step": 2.727733612060547, "step": 143} +{"train_info/time_between_train_steps": 0.00409388542175293, "step": 143} +{"info/global_step": 144, "train_info/time_within_train_step": 2.9208760261535645, "step": 144} +{"train_info/time_between_train_steps": 0.004239559173583984, "step": 144} +{"info/global_step": 145, "train_info/time_within_train_step": 2.800560712814331, "step": 145} +{"train_info/time_between_train_steps": 0.004196882247924805, "step": 145} +{"info/global_step": 146, "train_info/time_within_train_step": 2.7241146564483643, "step": 146} +{"train_info/time_between_train_steps": 0.003995656967163086, "step": 146} +{"info/global_step": 147, "train_info/time_within_train_step": 2.698925733566284, "step": 147} +{"train_info/time_between_train_steps": 0.004250288009643555, "step": 147} +{"info/global_step": 148, "train_info/time_within_train_step": 2.74423885345459, "step": 148} +{"train_info/time_between_train_steps": 0.003924131393432617, "step": 148} +{"info/global_step": 149, "train_info/time_within_train_step": 2.8140528202056885, "step": 149} +{"train_info/time_between_train_steps": 0.004076719284057617, "step": 149} +{"info/global_step": 150, "train_info/time_within_train_step": 2.744945764541626, "step": 150} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746286450, "_runtime": 472}, "step": 150} +{"logs": {"train/loss": 6.9421, "train/learning_rate": 0.0003, "train/epoch": 0.05, "_timestamp": 1746286450, "_runtime": 472}, "step": 150} +{"train_info/time_between_train_steps": 0.03634524345397949, "step": 150} +{"info/global_step": 151, "train_info/time_within_train_step": 2.6990199089050293, "step": 151} +{"train_info/time_between_train_steps": 0.003919124603271484, "step": 151} +{"info/global_step": 152, "train_info/time_within_train_step": 2.7954633235931396, "step": 152} +{"train_info/time_between_train_steps": 0.003927946090698242, "step": 152} +{"info/global_step": 153, "train_info/time_within_train_step": 2.857931613922119, "step": 153} +{"train_info/time_between_train_steps": 0.0038521289825439453, "step": 153} +{"info/global_step": 154, "train_info/time_within_train_step": 2.7285757064819336, "step": 154} +{"train_info/time_between_train_steps": 0.003887653350830078, "step": 154} +{"info/global_step": 155, "train_info/time_within_train_step": 2.7318081855773926, "step": 155} +{"train_info/time_between_train_steps": 0.00400996208190918, "step": 155} +{"info/global_step": 156, "train_info/time_within_train_step": 2.863605499267578, "step": 156} +{"train_info/time_between_train_steps": 0.003910541534423828, "step": 156} +{"info/global_step": 157, "train_info/time_within_train_step": 2.8030033111572266, "step": 157} +{"train_info/time_between_train_steps": 0.0038928985595703125, "step": 157} +{"info/global_step": 158, "train_info/time_within_train_step": 2.7442314624786377, "step": 158} +{"train_info/time_between_train_steps": 0.0039806365966796875, "step": 158} +{"info/global_step": 159, "train_info/time_within_train_step": 2.7386372089385986, "step": 159} +{"train_info/time_between_train_steps": 0.0038597583770751953, "step": 159} +{"info/global_step": 160, "train_info/time_within_train_step": 2.833493232727051, "step": 160} +{"train_info/time_between_train_steps": 0.0038797855377197266, "step": 160} +{"info/global_step": 161, "train_info/time_within_train_step": 2.767465591430664, "step": 161} +{"train_info/time_between_train_steps": 0.003936052322387695, "step": 161} +{"info/global_step": 162, "train_info/time_within_train_step": 2.7326200008392334, "step": 162} +{"train_info/time_between_train_steps": 0.003935337066650391, "step": 162} +{"info/global_step": 163, "train_info/time_within_train_step": 2.7192816734313965, "step": 163} +{"train_info/time_between_train_steps": 0.003838062286376953, "step": 163} +{"info/global_step": 164, "train_info/time_within_train_step": 2.697006940841675, "step": 164} +{"train_info/time_between_train_steps": 0.003975868225097656, "step": 164} +{"info/global_step": 165, "train_info/time_within_train_step": 2.7612950801849365, "step": 165} +{"train_info/time_between_train_steps": 0.0039882659912109375, "step": 165} +{"info/global_step": 166, "train_info/time_within_train_step": 2.8803839683532715, "step": 166} +{"train_info/time_between_train_steps": 0.0038330554962158203, "step": 166} +{"info/global_step": 167, "train_info/time_within_train_step": 2.7668616771698, "step": 167} +{"train_info/time_between_train_steps": 0.0039021968841552734, "step": 167} +{"info/global_step": 168, "train_info/time_within_train_step": 2.6975889205932617, "step": 168} +{"train_info/time_between_train_steps": 0.0038383007049560547, "step": 168} +{"info/global_step": 169, "train_info/time_within_train_step": 2.6966536045074463, "step": 169} +{"train_info/time_between_train_steps": 0.0037717819213867188, "step": 169} +{"info/global_step": 170, "train_info/time_within_train_step": 3.0676727294921875, "step": 170} +{"train_info/time_between_train_steps": 0.0036377906799316406, "step": 170} +{"info/global_step": 171, "train_info/time_within_train_step": 2.6993815898895264, "step": 171} +{"train_info/time_between_train_steps": 0.0036978721618652344, "step": 171} +{"info/global_step": 172, "train_info/time_within_train_step": 2.7855522632598877, "step": 172} +{"train_info/time_between_train_steps": 0.003641843795776367, "step": 172} +{"info/global_step": 173, "train_info/time_within_train_step": 2.780839443206787, "step": 173} +{"train_info/time_between_train_steps": 0.003638744354248047, "step": 173} +{"info/global_step": 174, "train_info/time_within_train_step": 2.7297327518463135, "step": 174} +{"train_info/time_between_train_steps": 0.0038933753967285156, "step": 174} +{"info/global_step": 175, "train_info/time_within_train_step": 2.7747626304626465, "step": 175} +{"train_info/time_between_train_steps": 0.003767251968383789, "step": 175} +{"info/global_step": 176, "train_info/time_within_train_step": 2.7711994647979736, "step": 176} +{"train_info/time_between_train_steps": 0.0038149356842041016, "step": 176} +{"info/global_step": 177, "train_info/time_within_train_step": 2.7273497581481934, "step": 177} +{"train_info/time_between_train_steps": 0.0038077831268310547, "step": 177} +{"info/global_step": 178, "train_info/time_within_train_step": 2.7628366947174072, "step": 178} +{"train_info/time_between_train_steps": 0.0036542415618896484, "step": 178} +{"info/global_step": 179, "train_info/time_within_train_step": 2.7572438716888428, "step": 179} +{"train_info/time_between_train_steps": 0.00360870361328125, "step": 179} +{"info/global_step": 180, "train_info/time_within_train_step": 2.744797945022583, "step": 180} +{"train_info/time_between_train_steps": 0.003634929656982422, "step": 180} +{"info/global_step": 181, "train_info/time_within_train_step": 2.749931812286377, "step": 181} +{"train_info/time_between_train_steps": 0.003584146499633789, "step": 181} +{"info/global_step": 182, "train_info/time_within_train_step": 2.797987461090088, "step": 182} +{"train_info/time_between_train_steps": 0.0036468505859375, "step": 182} +{"info/global_step": 183, "train_info/time_within_train_step": 2.721759796142578, "step": 183} +{"train_info/time_between_train_steps": 0.003619670867919922, "step": 183} +{"info/global_step": 184, "train_info/time_within_train_step": 2.7562992572784424, "step": 184} +{"train_info/time_between_train_steps": 0.0037603378295898438, "step": 184} +{"info/global_step": 185, "train_info/time_within_train_step": 2.9103033542633057, "step": 185} +{"train_info/time_between_train_steps": 0.003749847412109375, "step": 185} +{"info/global_step": 186, "train_info/time_within_train_step": 2.7556560039520264, "step": 186} +{"train_info/time_between_train_steps": 0.0036656856536865234, "step": 186} +{"info/global_step": 187, "train_info/time_within_train_step": 2.717447519302368, "step": 187} +{"train_info/time_between_train_steps": 0.0036840438842773438, "step": 187} +{"info/global_step": 188, "train_info/time_within_train_step": 2.826569080352783, "step": 188} +{"train_info/time_between_train_steps": 0.0036470890045166016, "step": 188} +{"info/global_step": 189, "train_info/time_within_train_step": 2.7152531147003174, "step": 189} +{"train_info/time_between_train_steps": 0.0036444664001464844, "step": 189} +{"info/global_step": 190, "train_info/time_within_train_step": 2.796049118041992, "step": 190} +{"train_info/time_between_train_steps": 0.0036249160766601562, "step": 190} +{"info/global_step": 191, "train_info/time_within_train_step": 2.7622556686401367, "step": 191} +{"train_info/time_between_train_steps": 0.0036377906799316406, "step": 191} +{"info/global_step": 192, "train_info/time_within_train_step": 2.7464442253112793, "step": 192} +{"train_info/time_between_train_steps": 0.0035741329193115234, "step": 192} +{"info/global_step": 193, "train_info/time_within_train_step": 2.734790086746216, "step": 193} +{"train_info/time_between_train_steps": 0.0035789012908935547, "step": 193} +{"info/global_step": 194, "train_info/time_within_train_step": 2.7025723457336426, "step": 194} +{"train_info/time_between_train_steps": 0.003818035125732422, "step": 194} +{"info/global_step": 195, "train_info/time_within_train_step": 2.698683500289917, "step": 195} +{"train_info/time_between_train_steps": 0.003727436065673828, "step": 195} +{"info/global_step": 196, "train_info/time_within_train_step": 2.7334437370300293, "step": 196} +{"train_info/time_between_train_steps": 0.0037157535552978516, "step": 196} +{"info/global_step": 197, "train_info/time_within_train_step": 2.8600614070892334, "step": 197} +{"train_info/time_between_train_steps": 0.003751516342163086, "step": 197} +{"info/global_step": 198, "train_info/time_within_train_step": 2.7281336784362793, "step": 198} +{"train_info/time_between_train_steps": 0.003760099411010742, "step": 198} +{"info/global_step": 199, "train_info/time_within_train_step": 2.7471044063568115, "step": 199} +{"train_info/time_between_train_steps": 0.003736734390258789, "step": 199} +{"info/global_step": 200, "train_info/time_within_train_step": 2.8117024898529053, "step": 200} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746286592, "_runtime": 614}, "step": 200} +{"logs": {"train/loss": 6.6538, "train/learning_rate": 0.00039999999999999996, "train/epoch": 0.07, "_timestamp": 1746286592, "_runtime": 614}, "step": 200} +{"train_info/time_between_train_steps": 14.566604614257812, "step": 200} +{"info/global_step": 201, "train_info/time_within_train_step": 2.4837982654571533, "step": 201} +{"train_info/time_between_train_steps": 0.003654956817626953, "step": 201} +{"info/global_step": 202, "train_info/time_within_train_step": 2.514986753463745, "step": 202} +{"train_info/time_between_train_steps": 0.003683328628540039, "step": 202} +{"info/global_step": 203, "train_info/time_within_train_step": 2.694354772567749, "step": 203} +{"train_info/time_between_train_steps": 0.004146575927734375, "step": 203} +{"info/global_step": 204, "train_info/time_within_train_step": 2.6944122314453125, "step": 204} +{"train_info/time_between_train_steps": 0.0037834644317626953, "step": 204} +{"info/global_step": 205, "train_info/time_within_train_step": 2.71390700340271, "step": 205} +{"train_info/time_between_train_steps": 0.003737211227416992, "step": 205} +{"info/global_step": 206, "train_info/time_within_train_step": 2.6959142684936523, "step": 206} +{"train_info/time_between_train_steps": 0.003796815872192383, "step": 206} +{"info/global_step": 207, "train_info/time_within_train_step": 2.7034008502960205, "step": 207} +{"train_info/time_between_train_steps": 0.0037653446197509766, "step": 207} +{"info/global_step": 208, "train_info/time_within_train_step": 2.970137357711792, "step": 208} +{"train_info/time_between_train_steps": 0.0037336349487304688, "step": 208} +{"info/global_step": 209, "train_info/time_within_train_step": 3.0340054035186768, "step": 209} +{"train_info/time_between_train_steps": 0.0036749839782714844, "step": 209} +{"info/global_step": 210, "train_info/time_within_train_step": 3.0926153659820557, "step": 210} +{"train_info/time_between_train_steps": 0.0036575794219970703, "step": 210} +{"info/global_step": 211, "train_info/time_within_train_step": 2.7265777587890625, "step": 211} +{"train_info/time_between_train_steps": 0.003661632537841797, "step": 211} +{"info/global_step": 212, "train_info/time_within_train_step": 2.6961257457733154, "step": 212} +{"train_info/time_between_train_steps": 0.003643035888671875, "step": 212} +{"info/global_step": 213, "train_info/time_within_train_step": 2.6993863582611084, "step": 213} +{"train_info/time_between_train_steps": 0.003743410110473633, "step": 213} +{"info/global_step": 214, "train_info/time_within_train_step": 2.699185848236084, "step": 214} +{"train_info/time_between_train_steps": 0.0036160945892333984, "step": 214} +{"info/global_step": 215, "train_info/time_within_train_step": 2.8756213188171387, "step": 215} +{"train_info/time_between_train_steps": 0.0037696361541748047, "step": 215} +{"info/global_step": 216, "train_info/time_within_train_step": 3.071660280227661, "step": 216} +{"train_info/time_between_train_steps": 0.0037994384765625, "step": 216} +{"info/global_step": 217, "train_info/time_within_train_step": 2.8015708923339844, "step": 217} +{"train_info/time_between_train_steps": 0.003593921661376953, "step": 217} +{"info/global_step": 218, "train_info/time_within_train_step": 2.7122297286987305, "step": 218} +{"train_info/time_between_train_steps": 0.003782033920288086, "step": 218} +{"info/global_step": 219, "train_info/time_within_train_step": 2.7702126502990723, "step": 219} +{"train_info/time_between_train_steps": 0.003615140914916992, "step": 219} +{"info/global_step": 220, "train_info/time_within_train_step": 2.9091830253601074, "step": 220} +{"train_info/time_between_train_steps": 0.0040950775146484375, "step": 220} +{"info/global_step": 221, "train_info/time_within_train_step": 2.720188617706299, "step": 221} +{"train_info/time_between_train_steps": 0.003812074661254883, "step": 221} +{"info/global_step": 222, "train_info/time_within_train_step": 2.7002856731414795, "step": 222} +{"train_info/time_between_train_steps": 0.0037987232208251953, "step": 222} +{"info/global_step": 223, "train_info/time_within_train_step": 2.829129934310913, "step": 223} +{"train_info/time_between_train_steps": 0.0038001537322998047, "step": 223} +{"info/global_step": 224, "train_info/time_within_train_step": 3.0159199237823486, "step": 224} +{"train_info/time_between_train_steps": 0.003912210464477539, "step": 224} +{"info/global_step": 225, "train_info/time_within_train_step": 3.0022804737091064, "step": 225} +{"train_info/time_between_train_steps": 0.0038459300994873047, "step": 225} +{"info/global_step": 226, "train_info/time_within_train_step": 2.697053909301758, "step": 226} +{"train_info/time_between_train_steps": 0.0039942264556884766, "step": 226} +{"info/global_step": 227, "train_info/time_within_train_step": 2.6957950592041016, "step": 227} +{"train_info/time_between_train_steps": 0.0038695335388183594, "step": 227} +{"info/global_step": 228, "train_info/time_within_train_step": 2.6955628395080566, "step": 228} +{"train_info/time_between_train_steps": 0.0038352012634277344, "step": 228} +{"info/global_step": 229, "train_info/time_within_train_step": 2.6985392570495605, "step": 229} +{"train_info/time_between_train_steps": 0.004053592681884766, "step": 229} +{"info/global_step": 230, "train_info/time_within_train_step": 2.7009241580963135, "step": 230} +{"train_info/time_between_train_steps": 0.003786325454711914, "step": 230} +{"info/global_step": 231, "train_info/time_within_train_step": 2.7048227787017822, "step": 231} +{"train_info/time_between_train_steps": 0.004014730453491211, "step": 231} +{"info/global_step": 232, "train_info/time_within_train_step": 2.710700750350952, "step": 232} +{"train_info/time_between_train_steps": 0.0035834312438964844, "step": 232} +{"info/global_step": 233, "train_info/time_within_train_step": 2.9620285034179688, "step": 233} +{"train_info/time_between_train_steps": 0.0036165714263916016, "step": 233} +{"info/global_step": 234, "train_info/time_within_train_step": 2.9072048664093018, "step": 234} +{"train_info/time_between_train_steps": 0.003788471221923828, "step": 234} +{"info/global_step": 235, "train_info/time_within_train_step": 2.695117950439453, "step": 235} +{"train_info/time_between_train_steps": 0.003688812255859375, "step": 235} +{"info/global_step": 236, "train_info/time_within_train_step": 2.695749044418335, "step": 236} +{"train_info/time_between_train_steps": 0.003789663314819336, "step": 236} +{"info/global_step": 237, "train_info/time_within_train_step": 2.695443630218506, "step": 237} +{"train_info/time_between_train_steps": 0.003487110137939453, "step": 237} +{"info/global_step": 238, "train_info/time_within_train_step": 2.695727586746216, "step": 238} +{"train_info/time_between_train_steps": 0.003701925277709961, "step": 238} +{"info/global_step": 239, "train_info/time_within_train_step": 2.73580265045166, "step": 239} +{"train_info/time_between_train_steps": 0.0037992000579833984, "step": 239} +{"info/global_step": 240, "train_info/time_within_train_step": 3.091503620147705, "step": 240} +{"train_info/time_between_train_steps": 0.0037088394165039062, "step": 240} +{"info/global_step": 241, "train_info/time_within_train_step": 2.924288272857666, "step": 241} +{"train_info/time_between_train_steps": 0.003795623779296875, "step": 241} +{"info/global_step": 242, "train_info/time_within_train_step": 2.7142038345336914, "step": 242} +{"train_info/time_between_train_steps": 0.003720998764038086, "step": 242} +{"info/global_step": 243, "train_info/time_within_train_step": 2.7551488876342773, "step": 243} +{"train_info/time_between_train_steps": 0.003769397735595703, "step": 243} +{"info/global_step": 244, "train_info/time_within_train_step": 2.8334403038024902, "step": 244} +{"train_info/time_between_train_steps": 0.0037717819213867188, "step": 244} +{"info/global_step": 245, "train_info/time_within_train_step": 2.761902332305908, "step": 245} +{"train_info/time_between_train_steps": 0.0040225982666015625, "step": 245} +{"info/global_step": 246, "train_info/time_within_train_step": 2.731365919113159, "step": 246} +{"train_info/time_between_train_steps": 0.003997802734375, "step": 246} +{"info/global_step": 247, "train_info/time_within_train_step": 2.848649263381958, "step": 247} +{"train_info/time_between_train_steps": 0.0037164688110351562, "step": 247} +{"info/global_step": 248, "train_info/time_within_train_step": 2.8654823303222656, "step": 248} +{"train_info/time_between_train_steps": 0.0037131309509277344, "step": 248} +{"info/global_step": 249, "train_info/time_within_train_step": 2.789954423904419, "step": 249} +{"train_info/time_between_train_steps": 0.003590822219848633, "step": 249} +{"info/global_step": 250, "train_info/time_within_train_step": 3.474637985229492, "step": 250} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746286750, "_runtime": 772}, "step": 250} +{"logs": {"train/loss": 6.3931, "train/learning_rate": 0.0005, "train/epoch": 0.08, "_timestamp": 1746286750, "_runtime": 772}, "step": 250} +{"train_info/time_between_train_steps": 0.1428844928741455, "step": 250} +{"info/global_step": 251, "train_info/time_within_train_step": 2.694899320602417, "step": 251} +{"train_info/time_between_train_steps": 0.003553628921508789, "step": 251} +{"info/global_step": 252, "train_info/time_within_train_step": 2.6945183277130127, "step": 252} +{"train_info/time_between_train_steps": 0.003538370132446289, "step": 252} +{"info/global_step": 253, "train_info/time_within_train_step": 2.6959245204925537, "step": 253} +{"train_info/time_between_train_steps": 0.003626108169555664, "step": 253} +{"info/global_step": 254, "train_info/time_within_train_step": 2.6966629028320312, "step": 254} +{"train_info/time_between_train_steps": 0.0036363601684570312, "step": 254} +{"info/global_step": 255, "train_info/time_within_train_step": 2.6961851119995117, "step": 255} +{"train_info/time_between_train_steps": 0.0036580562591552734, "step": 255} +{"info/global_step": 256, "train_info/time_within_train_step": 2.695672035217285, "step": 256} +{"train_info/time_between_train_steps": 0.003671884536743164, "step": 256} +{"info/global_step": 257, "train_info/time_within_train_step": 2.7820324897766113, "step": 257} +{"train_info/time_between_train_steps": 0.0036973953247070312, "step": 257} +{"info/global_step": 258, "train_info/time_within_train_step": 2.945784091949463, "step": 258} +{"train_info/time_between_train_steps": 0.003646373748779297, "step": 258} +{"info/global_step": 259, "train_info/time_within_train_step": 2.9825704097747803, "step": 259} +{"train_info/time_between_train_steps": 0.0034914016723632812, "step": 259} +{"info/global_step": 260, "train_info/time_within_train_step": 2.7063443660736084, "step": 260} +{"train_info/time_between_train_steps": 0.0035490989685058594, "step": 260} +{"info/global_step": 261, "train_info/time_within_train_step": 2.694995641708374, "step": 261} +{"train_info/time_between_train_steps": 0.0035359859466552734, "step": 261} +{"info/global_step": 262, "train_info/time_within_train_step": 2.69403338432312, "step": 262} +{"train_info/time_between_train_steps": 0.003537416458129883, "step": 262} +{"info/global_step": 263, "train_info/time_within_train_step": 2.697720766067505, "step": 263} +{"train_info/time_between_train_steps": 0.0036711692810058594, "step": 263} +{"info/global_step": 264, "train_info/time_within_train_step": 2.9300029277801514, "step": 264} +{"train_info/time_between_train_steps": 0.003645181655883789, "step": 264} +{"info/global_step": 265, "train_info/time_within_train_step": 2.872939348220825, "step": 265} +{"train_info/time_between_train_steps": 0.0035665035247802734, "step": 265} +{"info/global_step": 266, "train_info/time_within_train_step": 2.715043544769287, "step": 266} +{"train_info/time_between_train_steps": 0.003707408905029297, "step": 266} +{"info/global_step": 267, "train_info/time_within_train_step": 2.721343994140625, "step": 267} +{"train_info/time_between_train_steps": 0.0037147998809814453, "step": 267} +{"info/global_step": 268, "train_info/time_within_train_step": 2.8798446655273438, "step": 268} +{"train_info/time_between_train_steps": 0.0037555694580078125, "step": 268} +{"info/global_step": 269, "train_info/time_within_train_step": 2.810026168823242, "step": 269} +{"train_info/time_between_train_steps": 0.0037140846252441406, "step": 269} +{"info/global_step": 270, "train_info/time_within_train_step": 2.7491016387939453, "step": 270} +{"train_info/time_between_train_steps": 0.0036852359771728516, "step": 270} +{"info/global_step": 271, "train_info/time_within_train_step": 2.743985652923584, "step": 271} +{"train_info/time_between_train_steps": 0.0037131309509277344, "step": 271} +{"info/global_step": 272, "train_info/time_within_train_step": 2.830648422241211, "step": 272} +{"train_info/time_between_train_steps": 0.0035474300384521484, "step": 272} +{"info/global_step": 273, "train_info/time_within_train_step": 2.7230098247528076, "step": 273} +{"train_info/time_between_train_steps": 0.0035409927368164062, "step": 273} +{"info/global_step": 274, "train_info/time_within_train_step": 2.757760524749756, "step": 274} +{"train_info/time_between_train_steps": 0.0035915374755859375, "step": 274} +{"info/global_step": 275, "train_info/time_within_train_step": 2.8456153869628906, "step": 275} +{"train_info/time_between_train_steps": 0.0036149024963378906, "step": 275} +{"info/global_step": 276, "train_info/time_within_train_step": 2.7821433544158936, "step": 276} +{"train_info/time_between_train_steps": 0.0036351680755615234, "step": 276} +{"info/global_step": 277, "train_info/time_within_train_step": 2.7343900203704834, "step": 277} +{"train_info/time_between_train_steps": 0.003602266311645508, "step": 277} +{"info/global_step": 278, "train_info/time_within_train_step": 2.7619264125823975, "step": 278} +{"train_info/time_between_train_steps": 0.0035974979400634766, "step": 278} +{"info/global_step": 279, "train_info/time_within_train_step": 2.783827304840088, "step": 279} +{"train_info/time_between_train_steps": 0.0035567283630371094, "step": 279} +{"info/global_step": 280, "train_info/time_within_train_step": 2.778989315032959, "step": 280} +{"train_info/time_between_train_steps": 0.0035326480865478516, "step": 280} +{"info/global_step": 281, "train_info/time_within_train_step": 2.919947862625122, "step": 281} +{"train_info/time_between_train_steps": 0.0036706924438476562, "step": 281} +{"info/global_step": 282, "train_info/time_within_train_step": 2.709603786468506, "step": 282} +{"train_info/time_between_train_steps": 0.0036766529083251953, "step": 282} +{"info/global_step": 283, "train_info/time_within_train_step": 2.6961851119995117, "step": 283} +{"train_info/time_between_train_steps": 0.0035715103149414062, "step": 283} +{"info/global_step": 284, "train_info/time_within_train_step": 2.697864532470703, "step": 284} +{"train_info/time_between_train_steps": 0.004346609115600586, "step": 284} +{"info/global_step": 285, "train_info/time_within_train_step": 2.835587739944458, "step": 285} +{"train_info/time_between_train_steps": 0.0035736560821533203, "step": 285} +{"info/global_step": 286, "train_info/time_within_train_step": 3.0007848739624023, "step": 286} +{"train_info/time_between_train_steps": 0.0035109519958496094, "step": 286} +{"info/global_step": 287, "train_info/time_within_train_step": 2.762946844100952, "step": 287} +{"train_info/time_between_train_steps": 0.003541707992553711, "step": 287} +{"info/global_step": 288, "train_info/time_within_train_step": 2.6965885162353516, "step": 288} +{"train_info/time_between_train_steps": 0.0036182403564453125, "step": 288} +{"info/global_step": 289, "train_info/time_within_train_step": 2.798398017883301, "step": 289} +{"train_info/time_between_train_steps": 0.0038869380950927734, "step": 289} +{"info/global_step": 290, "train_info/time_within_train_step": 2.8529293537139893, "step": 290} +{"train_info/time_between_train_steps": 0.0035848617553710938, "step": 290} +{"info/global_step": 291, "train_info/time_within_train_step": 2.7059645652770996, "step": 291} +{"train_info/time_between_train_steps": 0.003821849822998047, "step": 291} +{"info/global_step": 292, "train_info/time_within_train_step": 2.69670033454895, "step": 292} +{"train_info/time_between_train_steps": 0.0038695335388183594, "step": 292} +{"info/global_step": 293, "train_info/time_within_train_step": 2.701622247695923, "step": 293} +{"train_info/time_between_train_steps": 0.003569364547729492, "step": 293} +{"info/global_step": 294, "train_info/time_within_train_step": 2.877699136734009, "step": 294} +{"train_info/time_between_train_steps": 0.0035741329193115234, "step": 294} +{"info/global_step": 295, "train_info/time_within_train_step": 2.843026876449585, "step": 295} +{"train_info/time_between_train_steps": 0.0034942626953125, "step": 295} +{"info/global_step": 296, "train_info/time_within_train_step": 2.7205235958099365, "step": 296} +{"train_info/time_between_train_steps": 0.003587484359741211, "step": 296} +{"info/global_step": 297, "train_info/time_within_train_step": 2.75012469291687, "step": 297} +{"train_info/time_between_train_steps": 0.003586292266845703, "step": 297} +{"info/global_step": 298, "train_info/time_within_train_step": 2.8196768760681152, "step": 298} +{"train_info/time_between_train_steps": 0.003599405288696289, "step": 298} +{"info/global_step": 299, "train_info/time_within_train_step": 2.739973783493042, "step": 299} +{"train_info/time_between_train_steps": 0.0039789676666259766, "step": 299} +{"info/global_step": 300, "train_info/time_within_train_step": 2.7840425968170166, "step": 300} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746286892, "_runtime": 914}, "step": 300} +{"logs": {"train/loss": 6.2315, "train/learning_rate": 0.0006, "train/epoch": 0.1, "_timestamp": 1746286892, "_runtime": 914}, "step": 300} +{"train_info/time_between_train_steps": 15.262081384658813, "step": 300} +{"info/global_step": 301, "train_info/time_within_train_step": 2.4867868423461914, "step": 301} +{"train_info/time_between_train_steps": 0.0040590763092041016, "step": 301} +{"info/global_step": 302, "train_info/time_within_train_step": 2.536252737045288, "step": 302} +{"train_info/time_between_train_steps": 0.004149675369262695, "step": 302} +{"info/global_step": 303, "train_info/time_within_train_step": 2.6907925605773926, "step": 303} +{"train_info/time_between_train_steps": 0.0035338401794433594, "step": 303} +{"info/global_step": 304, "train_info/time_within_train_step": 2.6910488605499268, "step": 304} +{"train_info/time_between_train_steps": 0.0036270618438720703, "step": 304} +{"info/global_step": 305, "train_info/time_within_train_step": 2.9212300777435303, "step": 305} +{"train_info/time_between_train_steps": 0.0036385059356689453, "step": 305} +{"info/global_step": 306, "train_info/time_within_train_step": 2.6980998516082764, "step": 306} +{"train_info/time_between_train_steps": 0.0035521984100341797, "step": 306} +{"info/global_step": 307, "train_info/time_within_train_step": 2.6958248615264893, "step": 307} +{"train_info/time_between_train_steps": 0.0039010047912597656, "step": 307} +{"info/global_step": 308, "train_info/time_within_train_step": 2.6973326206207275, "step": 308} +{"train_info/time_between_train_steps": 0.0037565231323242188, "step": 308} +{"info/global_step": 309, "train_info/time_within_train_step": 3.1201093196868896, "step": 309} +{"train_info/time_between_train_steps": 0.0035915374755859375, "step": 309} +{"info/global_step": 310, "train_info/time_within_train_step": 3.1608667373657227, "step": 310} +{"train_info/time_between_train_steps": 0.0037114620208740234, "step": 310} +{"info/global_step": 311, "train_info/time_within_train_step": 3.1082541942596436, "step": 311} +{"train_info/time_between_train_steps": 0.0036513805389404297, "step": 311} +{"info/global_step": 312, "train_info/time_within_train_step": 2.7311787605285645, "step": 312} +{"train_info/time_between_train_steps": 0.0035521984100341797, "step": 312} +{"info/global_step": 313, "train_info/time_within_train_step": 2.816948175430298, "step": 313} +{"train_info/time_between_train_steps": 0.00359344482421875, "step": 313} +{"info/global_step": 314, "train_info/time_within_train_step": 2.697272539138794, "step": 314} +{"train_info/time_between_train_steps": 0.0037946701049804688, "step": 314} +{"info/global_step": 315, "train_info/time_within_train_step": 2.6973235607147217, "step": 315} +{"train_info/time_between_train_steps": 0.0035316944122314453, "step": 315} +{"info/global_step": 316, "train_info/time_within_train_step": 2.6966512203216553, "step": 316} +{"train_info/time_between_train_steps": 0.003725290298461914, "step": 316} +{"info/global_step": 317, "train_info/time_within_train_step": 2.777855157852173, "step": 317} +{"train_info/time_between_train_steps": 0.003744840621948242, "step": 317} +{"info/global_step": 318, "train_info/time_within_train_step": 2.960890531539917, "step": 318} +{"train_info/time_between_train_steps": 0.003986835479736328, "step": 318} +{"info/global_step": 319, "train_info/time_within_train_step": 2.9544894695281982, "step": 319} +{"train_info/time_between_train_steps": 0.003788471221923828, "step": 319} +{"info/global_step": 320, "train_info/time_within_train_step": 2.709397554397583, "step": 320} +{"train_info/time_between_train_steps": 0.003904104232788086, "step": 320} +{"info/global_step": 321, "train_info/time_within_train_step": 2.700254201889038, "step": 321} +{"train_info/time_between_train_steps": 0.004782438278198242, "step": 321} +{"info/global_step": 322, "train_info/time_within_train_step": 2.700669527053833, "step": 322} +{"train_info/time_between_train_steps": 0.0038912296295166016, "step": 322} +{"info/global_step": 323, "train_info/time_within_train_step": 2.7488315105438232, "step": 323} +{"train_info/time_between_train_steps": 0.004033327102661133, "step": 323} +{"info/global_step": 324, "train_info/time_within_train_step": 2.8650736808776855, "step": 324} +{"train_info/time_between_train_steps": 0.0036537647247314453, "step": 324} +{"info/global_step": 325, "train_info/time_within_train_step": 2.709012031555176, "step": 325} +{"train_info/time_between_train_steps": 0.003603219985961914, "step": 325} +{"info/global_step": 326, "train_info/time_within_train_step": 2.7186622619628906, "step": 326} +{"train_info/time_between_train_steps": 0.0036263465881347656, "step": 326} +{"info/global_step": 327, "train_info/time_within_train_step": 2.8797237873077393, "step": 327} +{"train_info/time_between_train_steps": 0.0035233497619628906, "step": 327} +{"info/global_step": 328, "train_info/time_within_train_step": 2.7452428340911865, "step": 328} +{"train_info/time_between_train_steps": 0.003645658493041992, "step": 328} +{"info/global_step": 329, "train_info/time_within_train_step": 2.696532964706421, "step": 329} +{"train_info/time_between_train_steps": 0.0036079883575439453, "step": 329} +{"info/global_step": 330, "train_info/time_within_train_step": 2.8599298000335693, "step": 330} +{"train_info/time_between_train_steps": 0.0036232471466064453, "step": 330} +{"info/global_step": 331, "train_info/time_within_train_step": 2.9558265209198, "step": 331} +{"train_info/time_between_train_steps": 0.003626108169555664, "step": 331} +{"info/global_step": 332, "train_info/time_within_train_step": 2.831658363342285, "step": 332} +{"train_info/time_between_train_steps": 0.0036542415618896484, "step": 332} +{"info/global_step": 333, "train_info/time_within_train_step": 2.7784154415130615, "step": 333} +{"train_info/time_between_train_steps": 0.003543853759765625, "step": 333} +{"info/global_step": 334, "train_info/time_within_train_step": 2.769537925720215, "step": 334} +{"train_info/time_between_train_steps": 0.004021644592285156, "step": 334} +{"info/global_step": 335, "train_info/time_within_train_step": 2.7895278930664062, "step": 335} +{"train_info/time_between_train_steps": 0.0036230087280273438, "step": 335} +{"info/global_step": 336, "train_info/time_within_train_step": 2.7545411586761475, "step": 336} +{"train_info/time_between_train_steps": 0.003603696823120117, "step": 336} +{"info/global_step": 337, "train_info/time_within_train_step": 2.8498191833496094, "step": 337} +{"train_info/time_between_train_steps": 0.003637075424194336, "step": 337} +{"info/global_step": 338, "train_info/time_within_train_step": 2.8984313011169434, "step": 338} +{"train_info/time_between_train_steps": 0.0035953521728515625, "step": 338} +{"info/global_step": 339, "train_info/time_within_train_step": 2.809544563293457, "step": 339} +{"train_info/time_between_train_steps": 0.0035979747772216797, "step": 339} +{"info/global_step": 340, "train_info/time_within_train_step": 2.762521266937256, "step": 340} +{"train_info/time_between_train_steps": 0.0036292076110839844, "step": 340} +{"info/global_step": 341, "train_info/time_within_train_step": 2.8104746341705322, "step": 341} +{"train_info/time_between_train_steps": 0.0035126209259033203, "step": 341} +{"info/global_step": 342, "train_info/time_within_train_step": 2.763529062271118, "step": 342} +{"train_info/time_between_train_steps": 0.0036497116088867188, "step": 342} +{"info/global_step": 343, "train_info/time_within_train_step": 2.7300431728363037, "step": 343} +{"train_info/time_between_train_steps": 0.003604412078857422, "step": 343} +{"info/global_step": 344, "train_info/time_within_train_step": 2.7249131202697754, "step": 344} +{"train_info/time_between_train_steps": 0.0035898685455322266, "step": 344} +{"info/global_step": 345, "train_info/time_within_train_step": 2.826775312423706, "step": 345} +{"train_info/time_between_train_steps": 0.00406646728515625, "step": 345} +{"info/global_step": 346, "train_info/time_within_train_step": 2.811835527420044, "step": 346} +{"train_info/time_between_train_steps": 0.004181623458862305, "step": 346} +{"info/global_step": 347, "train_info/time_within_train_step": 2.819768190383911, "step": 347} +{"train_info/time_between_train_steps": 0.004171133041381836, "step": 347} +{"info/global_step": 348, "train_info/time_within_train_step": 2.7375450134277344, "step": 348} +{"train_info/time_between_train_steps": 0.004098176956176758, "step": 348} +{"info/global_step": 349, "train_info/time_within_train_step": 2.8924450874328613, "step": 349} +{"train_info/time_between_train_steps": 0.00403904914855957, "step": 349} +{"info/global_step": 350, "train_info/time_within_train_step": 2.929445266723633, "step": 350} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746287053, "_runtime": 1075}, "step": 350} +{"logs": {"train/loss": 6.0946, "train/learning_rate": 0.0005888888888888889, "train/epoch": 0.12, "_timestamp": 1746287053, "_runtime": 1075}, "step": 350} +{"train_info/time_between_train_steps": 0.027364730834960938, "step": 350} +{"info/global_step": 351, "train_info/time_within_train_step": 2.791156530380249, "step": 351} +{"train_info/time_between_train_steps": 0.003946542739868164, "step": 351} +{"info/global_step": 352, "train_info/time_within_train_step": 2.7710416316986084, "step": 352} +{"train_info/time_between_train_steps": 0.004031181335449219, "step": 352} +{"info/global_step": 353, "train_info/time_within_train_step": 2.7507479190826416, "step": 353} +{"train_info/time_between_train_steps": 0.004225015640258789, "step": 353} +{"info/global_step": 354, "train_info/time_within_train_step": 2.726674795150757, "step": 354} +{"train_info/time_between_train_steps": 0.004082679748535156, "step": 354} +{"info/global_step": 355, "train_info/time_within_train_step": 2.7561819553375244, "step": 355} +{"train_info/time_between_train_steps": 0.003995418548583984, "step": 355} +{"info/global_step": 356, "train_info/time_within_train_step": 2.7394859790802, "step": 356} +{"train_info/time_between_train_steps": 0.004229545593261719, "step": 356} +{"info/global_step": 357, "train_info/time_within_train_step": 2.789090871810913, "step": 357} +{"train_info/time_between_train_steps": 0.004011631011962891, "step": 357} +{"info/global_step": 358, "train_info/time_within_train_step": 2.7403404712677, "step": 358} +{"train_info/time_between_train_steps": 0.003987550735473633, "step": 358} +{"info/global_step": 359, "train_info/time_within_train_step": 2.779557228088379, "step": 359} +{"train_info/time_between_train_steps": 0.0039861202239990234, "step": 359} +{"info/global_step": 360, "train_info/time_within_train_step": 2.7660045623779297, "step": 360} +{"train_info/time_between_train_steps": 0.0043125152587890625, "step": 360} +{"info/global_step": 361, "train_info/time_within_train_step": 2.857433795928955, "step": 361} +{"train_info/time_between_train_steps": 0.004107475280761719, "step": 361} +{"info/global_step": 362, "train_info/time_within_train_step": 2.7844526767730713, "step": 362} +{"train_info/time_between_train_steps": 0.004166841506958008, "step": 362} +{"info/global_step": 363, "train_info/time_within_train_step": 2.734858989715576, "step": 363} +{"train_info/time_between_train_steps": 0.004077434539794922, "step": 363} +{"info/global_step": 364, "train_info/time_within_train_step": 2.7419252395629883, "step": 364} +{"train_info/time_between_train_steps": 0.0040111541748046875, "step": 364} +{"info/global_step": 365, "train_info/time_within_train_step": 2.7656710147857666, "step": 365} +{"train_info/time_between_train_steps": 0.004016399383544922, "step": 365} +{"info/global_step": 366, "train_info/time_within_train_step": 2.7891476154327393, "step": 366} +{"train_info/time_between_train_steps": 0.003997087478637695, "step": 366} +{"info/global_step": 367, "train_info/time_within_train_step": 2.7515206336975098, "step": 367} +{"train_info/time_between_train_steps": 0.00395512580871582, "step": 367} +{"info/global_step": 368, "train_info/time_within_train_step": 2.780703067779541, "step": 368} +{"train_info/time_between_train_steps": 0.0039806365966796875, "step": 368} +{"info/global_step": 369, "train_info/time_within_train_step": 2.743117094039917, "step": 369} +{"train_info/time_between_train_steps": 0.004015684127807617, "step": 369} +{"info/global_step": 370, "train_info/time_within_train_step": 2.7540924549102783, "step": 370} +{"train_info/time_between_train_steps": 0.003941059112548828, "step": 370} +{"info/global_step": 371, "train_info/time_within_train_step": 2.8181185722351074, "step": 371} +{"train_info/time_between_train_steps": 0.004069805145263672, "step": 371} +{"info/global_step": 372, "train_info/time_within_train_step": 2.769003391265869, "step": 372} +{"train_info/time_between_train_steps": 0.004003286361694336, "step": 372} +{"info/global_step": 373, "train_info/time_within_train_step": 2.7346668243408203, "step": 373} +{"train_info/time_between_train_steps": 0.0040090084075927734, "step": 373} +{"info/global_step": 374, "train_info/time_within_train_step": 2.8408846855163574, "step": 374} +{"train_info/time_between_train_steps": 0.003921031951904297, "step": 374} +{"info/global_step": 375, "train_info/time_within_train_step": 2.778165578842163, "step": 375} +{"train_info/time_between_train_steps": 0.17935490608215332, "step": 375} +{"info/global_step": 376, "train_info/time_within_train_step": 2.6967599391937256, "step": 376} +{"train_info/time_between_train_steps": 0.0037631988525390625, "step": 376} +{"info/global_step": 377, "train_info/time_within_train_step": 2.708643674850464, "step": 377} +{"train_info/time_between_train_steps": 0.0037806034088134766, "step": 377} +{"info/global_step": 378, "train_info/time_within_train_step": 2.742311716079712, "step": 378} +{"train_info/time_between_train_steps": 0.003721475601196289, "step": 378} +{"info/global_step": 379, "train_info/time_within_train_step": 2.734464406967163, "step": 379} +{"train_info/time_between_train_steps": 0.0037589073181152344, "step": 379} +{"info/global_step": 380, "train_info/time_within_train_step": 2.7660155296325684, "step": 380} +{"train_info/time_between_train_steps": 0.0037412643432617188, "step": 380} +{"info/global_step": 381, "train_info/time_within_train_step": 2.752246379852295, "step": 381} +{"train_info/time_between_train_steps": 0.0037076473236083984, "step": 381} +{"info/global_step": 382, "train_info/time_within_train_step": 2.8644492626190186, "step": 382} +{"train_info/time_between_train_steps": 0.003823518753051758, "step": 382} +{"info/global_step": 383, "train_info/time_within_train_step": 2.785780191421509, "step": 383} +{"train_info/time_between_train_steps": 0.00484776496887207, "step": 383} +{"info/global_step": 384, "train_info/time_within_train_step": 2.7507567405700684, "step": 384} +{"train_info/time_between_train_steps": 0.0036954879760742188, "step": 384} +{"info/global_step": 385, "train_info/time_within_train_step": 2.7327401638031006, "step": 385} +{"train_info/time_between_train_steps": 0.0036592483520507812, "step": 385} +{"info/global_step": 386, "train_info/time_within_train_step": 2.769678831100464, "step": 386} +{"train_info/time_between_train_steps": 0.0037603378295898438, "step": 386} +{"info/global_step": 387, "train_info/time_within_train_step": 2.796584367752075, "step": 387} +{"train_info/time_between_train_steps": 0.0037238597869873047, "step": 387} +{"info/global_step": 388, "train_info/time_within_train_step": 2.7281503677368164, "step": 388} +{"train_info/time_between_train_steps": 0.0037059783935546875, "step": 388} +{"info/global_step": 389, "train_info/time_within_train_step": 2.7376508712768555, "step": 389} +{"train_info/time_between_train_steps": 0.003721952438354492, "step": 389} +{"info/global_step": 390, "train_info/time_within_train_step": 2.714829921722412, "step": 390} +{"train_info/time_between_train_steps": 0.0037267208099365234, "step": 390} +{"info/global_step": 391, "train_info/time_within_train_step": 3.081367254257202, "step": 391} +{"train_info/time_between_train_steps": 0.0035970211029052734, "step": 391} +{"info/global_step": 392, "train_info/time_within_train_step": 2.699054479598999, "step": 392} +{"train_info/time_between_train_steps": 0.003844022750854492, "step": 392} +{"info/global_step": 393, "train_info/time_within_train_step": 2.853426933288574, "step": 393} +{"train_info/time_between_train_steps": 0.0036134719848632812, "step": 393} +{"info/global_step": 394, "train_info/time_within_train_step": 2.95725154876709, "step": 394} +{"train_info/time_between_train_steps": 0.003621339797973633, "step": 394} +{"info/global_step": 395, "train_info/time_within_train_step": 2.727769374847412, "step": 395} +{"train_info/time_between_train_steps": 0.0037178993225097656, "step": 395} +{"info/global_step": 396, "train_info/time_within_train_step": 2.696920871734619, "step": 396} +{"train_info/time_between_train_steps": 0.003552675247192383, "step": 396} +{"info/global_step": 397, "train_info/time_within_train_step": 2.6966636180877686, "step": 397} +{"train_info/time_between_train_steps": 0.003658294677734375, "step": 397} +{"info/global_step": 398, "train_info/time_within_train_step": 2.82025408744812, "step": 398} +{"train_info/time_between_train_steps": 0.0035626888275146484, "step": 398} +{"info/global_step": 399, "train_info/time_within_train_step": 2.8407387733459473, "step": 399} +{"train_info/time_between_train_steps": 0.003651857376098633, "step": 399} +{"info/global_step": 400, "train_info/time_within_train_step": 2.7233805656433105, "step": 400} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746287194, "_runtime": 1216}, "step": 400} +{"logs": {"train/loss": 5.9525, "train/learning_rate": 0.0005777777777777776, "train/epoch": 0.13, "_timestamp": 1746287194, "_runtime": 1216}, "step": 400} +{"train_info/time_between_train_steps": 14.049201011657715, "step": 400} +{"info/global_step": 401, "train_info/time_within_train_step": 2.4931554794311523, "step": 401} +{"train_info/time_between_train_steps": 0.0038290023803710938, "step": 401} +{"info/global_step": 402, "train_info/time_within_train_step": 2.5113613605499268, "step": 402} +{"train_info/time_between_train_steps": 0.004088401794433594, "step": 402} +{"info/global_step": 403, "train_info/time_within_train_step": 2.691070795059204, "step": 403} +{"train_info/time_between_train_steps": 0.004024982452392578, "step": 403} +{"info/global_step": 404, "train_info/time_within_train_step": 2.69429612159729, "step": 404} +{"train_info/time_between_train_steps": 0.004099130630493164, "step": 404} +{"info/global_step": 405, "train_info/time_within_train_step": 2.7226974964141846, "step": 405} +{"train_info/time_between_train_steps": 0.0042455196380615234, "step": 405} +{"info/global_step": 406, "train_info/time_within_train_step": 2.697216033935547, "step": 406} +{"train_info/time_between_train_steps": 0.00426030158996582, "step": 406} +{"info/global_step": 407, "train_info/time_within_train_step": 2.698214530944824, "step": 407} +{"train_info/time_between_train_steps": 0.004194498062133789, "step": 407} +{"info/global_step": 408, "train_info/time_within_train_step": 3.007866382598877, "step": 408} +{"train_info/time_between_train_steps": 0.00415492057800293, "step": 408} +{"info/global_step": 409, "train_info/time_within_train_step": 3.0681991577148438, "step": 409} +{"train_info/time_between_train_steps": 0.0041544437408447266, "step": 409} +{"info/global_step": 410, "train_info/time_within_train_step": 3.0896999835968018, "step": 410} +{"train_info/time_between_train_steps": 0.004715919494628906, "step": 410} +{"info/global_step": 411, "train_info/time_within_train_step": 2.7373297214508057, "step": 411} +{"train_info/time_between_train_steps": 0.004274845123291016, "step": 411} +{"info/global_step": 412, "train_info/time_within_train_step": 2.69844651222229, "step": 412} +{"train_info/time_between_train_steps": 0.004167795181274414, "step": 412} +{"info/global_step": 413, "train_info/time_within_train_step": 2.6991827487945557, "step": 413} +{"train_info/time_between_train_steps": 0.004166603088378906, "step": 413} +{"info/global_step": 414, "train_info/time_within_train_step": 2.69984769821167, "step": 414} +{"train_info/time_between_train_steps": 0.004099130630493164, "step": 414} +{"info/global_step": 415, "train_info/time_within_train_step": 2.712846517562866, "step": 415} +{"train_info/time_between_train_steps": 0.004151344299316406, "step": 415} +{"info/global_step": 416, "train_info/time_within_train_step": 2.8210840225219727, "step": 416} +{"train_info/time_between_train_steps": 0.0039670467376708984, "step": 416} +{"info/global_step": 417, "train_info/time_within_train_step": 3.0381243228912354, "step": 417} +{"train_info/time_between_train_steps": 0.003926992416381836, "step": 417} +{"info/global_step": 418, "train_info/time_within_train_step": 2.760370969772339, "step": 418} +{"train_info/time_between_train_steps": 0.00411534309387207, "step": 418} +{"info/global_step": 419, "train_info/time_within_train_step": 2.698472261428833, "step": 419} +{"train_info/time_between_train_steps": 0.004134178161621094, "step": 419} +{"info/global_step": 420, "train_info/time_within_train_step": 2.697465658187866, "step": 420} +{"train_info/time_between_train_steps": 0.004830121994018555, "step": 420} +{"info/global_step": 421, "train_info/time_within_train_step": 2.759981870651245, "step": 421} +{"train_info/time_between_train_steps": 0.004070281982421875, "step": 421} +{"info/global_step": 422, "train_info/time_within_train_step": 2.917091131210327, "step": 422} +{"train_info/time_between_train_steps": 0.0040547847747802734, "step": 422} +{"info/global_step": 423, "train_info/time_within_train_step": 2.7941157817840576, "step": 423} +{"train_info/time_between_train_steps": 0.004053354263305664, "step": 423} +{"info/global_step": 424, "train_info/time_within_train_step": 2.729663610458374, "step": 424} +{"train_info/time_between_train_steps": 0.004025936126708984, "step": 424} +{"info/global_step": 425, "train_info/time_within_train_step": 2.8319694995880127, "step": 425} +{"train_info/time_between_train_steps": 0.0040662288665771484, "step": 425} +{"info/global_step": 426, "train_info/time_within_train_step": 2.7982068061828613, "step": 426} +{"train_info/time_between_train_steps": 0.004181623458862305, "step": 426} +{"info/global_step": 427, "train_info/time_within_train_step": 2.7107796669006348, "step": 427} +{"train_info/time_between_train_steps": 0.003882169723510742, "step": 427} +{"info/global_step": 428, "train_info/time_within_train_step": 2.710038423538208, "step": 428} +{"train_info/time_between_train_steps": 0.00406646728515625, "step": 428} +{"info/global_step": 429, "train_info/time_within_train_step": 2.7768349647521973, "step": 429} +{"train_info/time_between_train_steps": 0.003972768783569336, "step": 429} +{"info/global_step": 430, "train_info/time_within_train_step": 2.8436734676361084, "step": 430} +{"train_info/time_between_train_steps": 0.004026174545288086, "step": 430} +{"info/global_step": 431, "train_info/time_within_train_step": 2.708185911178589, "step": 431} +{"train_info/time_between_train_steps": 0.0040209293365478516, "step": 431} +{"info/global_step": 432, "train_info/time_within_train_step": 2.7597811222076416, "step": 432} +{"train_info/time_between_train_steps": 0.0042362213134765625, "step": 432} +{"info/global_step": 433, "train_info/time_within_train_step": 2.9146792888641357, "step": 433} +{"train_info/time_between_train_steps": 0.0039637088775634766, "step": 433} +{"info/global_step": 434, "train_info/time_within_train_step": 2.8206639289855957, "step": 434} +{"train_info/time_between_train_steps": 0.003972530364990234, "step": 434} +{"info/global_step": 435, "train_info/time_within_train_step": 2.7947239875793457, "step": 435} +{"train_info/time_between_train_steps": 0.004026174545288086, "step": 435} +{"info/global_step": 436, "train_info/time_within_train_step": 2.786731719970703, "step": 436} +{"train_info/time_between_train_steps": 0.004075288772583008, "step": 436} +{"info/global_step": 437, "train_info/time_within_train_step": 2.7932870388031006, "step": 437} +{"train_info/time_between_train_steps": 0.004024028778076172, "step": 437} +{"info/global_step": 438, "train_info/time_within_train_step": 2.9058477878570557, "step": 438} +{"train_info/time_between_train_steps": 0.0037856101989746094, "step": 438} +{"info/global_step": 439, "train_info/time_within_train_step": 2.7214300632476807, "step": 439} +{"train_info/time_between_train_steps": 0.0038747787475585938, "step": 439} +{"info/global_step": 440, "train_info/time_within_train_step": 2.7917227745056152, "step": 440} +{"train_info/time_between_train_steps": 0.004743337631225586, "step": 440} +{"info/global_step": 441, "train_info/time_within_train_step": 2.9155361652374268, "step": 441} +{"train_info/time_between_train_steps": 0.003798246383666992, "step": 441} +{"info/global_step": 442, "train_info/time_within_train_step": 2.8064098358154297, "step": 442} +{"train_info/time_between_train_steps": 0.003835916519165039, "step": 442} +{"info/global_step": 443, "train_info/time_within_train_step": 2.7332074642181396, "step": 443} +{"train_info/time_between_train_steps": 0.003995180130004883, "step": 443} +{"info/global_step": 444, "train_info/time_within_train_step": 2.78437876701355, "step": 444} +{"train_info/time_between_train_steps": 0.0076406002044677734, "step": 444} +{"info/global_step": 445, "train_info/time_within_train_step": 2.802609920501709, "step": 445} +{"train_info/time_between_train_steps": 0.0037920475006103516, "step": 445} +{"info/global_step": 446, "train_info/time_within_train_step": 3.098980665206909, "step": 446} +{"train_info/time_between_train_steps": 0.0033407211303710938, "step": 446} +{"info/global_step": 447, "train_info/time_within_train_step": 2.6952097415924072, "step": 447} +{"train_info/time_between_train_steps": 0.0034782886505126953, "step": 447} +{"info/global_step": 448, "train_info/time_within_train_step": 2.696855306625366, "step": 448} +{"train_info/time_between_train_steps": 0.003340482711791992, "step": 448} +{"info/global_step": 449, "train_info/time_within_train_step": 2.7154831886291504, "step": 449} +{"train_info/time_between_train_steps": 0.0033135414123535156, "step": 449} +{"info/global_step": 450, "train_info/time_within_train_step": 2.8905527591705322, "step": 450} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746287350, "_runtime": 1372}, "step": 450} +{"logs": {"train/loss": 5.8624, "train/learning_rate": 0.0005666666666666666, "train/epoch": 0.15, "_timestamp": 1746287350, "_runtime": 1372}, "step": 450} +{"train_info/time_between_train_steps": 0.11729574203491211, "step": 450} +{"info/global_step": 451, "train_info/time_within_train_step": 2.7835633754730225, "step": 451} +{"train_info/time_between_train_steps": 0.0033648014068603516, "step": 451} +{"info/global_step": 452, "train_info/time_within_train_step": 2.7305867671966553, "step": 452} +{"train_info/time_between_train_steps": 0.0034248828887939453, "step": 452} +{"info/global_step": 453, "train_info/time_within_train_step": 2.7375545501708984, "step": 453} +{"train_info/time_between_train_steps": 0.003541707992553711, "step": 453} +{"info/global_step": 454, "train_info/time_within_train_step": 2.8315865993499756, "step": 454} +{"train_info/time_between_train_steps": 0.0036122798919677734, "step": 454} +{"info/global_step": 455, "train_info/time_within_train_step": 2.8591396808624268, "step": 455} +{"train_info/time_between_train_steps": 0.003609895706176758, "step": 455} +{"info/global_step": 456, "train_info/time_within_train_step": 2.7803449630737305, "step": 456} +{"train_info/time_between_train_steps": 0.0037848949432373047, "step": 456} +{"info/global_step": 457, "train_info/time_within_train_step": 2.734501600265503, "step": 457} +{"train_info/time_between_train_steps": 0.003833770751953125, "step": 457} +{"info/global_step": 458, "train_info/time_within_train_step": 2.748260736465454, "step": 458} +{"train_info/time_between_train_steps": 0.0037026405334472656, "step": 458} +{"info/global_step": 459, "train_info/time_within_train_step": 2.81874942779541, "step": 459} +{"train_info/time_between_train_steps": 0.003529071807861328, "step": 459} +{"info/global_step": 460, "train_info/time_within_train_step": 2.7772371768951416, "step": 460} +{"train_info/time_between_train_steps": 0.0035495758056640625, "step": 460} +{"info/global_step": 461, "train_info/time_within_train_step": 2.732879400253296, "step": 461} +{"train_info/time_between_train_steps": 0.0035202503204345703, "step": 461} +{"info/global_step": 462, "train_info/time_within_train_step": 2.802913188934326, "step": 462} +{"train_info/time_between_train_steps": 0.003468036651611328, "step": 462} +{"info/global_step": 463, "train_info/time_within_train_step": 2.7031736373901367, "step": 463} +{"train_info/time_between_train_steps": 0.003476858139038086, "step": 463} +{"info/global_step": 464, "train_info/time_within_train_step": 2.6941142082214355, "step": 464} +{"train_info/time_between_train_steps": 0.0034656524658203125, "step": 464} +{"info/global_step": 465, "train_info/time_within_train_step": 2.6940512657165527, "step": 465} +{"train_info/time_between_train_steps": 0.003561258316040039, "step": 465} +{"info/global_step": 466, "train_info/time_within_train_step": 2.694983959197998, "step": 466} +{"train_info/time_between_train_steps": 0.0034630298614501953, "step": 466} +{"info/global_step": 467, "train_info/time_within_train_step": 2.6950464248657227, "step": 467} +{"train_info/time_between_train_steps": 0.0034639835357666016, "step": 467} +{"info/global_step": 468, "train_info/time_within_train_step": 2.695814847946167, "step": 468} +{"train_info/time_between_train_steps": 0.0034933090209960938, "step": 468} +{"info/global_step": 469, "train_info/time_within_train_step": 2.6949830055236816, "step": 469} +{"train_info/time_between_train_steps": 0.00353240966796875, "step": 469} +{"info/global_step": 470, "train_info/time_within_train_step": 2.69671630859375, "step": 470} +{"train_info/time_between_train_steps": 0.003541231155395508, "step": 470} +{"info/global_step": 471, "train_info/time_within_train_step": 2.695315361022949, "step": 471} +{"train_info/time_between_train_steps": 0.003464221954345703, "step": 471} +{"info/global_step": 472, "train_info/time_within_train_step": 2.6963391304016113, "step": 472} +{"train_info/time_between_train_steps": 0.0034902095794677734, "step": 472} +{"info/global_step": 473, "train_info/time_within_train_step": 2.6959118843078613, "step": 473} +{"train_info/time_between_train_steps": 0.0034716129302978516, "step": 473} +{"info/global_step": 474, "train_info/time_within_train_step": 2.6957967281341553, "step": 474} +{"train_info/time_between_train_steps": 0.003492116928100586, "step": 474} +{"info/global_step": 475, "train_info/time_within_train_step": 2.767418384552002, "step": 475} +{"train_info/time_between_train_steps": 0.0034949779510498047, "step": 475} +{"info/global_step": 476, "train_info/time_within_train_step": 2.890841484069824, "step": 476} +{"train_info/time_between_train_steps": 0.003504514694213867, "step": 476} +{"info/global_step": 477, "train_info/time_within_train_step": 2.8484339714050293, "step": 477} +{"train_info/time_between_train_steps": 0.0034554004669189453, "step": 477} +{"info/global_step": 478, "train_info/time_within_train_step": 2.695486068725586, "step": 478} +{"train_info/time_between_train_steps": 0.003529787063598633, "step": 478} +{"info/global_step": 479, "train_info/time_within_train_step": 2.6972837448120117, "step": 479} +{"train_info/time_between_train_steps": 0.0038404464721679688, "step": 479} +{"info/global_step": 480, "train_info/time_within_train_step": 2.697922706604004, "step": 480} +{"train_info/time_between_train_steps": 0.0036668777465820312, "step": 480} +{"info/global_step": 481, "train_info/time_within_train_step": 2.696869134902954, "step": 481} +{"train_info/time_between_train_steps": 0.0037260055541992188, "step": 481} +{"info/global_step": 482, "train_info/time_within_train_step": 2.828604221343994, "step": 482} +{"train_info/time_between_train_steps": 0.0034780502319335938, "step": 482} +{"info/global_step": 483, "train_info/time_within_train_step": 2.953800916671753, "step": 483} +{"train_info/time_between_train_steps": 0.0034894943237304688, "step": 483} +{"info/global_step": 484, "train_info/time_within_train_step": 2.737882375717163, "step": 484} +{"train_info/time_between_train_steps": 0.0034897327423095703, "step": 484} +{"info/global_step": 485, "train_info/time_within_train_step": 2.697348117828369, "step": 485} +{"train_info/time_between_train_steps": 0.0034990310668945312, "step": 485} +{"info/global_step": 486, "train_info/time_within_train_step": 2.778604030609131, "step": 486} +{"train_info/time_between_train_steps": 0.00351715087890625, "step": 486} +{"info/global_step": 487, "train_info/time_within_train_step": 3.0795812606811523, "step": 487} +{"train_info/time_between_train_steps": 0.0032935142517089844, "step": 487} +{"info/global_step": 488, "train_info/time_within_train_step": 2.6963794231414795, "step": 488} +{"train_info/time_between_train_steps": 0.003401041030883789, "step": 488} +{"info/global_step": 489, "train_info/time_within_train_step": 2.6952481269836426, "step": 489} +{"train_info/time_between_train_steps": 0.0033867359161376953, "step": 489} +{"info/global_step": 490, "train_info/time_within_train_step": 2.6967766284942627, "step": 490} +{"train_info/time_between_train_steps": 0.0034537315368652344, "step": 490} +{"info/global_step": 491, "train_info/time_within_train_step": 2.697312116622925, "step": 491} +{"train_info/time_between_train_steps": 0.0033731460571289062, "step": 491} +{"info/global_step": 492, "train_info/time_within_train_step": 2.697537899017334, "step": 492} +{"train_info/time_between_train_steps": 0.003300189971923828, "step": 492} +{"info/global_step": 493, "train_info/time_within_train_step": 2.716102361679077, "step": 493} +{"train_info/time_between_train_steps": 0.0036025047302246094, "step": 493} +{"info/global_step": 494, "train_info/time_within_train_step": 2.892422676086426, "step": 494} +{"train_info/time_between_train_steps": 0.003342866897583008, "step": 494} +{"info/global_step": 495, "train_info/time_within_train_step": 2.9727256298065186, "step": 495} +{"train_info/time_between_train_steps": 0.0034589767456054688, "step": 495} +{"info/global_step": 496, "train_info/time_within_train_step": 2.716315507888794, "step": 496} +{"train_info/time_between_train_steps": 0.003369569778442383, "step": 496} +{"info/global_step": 497, "train_info/time_within_train_step": 2.6978070735931396, "step": 497} +{"train_info/time_between_train_steps": 0.0033118724822998047, "step": 497} +{"info/global_step": 498, "train_info/time_within_train_step": 2.6951115131378174, "step": 498} +{"train_info/time_between_train_steps": 0.003312826156616211, "step": 498} +{"info/global_step": 499, "train_info/time_within_train_step": 2.6952786445617676, "step": 499} +{"train_info/time_between_train_steps": 0.003297090530395508, "step": 499} +{"info/global_step": 500, "train_info/time_within_train_step": 3.227508306503296, "step": 500} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746287494, "_runtime": 1516}, "step": 500} +{"logs": {"train/loss": 5.7829, "train/learning_rate": 0.0005555555555555556, "train/epoch": 0.17, "_timestamp": 1746287494, "_runtime": 1516}, "step": 500} +{"train_info/time_between_train_steps": 14.146849870681763, "step": 500} +{"info/global_step": 501, "train_info/time_within_train_step": 2.4920132160186768, "step": 501} +{"train_info/time_between_train_steps": 0.0033507347106933594, "step": 501} +{"info/global_step": 502, "train_info/time_within_train_step": 2.513633966445923, "step": 502} +{"train_info/time_between_train_steps": 0.003323078155517578, "step": 502} +{"info/global_step": 503, "train_info/time_within_train_step": 2.68761944770813, "step": 503} +{"train_info/time_between_train_steps": 0.0033049583435058594, "step": 503} +{"info/global_step": 504, "train_info/time_within_train_step": 2.690019130706787, "step": 504} +{"train_info/time_between_train_steps": 0.003278970718383789, "step": 504} +{"info/global_step": 505, "train_info/time_within_train_step": 2.690350294113159, "step": 505} +{"train_info/time_between_train_steps": 0.0033550262451171875, "step": 505} +{"info/global_step": 506, "train_info/time_within_train_step": 2.692779779434204, "step": 506} +{"train_info/time_between_train_steps": 0.003274679183959961, "step": 506} +{"info/global_step": 507, "train_info/time_within_train_step": 2.6931190490722656, "step": 507} +{"train_info/time_between_train_steps": 0.0033054351806640625, "step": 507} +{"info/global_step": 508, "train_info/time_within_train_step": 2.9449901580810547, "step": 508} +{"train_info/time_between_train_steps": 0.0033016204833984375, "step": 508} +{"info/global_step": 509, "train_info/time_within_train_step": 3.107529640197754, "step": 509} +{"train_info/time_between_train_steps": 0.0032966136932373047, "step": 509} +{"info/global_step": 510, "train_info/time_within_train_step": 3.0402047634124756, "step": 510} +{"train_info/time_between_train_steps": 0.0033254623413085938, "step": 510} +{"info/global_step": 511, "train_info/time_within_train_step": 2.712599754333496, "step": 511} +{"train_info/time_between_train_steps": 0.0032510757446289062, "step": 511} +{"info/global_step": 512, "train_info/time_within_train_step": 2.6945724487304688, "step": 512} +{"train_info/time_between_train_steps": 0.003352642059326172, "step": 512} +{"info/global_step": 513, "train_info/time_within_train_step": 2.6934826374053955, "step": 513} +{"train_info/time_between_train_steps": 0.0032427310943603516, "step": 513} +{"info/global_step": 514, "train_info/time_within_train_step": 2.69472074508667, "step": 514} +{"train_info/time_between_train_steps": 0.0032701492309570312, "step": 514} +{"info/global_step": 515, "train_info/time_within_train_step": 2.756654739379883, "step": 515} +{"train_info/time_between_train_steps": 0.0032601356506347656, "step": 515} +{"info/global_step": 516, "train_info/time_within_train_step": 2.9507670402526855, "step": 516} +{"train_info/time_between_train_steps": 0.003305196762084961, "step": 516} +{"info/global_step": 517, "train_info/time_within_train_step": 2.9633333683013916, "step": 517} +{"train_info/time_between_train_steps": 0.0032584667205810547, "step": 517} +{"info/global_step": 518, "train_info/time_within_train_step": 2.700289487838745, "step": 518} +{"train_info/time_between_train_steps": 0.003298521041870117, "step": 518} +{"info/global_step": 519, "train_info/time_within_train_step": 2.6959824562072754, "step": 519} +{"train_info/time_between_train_steps": 0.0032913684844970703, "step": 519} +{"info/global_step": 520, "train_info/time_within_train_step": 2.6947145462036133, "step": 520} +{"train_info/time_between_train_steps": 0.0032203197479248047, "step": 520} +{"info/global_step": 521, "train_info/time_within_train_step": 2.725538492202759, "step": 521} +{"train_info/time_between_train_steps": 0.0033066272735595703, "step": 521} +{"info/global_step": 522, "train_info/time_within_train_step": 2.868415355682373, "step": 522} +{"train_info/time_between_train_steps": 0.003309488296508789, "step": 522} +{"info/global_step": 523, "train_info/time_within_train_step": 2.7810661792755127, "step": 523} +{"train_info/time_between_train_steps": 0.0033516883850097656, "step": 523} +{"info/global_step": 524, "train_info/time_within_train_step": 2.780224084854126, "step": 524} +{"train_info/time_between_train_steps": 0.003318309783935547, "step": 524} +{"info/global_step": 525, "train_info/time_within_train_step": 2.7680349349975586, "step": 525} +{"train_info/time_between_train_steps": 0.0033767223358154297, "step": 525} +{"info/global_step": 526, "train_info/time_within_train_step": 2.843621015548706, "step": 526} +{"train_info/time_between_train_steps": 0.003326416015625, "step": 526} +{"info/global_step": 527, "train_info/time_within_train_step": 2.906672716140747, "step": 527} +{"train_info/time_between_train_steps": 0.003259420394897461, "step": 527} +{"info/global_step": 528, "train_info/time_within_train_step": 2.8340084552764893, "step": 528} +{"train_info/time_between_train_steps": 0.0033981800079345703, "step": 528} +{"info/global_step": 529, "train_info/time_within_train_step": 2.7428460121154785, "step": 529} +{"train_info/time_between_train_steps": 0.003362417221069336, "step": 529} +{"info/global_step": 530, "train_info/time_within_train_step": 2.6988236904144287, "step": 530} +{"train_info/time_between_train_steps": 0.0033769607543945312, "step": 530} +{"info/global_step": 531, "train_info/time_within_train_step": 2.857898712158203, "step": 531} +{"train_info/time_between_train_steps": 0.00331878662109375, "step": 531} +{"info/global_step": 532, "train_info/time_within_train_step": 2.9428722858428955, "step": 532} +{"train_info/time_between_train_steps": 0.003281831741333008, "step": 532} +{"info/global_step": 533, "train_info/time_within_train_step": 2.8822386264801025, "step": 533} +{"train_info/time_between_train_steps": 0.0035169124603271484, "step": 533} +{"info/global_step": 534, "train_info/time_within_train_step": 2.754117965698242, "step": 534} +{"train_info/time_between_train_steps": 0.003448486328125, "step": 534} +{"info/global_step": 535, "train_info/time_within_train_step": 2.8798749446868896, "step": 535} +{"train_info/time_between_train_steps": 0.003386259078979492, "step": 535} +{"info/global_step": 536, "train_info/time_within_train_step": 2.839069366455078, "step": 536} +{"train_info/time_between_train_steps": 0.003587961196899414, "step": 536} +{"info/global_step": 537, "train_info/time_within_train_step": 2.8764476776123047, "step": 537} +{"train_info/time_between_train_steps": 0.003554105758666992, "step": 537} +{"info/global_step": 538, "train_info/time_within_train_step": 2.7310242652893066, "step": 538} +{"train_info/time_between_train_steps": 0.003901243209838867, "step": 538} +{"info/global_step": 539, "train_info/time_within_train_step": 2.796124219894409, "step": 539} +{"train_info/time_between_train_steps": 0.003572225570678711, "step": 539} +{"info/global_step": 540, "train_info/time_within_train_step": 2.9276459217071533, "step": 540} +{"train_info/time_between_train_steps": 0.003341197967529297, "step": 540} +{"info/global_step": 541, "train_info/time_within_train_step": 2.8117411136627197, "step": 541} +{"train_info/time_between_train_steps": 0.0033795833587646484, "step": 541} +{"info/global_step": 542, "train_info/time_within_train_step": 2.748950719833374, "step": 542} +{"train_info/time_between_train_steps": 0.0033500194549560547, "step": 542} +{"info/global_step": 543, "train_info/time_within_train_step": 2.7932333946228027, "step": 543} +{"train_info/time_between_train_steps": 0.003412008285522461, "step": 543} +{"info/global_step": 544, "train_info/time_within_train_step": 2.8200058937072754, "step": 544} +{"train_info/time_between_train_steps": 0.0036668777465820312, "step": 544} +{"info/global_step": 545, "train_info/time_within_train_step": 2.7818057537078857, "step": 545} +{"train_info/time_between_train_steps": 0.003370046615600586, "step": 545} +{"info/global_step": 546, "train_info/time_within_train_step": 2.778756856918335, "step": 546} +{"train_info/time_between_train_steps": 0.0033538341522216797, "step": 546} +{"info/global_step": 547, "train_info/time_within_train_step": 2.7187492847442627, "step": 547} +{"train_info/time_between_train_steps": 0.0033905506134033203, "step": 547} +{"info/global_step": 548, "train_info/time_within_train_step": 2.7754459381103516, "step": 548} +{"train_info/time_between_train_steps": 0.0037565231323242188, "step": 548} +{"info/global_step": 549, "train_info/time_within_train_step": 2.7987961769104004, "step": 549} +{"train_info/time_between_train_steps": 0.0034317970275878906, "step": 549} +{"info/global_step": 550, "train_info/time_within_train_step": 2.8349034786224365, "step": 550} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746287650, "_runtime": 1672}, "step": 550} +{"logs": {"train/loss": 5.7077, "train/learning_rate": 0.0005444444444444444, "train/epoch": 0.18, "_timestamp": 1746287650, "_runtime": 1672}, "step": 550} +{"train_info/time_between_train_steps": 0.027584314346313477, "step": 550} +{"info/global_step": 551, "train_info/time_within_train_step": 2.772981882095337, "step": 551} +{"train_info/time_between_train_steps": 0.003313779830932617, "step": 551} +{"info/global_step": 552, "train_info/time_within_train_step": 2.755167007446289, "step": 552} +{"train_info/time_between_train_steps": 0.003428936004638672, "step": 552} +{"info/global_step": 553, "train_info/time_within_train_step": 2.8119261264801025, "step": 553} +{"train_info/time_between_train_steps": 0.003366231918334961, "step": 553} +{"info/global_step": 554, "train_info/time_within_train_step": 2.8222815990448, "step": 554} +{"train_info/time_between_train_steps": 0.003401517868041992, "step": 554} +{"info/global_step": 555, "train_info/time_within_train_step": 2.833782911300659, "step": 555} +{"train_info/time_between_train_steps": 0.003325223922729492, "step": 555} +{"info/global_step": 556, "train_info/time_within_train_step": 2.750060558319092, "step": 556} +{"train_info/time_between_train_steps": 0.0032629966735839844, "step": 556} +{"info/global_step": 557, "train_info/time_within_train_step": 2.783278703689575, "step": 557} +{"train_info/time_between_train_steps": 0.0033392906188964844, "step": 557} +{"info/global_step": 558, "train_info/time_within_train_step": 2.901731014251709, "step": 558} +{"train_info/time_between_train_steps": 0.003300905227661133, "step": 558} +{"info/global_step": 559, "train_info/time_within_train_step": 2.797994375228882, "step": 559} +{"train_info/time_between_train_steps": 0.0033376216888427734, "step": 559} +{"info/global_step": 560, "train_info/time_within_train_step": 2.7286267280578613, "step": 560} +{"train_info/time_between_train_steps": 0.003374338150024414, "step": 560} +{"info/global_step": 561, "train_info/time_within_train_step": 2.7312629222869873, "step": 561} +{"train_info/time_between_train_steps": 0.003265857696533203, "step": 561} +{"info/global_step": 562, "train_info/time_within_train_step": 2.7741870880126953, "step": 562} +{"train_info/time_between_train_steps": 0.003324270248413086, "step": 562} +{"info/global_step": 563, "train_info/time_within_train_step": 2.824958086013794, "step": 563} +{"train_info/time_between_train_steps": 0.0033957958221435547, "step": 563} +{"info/global_step": 564, "train_info/time_within_train_step": 2.740938901901245, "step": 564} +{"train_info/time_between_train_steps": 0.003337383270263672, "step": 564} +{"info/global_step": 565, "train_info/time_within_train_step": 2.7714195251464844, "step": 565} +{"train_info/time_between_train_steps": 0.003536701202392578, "step": 565} +{"info/global_step": 566, "train_info/time_within_train_step": 2.742366075515747, "step": 566} +{"train_info/time_between_train_steps": 0.0034177303314208984, "step": 566} +{"info/global_step": 567, "train_info/time_within_train_step": 2.7211711406707764, "step": 567} +{"train_info/time_between_train_steps": 0.0033473968505859375, "step": 567} +{"info/global_step": 568, "train_info/time_within_train_step": 2.760103702545166, "step": 568} +{"train_info/time_between_train_steps": 0.0033397674560546875, "step": 568} +{"info/global_step": 569, "train_info/time_within_train_step": 2.801616668701172, "step": 569} +{"train_info/time_between_train_steps": 0.003262758255004883, "step": 569} +{"info/global_step": 570, "train_info/time_within_train_step": 2.7565979957580566, "step": 570} +{"train_info/time_between_train_steps": 0.0034935474395751953, "step": 570} +{"info/global_step": 571, "train_info/time_within_train_step": 2.72148060798645, "step": 571} +{"train_info/time_between_train_steps": 0.003275156021118164, "step": 571} +{"info/global_step": 572, "train_info/time_within_train_step": 2.789806842803955, "step": 572} +{"train_info/time_between_train_steps": 0.0032804012298583984, "step": 572} +{"info/global_step": 573, "train_info/time_within_train_step": 2.801029682159424, "step": 573} +{"train_info/time_between_train_steps": 0.003309965133666992, "step": 573} +{"info/global_step": 574, "train_info/time_within_train_step": 2.7302870750427246, "step": 574} +{"train_info/time_between_train_steps": 0.0033605098724365234, "step": 574} +{"info/global_step": 575, "train_info/time_within_train_step": 2.7460269927978516, "step": 575} +{"train_info/time_between_train_steps": 0.0033254623413085938, "step": 575} +{"info/global_step": 576, "train_info/time_within_train_step": 2.802793502807617, "step": 576} +{"train_info/time_between_train_steps": 0.0033180713653564453, "step": 576} +{"info/global_step": 577, "train_info/time_within_train_step": 2.700502872467041, "step": 577} +{"train_info/time_between_train_steps": 0.0032935142517089844, "step": 577} +{"info/global_step": 578, "train_info/time_within_train_step": 2.752462148666382, "step": 578} +{"train_info/time_between_train_steps": 0.003329753875732422, "step": 578} +{"info/global_step": 579, "train_info/time_within_train_step": 2.7873551845550537, "step": 579} +{"train_info/time_between_train_steps": 0.003339529037475586, "step": 579} +{"info/global_step": 580, "train_info/time_within_train_step": 2.7369041442871094, "step": 580} +{"train_info/time_between_train_steps": 0.003302335739135742, "step": 580} +{"info/global_step": 581, "train_info/time_within_train_step": 2.831705093383789, "step": 581} +{"train_info/time_between_train_steps": 0.0034499168395996094, "step": 581} +{"info/global_step": 582, "train_info/time_within_train_step": 2.7496166229248047, "step": 582} +{"train_info/time_between_train_steps": 0.003335714340209961, "step": 582} +{"info/global_step": 583, "train_info/time_within_train_step": 2.751155138015747, "step": 583} +{"train_info/time_between_train_steps": 0.003286600112915039, "step": 583} +{"info/global_step": 584, "train_info/time_within_train_step": 2.8404321670532227, "step": 584} +{"train_info/time_between_train_steps": 0.0033113956451416016, "step": 584} +{"info/global_step": 585, "train_info/time_within_train_step": 2.7061123847961426, "step": 585} +{"train_info/time_between_train_steps": 0.0032329559326171875, "step": 585} +{"info/global_step": 586, "train_info/time_within_train_step": 2.6953773498535156, "step": 586} +{"train_info/time_between_train_steps": 0.003314495086669922, "step": 586} +{"info/global_step": 587, "train_info/time_within_train_step": 2.7854831218719482, "step": 587} +{"train_info/time_between_train_steps": 0.0033507347106933594, "step": 587} +{"info/global_step": 588, "train_info/time_within_train_step": 2.882199287414551, "step": 588} +{"train_info/time_between_train_steps": 0.0032911300659179688, "step": 588} +{"info/global_step": 589, "train_info/time_within_train_step": 2.7943155765533447, "step": 589} +{"train_info/time_between_train_steps": 0.003309965133666992, "step": 589} +{"info/global_step": 590, "train_info/time_within_train_step": 2.7133045196533203, "step": 590} +{"train_info/time_between_train_steps": 0.0032448768615722656, "step": 590} +{"info/global_step": 591, "train_info/time_within_train_step": 2.7463152408599854, "step": 591} +{"train_info/time_between_train_steps": 0.003348827362060547, "step": 591} +{"info/global_step": 592, "train_info/time_within_train_step": 2.863079786300659, "step": 592} +{"train_info/time_between_train_steps": 0.0033333301544189453, "step": 592} +{"info/global_step": 593, "train_info/time_within_train_step": 2.7543723583221436, "step": 593} +{"train_info/time_between_train_steps": 0.0033104419708251953, "step": 593} +{"info/global_step": 594, "train_info/time_within_train_step": 2.695045232772827, "step": 594} +{"train_info/time_between_train_steps": 0.0032339096069335938, "step": 594} +{"info/global_step": 595, "train_info/time_within_train_step": 2.6964564323425293, "step": 595} +{"train_info/time_between_train_steps": 0.0032737255096435547, "step": 595} +{"info/global_step": 596, "train_info/time_within_train_step": 2.697014808654785, "step": 596} +{"train_info/time_between_train_steps": 0.0033295154571533203, "step": 596} +{"info/global_step": 597, "train_info/time_within_train_step": 2.852935791015625, "step": 597} +{"train_info/time_between_train_steps": 0.0034339427947998047, "step": 597} +{"info/global_step": 598, "train_info/time_within_train_step": 2.8643107414245605, "step": 598} +{"train_info/time_between_train_steps": 0.003298521041870117, "step": 598} +{"info/global_step": 599, "train_info/time_within_train_step": 2.747802972793579, "step": 599} +{"train_info/time_between_train_steps": 0.003261089324951172, "step": 599} +{"info/global_step": 600, "train_info/time_within_train_step": 2.7185776233673096, "step": 600} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746287791, "_runtime": 1813}, "step": 600} +{"logs": {"train/loss": 5.6411, "train/learning_rate": 0.0005333333333333333, "train/epoch": 0.2, "_timestamp": 1746287791, "_runtime": 1813}, "step": 600} +{"train_info/time_between_train_steps": 13.722306966781616, "step": 600} +{"info/global_step": 601, "train_info/time_within_train_step": 2.484534502029419, "step": 601} +{"train_info/time_between_train_steps": 0.003435373306274414, "step": 601} +{"info/global_step": 602, "train_info/time_within_train_step": 2.534651279449463, "step": 602} +{"train_info/time_between_train_steps": 0.003818511962890625, "step": 602} +{"info/global_step": 603, "train_info/time_within_train_step": 2.6927590370178223, "step": 603} +{"train_info/time_between_train_steps": 0.0035064220428466797, "step": 603} +{"info/global_step": 604, "train_info/time_within_train_step": 2.6939871311187744, "step": 604} +{"train_info/time_between_train_steps": 0.006857156753540039, "step": 604} +{"info/global_step": 605, "train_info/time_within_train_step": 2.6946873664855957, "step": 605} +{"train_info/time_between_train_steps": 0.0034148693084716797, "step": 605} +{"info/global_step": 606, "train_info/time_within_train_step": 2.6970343589782715, "step": 606} +{"train_info/time_between_train_steps": 0.0036427974700927734, "step": 606} +{"info/global_step": 607, "train_info/time_within_train_step": 2.697998523712158, "step": 607} +{"train_info/time_between_train_steps": 0.003582000732421875, "step": 607} +{"info/global_step": 608, "train_info/time_within_train_step": 2.9646785259246826, "step": 608} +{"train_info/time_between_train_steps": 0.0036172866821289062, "step": 608} +{"info/global_step": 609, "train_info/time_within_train_step": 3.064209222793579, "step": 609} +{"train_info/time_between_train_steps": 0.003701448440551758, "step": 609} +{"info/global_step": 610, "train_info/time_within_train_step": 2.862887382507324, "step": 610} +{"train_info/time_between_train_steps": 0.0037043094635009766, "step": 610} +{"info/global_step": 611, "train_info/time_within_train_step": 2.699949264526367, "step": 611} +{"train_info/time_between_train_steps": 0.0036478042602539062, "step": 611} +{"info/global_step": 612, "train_info/time_within_train_step": 2.6946842670440674, "step": 612} +{"train_info/time_between_train_steps": 0.0036106109619140625, "step": 612} +{"info/global_step": 613, "train_info/time_within_train_step": 2.6955771446228027, "step": 613} +{"train_info/time_between_train_steps": 0.004296541213989258, "step": 613} +{"info/global_step": 614, "train_info/time_within_train_step": 2.69766902923584, "step": 614} +{"train_info/time_between_train_steps": 0.0037925243377685547, "step": 614} +{"info/global_step": 615, "train_info/time_within_train_step": 2.6966052055358887, "step": 615} +{"train_info/time_between_train_steps": 0.0036194324493408203, "step": 615} +{"info/global_step": 616, "train_info/time_within_train_step": 2.7069857120513916, "step": 616} +{"train_info/time_between_train_steps": 0.0036344528198242188, "step": 616} +{"info/global_step": 617, "train_info/time_within_train_step": 2.6978135108947754, "step": 617} +{"train_info/time_between_train_steps": 0.0036547183990478516, "step": 617} +{"info/global_step": 618, "train_info/time_within_train_step": 2.899230718612671, "step": 618} +{"train_info/time_between_train_steps": 0.0033495426177978516, "step": 618} +{"info/global_step": 619, "train_info/time_within_train_step": 2.6972317695617676, "step": 619} +{"train_info/time_between_train_steps": 0.0033478736877441406, "step": 619} +{"info/global_step": 620, "train_info/time_within_train_step": 2.698150157928467, "step": 620} +{"train_info/time_between_train_steps": 0.0034706592559814453, "step": 620} +{"info/global_step": 621, "train_info/time_within_train_step": 2.6978859901428223, "step": 621} +{"train_info/time_between_train_steps": 0.0033326148986816406, "step": 621} +{"info/global_step": 622, "train_info/time_within_train_step": 2.6972813606262207, "step": 622} +{"train_info/time_between_train_steps": 0.0033838748931884766, "step": 622} +{"info/global_step": 623, "train_info/time_within_train_step": 2.825739622116089, "step": 623} +{"train_info/time_between_train_steps": 0.0034170150756835938, "step": 623} +{"info/global_step": 624, "train_info/time_within_train_step": 3.0473265647888184, "step": 624} +{"train_info/time_between_train_steps": 0.0033304691314697266, "step": 624} +{"info/global_step": 625, "train_info/time_within_train_step": 2.8622279167175293, "step": 625} +{"train_info/time_between_train_steps": 0.003348112106323242, "step": 625} +{"info/global_step": 626, "train_info/time_within_train_step": 2.696817636489868, "step": 626} +{"train_info/time_between_train_steps": 0.0033142566680908203, "step": 626} +{"info/global_step": 627, "train_info/time_within_train_step": 2.6968133449554443, "step": 627} +{"train_info/time_between_train_steps": 0.0033218860626220703, "step": 627} +{"info/global_step": 628, "train_info/time_within_train_step": 2.7362570762634277, "step": 628} +{"train_info/time_between_train_steps": 0.003339529037475586, "step": 628} +{"info/global_step": 629, "train_info/time_within_train_step": 2.9902050495147705, "step": 629} +{"train_info/time_between_train_steps": 0.0034856796264648438, "step": 629} +{"info/global_step": 630, "train_info/time_within_train_step": 2.95418381690979, "step": 630} +{"train_info/time_between_train_steps": 0.0033102035522460938, "step": 630} +{"info/global_step": 631, "train_info/time_within_train_step": 2.7289602756500244, "step": 631} +{"train_info/time_between_train_steps": 0.003362894058227539, "step": 631} +{"info/global_step": 632, "train_info/time_within_train_step": 2.7041261196136475, "step": 632} +{"train_info/time_between_train_steps": 0.0033621788024902344, "step": 632} +{"info/global_step": 633, "train_info/time_within_train_step": 2.8741238117218018, "step": 633} +{"train_info/time_between_train_steps": 0.003376483917236328, "step": 633} +{"info/global_step": 634, "train_info/time_within_train_step": 3.0168275833129883, "step": 634} +{"train_info/time_between_train_steps": 0.003543376922607422, "step": 634} +{"info/global_step": 635, "train_info/time_within_train_step": 2.8035967350006104, "step": 635} +{"train_info/time_between_train_steps": 0.0033867359161376953, "step": 635} +{"info/global_step": 636, "train_info/time_within_train_step": 2.714155912399292, "step": 636} +{"train_info/time_between_train_steps": 0.0033876895904541016, "step": 636} +{"info/global_step": 637, "train_info/time_within_train_step": 2.85737681388855, "step": 637} +{"train_info/time_between_train_steps": 0.003461599349975586, "step": 637} +{"info/global_step": 638, "train_info/time_within_train_step": 2.9152984619140625, "step": 638} +{"train_info/time_between_train_steps": 0.003532886505126953, "step": 638} +{"info/global_step": 639, "train_info/time_within_train_step": 2.762057065963745, "step": 639} +{"train_info/time_between_train_steps": 0.003482818603515625, "step": 639} +{"info/global_step": 640, "train_info/time_within_train_step": 2.71504282951355, "step": 640} +{"train_info/time_between_train_steps": 0.0034410953521728516, "step": 640} +{"info/global_step": 641, "train_info/time_within_train_step": 2.8540656566619873, "step": 641} +{"train_info/time_between_train_steps": 0.0034034252166748047, "step": 641} +{"info/global_step": 642, "train_info/time_within_train_step": 2.9646928310394287, "step": 642} +{"train_info/time_between_train_steps": 0.003560781478881836, "step": 642} +{"info/global_step": 643, "train_info/time_within_train_step": 2.8826892375946045, "step": 643} +{"train_info/time_between_train_steps": 0.003488779067993164, "step": 643} +{"info/global_step": 644, "train_info/time_within_train_step": 2.7850992679595947, "step": 644} +{"train_info/time_between_train_steps": 0.003387928009033203, "step": 644} +{"info/global_step": 645, "train_info/time_within_train_step": 2.7734029293060303, "step": 645} +{"train_info/time_between_train_steps": 0.003361940383911133, "step": 645} +{"info/global_step": 646, "train_info/time_within_train_step": 2.8164658546447754, "step": 646} +{"train_info/time_between_train_steps": 0.003358125686645508, "step": 646} +{"info/global_step": 647, "train_info/time_within_train_step": 2.8843789100646973, "step": 647} +{"train_info/time_between_train_steps": 0.0033431053161621094, "step": 647} +{"info/global_step": 648, "train_info/time_within_train_step": 2.832167625427246, "step": 648} +{"train_info/time_between_train_steps": 0.0033795833587646484, "step": 648} +{"info/global_step": 649, "train_info/time_within_train_step": 2.735698938369751, "step": 649} +{"train_info/time_between_train_steps": 0.003394603729248047, "step": 649} +{"info/global_step": 650, "train_info/time_within_train_step": 2.7595596313476562, "step": 650} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746287949, "_runtime": 1971}, "step": 650} +{"logs": {"train/loss": 5.5967, "train/learning_rate": 0.0005222222222222222, "train/epoch": 0.22, "_timestamp": 1746287949, "_runtime": 1971}, "step": 650} +{"train_info/time_between_train_steps": 0.04271435737609863, "step": 650} +{"info/global_step": 651, "train_info/time_within_train_step": 2.8394436836242676, "step": 651} +{"train_info/time_between_train_steps": 0.0034134387969970703, "step": 651} +{"info/global_step": 652, "train_info/time_within_train_step": 2.844925880432129, "step": 652} +{"train_info/time_between_train_steps": 0.003344297409057617, "step": 652} +{"info/global_step": 653, "train_info/time_within_train_step": 2.8121206760406494, "step": 653} +{"train_info/time_between_train_steps": 0.003484964370727539, "step": 653} +{"info/global_step": 654, "train_info/time_within_train_step": 2.797683000564575, "step": 654} +{"train_info/time_between_train_steps": 0.003451108932495117, "step": 654} +{"info/global_step": 655, "train_info/time_within_train_step": 2.857003927230835, "step": 655} +{"train_info/time_between_train_steps": 0.0034215450286865234, "step": 655} +{"info/global_step": 656, "train_info/time_within_train_step": 2.79036545753479, "step": 656} +{"train_info/time_between_train_steps": 0.0033631324768066406, "step": 656} +{"info/global_step": 657, "train_info/time_within_train_step": 2.8681790828704834, "step": 657} +{"train_info/time_between_train_steps": 0.0033936500549316406, "step": 657} +{"info/global_step": 658, "train_info/time_within_train_step": 2.8317923545837402, "step": 658} +{"train_info/time_between_train_steps": 0.003322124481201172, "step": 658} +{"info/global_step": 659, "train_info/time_within_train_step": 2.8129019737243652, "step": 659} +{"train_info/time_between_train_steps": 0.0034606456756591797, "step": 659} +{"info/global_step": 660, "train_info/time_within_train_step": 2.768965005874634, "step": 660} +{"train_info/time_between_train_steps": 0.003515005111694336, "step": 660} +{"info/global_step": 661, "train_info/time_within_train_step": 2.856511354446411, "step": 661} +{"train_info/time_between_train_steps": 0.0036470890045166016, "step": 661} +{"info/global_step": 662, "train_info/time_within_train_step": 2.7848474979400635, "step": 662} +{"train_info/time_between_train_steps": 0.003687620162963867, "step": 662} +{"info/global_step": 663, "train_info/time_within_train_step": 2.7347843647003174, "step": 663} +{"train_info/time_between_train_steps": 0.0035829544067382812, "step": 663} +{"info/global_step": 664, "train_info/time_within_train_step": 2.813878297805786, "step": 664} +{"train_info/time_between_train_steps": 0.0037610530853271484, "step": 664} +{"info/global_step": 665, "train_info/time_within_train_step": 2.8380134105682373, "step": 665} +{"train_info/time_between_train_steps": 0.0036804676055908203, "step": 665} +{"info/global_step": 666, "train_info/time_within_train_step": 2.6987857818603516, "step": 666} +{"train_info/time_between_train_steps": 0.003694772720336914, "step": 666} +{"info/global_step": 667, "train_info/time_within_train_step": 2.6951780319213867, "step": 667} +{"train_info/time_between_train_steps": 0.0036563873291015625, "step": 667} +{"info/global_step": 668, "train_info/time_within_train_step": 2.6938374042510986, "step": 668} +{"train_info/time_between_train_steps": 0.0035080909729003906, "step": 668} +{"info/global_step": 669, "train_info/time_within_train_step": 2.764042377471924, "step": 669} +{"train_info/time_between_train_steps": 0.0035941600799560547, "step": 669} +{"info/global_step": 670, "train_info/time_within_train_step": 2.6948392391204834, "step": 670} +{"train_info/time_between_train_steps": 0.0035233497619628906, "step": 670} +{"info/global_step": 671, "train_info/time_within_train_step": 2.6961145401000977, "step": 671} +{"train_info/time_between_train_steps": 0.0035123825073242188, "step": 671} +{"info/global_step": 672, "train_info/time_within_train_step": 2.6964733600616455, "step": 672} +{"train_info/time_between_train_steps": 0.003535747528076172, "step": 672} +{"info/global_step": 673, "train_info/time_within_train_step": 2.696878433227539, "step": 673} +{"train_info/time_between_train_steps": 0.003509998321533203, "step": 673} +{"info/global_step": 674, "train_info/time_within_train_step": 2.694211721420288, "step": 674} +{"train_info/time_between_train_steps": 0.0035958290100097656, "step": 674} +{"info/global_step": 675, "train_info/time_within_train_step": 2.6972851753234863, "step": 675} +{"train_info/time_between_train_steps": 0.0035619735717773438, "step": 675} +{"info/global_step": 676, "train_info/time_within_train_step": 2.697235107421875, "step": 676} +{"train_info/time_between_train_steps": 0.003589630126953125, "step": 676} +{"info/global_step": 677, "train_info/time_within_train_step": 2.6960110664367676, "step": 677} +{"train_info/time_between_train_steps": 0.0035631656646728516, "step": 677} +{"info/global_step": 678, "train_info/time_within_train_step": 2.699396848678589, "step": 678} +{"train_info/time_between_train_steps": 0.0034945011138916016, "step": 678} +{"info/global_step": 679, "train_info/time_within_train_step": 2.697502613067627, "step": 679} +{"train_info/time_between_train_steps": 0.0035114288330078125, "step": 679} +{"info/global_step": 680, "train_info/time_within_train_step": 2.6980741024017334, "step": 680} +{"train_info/time_between_train_steps": 0.003503561019897461, "step": 680} +{"info/global_step": 681, "train_info/time_within_train_step": 2.697939872741699, "step": 681} +{"train_info/time_between_train_steps": 0.003496408462524414, "step": 681} +{"info/global_step": 682, "train_info/time_within_train_step": 2.6951754093170166, "step": 682} +{"train_info/time_between_train_steps": 0.003512859344482422, "step": 682} +{"info/global_step": 683, "train_info/time_within_train_step": 2.695305824279785, "step": 683} +{"train_info/time_between_train_steps": 0.003509044647216797, "step": 683} +{"info/global_step": 684, "train_info/time_within_train_step": 2.6944499015808105, "step": 684} +{"train_info/time_between_train_steps": 0.0036630630493164062, "step": 684} +{"info/global_step": 685, "train_info/time_within_train_step": 2.695133924484253, "step": 685} +{"train_info/time_between_train_steps": 0.0035707950592041016, "step": 685} +{"info/global_step": 686, "train_info/time_within_train_step": 2.6960337162017822, "step": 686} +{"train_info/time_between_train_steps": 0.003626585006713867, "step": 686} +{"info/global_step": 687, "train_info/time_within_train_step": 2.6968278884887695, "step": 687} +{"train_info/time_between_train_steps": 0.0036585330963134766, "step": 687} +{"info/global_step": 688, "train_info/time_within_train_step": 2.6975646018981934, "step": 688} +{"train_info/time_between_train_steps": 0.003592967987060547, "step": 688} +{"info/global_step": 689, "train_info/time_within_train_step": 2.6968870162963867, "step": 689} +{"train_info/time_between_train_steps": 0.003466367721557617, "step": 689} +{"info/global_step": 690, "train_info/time_within_train_step": 2.69834041595459, "step": 690} +{"train_info/time_between_train_steps": 0.0036149024963378906, "step": 690} +{"info/global_step": 691, "train_info/time_within_train_step": 2.698134660720825, "step": 691} +{"train_info/time_between_train_steps": 0.003509521484375, "step": 691} +{"info/global_step": 692, "train_info/time_within_train_step": 2.7242352962493896, "step": 692} +{"train_info/time_between_train_steps": 0.003559112548828125, "step": 692} +{"info/global_step": 693, "train_info/time_within_train_step": 2.6983470916748047, "step": 693} +{"train_info/time_between_train_steps": 0.0036122798919677734, "step": 693} +{"info/global_step": 694, "train_info/time_within_train_step": 2.696309804916382, "step": 694} +{"train_info/time_between_train_steps": 0.0035119056701660156, "step": 694} +{"info/global_step": 695, "train_info/time_within_train_step": 2.698840379714966, "step": 695} +{"train_info/time_between_train_steps": 0.0035915374755859375, "step": 695} +{"info/global_step": 696, "train_info/time_within_train_step": 2.697244644165039, "step": 696} +{"train_info/time_between_train_steps": 0.0035524368286132812, "step": 696} +{"info/global_step": 697, "train_info/time_within_train_step": 2.698317050933838, "step": 697} +{"train_info/time_between_train_steps": 0.0035746097564697266, "step": 697} +{"info/global_step": 698, "train_info/time_within_train_step": 2.7342381477355957, "step": 698} +{"train_info/time_between_train_steps": 0.003512144088745117, "step": 698} +{"info/global_step": 699, "train_info/time_within_train_step": 3.0137441158294678, "step": 699} +{"train_info/time_between_train_steps": 0.003742694854736328, "step": 699} +{"info/global_step": 700, "train_info/time_within_train_step": 2.7244956493377686, "step": 700} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746288097, "_runtime": 2119}, "step": 700} +{"logs": {"train/loss": 5.5408, "train/learning_rate": 0.0005111111111111111, "train/epoch": 0.23, "_timestamp": 1746288097, "_runtime": 2119}, "step": 700} +{"train_info/time_between_train_steps": 31.540311574935913, "step": 700} +{"info/global_step": 701, "train_info/time_within_train_step": 2.4754014015197754, "step": 701} +{"train_info/time_between_train_steps": 0.003471851348876953, "step": 701} +{"info/global_step": 702, "train_info/time_within_train_step": 2.479337453842163, "step": 702} +{"train_info/time_between_train_steps": 0.0035009384155273438, "step": 702} +{"info/global_step": 703, "train_info/time_within_train_step": 2.6634488105773926, "step": 703} +{"train_info/time_between_train_steps": 0.0035228729248046875, "step": 703} +{"info/global_step": 704, "train_info/time_within_train_step": 2.6885106563568115, "step": 704} +{"train_info/time_between_train_steps": 0.0034914016723632812, "step": 704} +{"info/global_step": 705, "train_info/time_within_train_step": 2.690291166305542, "step": 705} +{"train_info/time_between_train_steps": 0.0035114288330078125, "step": 705} +{"info/global_step": 706, "train_info/time_within_train_step": 2.692396402359009, "step": 706} +{"train_info/time_between_train_steps": 0.003424406051635742, "step": 706} +{"info/global_step": 707, "train_info/time_within_train_step": 2.6940455436706543, "step": 707} +{"train_info/time_between_train_steps": 0.003667116165161133, "step": 707} +{"info/global_step": 708, "train_info/time_within_train_step": 2.696380615234375, "step": 708} +{"train_info/time_between_train_steps": 0.0034694671630859375, "step": 708} +{"info/global_step": 709, "train_info/time_within_train_step": 2.7860677242279053, "step": 709} +{"train_info/time_between_train_steps": 0.0034770965576171875, "step": 709} +{"info/global_step": 710, "train_info/time_within_train_step": 2.9676527976989746, "step": 710} +{"train_info/time_between_train_steps": 0.0035550594329833984, "step": 710} +{"info/global_step": 711, "train_info/time_within_train_step": 3.1565377712249756, "step": 711} +{"train_info/time_between_train_steps": 0.0034933090209960938, "step": 711} +{"info/global_step": 712, "train_info/time_within_train_step": 2.884394645690918, "step": 712} +{"train_info/time_between_train_steps": 0.003511190414428711, "step": 712} +{"info/global_step": 713, "train_info/time_within_train_step": 2.6976912021636963, "step": 713} +{"train_info/time_between_train_steps": 0.003428220748901367, "step": 713} +{"info/global_step": 714, "train_info/time_within_train_step": 2.697897434234619, "step": 714} +{"train_info/time_between_train_steps": 0.0034940242767333984, "step": 714} +{"info/global_step": 715, "train_info/time_within_train_step": 2.6996095180511475, "step": 715} +{"train_info/time_between_train_steps": 0.00672602653503418, "step": 715} +{"info/global_step": 716, "train_info/time_within_train_step": 2.6967601776123047, "step": 716} +{"train_info/time_between_train_steps": 0.0035517215728759766, "step": 716} +{"info/global_step": 717, "train_info/time_within_train_step": 2.697397470474243, "step": 717} +{"train_info/time_between_train_steps": 0.003553628921508789, "step": 717} +{"info/global_step": 718, "train_info/time_within_train_step": 2.695929527282715, "step": 718} +{"train_info/time_between_train_steps": 0.0034651756286621094, "step": 718} +{"info/global_step": 719, "train_info/time_within_train_step": 2.774653673171997, "step": 719} +{"train_info/time_between_train_steps": 0.003341197967529297, "step": 719} +{"info/global_step": 720, "train_info/time_within_train_step": 2.696197748184204, "step": 720} +{"train_info/time_between_train_steps": 0.0034339427947998047, "step": 720} +{"info/global_step": 721, "train_info/time_within_train_step": 2.8085129261016846, "step": 721} +{"train_info/time_between_train_steps": 0.003439188003540039, "step": 721} +{"info/global_step": 722, "train_info/time_within_train_step": 2.6971869468688965, "step": 722} +{"train_info/time_between_train_steps": 0.003398418426513672, "step": 722} +{"info/global_step": 723, "train_info/time_within_train_step": 2.6974430084228516, "step": 723} +{"train_info/time_between_train_steps": 0.0034966468811035156, "step": 723} +{"info/global_step": 724, "train_info/time_within_train_step": 2.6980154514312744, "step": 724} +{"train_info/time_between_train_steps": 0.003739595413208008, "step": 724} +{"info/global_step": 725, "train_info/time_within_train_step": 2.6986641883850098, "step": 725} +{"train_info/time_between_train_steps": 0.0034182071685791016, "step": 725} +{"info/global_step": 726, "train_info/time_within_train_step": 2.6987810134887695, "step": 726} +{"train_info/time_between_train_steps": 0.0034461021423339844, "step": 726} +{"info/global_step": 727, "train_info/time_within_train_step": 2.779154062271118, "step": 727} +{"train_info/time_between_train_steps": 0.003995418548583984, "step": 727} +{"info/global_step": 728, "train_info/time_within_train_step": 2.960738182067871, "step": 728} +{"train_info/time_between_train_steps": 0.0035386085510253906, "step": 728} +{"info/global_step": 729, "train_info/time_within_train_step": 2.952425241470337, "step": 729} +{"train_info/time_between_train_steps": 0.0037496089935302734, "step": 729} +{"info/global_step": 730, "train_info/time_within_train_step": 2.6979548931121826, "step": 730} +{"train_info/time_between_train_steps": 0.0034301280975341797, "step": 730} +{"info/global_step": 731, "train_info/time_within_train_step": 2.6957457065582275, "step": 731} +{"train_info/time_between_train_steps": 0.003506898880004883, "step": 731} +{"info/global_step": 732, "train_info/time_within_train_step": 2.696370840072632, "step": 732} +{"train_info/time_between_train_steps": 0.00336456298828125, "step": 732} +{"info/global_step": 733, "train_info/time_within_train_step": 2.6972761154174805, "step": 733} +{"train_info/time_between_train_steps": 0.003358602523803711, "step": 733} +{"info/global_step": 734, "train_info/time_within_train_step": 2.6966452598571777, "step": 734} +{"train_info/time_between_train_steps": 0.0035779476165771484, "step": 734} +{"info/global_step": 735, "train_info/time_within_train_step": 2.6973183155059814, "step": 735} +{"train_info/time_between_train_steps": 0.0033490657806396484, "step": 735} +{"info/global_step": 736, "train_info/time_within_train_step": 2.6973342895507812, "step": 736} +{"train_info/time_between_train_steps": 0.0035049915313720703, "step": 736} +{"info/global_step": 737, "train_info/time_within_train_step": 2.696057081222534, "step": 737} +{"train_info/time_between_train_steps": 0.003407001495361328, "step": 737} +{"info/global_step": 738, "train_info/time_within_train_step": 2.6974411010742188, "step": 738} +{"train_info/time_between_train_steps": 0.003622293472290039, "step": 738} +{"info/global_step": 739, "train_info/time_within_train_step": 2.6982007026672363, "step": 739} +{"train_info/time_between_train_steps": 0.0038564205169677734, "step": 739} +{"info/global_step": 740, "train_info/time_within_train_step": 2.696453332901001, "step": 740} +{"train_info/time_between_train_steps": 0.003777027130126953, "step": 740} +{"info/global_step": 741, "train_info/time_within_train_step": 2.6972522735595703, "step": 741} +{"train_info/time_between_train_steps": 0.0035326480865478516, "step": 741} +{"info/global_step": 742, "train_info/time_within_train_step": 2.747069835662842, "step": 742} +{"train_info/time_between_train_steps": 0.0036280155181884766, "step": 742} +{"info/global_step": 743, "train_info/time_within_train_step": 2.8975865840911865, "step": 743} +{"train_info/time_between_train_steps": 0.003734111785888672, "step": 743} +{"info/global_step": 744, "train_info/time_within_train_step": 2.82381010055542, "step": 744} +{"train_info/time_between_train_steps": 0.00379180908203125, "step": 744} +{"info/global_step": 745, "train_info/time_within_train_step": 2.7161412239074707, "step": 745} +{"train_info/time_between_train_steps": 0.0036940574645996094, "step": 745} +{"info/global_step": 746, "train_info/time_within_train_step": 2.703261613845825, "step": 746} +{"train_info/time_between_train_steps": 0.004216909408569336, "step": 746} +{"info/global_step": 747, "train_info/time_within_train_step": 2.8777763843536377, "step": 747} +{"train_info/time_between_train_steps": 0.0039403438568115234, "step": 747} +{"info/global_step": 748, "train_info/time_within_train_step": 2.844374418258667, "step": 748} +{"train_info/time_between_train_steps": 0.003984212875366211, "step": 748} +{"info/global_step": 749, "train_info/time_within_train_step": 2.7044177055358887, "step": 749} +{"train_info/time_between_train_steps": 0.004046440124511719, "step": 749} +{"info/global_step": 750, "train_info/time_within_train_step": 3.5773673057556152, "step": 750} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746288274, "_runtime": 2296}, "step": 750} +{"logs": {"train/loss": 5.4798, "train/learning_rate": 0.0005, "train/epoch": 0.25, "_timestamp": 1746288274, "_runtime": 2296}, "step": 750} +{"train_info/time_between_train_steps": 0.80765700340271, "step": 750} +{"info/global_step": 751, "train_info/time_within_train_step": 2.693007230758667, "step": 751} +{"train_info/time_between_train_steps": 0.0039899349212646484, "step": 751} +{"info/global_step": 752, "train_info/time_within_train_step": 2.6943955421447754, "step": 752} +{"train_info/time_between_train_steps": 0.0040209293365478516, "step": 752} +{"info/global_step": 753, "train_info/time_within_train_step": 2.6965134143829346, "step": 753} +{"train_info/time_between_train_steps": 0.004117488861083984, "step": 753} +{"info/global_step": 754, "train_info/time_within_train_step": 2.734513759613037, "step": 754} +{"train_info/time_between_train_steps": 0.004000186920166016, "step": 754} +{"info/global_step": 755, "train_info/time_within_train_step": 2.695573329925537, "step": 755} +{"train_info/time_between_train_steps": 0.003916501998901367, "step": 755} +{"info/global_step": 756, "train_info/time_within_train_step": 2.697697401046753, "step": 756} +{"train_info/time_between_train_steps": 0.0041081905364990234, "step": 756} +{"info/global_step": 757, "train_info/time_within_train_step": 2.701155424118042, "step": 757} +{"train_info/time_between_train_steps": 0.004179716110229492, "step": 757} +{"info/global_step": 758, "train_info/time_within_train_step": 2.7013068199157715, "step": 758} +{"train_info/time_between_train_steps": 0.004418611526489258, "step": 758} +{"train_info/time_between_train_steps": 3.126755475997925, "step": 758} +{"info/global_step": 759, "train_info/time_within_train_step": 2.6948764324188232, "step": 759} +{"train_info/time_between_train_steps": 0.003548860549926758, "step": 759} +{"info/global_step": 760, "train_info/time_within_train_step": 2.695556879043579, "step": 760} +{"train_info/time_between_train_steps": 0.0035696029663085938, "step": 760} +{"info/global_step": 761, "train_info/time_within_train_step": 2.696937322616577, "step": 761} +{"train_info/time_between_train_steps": 0.003631591796875, "step": 761} +{"info/global_step": 762, "train_info/time_within_train_step": 3.096351385116577, "step": 762} +{"train_info/time_between_train_steps": 0.003659486770629883, "step": 762} +{"info/global_step": 763, "train_info/time_within_train_step": 2.696506977081299, "step": 763} +{"train_info/time_between_train_steps": 0.0036630630493164062, "step": 763} +{"info/global_step": 764, "train_info/time_within_train_step": 2.6947340965270996, "step": 764} +{"train_info/time_between_train_steps": 0.0035064220428466797, "step": 764} +{"info/global_step": 765, "train_info/time_within_train_step": 2.694762706756592, "step": 765} +{"train_info/time_between_train_steps": 0.0034608840942382812, "step": 765} +{"info/global_step": 766, "train_info/time_within_train_step": 2.694554328918457, "step": 766} +{"train_info/time_between_train_steps": 0.0034389495849609375, "step": 766} +{"info/global_step": 767, "train_info/time_within_train_step": 2.904820203781128, "step": 767} +{"train_info/time_between_train_steps": 0.0034978389739990234, "step": 767} +{"info/global_step": 768, "train_info/time_within_train_step": 2.695444107055664, "step": 768} +{"train_info/time_between_train_steps": 0.0034720897674560547, "step": 768} +{"info/global_step": 769, "train_info/time_within_train_step": 2.70149827003479, "step": 769} +{"train_info/time_between_train_steps": 0.003503561019897461, "step": 769} +{"info/global_step": 770, "train_info/time_within_train_step": 2.696101188659668, "step": 770} +{"train_info/time_between_train_steps": 0.0034818649291992188, "step": 770} +{"info/global_step": 771, "train_info/time_within_train_step": 2.6959969997406006, "step": 771} +{"train_info/time_between_train_steps": 0.003552675247192383, "step": 771} +{"info/global_step": 772, "train_info/time_within_train_step": 2.69777774810791, "step": 772} +{"train_info/time_between_train_steps": 0.0038022994995117188, "step": 772} +{"info/global_step": 773, "train_info/time_within_train_step": 2.7099545001983643, "step": 773} +{"train_info/time_between_train_steps": 0.0034422874450683594, "step": 773} +{"info/global_step": 774, "train_info/time_within_train_step": 2.8801310062408447, "step": 774} +{"train_info/time_between_train_steps": 0.0034918785095214844, "step": 774} +{"info/global_step": 775, "train_info/time_within_train_step": 3.108037233352661, "step": 775} +{"train_info/time_between_train_steps": 0.0035903453826904297, "step": 775} +{"info/global_step": 776, "train_info/time_within_train_step": 2.759657859802246, "step": 776} +{"train_info/time_between_train_steps": 0.0034677982330322266, "step": 776} +{"info/global_step": 777, "train_info/time_within_train_step": 2.693779230117798, "step": 777} +{"train_info/time_between_train_steps": 0.0035278797149658203, "step": 777} +{"info/global_step": 778, "train_info/time_within_train_step": 2.695911169052124, "step": 778} +{"train_info/time_between_train_steps": 0.0035674571990966797, "step": 778} +{"info/global_step": 779, "train_info/time_within_train_step": 2.6953752040863037, "step": 779} +{"train_info/time_between_train_steps": 0.0034813880920410156, "step": 779} +{"info/global_step": 780, "train_info/time_within_train_step": 2.6947414875030518, "step": 780} +{"train_info/time_between_train_steps": 0.0034592151641845703, "step": 780} +{"info/global_step": 781, "train_info/time_within_train_step": 2.6962013244628906, "step": 781} +{"train_info/time_between_train_steps": 0.0034966468811035156, "step": 781} +{"info/global_step": 782, "train_info/time_within_train_step": 3.1610360145568848, "step": 782} +{"train_info/time_between_train_steps": 0.0034852027893066406, "step": 782} +{"info/global_step": 783, "train_info/time_within_train_step": 2.7011189460754395, "step": 783} +{"train_info/time_between_train_steps": 0.0035123825073242188, "step": 783} +{"info/global_step": 784, "train_info/time_within_train_step": 2.696573257446289, "step": 784} +{"train_info/time_between_train_steps": 0.0034606456756591797, "step": 784} +{"info/global_step": 785, "train_info/time_within_train_step": 2.695099115371704, "step": 785} +{"train_info/time_between_train_steps": 0.0037031173706054688, "step": 785} +{"info/global_step": 786, "train_info/time_within_train_step": 2.6937808990478516, "step": 786} +{"train_info/time_between_train_steps": 0.003503084182739258, "step": 786} +{"info/global_step": 787, "train_info/time_within_train_step": 2.7693774700164795, "step": 787} +{"train_info/time_between_train_steps": 0.003460407257080078, "step": 787} +{"info/global_step": 788, "train_info/time_within_train_step": 2.6947240829467773, "step": 788} +{"train_info/time_between_train_steps": 0.003916740417480469, "step": 788} +{"info/global_step": 789, "train_info/time_within_train_step": 2.6918787956237793, "step": 789} +{"train_info/time_between_train_steps": 0.0035436153411865234, "step": 789} +{"info/global_step": 790, "train_info/time_within_train_step": 2.692335605621338, "step": 790} +{"train_info/time_between_train_steps": 0.003481149673461914, "step": 790} +{"info/global_step": 791, "train_info/time_within_train_step": 2.6931962966918945, "step": 791} +{"train_info/time_between_train_steps": 0.003495454788208008, "step": 791} +{"info/global_step": 792, "train_info/time_within_train_step": 2.6929826736450195, "step": 792} +{"train_info/time_between_train_steps": 0.0034906864166259766, "step": 792} +{"info/global_step": 793, "train_info/time_within_train_step": 2.6934823989868164, "step": 793} +{"train_info/time_between_train_steps": 0.0035276412963867188, "step": 793} +{"info/global_step": 794, "train_info/time_within_train_step": 2.693561553955078, "step": 794} +{"train_info/time_between_train_steps": 0.0034461021423339844, "step": 794} +{"info/global_step": 795, "train_info/time_within_train_step": 2.695643186569214, "step": 795} +{"train_info/time_between_train_steps": 0.003501415252685547, "step": 795} +{"info/global_step": 796, "train_info/time_within_train_step": 2.6940062046051025, "step": 796} +{"train_info/time_between_train_steps": 0.003467082977294922, "step": 796} +{"info/global_step": 797, "train_info/time_within_train_step": 2.69327712059021, "step": 797} +{"train_info/time_between_train_steps": 0.003505706787109375, "step": 797} +{"info/global_step": 798, "train_info/time_within_train_step": 2.694514513015747, "step": 798} +{"train_info/time_between_train_steps": 0.0034515857696533203, "step": 798} +{"info/global_step": 799, "train_info/time_within_train_step": 2.69374942779541, "step": 799} +{"train_info/time_between_train_steps": 0.0035676956176757812, "step": 799} +{"info/global_step": 800, "train_info/time_within_train_step": 2.693566083908081, "step": 800} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746288429, "_runtime": 2451}, "step": 800} +{"logs": {"train/loss": 5.473, "train/learning_rate": 0.0004888888888888889, "train/epoch": 1.01, "_timestamp": 1746288429, "_runtime": 2451}, "step": 800} +{"train_info/time_between_train_steps": 34.57000231742859, "step": 800} +{"info/global_step": 801, "train_info/time_within_train_step": 2.4698410034179688, "step": 801} +{"train_info/time_between_train_steps": 0.0040018558502197266, "step": 801} +{"info/global_step": 802, "train_info/time_within_train_step": 2.4904983043670654, "step": 802} +{"train_info/time_between_train_steps": 0.0036554336547851562, "step": 802} +{"info/global_step": 803, "train_info/time_within_train_step": 2.6850743293762207, "step": 803} +{"train_info/time_between_train_steps": 0.003658294677734375, "step": 803} +{"info/global_step": 804, "train_info/time_within_train_step": 2.693901538848877, "step": 804} +{"train_info/time_between_train_steps": 0.0036678314208984375, "step": 804} +{"info/global_step": 805, "train_info/time_within_train_step": 2.6937406063079834, "step": 805} +{"train_info/time_between_train_steps": 0.0036859512329101562, "step": 805} +{"info/global_step": 806, "train_info/time_within_train_step": 2.6945748329162598, "step": 806} +{"train_info/time_between_train_steps": 0.0036497116088867188, "step": 806} +{"info/global_step": 807, "train_info/time_within_train_step": 2.6958234310150146, "step": 807} +{"train_info/time_between_train_steps": 0.003653287887573242, "step": 807} +{"info/global_step": 808, "train_info/time_within_train_step": 2.69804048538208, "step": 808} +{"train_info/time_between_train_steps": 0.0035161972045898438, "step": 808} +{"info/global_step": 809, "train_info/time_within_train_step": 2.6951522827148438, "step": 809} +{"train_info/time_between_train_steps": 0.0034956932067871094, "step": 809} +{"info/global_step": 810, "train_info/time_within_train_step": 2.9070212841033936, "step": 810} +{"train_info/time_between_train_steps": 0.003506898880004883, "step": 810} +{"info/global_step": 811, "train_info/time_within_train_step": 2.6954691410064697, "step": 811} +{"train_info/time_between_train_steps": 0.003658771514892578, "step": 811} +{"info/global_step": 812, "train_info/time_within_train_step": 2.802166700363159, "step": 812} +{"train_info/time_between_train_steps": 0.0035452842712402344, "step": 812} +{"info/global_step": 813, "train_info/time_within_train_step": 2.696082592010498, "step": 813} +{"train_info/time_between_train_steps": 0.0034935474395751953, "step": 813} +{"info/global_step": 814, "train_info/time_within_train_step": 2.6986844539642334, "step": 814} +{"train_info/time_between_train_steps": 0.003531932830810547, "step": 814} +{"info/global_step": 815, "train_info/time_within_train_step": 2.697478771209717, "step": 815} +{"train_info/time_between_train_steps": 0.0037412643432617188, "step": 815} +{"info/global_step": 816, "train_info/time_within_train_step": 2.6980838775634766, "step": 816} +{"train_info/time_between_train_steps": 0.003630399703979492, "step": 816} +{"info/global_step": 817, "train_info/time_within_train_step": 2.6967384815216064, "step": 817} +{"train_info/time_between_train_steps": 0.003657817840576172, "step": 817} +{"info/global_step": 818, "train_info/time_within_train_step": 2.697099208831787, "step": 818} +{"train_info/time_between_train_steps": 0.0035104751586914062, "step": 818} +{"info/global_step": 819, "train_info/time_within_train_step": 2.6963090896606445, "step": 819} +{"train_info/time_between_train_steps": 0.0035352706909179688, "step": 819} +{"info/global_step": 820, "train_info/time_within_train_step": 2.69840931892395, "step": 820} +{"train_info/time_between_train_steps": 0.003504514694213867, "step": 820} +{"info/global_step": 821, "train_info/time_within_train_step": 2.812777280807495, "step": 821} +{"train_info/time_between_train_steps": 0.003573179244995117, "step": 821} +{"info/global_step": 822, "train_info/time_within_train_step": 2.697394371032715, "step": 822} +{"train_info/time_between_train_steps": 0.0036802291870117188, "step": 822} +{"info/global_step": 823, "train_info/time_within_train_step": 2.696648597717285, "step": 823} +{"train_info/time_between_train_steps": 0.003718852996826172, "step": 823} +{"info/global_step": 824, "train_info/time_within_train_step": 2.6976513862609863, "step": 824} +{"train_info/time_between_train_steps": 0.0036466121673583984, "step": 824} +{"info/global_step": 825, "train_info/time_within_train_step": 2.696467638015747, "step": 825} +{"train_info/time_between_train_steps": 0.0038788318634033203, "step": 825} +{"info/global_step": 826, "train_info/time_within_train_step": 2.7000844478607178, "step": 826} +{"train_info/time_between_train_steps": 0.003568887710571289, "step": 826} +{"info/global_step": 827, "train_info/time_within_train_step": 2.6985414028167725, "step": 827} +{"train_info/time_between_train_steps": 0.003679990768432617, "step": 827} +{"info/global_step": 828, "train_info/time_within_train_step": 2.699714422225952, "step": 828} +{"train_info/time_between_train_steps": 0.0034706592559814453, "step": 828} +{"info/global_step": 829, "train_info/time_within_train_step": 2.6962409019470215, "step": 829} +{"train_info/time_between_train_steps": 0.003493785858154297, "step": 829} +{"info/global_step": 830, "train_info/time_within_train_step": 2.832233190536499, "step": 830} +{"train_info/time_between_train_steps": 0.0035533905029296875, "step": 830} +{"info/global_step": 831, "train_info/time_within_train_step": 2.9902560710906982, "step": 831} +{"train_info/time_between_train_steps": 0.003545522689819336, "step": 831} +{"info/global_step": 832, "train_info/time_within_train_step": 2.9627861976623535, "step": 832} +{"train_info/time_between_train_steps": 0.0034956932067871094, "step": 832} +{"info/global_step": 833, "train_info/time_within_train_step": 2.700094699859619, "step": 833} +{"train_info/time_between_train_steps": 0.0035278797149658203, "step": 833} +{"info/global_step": 834, "train_info/time_within_train_step": 2.696674108505249, "step": 834} +{"train_info/time_between_train_steps": 0.003530740737915039, "step": 834} +{"info/global_step": 835, "train_info/time_within_train_step": 2.69606614112854, "step": 835} +{"train_info/time_between_train_steps": 0.0035216808319091797, "step": 835} +{"info/global_step": 836, "train_info/time_within_train_step": 2.6973068714141846, "step": 836} +{"train_info/time_between_train_steps": 0.0035047531127929688, "step": 836} +{"info/global_step": 837, "train_info/time_within_train_step": 2.697728157043457, "step": 837} +{"train_info/time_between_train_steps": 0.003469228744506836, "step": 837} +{"info/global_step": 838, "train_info/time_within_train_step": 2.798933982849121, "step": 838} +{"train_info/time_between_train_steps": 0.0034444332122802734, "step": 838} +{"info/global_step": 839, "train_info/time_within_train_step": 2.952378273010254, "step": 839} +{"train_info/time_between_train_steps": 0.0035567283630371094, "step": 839} +{"info/global_step": 840, "train_info/time_within_train_step": 2.8018391132354736, "step": 840} +{"train_info/time_between_train_steps": 0.0034799575805664062, "step": 840} +{"info/global_step": 841, "train_info/time_within_train_step": 2.696192979812622, "step": 841} +{"train_info/time_between_train_steps": 0.0035047531127929688, "step": 841} +{"info/global_step": 842, "train_info/time_within_train_step": 2.698441505432129, "step": 842} +{"train_info/time_between_train_steps": 0.0034852027893066406, "step": 842} +{"info/global_step": 843, "train_info/time_within_train_step": 2.697822093963623, "step": 843} +{"train_info/time_between_train_steps": 0.003475189208984375, "step": 843} +{"info/global_step": 844, "train_info/time_within_train_step": 2.797454357147217, "step": 844} +{"train_info/time_between_train_steps": 0.0035772323608398438, "step": 844} +{"info/global_step": 845, "train_info/time_within_train_step": 2.6965250968933105, "step": 845} +{"train_info/time_between_train_steps": 0.0035538673400878906, "step": 845} +{"info/global_step": 846, "train_info/time_within_train_step": 2.6996757984161377, "step": 846} +{"train_info/time_between_train_steps": 0.0041425228118896484, "step": 846} +{"info/global_step": 847, "train_info/time_within_train_step": 2.699265480041504, "step": 847} +{"train_info/time_between_train_steps": 0.0035254955291748047, "step": 847} +{"info/global_step": 848, "train_info/time_within_train_step": 2.6978342533111572, "step": 848} +{"train_info/time_between_train_steps": 0.004066944122314453, "step": 848} +{"info/global_step": 849, "train_info/time_within_train_step": 2.697685480117798, "step": 849} +{"train_info/time_between_train_steps": 0.003506183624267578, "step": 849} +{"info/global_step": 850, "train_info/time_within_train_step": 2.699460506439209, "step": 850} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746288609, "_runtime": 2631}, "step": 850} +{"logs": {"train/loss": 5.3765, "train/learning_rate": 0.0004777777777777777, "train/epoch": 1.03, "_timestamp": 1746288609, "_runtime": 2631}, "step": 850} +{"train_info/time_between_train_steps": 0.02507805824279785, "step": 850} +{"info/global_step": 851, "train_info/time_within_train_step": 2.7259654998779297, "step": 851} +{"train_info/time_between_train_steps": 0.0035829544067382812, "step": 851} +{"info/global_step": 852, "train_info/time_within_train_step": 2.879678726196289, "step": 852} +{"train_info/time_between_train_steps": 0.003607034683227539, "step": 852} +{"info/global_step": 853, "train_info/time_within_train_step": 3.054119110107422, "step": 853} +{"train_info/time_between_train_steps": 0.0035521984100341797, "step": 853} +{"info/global_step": 854, "train_info/time_within_train_step": 2.7392141819000244, "step": 854} +{"train_info/time_between_train_steps": 0.003544330596923828, "step": 854} +{"info/global_step": 855, "train_info/time_within_train_step": 2.698302984237671, "step": 855} +{"train_info/time_between_train_steps": 0.00368499755859375, "step": 855} +{"info/global_step": 856, "train_info/time_within_train_step": 2.6976230144500732, "step": 856} +{"train_info/time_between_train_steps": 0.0035483837127685547, "step": 856} +{"info/global_step": 857, "train_info/time_within_train_step": 2.6973793506622314, "step": 857} +{"train_info/time_between_train_steps": 0.0036191940307617188, "step": 857} +{"info/global_step": 858, "train_info/time_within_train_step": 2.697539806365967, "step": 858} +{"train_info/time_between_train_steps": 0.003549337387084961, "step": 858} +{"info/global_step": 859, "train_info/time_within_train_step": 2.714583396911621, "step": 859} +{"train_info/time_between_train_steps": 0.0035250186920166016, "step": 859} +{"info/global_step": 860, "train_info/time_within_train_step": 2.6952431201934814, "step": 860} +{"train_info/time_between_train_steps": 0.003632783889770508, "step": 860} +{"info/global_step": 861, "train_info/time_within_train_step": 2.6966140270233154, "step": 861} +{"train_info/time_between_train_steps": 0.003665924072265625, "step": 861} +{"info/global_step": 862, "train_info/time_within_train_step": 2.6957180500030518, "step": 862} +{"train_info/time_between_train_steps": 0.0035746097564697266, "step": 862} +{"info/global_step": 863, "train_info/time_within_train_step": 2.6972815990448, "step": 863} +{"train_info/time_between_train_steps": 0.004677772521972656, "step": 863} +{"info/global_step": 864, "train_info/time_within_train_step": 3.182295799255371, "step": 864} +{"train_info/time_between_train_steps": 0.0036971569061279297, "step": 864} +{"info/global_step": 865, "train_info/time_within_train_step": 2.6939821243286133, "step": 865} +{"train_info/time_between_train_steps": 0.0036563873291015625, "step": 865} +{"info/global_step": 866, "train_info/time_within_train_step": 2.6955199241638184, "step": 866} +{"train_info/time_between_train_steps": 0.0036249160766601562, "step": 866} +{"info/global_step": 867, "train_info/time_within_train_step": 2.6970677375793457, "step": 867} +{"train_info/time_between_train_steps": 0.0036177635192871094, "step": 867} +{"info/global_step": 868, "train_info/time_within_train_step": 2.6970131397247314, "step": 868} +{"train_info/time_between_train_steps": 0.0037026405334472656, "step": 868} +{"info/global_step": 869, "train_info/time_within_train_step": 2.699943780899048, "step": 869} +{"train_info/time_between_train_steps": 0.003998517990112305, "step": 869} +{"info/global_step": 870, "train_info/time_within_train_step": 2.703249454498291, "step": 870} +{"train_info/time_between_train_steps": 0.004025459289550781, "step": 870} +{"info/global_step": 871, "train_info/time_within_train_step": 2.7563071250915527, "step": 871} +{"train_info/time_between_train_steps": 0.0038895606994628906, "step": 871} +{"info/global_step": 872, "train_info/time_within_train_step": 2.9179768562316895, "step": 872} +{"train_info/time_between_train_steps": 0.003904581069946289, "step": 872} +{"info/global_step": 873, "train_info/time_within_train_step": 3.051553726196289, "step": 873} +{"train_info/time_between_train_steps": 0.003958463668823242, "step": 873} +{"info/global_step": 874, "train_info/time_within_train_step": 2.7151718139648438, "step": 874} +{"train_info/time_between_train_steps": 0.003880023956298828, "step": 874} +{"info/global_step": 875, "train_info/time_within_train_step": 2.697225570678711, "step": 875} +{"train_info/time_between_train_steps": 0.0039598941802978516, "step": 875} +{"info/global_step": 876, "train_info/time_within_train_step": 2.6975414752960205, "step": 876} +{"train_info/time_between_train_steps": 0.003921031951904297, "step": 876} +{"info/global_step": 877, "train_info/time_within_train_step": 2.6999168395996094, "step": 877} +{"train_info/time_between_train_steps": 0.0038924217224121094, "step": 877} +{"info/global_step": 878, "train_info/time_within_train_step": 2.6978304386138916, "step": 878} +{"train_info/time_between_train_steps": 0.003942251205444336, "step": 878} +{"info/global_step": 879, "train_info/time_within_train_step": 2.6969120502471924, "step": 879} +{"train_info/time_between_train_steps": 0.0038177967071533203, "step": 879} +{"info/global_step": 880, "train_info/time_within_train_step": 2.697981357574463, "step": 880} +{"train_info/time_between_train_steps": 0.004081010818481445, "step": 880} +{"info/global_step": 881, "train_info/time_within_train_step": 2.6969823837280273, "step": 881} +{"train_info/time_between_train_steps": 0.003947734832763672, "step": 881} +{"info/global_step": 882, "train_info/time_within_train_step": 2.9414634704589844, "step": 882} +{"train_info/time_between_train_steps": 0.0038690567016601562, "step": 882} +{"info/global_step": 883, "train_info/time_within_train_step": 2.6961071491241455, "step": 883} +{"train_info/time_between_train_steps": 0.18949532508850098, "step": 883} +{"info/global_step": 884, "train_info/time_within_train_step": 2.711719036102295, "step": 884} +{"train_info/time_between_train_steps": 0.003659486770629883, "step": 884} +{"info/global_step": 885, "train_info/time_within_train_step": 2.6980597972869873, "step": 885} +{"train_info/time_between_train_steps": 0.003683328628540039, "step": 885} +{"info/global_step": 886, "train_info/time_within_train_step": 2.696706771850586, "step": 886} +{"train_info/time_between_train_steps": 0.003683805465698242, "step": 886} +{"info/global_step": 887, "train_info/time_within_train_step": 2.6969621181488037, "step": 887} +{"train_info/time_between_train_steps": 0.0036962032318115234, "step": 887} +{"info/global_step": 888, "train_info/time_within_train_step": 2.716670274734497, "step": 888} +{"train_info/time_between_train_steps": 0.003686666488647461, "step": 888} +{"info/global_step": 889, "train_info/time_within_train_step": 2.826545238494873, "step": 889} +{"train_info/time_between_train_steps": 0.003738880157470703, "step": 889} +{"info/global_step": 890, "train_info/time_within_train_step": 2.9495248794555664, "step": 890} +{"train_info/time_between_train_steps": 0.0037293434143066406, "step": 890} +{"info/global_step": 891, "train_info/time_within_train_step": 2.719876289367676, "step": 891} +{"train_info/time_between_train_steps": 0.0036919116973876953, "step": 891} +{"info/global_step": 892, "train_info/time_within_train_step": 2.698317766189575, "step": 892} +{"train_info/time_between_train_steps": 0.003693819046020508, "step": 892} +{"info/global_step": 893, "train_info/time_within_train_step": 2.6970458030700684, "step": 893} +{"train_info/time_between_train_steps": 0.003702402114868164, "step": 893} +{"info/global_step": 894, "train_info/time_within_train_step": 2.697298765182495, "step": 894} +{"train_info/time_between_train_steps": 0.003644704818725586, "step": 894} +{"info/global_step": 895, "train_info/time_within_train_step": 4.048845529556274, "step": 895} +{"train_info/time_between_train_steps": 0.0037577152252197266, "step": 895} +{"info/global_step": 896, "train_info/time_within_train_step": 2.6955385208129883, "step": 896} +{"train_info/time_between_train_steps": 0.0037310123443603516, "step": 896} +{"info/global_step": 897, "train_info/time_within_train_step": 2.6979799270629883, "step": 897} +{"train_info/time_between_train_steps": 0.003688335418701172, "step": 897} +{"info/global_step": 898, "train_info/time_within_train_step": 2.6976003646850586, "step": 898} +{"train_info/time_between_train_steps": 0.00370025634765625, "step": 898} +{"info/global_step": 899, "train_info/time_within_train_step": 2.7001068592071533, "step": 899} +{"train_info/time_between_train_steps": 0.003771066665649414, "step": 899} +{"info/global_step": 900, "train_info/time_within_train_step": 2.6985549926757812, "step": 900} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746288757, "_runtime": 2779}, "step": 900} +{"logs": {"train/loss": 5.3335, "train/learning_rate": 0.0004666666666666666, "train/epoch": 1.05, "_timestamp": 1746288757, "_runtime": 2779}, "step": 900} +{"train_info/time_between_train_steps": 41.09962320327759, "step": 900} +{"info/global_step": 901, "train_info/time_within_train_step": 2.4738409519195557, "step": 901} +{"train_info/time_between_train_steps": 0.003731250762939453, "step": 901} +{"info/global_step": 902, "train_info/time_within_train_step": 2.536184072494507, "step": 902} +{"train_info/time_between_train_steps": 0.003657817840576172, "step": 902} +{"info/global_step": 903, "train_info/time_within_train_step": 2.6674747467041016, "step": 903} +{"train_info/time_between_train_steps": 0.003814697265625, "step": 903} +{"info/global_step": 904, "train_info/time_within_train_step": 2.6905529499053955, "step": 904} +{"train_info/time_between_train_steps": 0.0037081241607666016, "step": 904} +{"info/global_step": 905, "train_info/time_within_train_step": 2.6910510063171387, "step": 905} +{"train_info/time_between_train_steps": 0.0036945343017578125, "step": 905} +{"info/global_step": 906, "train_info/time_within_train_step": 2.693345308303833, "step": 906} +{"train_info/time_between_train_steps": 0.0036797523498535156, "step": 906} +{"info/global_step": 907, "train_info/time_within_train_step": 2.6953060626983643, "step": 907} +{"train_info/time_between_train_steps": 0.003813028335571289, "step": 907} +{"info/global_step": 908, "train_info/time_within_train_step": 2.696596384048462, "step": 908} +{"train_info/time_between_train_steps": 0.0036840438842773438, "step": 908} +{"info/global_step": 909, "train_info/time_within_train_step": 2.698399782180786, "step": 909} +{"train_info/time_between_train_steps": 0.003698110580444336, "step": 909} +{"info/global_step": 910, "train_info/time_within_train_step": 2.7769060134887695, "step": 910} +{"train_info/time_between_train_steps": 0.004060268402099609, "step": 910} +{"info/global_step": 911, "train_info/time_within_train_step": 2.9345383644104004, "step": 911} +{"train_info/time_between_train_steps": 0.003709077835083008, "step": 911} +{"info/global_step": 912, "train_info/time_within_train_step": 2.9953460693359375, "step": 912} +{"train_info/time_between_train_steps": 0.003659963607788086, "step": 912} +{"info/global_step": 913, "train_info/time_within_train_step": 2.71352481842041, "step": 913} +{"train_info/time_between_train_steps": 0.0036535263061523438, "step": 913} +{"info/global_step": 914, "train_info/time_within_train_step": 2.6983485221862793, "step": 914} +{"train_info/time_between_train_steps": 0.003653287887573242, "step": 914} +{"info/global_step": 915, "train_info/time_within_train_step": 2.6977555751800537, "step": 915} +{"train_info/time_between_train_steps": 0.0036292076110839844, "step": 915} +{"info/global_step": 916, "train_info/time_within_train_step": 2.7004339694976807, "step": 916} +{"train_info/time_between_train_steps": 0.003632783889770508, "step": 916} +{"info/global_step": 917, "train_info/time_within_train_step": 2.6980526447296143, "step": 917} +{"train_info/time_between_train_steps": 0.0035872459411621094, "step": 917} +{"info/global_step": 918, "train_info/time_within_train_step": 2.6971166133880615, "step": 918} +{"train_info/time_between_train_steps": 0.0036284923553466797, "step": 918} +{"info/global_step": 919, "train_info/time_within_train_step": 2.7845332622528076, "step": 919} +{"train_info/time_between_train_steps": 0.0036745071411132812, "step": 919} +{"info/global_step": 920, "train_info/time_within_train_step": 3.021531820297241, "step": 920} +{"train_info/time_between_train_steps": 0.003645658493041992, "step": 920} +{"info/global_step": 921, "train_info/time_within_train_step": 2.7555623054504395, "step": 921} +{"train_info/time_between_train_steps": 0.0037102699279785156, "step": 921} +{"info/global_step": 922, "train_info/time_within_train_step": 2.7000551223754883, "step": 922} +{"train_info/time_between_train_steps": 0.003655672073364258, "step": 922} +{"info/global_step": 923, "train_info/time_within_train_step": 2.825782537460327, "step": 923} +{"train_info/time_between_train_steps": 0.003678560256958008, "step": 923} +{"info/global_step": 924, "train_info/time_within_train_step": 2.8455381393432617, "step": 924} +{"train_info/time_between_train_steps": 0.0035791397094726562, "step": 924} +{"info/global_step": 925, "train_info/time_within_train_step": 2.7163236141204834, "step": 925} +{"train_info/time_between_train_steps": 0.0036537647247314453, "step": 925} +{"info/global_step": 926, "train_info/time_within_train_step": 3.043050765991211, "step": 926} +{"train_info/time_between_train_steps": 0.003599882125854492, "step": 926} +{"info/global_step": 927, "train_info/time_within_train_step": 2.700770139694214, "step": 927} +{"train_info/time_between_train_steps": 0.0035190582275390625, "step": 927} +{"info/global_step": 928, "train_info/time_within_train_step": 2.7105987071990967, "step": 928} +{"train_info/time_between_train_steps": 0.003516674041748047, "step": 928} +{"info/global_step": 929, "train_info/time_within_train_step": 2.9395010471343994, "step": 929} +{"train_info/time_between_train_steps": 0.0035996437072753906, "step": 929} +{"info/global_step": 930, "train_info/time_within_train_step": 2.873438596725464, "step": 930} +{"train_info/time_between_train_steps": 0.003522157669067383, "step": 930} +{"info/global_step": 931, "train_info/time_within_train_step": 2.71690034866333, "step": 931} +{"train_info/time_between_train_steps": 0.003557443618774414, "step": 931} +{"info/global_step": 932, "train_info/time_within_train_step": 2.6963157653808594, "step": 932} +{"train_info/time_between_train_steps": 0.003472566604614258, "step": 932} +{"info/global_step": 933, "train_info/time_within_train_step": 2.698227882385254, "step": 933} +{"train_info/time_between_train_steps": 0.0035872459411621094, "step": 933} +{"info/global_step": 934, "train_info/time_within_train_step": 2.7877161502838135, "step": 934} +{"train_info/time_between_train_steps": 0.003591299057006836, "step": 934} +{"info/global_step": 935, "train_info/time_within_train_step": 2.9301252365112305, "step": 935} +{"train_info/time_between_train_steps": 0.003602743148803711, "step": 935} +{"info/global_step": 936, "train_info/time_within_train_step": 2.7377371788024902, "step": 936} +{"train_info/time_between_train_steps": 0.003551006317138672, "step": 936} +{"info/global_step": 937, "train_info/time_within_train_step": 2.7140119075775146, "step": 937} +{"train_info/time_between_train_steps": 0.0035381317138671875, "step": 937} +{"info/global_step": 938, "train_info/time_within_train_step": 2.8922548294067383, "step": 938} +{"train_info/time_between_train_steps": 0.0035321712493896484, "step": 938} +{"info/global_step": 939, "train_info/time_within_train_step": 2.8686273097991943, "step": 939} +{"train_info/time_between_train_steps": 0.003519296646118164, "step": 939} +{"info/global_step": 940, "train_info/time_within_train_step": 2.7299606800079346, "step": 940} +{"train_info/time_between_train_steps": 0.003666400909423828, "step": 940} +{"info/global_step": 941, "train_info/time_within_train_step": 2.738415479660034, "step": 941} +{"train_info/time_between_train_steps": 0.0035719871520996094, "step": 941} +{"info/global_step": 942, "train_info/time_within_train_step": 2.876800298690796, "step": 942} +{"train_info/time_between_train_steps": 0.0035517215728759766, "step": 942} +{"info/global_step": 943, "train_info/time_within_train_step": 2.781684637069702, "step": 943} +{"train_info/time_between_train_steps": 0.003854513168334961, "step": 943} +{"info/global_step": 944, "train_info/time_within_train_step": 2.7072808742523193, "step": 944} +{"train_info/time_between_train_steps": 0.004067420959472656, "step": 944} +{"info/global_step": 945, "train_info/time_within_train_step": 3.323967456817627, "step": 945} +{"train_info/time_between_train_steps": 0.004075050354003906, "step": 945} +{"info/global_step": 946, "train_info/time_within_train_step": 2.883242607116699, "step": 946} +{"train_info/time_between_train_steps": 0.0037622451782226562, "step": 946} +{"info/global_step": 947, "train_info/time_within_train_step": 2.6943132877349854, "step": 947} +{"train_info/time_between_train_steps": 0.0037055015563964844, "step": 947} +{"info/global_step": 948, "train_info/time_within_train_step": 2.6931369304656982, "step": 948} +{"train_info/time_between_train_steps": 0.003694295883178711, "step": 948} +{"info/global_step": 949, "train_info/time_within_train_step": 2.6977269649505615, "step": 949} +{"train_info/time_between_train_steps": 0.0036399364471435547, "step": 949} +{"info/global_step": 950, "train_info/time_within_train_step": 2.696561813354492, "step": 950} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746288943, "_runtime": 2965}, "step": 950} +{"logs": {"train/loss": 5.2909, "train/learning_rate": 0.00045555555555555556, "train/epoch": 1.06, "_timestamp": 1746288943, "_runtime": 2965}, "step": 950} +{"train_info/time_between_train_steps": 0.031139850616455078, "step": 950} +{"info/global_step": 951, "train_info/time_within_train_step": 2.6956896781921387, "step": 951} +{"train_info/time_between_train_steps": 0.0037016868591308594, "step": 951} +{"info/global_step": 952, "train_info/time_within_train_step": 2.695054292678833, "step": 952} +{"train_info/time_between_train_steps": 0.003610372543334961, "step": 952} +{"info/global_step": 953, "train_info/time_within_train_step": 2.695786476135254, "step": 953} +{"train_info/time_between_train_steps": 0.0038123130798339844, "step": 953} +{"info/global_step": 954, "train_info/time_within_train_step": 2.696422815322876, "step": 954} +{"train_info/time_between_train_steps": 0.0036017894744873047, "step": 954} +{"info/global_step": 955, "train_info/time_within_train_step": 2.6961371898651123, "step": 955} +{"train_info/time_between_train_steps": 0.0036919116973876953, "step": 955} +{"info/global_step": 956, "train_info/time_within_train_step": 2.6968817710876465, "step": 956} +{"train_info/time_between_train_steps": 0.0036542415618896484, "step": 956} +{"info/global_step": 957, "train_info/time_within_train_step": 2.6972272396087646, "step": 957} +{"train_info/time_between_train_steps": 0.003732919692993164, "step": 957} +{"info/global_step": 958, "train_info/time_within_train_step": 2.698357343673706, "step": 958} +{"train_info/time_between_train_steps": 0.0036246776580810547, "step": 958} +{"info/global_step": 959, "train_info/time_within_train_step": 2.6957383155822754, "step": 959} +{"train_info/time_between_train_steps": 0.003591775894165039, "step": 959} +{"info/global_step": 960, "train_info/time_within_train_step": 2.7589166164398193, "step": 960} +{"train_info/time_between_train_steps": 0.0036821365356445312, "step": 960} +{"info/global_step": 961, "train_info/time_within_train_step": 2.893137216567993, "step": 961} +{"train_info/time_between_train_steps": 0.0036020278930664062, "step": 961} +{"info/global_step": 962, "train_info/time_within_train_step": 2.863692045211792, "step": 962} +{"train_info/time_between_train_steps": 0.003701448440551758, "step": 962} +{"info/global_step": 963, "train_info/time_within_train_step": 2.7042508125305176, "step": 963} +{"train_info/time_between_train_steps": 0.0036852359771728516, "step": 963} +{"info/global_step": 964, "train_info/time_within_train_step": 2.698288917541504, "step": 964} +{"train_info/time_between_train_steps": 0.003606557846069336, "step": 964} +{"info/global_step": 965, "train_info/time_within_train_step": 2.7016117572784424, "step": 965} +{"train_info/time_between_train_steps": 0.0036630630493164062, "step": 965} +{"info/global_step": 966, "train_info/time_within_train_step": 2.7775304317474365, "step": 966} +{"train_info/time_between_train_steps": 0.0036406517028808594, "step": 966} +{"info/global_step": 967, "train_info/time_within_train_step": 2.997864007949829, "step": 967} +{"train_info/time_between_train_steps": 0.0037364959716796875, "step": 967} +{"info/global_step": 968, "train_info/time_within_train_step": 2.7444775104522705, "step": 968} +{"train_info/time_between_train_steps": 0.003696441650390625, "step": 968} +{"info/global_step": 969, "train_info/time_within_train_step": 2.6990444660186768, "step": 969} +{"train_info/time_between_train_steps": 0.003692626953125, "step": 969} +{"info/global_step": 970, "train_info/time_within_train_step": 2.698610544204712, "step": 970} +{"train_info/time_between_train_steps": 0.003704071044921875, "step": 970} +{"info/global_step": 971, "train_info/time_within_train_step": 2.722754955291748, "step": 971} +{"train_info/time_between_train_steps": 0.0036416053771972656, "step": 971} +{"info/global_step": 972, "train_info/time_within_train_step": 2.876946210861206, "step": 972} +{"train_info/time_between_train_steps": 0.0037696361541748047, "step": 972} +{"info/global_step": 973, "train_info/time_within_train_step": 2.756014585494995, "step": 973} +{"train_info/time_between_train_steps": 0.003896951675415039, "step": 973} +{"info/global_step": 974, "train_info/time_within_train_step": 2.6976969242095947, "step": 974} +{"train_info/time_between_train_steps": 0.00408172607421875, "step": 974} +{"info/global_step": 975, "train_info/time_within_train_step": 2.697770595550537, "step": 975} +{"train_info/time_between_train_steps": 0.003794431686401367, "step": 975} +{"info/global_step": 976, "train_info/time_within_train_step": 2.7241933345794678, "step": 976} +{"train_info/time_between_train_steps": 0.0039048194885253906, "step": 976} +{"info/global_step": 977, "train_info/time_within_train_step": 2.8306217193603516, "step": 977} +{"train_info/time_between_train_steps": 0.0039441585540771484, "step": 977} +{"info/global_step": 978, "train_info/time_within_train_step": 3.142195463180542, "step": 978} +{"train_info/time_between_train_steps": 0.003579378128051758, "step": 978} +{"info/global_step": 979, "train_info/time_within_train_step": 2.69938588142395, "step": 979} +{"train_info/time_between_train_steps": 0.0036020278930664062, "step": 979} +{"info/global_step": 980, "train_info/time_within_train_step": 2.696923017501831, "step": 980} +{"train_info/time_between_train_steps": 0.0035552978515625, "step": 980} +{"info/global_step": 981, "train_info/time_within_train_step": 2.696559429168701, "step": 981} +{"train_info/time_between_train_steps": 0.0035228729248046875, "step": 981} +{"info/global_step": 982, "train_info/time_within_train_step": 2.7176787853240967, "step": 982} +{"train_info/time_between_train_steps": 0.003507852554321289, "step": 982} +{"info/global_step": 983, "train_info/time_within_train_step": 2.9804539680480957, "step": 983} +{"train_info/time_between_train_steps": 0.0036499500274658203, "step": 983} +{"info/global_step": 984, "train_info/time_within_train_step": 2.9090142250061035, "step": 984} +{"train_info/time_between_train_steps": 0.0036733150482177734, "step": 984} +{"info/global_step": 985, "train_info/time_within_train_step": 2.7846524715423584, "step": 985} +{"train_info/time_between_train_steps": 0.003686189651489258, "step": 985} +{"info/global_step": 986, "train_info/time_within_train_step": 2.7362136840820312, "step": 986} +{"train_info/time_between_train_steps": 0.003547191619873047, "step": 986} +{"info/global_step": 987, "train_info/time_within_train_step": 2.7241263389587402, "step": 987} +{"train_info/time_between_train_steps": 0.003618955612182617, "step": 987} +{"info/global_step": 988, "train_info/time_within_train_step": 2.8096094131469727, "step": 988} +{"train_info/time_between_train_steps": 0.003504514694213867, "step": 988} +{"info/global_step": 989, "train_info/time_within_train_step": 2.745948314666748, "step": 989} +{"train_info/time_between_train_steps": 0.003626585006713867, "step": 989} +{"info/global_step": 990, "train_info/time_within_train_step": 2.7758235931396484, "step": 990} +{"train_info/time_between_train_steps": 0.0035109519958496094, "step": 990} +{"info/global_step": 991, "train_info/time_within_train_step": 2.9133903980255127, "step": 991} +{"train_info/time_between_train_steps": 0.0035698413848876953, "step": 991} +{"info/global_step": 992, "train_info/time_within_train_step": 2.73335862159729, "step": 992} +{"train_info/time_between_train_steps": 0.003556489944458008, "step": 992} +{"info/global_step": 993, "train_info/time_within_train_step": 2.7030832767486572, "step": 993} +{"train_info/time_between_train_steps": 0.00357818603515625, "step": 993} +{"info/global_step": 994, "train_info/time_within_train_step": 2.8759145736694336, "step": 994} +{"train_info/time_between_train_steps": 0.003674745559692383, "step": 994} +{"info/global_step": 995, "train_info/time_within_train_step": 2.9215633869171143, "step": 995} +{"train_info/time_between_train_steps": 0.003671884536743164, "step": 995} +{"info/global_step": 996, "train_info/time_within_train_step": 2.8219363689422607, "step": 996} +{"train_info/time_between_train_steps": 0.003638029098510742, "step": 996} +{"info/global_step": 997, "train_info/time_within_train_step": 2.7186777591705322, "step": 997} +{"train_info/time_between_train_steps": 0.0035865306854248047, "step": 997} +{"info/global_step": 998, "train_info/time_within_train_step": 2.730541229248047, "step": 998} +{"train_info/time_between_train_steps": 0.0037508010864257812, "step": 998} +{"info/global_step": 999, "train_info/time_within_train_step": 2.7820241451263428, "step": 999} +{"train_info/time_between_train_steps": 0.0037093162536621094, "step": 999} +{"info/global_step": 1000, "train_info/time_within_train_step": 3.3077778816223145, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 5466.0, "train_info/memory_max_reserved": 5466.0, "_timestamp": 1746289084, "_runtime": 3106}, "step": 1000} +{"logs": {"train/loss": 5.2443, "train/learning_rate": 0.00044444444444444436, "train/epoch": 1.08, "_timestamp": 1746289084, "_runtime": 3106}, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289091, "_runtime": 3113}, "step": 1000} +{"logs": {"eval/loss": 5.493804931640625, "eval/runtime": 5.9984, "eval/samples_per_second": 30.341, "eval/steps_per_second": 1.0, "train/epoch": 1.08, "_timestamp": 1746289091, "_runtime": 3113}, "step": 1000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289091, "_runtime": 3113}, "step": 1000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 5.493804931640625, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 243.180734835711, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.9984, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 30.341, "train/epoch": 1.08, "_timestamp": 1746289091, "_runtime": 3113}, "step": 1000} +{"train_info/time_between_train_steps": 20.482836484909058, "step": 1000} +{"info/global_step": 1001, "train_info/time_within_train_step": 2.490696430206299, "step": 1001} +{"train_info/time_between_train_steps": 0.003779888153076172, "step": 1001} +{"info/global_step": 1002, "train_info/time_within_train_step": 2.50900936126709, "step": 1002} +{"train_info/time_between_train_steps": 0.003818035125732422, "step": 1002} +{"info/global_step": 1003, "train_info/time_within_train_step": 2.6894302368164062, "step": 1003} +{"train_info/time_between_train_steps": 0.003844022750854492, "step": 1003} +{"info/global_step": 1004, "train_info/time_within_train_step": 2.6923632621765137, "step": 1004} +{"train_info/time_between_train_steps": 0.0038034915924072266, "step": 1004} +{"info/global_step": 1005, "train_info/time_within_train_step": 2.694936752319336, "step": 1005} +{"train_info/time_between_train_steps": 0.0038568973541259766, "step": 1005} +{"info/global_step": 1006, "train_info/time_within_train_step": 2.6967933177948, "step": 1006} +{"train_info/time_between_train_steps": 0.003904581069946289, "step": 1006} +{"info/global_step": 1007, "train_info/time_within_train_step": 2.6988046169281006, "step": 1007} +{"train_info/time_between_train_steps": 0.003910064697265625, "step": 1007} +{"info/global_step": 1008, "train_info/time_within_train_step": 2.8413901329040527, "step": 1008} +{"train_info/time_between_train_steps": 0.1708993911743164, "step": 1008} +{"info/global_step": 1009, "train_info/time_within_train_step": 2.715414047241211, "step": 1009} +{"train_info/time_between_train_steps": 0.0036516189575195312, "step": 1009} +{"info/global_step": 1010, "train_info/time_within_train_step": 3.0063607692718506, "step": 1010} +{"train_info/time_between_train_steps": 0.003628253936767578, "step": 1010} +{"info/global_step": 1011, "train_info/time_within_train_step": 2.798556327819824, "step": 1011} +{"train_info/time_between_train_steps": 0.003632783889770508, "step": 1011} +{"info/global_step": 1012, "train_info/time_within_train_step": 2.6979713439941406, "step": 1012} +{"train_info/time_between_train_steps": 0.0036928653717041016, "step": 1012} +{"info/global_step": 1013, "train_info/time_within_train_step": 2.702897787094116, "step": 1013} +{"train_info/time_between_train_steps": 0.004221677780151367, "step": 1013} +{"info/global_step": 1014, "train_info/time_within_train_step": 2.7895402908325195, "step": 1014} +{"train_info/time_between_train_steps": 0.0036907196044921875, "step": 1014} +{"info/global_step": 1015, "train_info/time_within_train_step": 2.8106958866119385, "step": 1015} +{"train_info/time_between_train_steps": 0.003634214401245117, "step": 1015} +{"info/global_step": 1016, "train_info/time_within_train_step": 2.770627975463867, "step": 1016} +{"train_info/time_between_train_steps": 0.003650665283203125, "step": 1016} +{"info/global_step": 1017, "train_info/time_within_train_step": 2.8095970153808594, "step": 1017} +{"train_info/time_between_train_steps": 0.0036592483520507812, "step": 1017} +{"info/global_step": 1018, "train_info/time_within_train_step": 2.81980562210083, "step": 1018} +{"train_info/time_between_train_steps": 0.003689289093017578, "step": 1018} +{"info/global_step": 1019, "train_info/time_within_train_step": 2.738009214401245, "step": 1019} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 1019} +{"info/global_step": 1020, "train_info/time_within_train_step": 2.8171064853668213, "step": 1020} +{"train_info/time_between_train_steps": 0.003645181655883789, "step": 1020} +{"info/global_step": 1021, "train_info/time_within_train_step": 2.9300949573516846, "step": 1021} +{"train_info/time_between_train_steps": 0.0036673545837402344, "step": 1021} +{"info/global_step": 1022, "train_info/time_within_train_step": 2.8507487773895264, "step": 1022} +{"train_info/time_between_train_steps": 0.0036771297454833984, "step": 1022} +{"info/global_step": 1023, "train_info/time_within_train_step": 2.7646231651306152, "step": 1023} +{"train_info/time_between_train_steps": 0.003613710403442383, "step": 1023} +{"info/global_step": 1024, "train_info/time_within_train_step": 2.820631742477417, "step": 1024} +{"train_info/time_between_train_steps": 0.003692150115966797, "step": 1024} +{"info/global_step": 1025, "train_info/time_within_train_step": 2.8809947967529297, "step": 1025} +{"train_info/time_between_train_steps": 0.0078067779541015625, "step": 1025} +{"info/global_step": 1026, "train_info/time_within_train_step": 2.966966390609741, "step": 1026} +{"train_info/time_between_train_steps": 0.003754138946533203, "step": 1026} +{"info/global_step": 1027, "train_info/time_within_train_step": 2.8834452629089355, "step": 1027} +{"train_info/time_between_train_steps": 0.003644704818725586, "step": 1027} +{"info/global_step": 1028, "train_info/time_within_train_step": 2.7578799724578857, "step": 1028} +{"train_info/time_between_train_steps": 0.007348060607910156, "step": 1028} +{"info/global_step": 1029, "train_info/time_within_train_step": 2.8185243606567383, "step": 1029} +{"train_info/time_between_train_steps": 0.0038251876831054688, "step": 1029} +{"info/global_step": 1030, "train_info/time_within_train_step": 2.9025373458862305, "step": 1030} +{"train_info/time_between_train_steps": 0.003636598587036133, "step": 1030} +{"info/global_step": 1031, "train_info/time_within_train_step": 2.8587546348571777, "step": 1031} +{"train_info/time_between_train_steps": 0.003724336624145508, "step": 1031} +{"info/global_step": 1032, "train_info/time_within_train_step": 3.0270609855651855, "step": 1032} +{"train_info/time_between_train_steps": 0.003560304641723633, "step": 1032} +{"info/global_step": 1033, "train_info/time_within_train_step": 2.7115986347198486, "step": 1033} +{"train_info/time_between_train_steps": 0.003468036651611328, "step": 1033} +{"info/global_step": 1034, "train_info/time_within_train_step": 2.981989860534668, "step": 1034} +{"train_info/time_between_train_steps": 0.0035758018493652344, "step": 1034} +{"info/global_step": 1035, "train_info/time_within_train_step": 3.0238513946533203, "step": 1035} +{"train_info/time_between_train_steps": 0.0034987926483154297, "step": 1035} +{"info/global_step": 1036, "train_info/time_within_train_step": 2.8407492637634277, "step": 1036} +{"train_info/time_between_train_steps": 0.003507852554321289, "step": 1036} +{"info/global_step": 1037, "train_info/time_within_train_step": 2.7542996406555176, "step": 1037} +{"train_info/time_between_train_steps": 0.0034787654876708984, "step": 1037} +{"info/global_step": 1038, "train_info/time_within_train_step": 2.7609944343566895, "step": 1038} +{"train_info/time_between_train_steps": 0.003573179244995117, "step": 1038} +{"info/global_step": 1039, "train_info/time_within_train_step": 2.828617572784424, "step": 1039} +{"train_info/time_between_train_steps": 0.0034863948822021484, "step": 1039} +{"info/global_step": 1040, "train_info/time_within_train_step": 2.864379644393921, "step": 1040} +{"train_info/time_between_train_steps": 0.0034646987915039062, "step": 1040} +{"info/global_step": 1041, "train_info/time_within_train_step": 2.808583974838257, "step": 1041} +{"train_info/time_between_train_steps": 0.0034477710723876953, "step": 1041} +{"info/global_step": 1042, "train_info/time_within_train_step": 2.8023386001586914, "step": 1042} +{"train_info/time_between_train_steps": 0.003517627716064453, "step": 1042} +{"info/global_step": 1043, "train_info/time_within_train_step": 2.722646713256836, "step": 1043} +{"train_info/time_between_train_steps": 0.003484010696411133, "step": 1043} +{"info/global_step": 1044, "train_info/time_within_train_step": 2.746802806854248, "step": 1044} +{"train_info/time_between_train_steps": 0.0035600662231445312, "step": 1044} +{"info/global_step": 1045, "train_info/time_within_train_step": 2.861288070678711, "step": 1045} +{"train_info/time_between_train_steps": 0.003541707992553711, "step": 1045} +{"info/global_step": 1046, "train_info/time_within_train_step": 2.8970348834991455, "step": 1046} +{"train_info/time_between_train_steps": 0.003504037857055664, "step": 1046} +{"info/global_step": 1047, "train_info/time_within_train_step": 2.808119058609009, "step": 1047} +{"train_info/time_between_train_steps": 0.0034737586975097656, "step": 1047} +{"info/global_step": 1048, "train_info/time_within_train_step": 2.8055388927459717, "step": 1048} +{"train_info/time_between_train_steps": 0.003514528274536133, "step": 1048} +{"info/global_step": 1049, "train_info/time_within_train_step": 2.8639779090881348, "step": 1049} +{"train_info/time_between_train_steps": 0.0034818649291992188, "step": 1049} +{"info/global_step": 1050, "train_info/time_within_train_step": 2.8043370246887207, "step": 1050} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289248, "_runtime": 3270}, "step": 1050} +{"logs": {"train/loss": 5.2005, "train/learning_rate": 0.0004333333333333333, "train/epoch": 1.1, "_timestamp": 1746289248, "_runtime": 3270}, "step": 1050} +{"train_info/time_between_train_steps": 0.025693655014038086, "step": 1050} +{"info/global_step": 1051, "train_info/time_within_train_step": 2.8101887702941895, "step": 1051} +{"train_info/time_between_train_steps": 0.003557443618774414, "step": 1051} +{"info/global_step": 1052, "train_info/time_within_train_step": 2.800370216369629, "step": 1052} +{"train_info/time_between_train_steps": 0.0035626888275146484, "step": 1052} +{"info/global_step": 1053, "train_info/time_within_train_step": 2.759531259536743, "step": 1053} +{"train_info/time_between_train_steps": 0.004504680633544922, "step": 1053} +{"info/global_step": 1054, "train_info/time_within_train_step": 2.8073387145996094, "step": 1054} +{"train_info/time_between_train_steps": 0.003563404083251953, "step": 1054} +{"info/global_step": 1055, "train_info/time_within_train_step": 2.800961971282959, "step": 1055} +{"train_info/time_between_train_steps": 0.0035028457641601562, "step": 1055} +{"info/global_step": 1056, "train_info/time_within_train_step": 2.8225085735321045, "step": 1056} +{"train_info/time_between_train_steps": 0.0035169124603271484, "step": 1056} +{"info/global_step": 1057, "train_info/time_within_train_step": 2.701983690261841, "step": 1057} +{"train_info/time_between_train_steps": 0.0035643577575683594, "step": 1057} +{"info/global_step": 1058, "train_info/time_within_train_step": 2.711181879043579, "step": 1058} +{"train_info/time_between_train_steps": 0.0035469532012939453, "step": 1058} +{"info/global_step": 1059, "train_info/time_within_train_step": 2.761686086654663, "step": 1059} +{"train_info/time_between_train_steps": 0.0035457611083984375, "step": 1059} +{"info/global_step": 1060, "train_info/time_within_train_step": 2.8338513374328613, "step": 1060} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 1060} +{"info/global_step": 1061, "train_info/time_within_train_step": 2.8329734802246094, "step": 1061} +{"train_info/time_between_train_steps": 0.0035715103149414062, "step": 1061} +{"info/global_step": 1062, "train_info/time_within_train_step": 2.7738425731658936, "step": 1062} +{"train_info/time_between_train_steps": 0.0035295486450195312, "step": 1062} +{"info/global_step": 1063, "train_info/time_within_train_step": 2.7509665489196777, "step": 1063} +{"train_info/time_between_train_steps": 0.003559589385986328, "step": 1063} +{"info/global_step": 1064, "train_info/time_within_train_step": 2.783228874206543, "step": 1064} +{"train_info/time_between_train_steps": 0.0038144588470458984, "step": 1064} +{"info/global_step": 1065, "train_info/time_within_train_step": 2.7782504558563232, "step": 1065} +{"train_info/time_between_train_steps": 0.0035767555236816406, "step": 1065} +{"info/global_step": 1066, "train_info/time_within_train_step": 2.7709579467773438, "step": 1066} +{"train_info/time_between_train_steps": 0.0035555362701416016, "step": 1066} +{"info/global_step": 1067, "train_info/time_within_train_step": 2.7147927284240723, "step": 1067} +{"train_info/time_between_train_steps": 0.0035698413848876953, "step": 1067} +{"info/global_step": 1068, "train_info/time_within_train_step": 2.7928972244262695, "step": 1068} +{"train_info/time_between_train_steps": 0.003606557846069336, "step": 1068} +{"info/global_step": 1069, "train_info/time_within_train_step": 2.8818159103393555, "step": 1069} +{"train_info/time_between_train_steps": 0.003506183624267578, "step": 1069} +{"info/global_step": 1070, "train_info/time_within_train_step": 2.7303407192230225, "step": 1070} +{"train_info/time_between_train_steps": 0.0035347938537597656, "step": 1070} +{"info/global_step": 1071, "train_info/time_within_train_step": 2.824812889099121, "step": 1071} +{"train_info/time_between_train_steps": 0.003508329391479492, "step": 1071} +{"info/global_step": 1072, "train_info/time_within_train_step": 2.7612602710723877, "step": 1072} +{"train_info/time_between_train_steps": 0.003484487533569336, "step": 1072} +{"info/global_step": 1073, "train_info/time_within_train_step": 2.8903133869171143, "step": 1073} +{"train_info/time_between_train_steps": 0.0035512447357177734, "step": 1073} +{"info/global_step": 1074, "train_info/time_within_train_step": 2.7422125339508057, "step": 1074} +{"train_info/time_between_train_steps": 0.0035295486450195312, "step": 1074} +{"info/global_step": 1075, "train_info/time_within_train_step": 2.7087836265563965, "step": 1075} +{"train_info/time_between_train_steps": 0.0035512447357177734, "step": 1075} +{"info/global_step": 1076, "train_info/time_within_train_step": 2.7475359439849854, "step": 1076} +{"train_info/time_between_train_steps": 0.0035741329193115234, "step": 1076} +{"info/global_step": 1077, "train_info/time_within_train_step": 2.8032822608947754, "step": 1077} +{"train_info/time_between_train_steps": 0.003541231155395508, "step": 1077} +{"info/global_step": 1078, "train_info/time_within_train_step": 2.7443737983703613, "step": 1078} +{"train_info/time_between_train_steps": 0.0035572052001953125, "step": 1078} +{"info/global_step": 1079, "train_info/time_within_train_step": 2.7407419681549072, "step": 1079} +{"train_info/time_between_train_steps": 0.00365447998046875, "step": 1079} +{"info/global_step": 1080, "train_info/time_within_train_step": 2.826669454574585, "step": 1080} +{"train_info/time_between_train_steps": 0.0036203861236572266, "step": 1080} +{"info/global_step": 1081, "train_info/time_within_train_step": 2.6956300735473633, "step": 1081} +{"train_info/time_between_train_steps": 0.003551483154296875, "step": 1081} +{"info/global_step": 1082, "train_info/time_within_train_step": 2.6931519508361816, "step": 1082} +{"train_info/time_between_train_steps": 0.00359344482421875, "step": 1082} +{"info/global_step": 1083, "train_info/time_within_train_step": 2.694600820541382, "step": 1083} +{"train_info/time_between_train_steps": 0.0035452842712402344, "step": 1083} +{"info/global_step": 1084, "train_info/time_within_train_step": 2.6939945220947266, "step": 1084} +{"train_info/time_between_train_steps": 0.003627300262451172, "step": 1084} +{"info/global_step": 1085, "train_info/time_within_train_step": 2.6958961486816406, "step": 1085} +{"train_info/time_between_train_steps": 0.0035784244537353516, "step": 1085} +{"info/global_step": 1086, "train_info/time_within_train_step": 2.6950182914733887, "step": 1086} +{"train_info/time_between_train_steps": 0.0035943984985351562, "step": 1086} +{"info/global_step": 1087, "train_info/time_within_train_step": 2.6953327655792236, "step": 1087} +{"train_info/time_between_train_steps": 0.0035364627838134766, "step": 1087} +{"info/global_step": 1088, "train_info/time_within_train_step": 2.6965925693511963, "step": 1088} +{"train_info/time_between_train_steps": 0.0035681724548339844, "step": 1088} +{"info/global_step": 1089, "train_info/time_within_train_step": 2.697352409362793, "step": 1089} +{"train_info/time_between_train_steps": 0.0035812854766845703, "step": 1089} +{"info/global_step": 1090, "train_info/time_within_train_step": 2.6975131034851074, "step": 1090} +{"train_info/time_between_train_steps": 0.003647327423095703, "step": 1090} +{"info/global_step": 1091, "train_info/time_within_train_step": 2.6998038291931152, "step": 1091} +{"train_info/time_between_train_steps": 0.003711700439453125, "step": 1091} +{"info/global_step": 1092, "train_info/time_within_train_step": 2.698878526687622, "step": 1092} +{"train_info/time_between_train_steps": 0.003636598587036133, "step": 1092} +{"info/global_step": 1093, "train_info/time_within_train_step": 2.6984028816223145, "step": 1093} +{"train_info/time_between_train_steps": 0.003619670867919922, "step": 1093} +{"info/global_step": 1094, "train_info/time_within_train_step": 2.698712110519409, "step": 1094} +{"train_info/time_between_train_steps": 0.0035300254821777344, "step": 1094} +{"info/global_step": 1095, "train_info/time_within_train_step": 2.6978843212127686, "step": 1095} +{"train_info/time_between_train_steps": 0.003595113754272461, "step": 1095} +{"info/global_step": 1096, "train_info/time_within_train_step": 2.698204755783081, "step": 1096} +{"train_info/time_between_train_steps": 0.003555774688720703, "step": 1096} +{"info/global_step": 1097, "train_info/time_within_train_step": 2.7411859035491943, "step": 1097} +{"train_info/time_between_train_steps": 0.0034949779510498047, "step": 1097} +{"info/global_step": 1098, "train_info/time_within_train_step": 3.0222527980804443, "step": 1098} +{"train_info/time_between_train_steps": 0.0035779476165771484, "step": 1098} +{"info/global_step": 1099, "train_info/time_within_train_step": 2.891813278198242, "step": 1099} +{"train_info/time_between_train_steps": 0.003524303436279297, "step": 1099} +{"info/global_step": 1100, "train_info/time_within_train_step": 2.695674419403076, "step": 1100} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289391, "_runtime": 3413}, "step": 1100} +{"logs": {"train/loss": 5.1719, "train/learning_rate": 0.0004222222222222222, "train/epoch": 1.11, "_timestamp": 1746289391, "_runtime": 3413}, "step": 1100} +{"train_info/time_between_train_steps": 14.164521217346191, "step": 1100} +{"info/global_step": 1101, "train_info/time_within_train_step": 2.4723756313323975, "step": 1101} +{"train_info/time_between_train_steps": 0.003638029098510742, "step": 1101} +{"info/global_step": 1102, "train_info/time_within_train_step": 2.515077829360962, "step": 1102} +{"train_info/time_between_train_steps": 0.003571748733520508, "step": 1102} +{"info/global_step": 1103, "train_info/time_within_train_step": 2.690751075744629, "step": 1103} +{"train_info/time_between_train_steps": 0.003530263900756836, "step": 1103} +{"info/global_step": 1104, "train_info/time_within_train_step": 2.6936655044555664, "step": 1104} +{"train_info/time_between_train_steps": 0.003566741943359375, "step": 1104} +{"info/global_step": 1105, "train_info/time_within_train_step": 2.6936185359954834, "step": 1105} +{"train_info/time_between_train_steps": 0.0036449432373046875, "step": 1105} +{"info/global_step": 1106, "train_info/time_within_train_step": 2.695918560028076, "step": 1106} +{"train_info/time_between_train_steps": 0.0035064220428466797, "step": 1106} +{"info/global_step": 1107, "train_info/time_within_train_step": 2.6960999965667725, "step": 1107} +{"train_info/time_between_train_steps": 0.0035753250122070312, "step": 1107} +{"info/global_step": 1108, "train_info/time_within_train_step": 3.066704750061035, "step": 1108} +{"train_info/time_between_train_steps": 0.0035848617553710938, "step": 1108} +{"info/global_step": 1109, "train_info/time_within_train_step": 2.8818368911743164, "step": 1109} +{"train_info/time_between_train_steps": 0.003606557846069336, "step": 1109} +{"info/global_step": 1110, "train_info/time_within_train_step": 3.18608021736145, "step": 1110} +{"train_info/time_between_train_steps": 0.003649473190307617, "step": 1110} +{"info/global_step": 1111, "train_info/time_within_train_step": 2.7641732692718506, "step": 1111} +{"train_info/time_between_train_steps": 0.003582000732421875, "step": 1111} +{"info/global_step": 1112, "train_info/time_within_train_step": 2.698225259780884, "step": 1112} +{"train_info/time_between_train_steps": 0.003579854965209961, "step": 1112} +{"info/global_step": 1113, "train_info/time_within_train_step": 2.700035810470581, "step": 1113} +{"train_info/time_between_train_steps": 0.003543376922607422, "step": 1113} +{"info/global_step": 1114, "train_info/time_within_train_step": 2.899263858795166, "step": 1114} +{"train_info/time_between_train_steps": 0.003532886505126953, "step": 1114} +{"info/global_step": 1115, "train_info/time_within_train_step": 3.014089822769165, "step": 1115} +{"train_info/time_between_train_steps": 0.0035223960876464844, "step": 1115} +{"info/global_step": 1116, "train_info/time_within_train_step": 2.843628406524658, "step": 1116} +{"train_info/time_between_train_steps": 0.003641366958618164, "step": 1116} +{"info/global_step": 1117, "train_info/time_within_train_step": 2.6996562480926514, "step": 1117} +{"train_info/time_between_train_steps": 0.003595113754272461, "step": 1117} +{"info/global_step": 1118, "train_info/time_within_train_step": 2.7007272243499756, "step": 1118} +{"train_info/time_between_train_steps": 0.0043065547943115234, "step": 1118} +{"info/global_step": 1119, "train_info/time_within_train_step": 2.902039051055908, "step": 1119} +{"train_info/time_between_train_steps": 0.0036683082580566406, "step": 1119} +{"info/global_step": 1120, "train_info/time_within_train_step": 2.901346445083618, "step": 1120} +{"train_info/time_between_train_steps": 0.0036258697509765625, "step": 1120} +{"info/global_step": 1121, "train_info/time_within_train_step": 2.8109798431396484, "step": 1121} +{"train_info/time_between_train_steps": 0.0036194324493408203, "step": 1121} +{"info/global_step": 1122, "train_info/time_within_train_step": 2.750844955444336, "step": 1122} +{"train_info/time_between_train_steps": 0.003796100616455078, "step": 1122} +{"info/global_step": 1123, "train_info/time_within_train_step": 2.869873523712158, "step": 1123} +{"train_info/time_between_train_steps": 0.004329204559326172, "step": 1123} +{"info/global_step": 1124, "train_info/time_within_train_step": 2.966766834259033, "step": 1124} +{"train_info/time_between_train_steps": 0.004285573959350586, "step": 1124} +{"info/global_step": 1125, "train_info/time_within_train_step": 2.8530197143554688, "step": 1125} +{"train_info/time_between_train_steps": 0.004057884216308594, "step": 1125} +{"info/global_step": 1126, "train_info/time_within_train_step": 2.7715821266174316, "step": 1126} +{"train_info/time_between_train_steps": 0.004020214080810547, "step": 1126} +{"info/global_step": 1127, "train_info/time_within_train_step": 2.7585887908935547, "step": 1127} +{"train_info/time_between_train_steps": 0.003931522369384766, "step": 1127} +{"info/global_step": 1128, "train_info/time_within_train_step": 2.8942904472351074, "step": 1128} +{"train_info/time_between_train_steps": 0.0049059391021728516, "step": 1128} +{"info/global_step": 1129, "train_info/time_within_train_step": 2.9141340255737305, "step": 1129} +{"train_info/time_between_train_steps": 0.004117488861083984, "step": 1129} +{"info/global_step": 1130, "train_info/time_within_train_step": 2.852145195007324, "step": 1130} +{"train_info/time_between_train_steps": 0.004060029983520508, "step": 1130} +{"info/global_step": 1131, "train_info/time_within_train_step": 2.908281087875366, "step": 1131} +{"train_info/time_between_train_steps": 0.003973722457885742, "step": 1131} +{"info/global_step": 1132, "train_info/time_within_train_step": 2.7790772914886475, "step": 1132} +{"train_info/time_between_train_steps": 0.003973484039306641, "step": 1132} +{"info/global_step": 1133, "train_info/time_within_train_step": 2.787997007369995, "step": 1133} +{"train_info/time_between_train_steps": 0.20029401779174805, "step": 1133} +{"info/global_step": 1134, "train_info/time_within_train_step": 2.758023738861084, "step": 1134} +{"train_info/time_between_train_steps": 0.0037965774536132812, "step": 1134} +{"info/global_step": 1135, "train_info/time_within_train_step": 2.757375955581665, "step": 1135} +{"train_info/time_between_train_steps": 0.003757953643798828, "step": 1135} +{"info/global_step": 1136, "train_info/time_within_train_step": 2.8513741493225098, "step": 1136} +{"train_info/time_between_train_steps": 0.003765583038330078, "step": 1136} +{"info/global_step": 1137, "train_info/time_within_train_step": 2.868475914001465, "step": 1137} +{"train_info/time_between_train_steps": 0.0038139820098876953, "step": 1137} +{"info/global_step": 1138, "train_info/time_within_train_step": 2.8658483028411865, "step": 1138} +{"train_info/time_between_train_steps": 0.0038139820098876953, "step": 1138} +{"info/global_step": 1139, "train_info/time_within_train_step": 2.7997817993164062, "step": 1139} +{"train_info/time_between_train_steps": 0.0037484169006347656, "step": 1139} +{"info/global_step": 1140, "train_info/time_within_train_step": 2.772765636444092, "step": 1140} +{"train_info/time_between_train_steps": 0.003760814666748047, "step": 1140} +{"info/global_step": 1141, "train_info/time_within_train_step": 2.8002052307128906, "step": 1141} +{"train_info/time_between_train_steps": 0.0036492347717285156, "step": 1141} +{"info/global_step": 1142, "train_info/time_within_train_step": 2.850813150405884, "step": 1142} +{"train_info/time_between_train_steps": 0.003786325454711914, "step": 1142} +{"info/global_step": 1143, "train_info/time_within_train_step": 2.8798837661743164, "step": 1143} +{"train_info/time_between_train_steps": 0.0037157535552978516, "step": 1143} +{"info/global_step": 1144, "train_info/time_within_train_step": 2.8185410499572754, "step": 1144} +{"train_info/time_between_train_steps": 0.003681182861328125, "step": 1144} +{"info/global_step": 1145, "train_info/time_within_train_step": 2.7675888538360596, "step": 1145} +{"train_info/time_between_train_steps": 0.003654956817626953, "step": 1145} +{"info/global_step": 1146, "train_info/time_within_train_step": 2.856402635574341, "step": 1146} +{"train_info/time_between_train_steps": 0.003699779510498047, "step": 1146} +{"info/global_step": 1147, "train_info/time_within_train_step": 2.826970100402832, "step": 1147} +{"train_info/time_between_train_steps": 0.004755973815917969, "step": 1147} +{"info/global_step": 1148, "train_info/time_within_train_step": 2.8141491413116455, "step": 1148} +{"train_info/time_between_train_steps": 0.003924131393432617, "step": 1148} +{"info/global_step": 1149, "train_info/time_within_train_step": 2.822970390319824, "step": 1149} +{"train_info/time_between_train_steps": 0.004194974899291992, "step": 1149} +{"info/global_step": 1150, "train_info/time_within_train_step": 2.743384599685669, "step": 1150} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289548, "_runtime": 3570}, "step": 1150} +{"logs": {"train/loss": 5.1256, "train/learning_rate": 0.0004111111111111111, "train/epoch": 1.13, "_timestamp": 1746289548, "_runtime": 3570}, "step": 1150} +{"train_info/time_between_train_steps": 0.0268552303314209, "step": 1150} +{"info/global_step": 1151, "train_info/time_within_train_step": 2.7818753719329834, "step": 1151} +{"train_info/time_between_train_steps": 0.004019021987915039, "step": 1151} +{"info/global_step": 1152, "train_info/time_within_train_step": 2.8560144901275635, "step": 1152} +{"train_info/time_between_train_steps": 0.003983736038208008, "step": 1152} +{"info/global_step": 1153, "train_info/time_within_train_step": 2.7492923736572266, "step": 1153} +{"train_info/time_between_train_steps": 0.003900766372680664, "step": 1153} +{"info/global_step": 1154, "train_info/time_within_train_step": 2.7350025177001953, "step": 1154} +{"train_info/time_between_train_steps": 0.003946781158447266, "step": 1154} +{"info/global_step": 1155, "train_info/time_within_train_step": 2.7202963829040527, "step": 1155} +{"train_info/time_between_train_steps": 0.003968715667724609, "step": 1155} +{"info/global_step": 1156, "train_info/time_within_train_step": 2.798441171646118, "step": 1156} +{"train_info/time_between_train_steps": 0.0037984848022460938, "step": 1156} +{"info/global_step": 1157, "train_info/time_within_train_step": 2.8266990184783936, "step": 1157} +{"train_info/time_between_train_steps": 0.003931760787963867, "step": 1157} +{"info/global_step": 1158, "train_info/time_within_train_step": 2.7707359790802, "step": 1158} +{"train_info/time_between_train_steps": 0.003932476043701172, "step": 1158} +{"info/global_step": 1159, "train_info/time_within_train_step": 2.790231466293335, "step": 1159} +{"train_info/time_between_train_steps": 0.003866910934448242, "step": 1159} +{"info/global_step": 1160, "train_info/time_within_train_step": 2.8336105346679688, "step": 1160} +{"train_info/time_between_train_steps": 0.003912448883056641, "step": 1160} +{"info/global_step": 1161, "train_info/time_within_train_step": 2.7779805660247803, "step": 1161} +{"train_info/time_between_train_steps": 0.003885030746459961, "step": 1161} +{"info/global_step": 1162, "train_info/time_within_train_step": 2.769620895385742, "step": 1162} +{"train_info/time_between_train_steps": 0.007622241973876953, "step": 1162} +{"info/global_step": 1163, "train_info/time_within_train_step": 2.845188617706299, "step": 1163} +{"train_info/time_between_train_steps": 0.0052945613861083984, "step": 1163} +{"info/global_step": 1164, "train_info/time_within_train_step": 2.8520009517669678, "step": 1164} +{"train_info/time_between_train_steps": 0.00768280029296875, "step": 1164} +{"info/global_step": 1165, "train_info/time_within_train_step": 2.733541488647461, "step": 1165} +{"train_info/time_between_train_steps": 0.00420069694519043, "step": 1165} +{"info/global_step": 1166, "train_info/time_within_train_step": 2.7069568634033203, "step": 1166} +{"train_info/time_between_train_steps": 0.003954172134399414, "step": 1166} +{"info/global_step": 1167, "train_info/time_within_train_step": 2.79708194732666, "step": 1167} +{"train_info/time_between_train_steps": 0.003980875015258789, "step": 1167} +{"info/global_step": 1168, "train_info/time_within_train_step": 2.839622974395752, "step": 1168} +{"train_info/time_between_train_steps": 0.0038924217224121094, "step": 1168} +{"info/global_step": 1169, "train_info/time_within_train_step": 2.780663013458252, "step": 1169} +{"train_info/time_between_train_steps": 0.003949642181396484, "step": 1169} +{"info/global_step": 1170, "train_info/time_within_train_step": 2.7166781425476074, "step": 1170} +{"train_info/time_between_train_steps": 0.003951549530029297, "step": 1170} +{"info/global_step": 1171, "train_info/time_within_train_step": 2.8494157791137695, "step": 1171} +{"train_info/time_between_train_steps": 0.003907918930053711, "step": 1171} +{"info/global_step": 1172, "train_info/time_within_train_step": 2.771714448928833, "step": 1172} +{"train_info/time_between_train_steps": 0.003877401351928711, "step": 1172} +{"info/global_step": 1173, "train_info/time_within_train_step": 2.6973378658294678, "step": 1173} +{"train_info/time_between_train_steps": 0.0038671493530273438, "step": 1173} +{"info/global_step": 1174, "train_info/time_within_train_step": 2.730534315109253, "step": 1174} +{"train_info/time_between_train_steps": 0.003998756408691406, "step": 1174} +{"info/global_step": 1175, "train_info/time_within_train_step": 2.83429217338562, "step": 1175} +{"train_info/time_between_train_steps": 0.0038912296295166016, "step": 1175} +{"info/global_step": 1176, "train_info/time_within_train_step": 2.809976577758789, "step": 1176} +{"train_info/time_between_train_steps": 0.0039520263671875, "step": 1176} +{"info/global_step": 1177, "train_info/time_within_train_step": 2.7511909008026123, "step": 1177} +{"train_info/time_between_train_steps": 0.004027128219604492, "step": 1177} +{"info/global_step": 1178, "train_info/time_within_train_step": 2.7360587120056152, "step": 1178} +{"train_info/time_between_train_steps": 0.0039517879486083984, "step": 1178} +{"info/global_step": 1179, "train_info/time_within_train_step": 2.8042495250701904, "step": 1179} +{"train_info/time_between_train_steps": 0.004023075103759766, "step": 1179} +{"info/global_step": 1180, "train_info/time_within_train_step": 2.7452991008758545, "step": 1180} +{"train_info/time_between_train_steps": 0.003942966461181641, "step": 1180} +{"info/global_step": 1181, "train_info/time_within_train_step": 2.69950532913208, "step": 1181} +{"train_info/time_between_train_steps": 0.003887653350830078, "step": 1181} +{"info/global_step": 1182, "train_info/time_within_train_step": 2.768657922744751, "step": 1182} +{"train_info/time_between_train_steps": 0.0041468143463134766, "step": 1182} +{"info/global_step": 1183, "train_info/time_within_train_step": 2.7970755100250244, "step": 1183} +{"train_info/time_between_train_steps": 0.003981351852416992, "step": 1183} +{"info/global_step": 1184, "train_info/time_within_train_step": 2.735147714614868, "step": 1184} +{"train_info/time_between_train_steps": 0.004047870635986328, "step": 1184} +{"info/global_step": 1185, "train_info/time_within_train_step": 2.783012628555298, "step": 1185} +{"train_info/time_between_train_steps": 0.00397491455078125, "step": 1185} +{"info/global_step": 1186, "train_info/time_within_train_step": 2.7925970554351807, "step": 1186} +{"train_info/time_between_train_steps": 0.003963947296142578, "step": 1186} +{"info/global_step": 1187, "train_info/time_within_train_step": 2.734424352645874, "step": 1187} +{"train_info/time_between_train_steps": 0.003928184509277344, "step": 1187} +{"info/global_step": 1188, "train_info/time_within_train_step": 2.758561611175537, "step": 1188} +{"train_info/time_between_train_steps": 0.003880739212036133, "step": 1188} +{"info/global_step": 1189, "train_info/time_within_train_step": 2.8495752811431885, "step": 1189} +{"train_info/time_between_train_steps": 0.003931522369384766, "step": 1189} +{"info/global_step": 1190, "train_info/time_within_train_step": 2.7525618076324463, "step": 1190} +{"train_info/time_between_train_steps": 0.003841400146484375, "step": 1190} +{"info/global_step": 1191, "train_info/time_within_train_step": 2.717536211013794, "step": 1191} +{"train_info/time_between_train_steps": 0.004530668258666992, "step": 1191} +{"info/global_step": 1192, "train_info/time_within_train_step": 2.7527315616607666, "step": 1192} +{"train_info/time_between_train_steps": 0.003854513168334961, "step": 1192} +{"info/global_step": 1193, "train_info/time_within_train_step": 3.193981647491455, "step": 1193} +{"train_info/time_between_train_steps": 0.003599405288696289, "step": 1193} +{"info/global_step": 1194, "train_info/time_within_train_step": 2.69700288772583, "step": 1194} +{"train_info/time_between_train_steps": 0.003642559051513672, "step": 1194} +{"info/global_step": 1195, "train_info/time_within_train_step": 2.701613426208496, "step": 1195} +{"train_info/time_between_train_steps": 0.003557920455932617, "step": 1195} +{"info/global_step": 1196, "train_info/time_within_train_step": 2.7322299480438232, "step": 1196} +{"train_info/time_between_train_steps": 0.0036263465881347656, "step": 1196} +{"info/global_step": 1197, "train_info/time_within_train_step": 2.797508716583252, "step": 1197} +{"train_info/time_between_train_steps": 0.0035893917083740234, "step": 1197} +{"info/global_step": 1198, "train_info/time_within_train_step": 2.9974582195281982, "step": 1198} +{"train_info/time_between_train_steps": 0.0036263465881347656, "step": 1198} +{"info/global_step": 1199, "train_info/time_within_train_step": 2.787191152572632, "step": 1199} +{"train_info/time_between_train_steps": 0.0035903453826904297, "step": 1199} +{"info/global_step": 1200, "train_info/time_within_train_step": 2.699788808822632, "step": 1200} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289690, "_runtime": 3712}, "step": 1200} +{"logs": {"train/loss": 5.096, "train/learning_rate": 0.00039999999999999996, "train/epoch": 1.15, "_timestamp": 1746289690, "_runtime": 3712}, "step": 1200} +{"train_info/time_between_train_steps": 14.329864740371704, "step": 1200} +{"info/global_step": 1201, "train_info/time_within_train_step": 2.474046230316162, "step": 1201} +{"train_info/time_between_train_steps": 0.003583669662475586, "step": 1201} +{"info/global_step": 1202, "train_info/time_within_train_step": 2.5309057235717773, "step": 1202} +{"train_info/time_between_train_steps": 0.0037767887115478516, "step": 1202} +{"info/global_step": 1203, "train_info/time_within_train_step": 2.6893603801727295, "step": 1203} +{"train_info/time_between_train_steps": 0.0037338733673095703, "step": 1203} +{"info/global_step": 1204, "train_info/time_within_train_step": 2.7002980709075928, "step": 1204} +{"train_info/time_between_train_steps": 0.0035049915313720703, "step": 1204} +{"info/global_step": 1205, "train_info/time_within_train_step": 2.692837715148926, "step": 1205} +{"train_info/time_between_train_steps": 0.0034592151641845703, "step": 1205} +{"info/global_step": 1206, "train_info/time_within_train_step": 2.6963512897491455, "step": 1206} +{"train_info/time_between_train_steps": 0.0034942626953125, "step": 1206} +{"info/global_step": 1207, "train_info/time_within_train_step": 2.6959407329559326, "step": 1207} +{"train_info/time_between_train_steps": 0.0035638809204101562, "step": 1207} +{"info/global_step": 1208, "train_info/time_within_train_step": 2.9322941303253174, "step": 1208} +{"train_info/time_between_train_steps": 0.0034830570220947266, "step": 1208} +{"info/global_step": 1209, "train_info/time_within_train_step": 3.0088276863098145, "step": 1209} +{"train_info/time_between_train_steps": 0.0034940242767333984, "step": 1209} +{"info/global_step": 1210, "train_info/time_within_train_step": 3.190250873565674, "step": 1210} +{"train_info/time_between_train_steps": 0.003429889678955078, "step": 1210} +{"info/global_step": 1211, "train_info/time_within_train_step": 2.770646572113037, "step": 1211} +{"train_info/time_between_train_steps": 0.0035915374755859375, "step": 1211} +{"info/global_step": 1212, "train_info/time_within_train_step": 2.6952919960021973, "step": 1212} +{"train_info/time_between_train_steps": 0.0034308433532714844, "step": 1212} +{"info/global_step": 1213, "train_info/time_within_train_step": 2.6961781978607178, "step": 1213} +{"train_info/time_between_train_steps": 0.003444194793701172, "step": 1213} +{"info/global_step": 1214, "train_info/time_within_train_step": 2.695446014404297, "step": 1214} +{"train_info/time_between_train_steps": 0.003426074981689453, "step": 1214} +{"info/global_step": 1215, "train_info/time_within_train_step": 2.6949713230133057, "step": 1215} +{"train_info/time_between_train_steps": 0.0033903121948242188, "step": 1215} +{"info/global_step": 1216, "train_info/time_within_train_step": 2.696291208267212, "step": 1216} +{"train_info/time_between_train_steps": 0.0034134387969970703, "step": 1216} +{"info/global_step": 1217, "train_info/time_within_train_step": 2.7644975185394287, "step": 1217} +{"train_info/time_between_train_steps": 0.0034041404724121094, "step": 1217} +{"info/global_step": 1218, "train_info/time_within_train_step": 2.807861089706421, "step": 1218} +{"train_info/time_between_train_steps": 0.006856679916381836, "step": 1218} +{"info/global_step": 1219, "train_info/time_within_train_step": 2.824462652206421, "step": 1219} +{"train_info/time_between_train_steps": 0.006883144378662109, "step": 1219} +{"info/global_step": 1220, "train_info/time_within_train_step": 2.7218258380889893, "step": 1220} +{"train_info/time_between_train_steps": 0.0034220218658447266, "step": 1220} +{"info/global_step": 1221, "train_info/time_within_train_step": 2.6972758769989014, "step": 1221} +{"train_info/time_between_train_steps": 0.0034515857696533203, "step": 1221} +{"info/global_step": 1222, "train_info/time_within_train_step": 2.7257332801818848, "step": 1222} +{"train_info/time_between_train_steps": 0.0034537315368652344, "step": 1222} +{"info/global_step": 1223, "train_info/time_within_train_step": 2.796713352203369, "step": 1223} +{"train_info/time_between_train_steps": 0.003399372100830078, "step": 1223} +{"info/global_step": 1224, "train_info/time_within_train_step": 2.7469663619995117, "step": 1224} +{"train_info/time_between_train_steps": 0.003396272659301758, "step": 1224} +{"info/global_step": 1225, "train_info/time_within_train_step": 2.7588155269622803, "step": 1225} +{"train_info/time_between_train_steps": 0.0035009384155273438, "step": 1225} +{"info/global_step": 1226, "train_info/time_within_train_step": 2.832914352416992, "step": 1226} +{"train_info/time_between_train_steps": 0.003426790237426758, "step": 1226} +{"info/global_step": 1227, "train_info/time_within_train_step": 2.8074746131896973, "step": 1227} +{"train_info/time_between_train_steps": 0.0033960342407226562, "step": 1227} +{"info/global_step": 1228, "train_info/time_within_train_step": 2.760929822921753, "step": 1228} +{"train_info/time_between_train_steps": 0.0034220218658447266, "step": 1228} +{"info/global_step": 1229, "train_info/time_within_train_step": 2.8324570655822754, "step": 1229} +{"train_info/time_between_train_steps": 0.003356456756591797, "step": 1229} +{"info/global_step": 1230, "train_info/time_within_train_step": 2.835911989212036, "step": 1230} +{"train_info/time_between_train_steps": 0.003348827362060547, "step": 1230} +{"info/global_step": 1231, "train_info/time_within_train_step": 2.831559658050537, "step": 1231} +{"train_info/time_between_train_steps": 0.0034303665161132812, "step": 1231} +{"info/global_step": 1232, "train_info/time_within_train_step": 2.778573989868164, "step": 1232} +{"train_info/time_between_train_steps": 0.00342559814453125, "step": 1232} +{"info/global_step": 1233, "train_info/time_within_train_step": 2.7822885513305664, "step": 1233} +{"train_info/time_between_train_steps": 0.0033986568450927734, "step": 1233} +{"info/global_step": 1234, "train_info/time_within_train_step": 2.8666412830352783, "step": 1234} +{"train_info/time_between_train_steps": 0.0033457279205322266, "step": 1234} +{"info/global_step": 1235, "train_info/time_within_train_step": 3.1711854934692383, "step": 1235} +{"train_info/time_between_train_steps": 0.003209829330444336, "step": 1235} +{"info/global_step": 1236, "train_info/time_within_train_step": 2.6960947513580322, "step": 1236} +{"train_info/time_between_train_steps": 0.003286123275756836, "step": 1236} +{"info/global_step": 1237, "train_info/time_within_train_step": 2.7013583183288574, "step": 1237} +{"train_info/time_between_train_steps": 0.0032994747161865234, "step": 1237} +{"info/global_step": 1238, "train_info/time_within_train_step": 2.962599277496338, "step": 1238} +{"train_info/time_between_train_steps": 0.0032854080200195312, "step": 1238} +{"info/global_step": 1239, "train_info/time_within_train_step": 2.956484317779541, "step": 1239} +{"train_info/time_between_train_steps": 0.0032444000244140625, "step": 1239} +{"info/global_step": 1240, "train_info/time_within_train_step": 2.794055700302124, "step": 1240} +{"train_info/time_between_train_steps": 0.0032896995544433594, "step": 1240} +{"info/global_step": 1241, "train_info/time_within_train_step": 2.724590301513672, "step": 1241} +{"train_info/time_between_train_steps": 0.003348112106323242, "step": 1241} +{"info/global_step": 1242, "train_info/time_within_train_step": 2.8083953857421875, "step": 1242} +{"train_info/time_between_train_steps": 0.003232240676879883, "step": 1242} +{"info/global_step": 1243, "train_info/time_within_train_step": 2.84169340133667, "step": 1243} +{"train_info/time_between_train_steps": 0.003397226333618164, "step": 1243} +{"info/global_step": 1244, "train_info/time_within_train_step": 2.7950284481048584, "step": 1244} +{"train_info/time_between_train_steps": 0.0032958984375, "step": 1244} +{"info/global_step": 1245, "train_info/time_within_train_step": 2.699322462081909, "step": 1245} +{"train_info/time_between_train_steps": 0.003307342529296875, "step": 1245} +{"info/global_step": 1246, "train_info/time_within_train_step": 2.708019256591797, "step": 1246} +{"train_info/time_between_train_steps": 0.0032477378845214844, "step": 1246} +{"info/global_step": 1247, "train_info/time_within_train_step": 2.982058048248291, "step": 1247} +{"train_info/time_between_train_steps": 0.0033740997314453125, "step": 1247} +{"info/global_step": 1248, "train_info/time_within_train_step": 2.9543564319610596, "step": 1248} +{"train_info/time_between_train_steps": 0.0033330917358398438, "step": 1248} +{"info/global_step": 1249, "train_info/time_within_train_step": 2.778128147125244, "step": 1249} +{"train_info/time_between_train_steps": 0.003280162811279297, "step": 1249} +{"info/global_step": 1250, "train_info/time_within_train_step": 3.2609059810638428, "step": 1250} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289847, "_runtime": 3869}, "step": 1250} +{"logs": {"train/loss": 5.0655, "train/learning_rate": 0.00038888888888888887, "train/epoch": 1.16, "_timestamp": 1746289847, "_runtime": 3869}, "step": 1250} +{"train_info/time_between_train_steps": 0.041810035705566406, "step": 1250} +{"info/global_step": 1251, "train_info/time_within_train_step": 2.6949970722198486, "step": 1251} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 1251} +{"info/global_step": 1252, "train_info/time_within_train_step": 2.697296619415283, "step": 1252} +{"train_info/time_between_train_steps": 0.0034096240997314453, "step": 1252} +{"info/global_step": 1253, "train_info/time_within_train_step": 2.7170581817626953, "step": 1253} +{"train_info/time_between_train_steps": 0.003438711166381836, "step": 1253} +{"info/global_step": 1254, "train_info/time_within_train_step": 2.695946216583252, "step": 1254} +{"train_info/time_between_train_steps": 0.003491640090942383, "step": 1254} +{"info/global_step": 1255, "train_info/time_within_train_step": 2.6987671852111816, "step": 1255} +{"train_info/time_between_train_steps": 0.0035979747772216797, "step": 1255} +{"info/global_step": 1256, "train_info/time_within_train_step": 2.699312686920166, "step": 1256} +{"train_info/time_between_train_steps": 0.003523111343383789, "step": 1256} +{"info/global_step": 1257, "train_info/time_within_train_step": 2.699448823928833, "step": 1257} +{"train_info/time_between_train_steps": 0.003542184829711914, "step": 1257} +{"info/global_step": 1258, "train_info/time_within_train_step": 2.700132131576538, "step": 1258} +{"train_info/time_between_train_steps": 0.0035457611083984375, "step": 1258} +{"info/global_step": 1259, "train_info/time_within_train_step": 2.6996893882751465, "step": 1259} +{"train_info/time_between_train_steps": 0.003557920455932617, "step": 1259} +{"info/global_step": 1260, "train_info/time_within_train_step": 2.7776784896850586, "step": 1260} +{"train_info/time_between_train_steps": 0.0035240650177001953, "step": 1260} +{"info/global_step": 1261, "train_info/time_within_train_step": 2.9800736904144287, "step": 1261} +{"train_info/time_between_train_steps": 0.003665447235107422, "step": 1261} +{"info/global_step": 1262, "train_info/time_within_train_step": 2.7862772941589355, "step": 1262} +{"train_info/time_between_train_steps": 0.003545522689819336, "step": 1262} +{"info/global_step": 1263, "train_info/time_within_train_step": 2.6993753910064697, "step": 1263} +{"train_info/time_between_train_steps": 0.003541231155395508, "step": 1263} +{"info/global_step": 1264, "train_info/time_within_train_step": 2.6998085975646973, "step": 1264} +{"train_info/time_between_train_steps": 0.0035343170166015625, "step": 1264} +{"info/global_step": 1265, "train_info/time_within_train_step": 2.7424733638763428, "step": 1265} +{"train_info/time_between_train_steps": 0.0034928321838378906, "step": 1265} +{"info/global_step": 1266, "train_info/time_within_train_step": 2.6999402046203613, "step": 1266} +{"train_info/time_between_train_steps": 0.003442525863647461, "step": 1266} +{"info/global_step": 1267, "train_info/time_within_train_step": 2.7638516426086426, "step": 1267} +{"train_info/time_between_train_steps": 0.0034699440002441406, "step": 1267} +{"info/global_step": 1268, "train_info/time_within_train_step": 2.953946590423584, "step": 1268} +{"train_info/time_between_train_steps": 0.0034689903259277344, "step": 1268} +{"info/global_step": 1269, "train_info/time_within_train_step": 2.8238272666931152, "step": 1269} +{"train_info/time_between_train_steps": 0.00351715087890625, "step": 1269} +{"info/global_step": 1270, "train_info/time_within_train_step": 2.707087755203247, "step": 1270} +{"train_info/time_between_train_steps": 0.003487825393676758, "step": 1270} +{"info/global_step": 1271, "train_info/time_within_train_step": 2.714719533920288, "step": 1271} +{"train_info/time_between_train_steps": 0.0034990310668945312, "step": 1271} +{"info/global_step": 1272, "train_info/time_within_train_step": 2.7993886470794678, "step": 1272} +{"train_info/time_between_train_steps": 0.0034601688385009766, "step": 1272} +{"info/global_step": 1273, "train_info/time_within_train_step": 2.7587454319000244, "step": 1273} +{"train_info/time_between_train_steps": 0.003458261489868164, "step": 1273} +{"info/global_step": 1274, "train_info/time_within_train_step": 2.7570109367370605, "step": 1274} +{"train_info/time_between_train_steps": 0.0035195350646972656, "step": 1274} +{"info/global_step": 1275, "train_info/time_within_train_step": 2.725811719894409, "step": 1275} +{"train_info/time_between_train_steps": 0.0034933090209960938, "step": 1275} +{"info/global_step": 1276, "train_info/time_within_train_step": 2.7643814086914062, "step": 1276} +{"train_info/time_between_train_steps": 0.003507852554321289, "step": 1276} +{"info/global_step": 1277, "train_info/time_within_train_step": 2.7974884510040283, "step": 1277} +{"train_info/time_between_train_steps": 0.003454446792602539, "step": 1277} +{"info/global_step": 1278, "train_info/time_within_train_step": 2.7350893020629883, "step": 1278} +{"train_info/time_between_train_steps": 0.003560781478881836, "step": 1278} +{"info/global_step": 1279, "train_info/time_within_train_step": 2.7075908184051514, "step": 1279} +{"train_info/time_between_train_steps": 0.0035009384155273438, "step": 1279} +{"info/global_step": 1280, "train_info/time_within_train_step": 2.699110746383667, "step": 1280} +{"train_info/time_between_train_steps": 0.0034704208374023438, "step": 1280} +{"info/global_step": 1281, "train_info/time_within_train_step": 2.699192762374878, "step": 1281} +{"train_info/time_between_train_steps": 0.0034308433532714844, "step": 1281} +{"info/global_step": 1282, "train_info/time_within_train_step": 2.81329083442688, "step": 1282} +{"train_info/time_between_train_steps": 0.0035071372985839844, "step": 1282} +{"info/global_step": 1283, "train_info/time_within_train_step": 2.8810408115386963, "step": 1283} +{"train_info/time_between_train_steps": 0.003488779067993164, "step": 1283} +{"info/global_step": 1284, "train_info/time_within_train_step": 2.7648751735687256, "step": 1284} +{"train_info/time_between_train_steps": 0.003421783447265625, "step": 1284} +{"info/global_step": 1285, "train_info/time_within_train_step": 2.7010955810546875, "step": 1285} +{"train_info/time_between_train_steps": 0.0035212039947509766, "step": 1285} +{"info/global_step": 1286, "train_info/time_within_train_step": 2.7733654975891113, "step": 1286} +{"train_info/time_between_train_steps": 0.003640413284301758, "step": 1286} +{"info/global_step": 1287, "train_info/time_within_train_step": 2.7890121936798096, "step": 1287} +{"train_info/time_between_train_steps": 0.003565549850463867, "step": 1287} +{"info/global_step": 1288, "train_info/time_within_train_step": 2.7160263061523438, "step": 1288} +{"train_info/time_between_train_steps": 0.003566265106201172, "step": 1288} +{"info/global_step": 1289, "train_info/time_within_train_step": 2.7393085956573486, "step": 1289} +{"train_info/time_between_train_steps": 0.0035600662231445312, "step": 1289} +{"info/global_step": 1290, "train_info/time_within_train_step": 2.7503397464752197, "step": 1290} +{"train_info/time_between_train_steps": 0.003513813018798828, "step": 1290} +{"info/global_step": 1291, "train_info/time_within_train_step": 2.754979372024536, "step": 1291} +{"train_info/time_between_train_steps": 0.0036504268646240234, "step": 1291} +{"info/global_step": 1292, "train_info/time_within_train_step": 2.720931053161621, "step": 1292} +{"train_info/time_between_train_steps": 0.00370025634765625, "step": 1292} +{"info/global_step": 1293, "train_info/time_within_train_step": 2.7124786376953125, "step": 1293} +{"train_info/time_between_train_steps": 0.003478527069091797, "step": 1293} +{"info/global_step": 1294, "train_info/time_within_train_step": 2.7468807697296143, "step": 1294} +{"train_info/time_between_train_steps": 0.0034682750701904297, "step": 1294} +{"info/global_step": 1295, "train_info/time_within_train_step": 2.77284574508667, "step": 1295} +{"train_info/time_between_train_steps": 0.003414154052734375, "step": 1295} +{"info/global_step": 1296, "train_info/time_within_train_step": 2.7449252605438232, "step": 1296} +{"train_info/time_between_train_steps": 0.0035219192504882812, "step": 1296} +{"info/global_step": 1297, "train_info/time_within_train_step": 2.7323696613311768, "step": 1297} +{"train_info/time_between_train_steps": 0.003427743911743164, "step": 1297} +{"info/global_step": 1298, "train_info/time_within_train_step": 2.8360390663146973, "step": 1298} +{"train_info/time_between_train_steps": 0.0035049915313720703, "step": 1298} +{"info/global_step": 1299, "train_info/time_within_train_step": 2.723583221435547, "step": 1299} +{"train_info/time_between_train_steps": 0.0035245418548583984, "step": 1299} +{"info/global_step": 1300, "train_info/time_within_train_step": 2.7226667404174805, "step": 1300} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746289988, "_runtime": 4010}, "step": 1300} +{"logs": {"train/loss": 5.0278, "train/learning_rate": 0.00037777777777777777, "train/epoch": 1.18, "_timestamp": 1746289988, "_runtime": 4010}, "step": 1300} +{"train_info/time_between_train_steps": 13.94506287574768, "step": 1300} +{"info/global_step": 1301, "train_info/time_within_train_step": 2.471558094024658, "step": 1301} +{"train_info/time_between_train_steps": 0.0034928321838378906, "step": 1301} +{"info/global_step": 1302, "train_info/time_within_train_step": 2.5166306495666504, "step": 1302} +{"train_info/time_between_train_steps": 0.003446817398071289, "step": 1302} +{"info/global_step": 1303, "train_info/time_within_train_step": 2.6900036334991455, "step": 1303} +{"train_info/time_between_train_steps": 0.003504037857055664, "step": 1303} +{"info/global_step": 1304, "train_info/time_within_train_step": 2.6931393146514893, "step": 1304} +{"train_info/time_between_train_steps": 0.003613710403442383, "step": 1304} +{"info/global_step": 1305, "train_info/time_within_train_step": 2.694228172302246, "step": 1305} +{"train_info/time_between_train_steps": 0.003542184829711914, "step": 1305} +{"info/global_step": 1306, "train_info/time_within_train_step": 2.697204351425171, "step": 1306} +{"train_info/time_between_train_steps": 0.003575563430786133, "step": 1306} +{"info/global_step": 1307, "train_info/time_within_train_step": 2.698277711868286, "step": 1307} +{"train_info/time_between_train_steps": 0.0036432743072509766, "step": 1307} +{"info/global_step": 1308, "train_info/time_within_train_step": 2.9508681297302246, "step": 1308} +{"train_info/time_between_train_steps": 0.0036156177520751953, "step": 1308} +{"info/global_step": 1309, "train_info/time_within_train_step": 3.0102014541625977, "step": 1309} +{"train_info/time_between_train_steps": 0.0037841796875, "step": 1309} +{"info/global_step": 1310, "train_info/time_within_train_step": 2.9260306358337402, "step": 1310} +{"train_info/time_between_train_steps": 0.003791332244873047, "step": 1310} +{"info/global_step": 1311, "train_info/time_within_train_step": 2.699888229370117, "step": 1311} +{"train_info/time_between_train_steps": 0.0036041736602783203, "step": 1311} +{"info/global_step": 1312, "train_info/time_within_train_step": 2.6997129917144775, "step": 1312} +{"train_info/time_between_train_steps": 0.0036520957946777344, "step": 1312} +{"info/global_step": 1313, "train_info/time_within_train_step": 2.698122262954712, "step": 1313} +{"train_info/time_between_train_steps": 0.0035092830657958984, "step": 1313} +{"info/global_step": 1314, "train_info/time_within_train_step": 2.6971940994262695, "step": 1314} +{"train_info/time_between_train_steps": 0.0036525726318359375, "step": 1314} +{"info/global_step": 1315, "train_info/time_within_train_step": 2.9546139240264893, "step": 1315} +{"train_info/time_between_train_steps": 0.003297567367553711, "step": 1315} +{"info/global_step": 1316, "train_info/time_within_train_step": 2.6953229904174805, "step": 1316} +{"train_info/time_between_train_steps": 0.003316640853881836, "step": 1316} +{"info/global_step": 1317, "train_info/time_within_train_step": 2.696774959564209, "step": 1317} +{"train_info/time_between_train_steps": 0.003345489501953125, "step": 1317} +{"info/global_step": 1318, "train_info/time_within_train_step": 2.7174901962280273, "step": 1318} +{"train_info/time_between_train_steps": 0.003293752670288086, "step": 1318} +{"info/global_step": 1319, "train_info/time_within_train_step": 2.7935268878936768, "step": 1319} +{"train_info/time_between_train_steps": 0.0033044815063476562, "step": 1319} +{"info/global_step": 1320, "train_info/time_within_train_step": 2.9878764152526855, "step": 1320} +{"train_info/time_between_train_steps": 0.0033638477325439453, "step": 1320} +{"info/global_step": 1321, "train_info/time_within_train_step": 2.7472760677337646, "step": 1321} +{"train_info/time_between_train_steps": 0.0034351348876953125, "step": 1321} +{"info/global_step": 1322, "train_info/time_within_train_step": 2.6987476348876953, "step": 1322} +{"train_info/time_between_train_steps": 0.0037109851837158203, "step": 1322} +{"info/global_step": 1323, "train_info/time_within_train_step": 2.6981499195098877, "step": 1323} +{"train_info/time_between_train_steps": 0.0037064552307128906, "step": 1323} +{"info/global_step": 1324, "train_info/time_within_train_step": 2.696955442428589, "step": 1324} +{"train_info/time_between_train_steps": 0.0036745071411132812, "step": 1324} +{"info/global_step": 1325, "train_info/time_within_train_step": 2.7524499893188477, "step": 1325} +{"train_info/time_between_train_steps": 0.0036547183990478516, "step": 1325} +{"info/global_step": 1326, "train_info/time_within_train_step": 2.8545374870300293, "step": 1326} +{"train_info/time_between_train_steps": 0.0037691593170166016, "step": 1326} +{"info/global_step": 1327, "train_info/time_within_train_step": 2.7050466537475586, "step": 1327} +{"train_info/time_between_train_steps": 0.003549337387084961, "step": 1327} +{"info/global_step": 1328, "train_info/time_within_train_step": 2.6975860595703125, "step": 1328} +{"train_info/time_between_train_steps": 0.003601551055908203, "step": 1328} +{"info/global_step": 1329, "train_info/time_within_train_step": 2.697078227996826, "step": 1329} +{"train_info/time_between_train_steps": 0.0035948753356933594, "step": 1329} +{"info/global_step": 1330, "train_info/time_within_train_step": 2.725083351135254, "step": 1330} +{"train_info/time_between_train_steps": 0.003592252731323242, "step": 1330} +{"info/global_step": 1331, "train_info/time_within_train_step": 2.8593950271606445, "step": 1331} +{"train_info/time_between_train_steps": 0.00401759147644043, "step": 1331} +{"info/global_step": 1332, "train_info/time_within_train_step": 2.7653892040252686, "step": 1332} +{"train_info/time_between_train_steps": 0.0034966468811035156, "step": 1332} +{"info/global_step": 1333, "train_info/time_within_train_step": 2.7218785285949707, "step": 1333} +{"train_info/time_between_train_steps": 0.0036020278930664062, "step": 1333} +{"info/global_step": 1334, "train_info/time_within_train_step": 2.9369473457336426, "step": 1334} +{"train_info/time_between_train_steps": 0.003506183624267578, "step": 1334} +{"info/global_step": 1335, "train_info/time_within_train_step": 2.7123711109161377, "step": 1335} +{"train_info/time_between_train_steps": 0.003496885299682617, "step": 1335} +{"info/global_step": 1336, "train_info/time_within_train_step": 2.699683427810669, "step": 1336} +{"train_info/time_between_train_steps": 0.003519773483276367, "step": 1336} +{"info/global_step": 1337, "train_info/time_within_train_step": 2.806443452835083, "step": 1337} +{"train_info/time_between_train_steps": 0.0035195350646972656, "step": 1337} +{"info/global_step": 1338, "train_info/time_within_train_step": 2.8200440406799316, "step": 1338} +{"train_info/time_between_train_steps": 0.0035126209259033203, "step": 1338} +{"info/global_step": 1339, "train_info/time_within_train_step": 2.744959592819214, "step": 1339} +{"train_info/time_between_train_steps": 0.0035390853881835938, "step": 1339} +{"info/global_step": 1340, "train_info/time_within_train_step": 2.728914976119995, "step": 1340} +{"train_info/time_between_train_steps": 0.0038161277770996094, "step": 1340} +{"info/global_step": 1341, "train_info/time_within_train_step": 2.7616891860961914, "step": 1341} +{"train_info/time_between_train_steps": 0.0036749839782714844, "step": 1341} +{"info/global_step": 1342, "train_info/time_within_train_step": 2.768171548843384, "step": 1342} +{"train_info/time_between_train_steps": 0.003762960433959961, "step": 1342} +{"info/global_step": 1343, "train_info/time_within_train_step": 2.7003252506256104, "step": 1343} +{"train_info/time_between_train_steps": 0.0036122798919677734, "step": 1343} +{"info/global_step": 1344, "train_info/time_within_train_step": 2.758800745010376, "step": 1344} +{"train_info/time_between_train_steps": 0.003687143325805664, "step": 1344} +{"info/global_step": 1345, "train_info/time_within_train_step": 2.914173126220703, "step": 1345} +{"train_info/time_between_train_steps": 0.0035867691040039062, "step": 1345} +{"info/global_step": 1346, "train_info/time_within_train_step": 2.7141060829162598, "step": 1346} +{"train_info/time_between_train_steps": 0.0036437511444091797, "step": 1346} +{"info/global_step": 1347, "train_info/time_within_train_step": 2.697608232498169, "step": 1347} +{"train_info/time_between_train_steps": 0.003515481948852539, "step": 1347} +{"info/global_step": 1348, "train_info/time_within_train_step": 2.6999664306640625, "step": 1348} +{"train_info/time_between_train_steps": 0.0035767555236816406, "step": 1348} +{"info/global_step": 1349, "train_info/time_within_train_step": 2.8744139671325684, "step": 1349} +{"train_info/time_between_train_steps": 0.003493785858154297, "step": 1349} +{"info/global_step": 1350, "train_info/time_within_train_step": 2.882998466491699, "step": 1350} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746290143, "_runtime": 4165}, "step": 1350} +{"logs": {"train/loss": 4.9883, "train/learning_rate": 0.00036666666666666667, "train/epoch": 1.2, "_timestamp": 1746290143, "_runtime": 4165}, "step": 1350} +{"train_info/time_between_train_steps": 0.026781558990478516, "step": 1350} +{"info/global_step": 1351, "train_info/time_within_train_step": 2.77905535697937, "step": 1351} +{"train_info/time_between_train_steps": 0.003592967987060547, "step": 1351} +{"info/global_step": 1352, "train_info/time_within_train_step": 2.704848527908325, "step": 1352} +{"train_info/time_between_train_steps": 0.003674745559692383, "step": 1352} +{"info/global_step": 1353, "train_info/time_within_train_step": 2.7959940433502197, "step": 1353} +{"train_info/time_between_train_steps": 0.003616809844970703, "step": 1353} +{"info/global_step": 1354, "train_info/time_within_train_step": 2.713921546936035, "step": 1354} +{"train_info/time_between_train_steps": 0.0036058425903320312, "step": 1354} +{"info/global_step": 1355, "train_info/time_within_train_step": 2.739363193511963, "step": 1355} +{"train_info/time_between_train_steps": 0.003633260726928711, "step": 1355} +{"info/global_step": 1356, "train_info/time_within_train_step": 2.787179708480835, "step": 1356} +{"train_info/time_between_train_steps": 0.003632783889770508, "step": 1356} +{"info/global_step": 1357, "train_info/time_within_train_step": 2.8047878742218018, "step": 1357} +{"train_info/time_between_train_steps": 0.0036323070526123047, "step": 1357} +{"info/global_step": 1358, "train_info/time_within_train_step": 2.7470452785491943, "step": 1358} +{"train_info/time_between_train_steps": 0.0036039352416992188, "step": 1358} +{"info/global_step": 1359, "train_info/time_within_train_step": 2.744535446166992, "step": 1359} +{"train_info/time_between_train_steps": 0.003535032272338867, "step": 1359} +{"info/global_step": 1360, "train_info/time_within_train_step": 2.8347151279449463, "step": 1360} +{"train_info/time_between_train_steps": 0.0037271976470947266, "step": 1360} +{"info/global_step": 1361, "train_info/time_within_train_step": 2.750488519668579, "step": 1361} +{"train_info/time_between_train_steps": 0.0035016536712646484, "step": 1361} +{"info/global_step": 1362, "train_info/time_within_train_step": 2.727400064468384, "step": 1362} +{"train_info/time_between_train_steps": 0.0035903453826904297, "step": 1362} +{"info/global_step": 1363, "train_info/time_within_train_step": 2.8040878772735596, "step": 1363} +{"train_info/time_between_train_steps": 0.0036172866821289062, "step": 1363} +{"info/global_step": 1364, "train_info/time_within_train_step": 2.7421298027038574, "step": 1364} +{"train_info/time_between_train_steps": 0.003615140914916992, "step": 1364} +{"info/global_step": 1365, "train_info/time_within_train_step": 2.7285280227661133, "step": 1365} +{"train_info/time_between_train_steps": 0.0034813880920410156, "step": 1365} +{"info/global_step": 1366, "train_info/time_within_train_step": 2.7818992137908936, "step": 1366} +{"train_info/time_between_train_steps": 0.0036127567291259766, "step": 1366} +{"info/global_step": 1367, "train_info/time_within_train_step": 2.746792793273926, "step": 1367} +{"train_info/time_between_train_steps": 0.0036487579345703125, "step": 1367} +{"info/global_step": 1368, "train_info/time_within_train_step": 2.7114479541778564, "step": 1368} +{"train_info/time_between_train_steps": 0.0036563873291015625, "step": 1368} +{"info/global_step": 1369, "train_info/time_within_train_step": 2.7658467292785645, "step": 1369} +{"train_info/time_between_train_steps": 0.0034809112548828125, "step": 1369} +{"info/global_step": 1370, "train_info/time_within_train_step": 2.7573812007904053, "step": 1370} +{"train_info/time_between_train_steps": 0.003591299057006836, "step": 1370} +{"info/global_step": 1371, "train_info/time_within_train_step": 2.7188467979431152, "step": 1371} +{"train_info/time_between_train_steps": 0.0036826133728027344, "step": 1371} +{"info/global_step": 1372, "train_info/time_within_train_step": 2.758188009262085, "step": 1372} +{"train_info/time_between_train_steps": 0.0035223960876464844, "step": 1372} +{"info/global_step": 1373, "train_info/time_within_train_step": 2.747951030731201, "step": 1373} +{"train_info/time_between_train_steps": 0.0035545825958251953, "step": 1373} +{"info/global_step": 1374, "train_info/time_within_train_step": 2.744757890701294, "step": 1374} +{"train_info/time_between_train_steps": 0.003475189208984375, "step": 1374} +{"info/global_step": 1375, "train_info/time_within_train_step": 2.728712558746338, "step": 1375} +{"train_info/time_between_train_steps": 0.0034837722778320312, "step": 1375} +{"info/global_step": 1376, "train_info/time_within_train_step": 2.755145311355591, "step": 1376} +{"train_info/time_between_train_steps": 0.003458261489868164, "step": 1376} +{"info/global_step": 1377, "train_info/time_within_train_step": 2.733510732650757, "step": 1377} +{"train_info/time_between_train_steps": 0.003771543502807617, "step": 1377} +{"info/global_step": 1378, "train_info/time_within_train_step": 2.8012850284576416, "step": 1378} +{"train_info/time_between_train_steps": 0.003635883331298828, "step": 1378} +{"info/global_step": 1379, "train_info/time_within_train_step": 2.729642629623413, "step": 1379} +{"train_info/time_between_train_steps": 0.003621816635131836, "step": 1379} +{"info/global_step": 1380, "train_info/time_within_train_step": 2.7291979789733887, "step": 1380} +{"train_info/time_between_train_steps": 0.0038666725158691406, "step": 1380} +{"info/global_step": 1381, "train_info/time_within_train_step": 2.7033958435058594, "step": 1381} +{"train_info/time_between_train_steps": 0.003577709197998047, "step": 1381} +{"info/global_step": 1382, "train_info/time_within_train_step": 2.7031288146972656, "step": 1382} +{"train_info/time_between_train_steps": 0.004162788391113281, "step": 1382} +{"info/global_step": 1383, "train_info/time_within_train_step": 2.7476885318756104, "step": 1383} +{"train_info/time_between_train_steps": 0.003690481185913086, "step": 1383} +{"info/global_step": 1384, "train_info/time_within_train_step": 2.8088507652282715, "step": 1384} +{"train_info/time_between_train_steps": 0.0036842823028564453, "step": 1384} +{"info/global_step": 1385, "train_info/time_within_train_step": 2.7479560375213623, "step": 1385} +{"train_info/time_between_train_steps": 0.003640413284301758, "step": 1385} +{"info/global_step": 1386, "train_info/time_within_train_step": 2.70416259765625, "step": 1386} +{"train_info/time_between_train_steps": 0.0036652088165283203, "step": 1386} +{"info/global_step": 1387, "train_info/time_within_train_step": 2.7763314247131348, "step": 1387} +{"train_info/time_between_train_steps": 0.0036611557006835938, "step": 1387} +{"info/global_step": 1388, "train_info/time_within_train_step": 2.766808032989502, "step": 1388} +{"train_info/time_between_train_steps": 0.003515005111694336, "step": 1388} +{"info/global_step": 1389, "train_info/time_within_train_step": 2.7009665966033936, "step": 1389} +{"train_info/time_between_train_steps": 0.007010698318481445, "step": 1389} +{"info/global_step": 1390, "train_info/time_within_train_step": 2.834648370742798, "step": 1390} +{"train_info/time_between_train_steps": 0.003726959228515625, "step": 1390} +{"info/global_step": 1391, "train_info/time_within_train_step": 2.7930874824523926, "step": 1391} +{"train_info/time_between_train_steps": 0.003710031509399414, "step": 1391} +{"info/global_step": 1392, "train_info/time_within_train_step": 2.707324743270874, "step": 1392} +{"train_info/time_between_train_steps": 0.003649473190307617, "step": 1392} +{"info/global_step": 1393, "train_info/time_within_train_step": 2.744251251220703, "step": 1393} +{"train_info/time_between_train_steps": 0.0035026073455810547, "step": 1393} +{"info/global_step": 1394, "train_info/time_within_train_step": 2.7052111625671387, "step": 1394} +{"train_info/time_between_train_steps": 0.0036742687225341797, "step": 1394} +{"info/global_step": 1395, "train_info/time_within_train_step": 2.745804786682129, "step": 1395} +{"train_info/time_between_train_steps": 0.0036618709564208984, "step": 1395} +{"info/global_step": 1396, "train_info/time_within_train_step": 2.825761079788208, "step": 1396} +{"train_info/time_between_train_steps": 0.0035796165466308594, "step": 1396} +{"info/global_step": 1397, "train_info/time_within_train_step": 2.7408089637756348, "step": 1397} +{"train_info/time_between_train_steps": 0.003480672836303711, "step": 1397} +{"info/global_step": 1398, "train_info/time_within_train_step": 2.709652900695801, "step": 1398} +{"train_info/time_between_train_steps": 0.0036773681640625, "step": 1398} +{"info/global_step": 1399, "train_info/time_within_train_step": 2.8612663745880127, "step": 1399} +{"train_info/time_between_train_steps": 0.0036554336547851562, "step": 1399} +{"info/global_step": 1400, "train_info/time_within_train_step": 2.7565605640411377, "step": 1400} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746290282, "_runtime": 4304}, "step": 1400} +{"logs": {"train/loss": 4.9785, "train/learning_rate": 0.0003555555555555555, "train/epoch": 1.21, "_timestamp": 1746290282, "_runtime": 4304}, "step": 1400} +{"train_info/time_between_train_steps": 14.037198066711426, "step": 1400} +{"info/global_step": 1401, "train_info/time_within_train_step": 2.4828648567199707, "step": 1401} +{"train_info/time_between_train_steps": 0.0035212039947509766, "step": 1401} +{"info/global_step": 1402, "train_info/time_within_train_step": 2.5146472454071045, "step": 1402} +{"train_info/time_between_train_steps": 0.003529787063598633, "step": 1402} +{"info/global_step": 1403, "train_info/time_within_train_step": 2.6900365352630615, "step": 1403} +{"train_info/time_between_train_steps": 0.0035178661346435547, "step": 1403} +{"info/global_step": 1404, "train_info/time_within_train_step": 2.695392608642578, "step": 1404} +{"train_info/time_between_train_steps": 0.0037508010864257812, "step": 1404} +{"info/global_step": 1405, "train_info/time_within_train_step": 2.8686506748199463, "step": 1405} +{"train_info/time_between_train_steps": 0.003302335739135742, "step": 1405} +{"info/global_step": 1406, "train_info/time_within_train_step": 2.696430206298828, "step": 1406} +{"train_info/time_between_train_steps": 0.003336668014526367, "step": 1406} +{"info/global_step": 1407, "train_info/time_within_train_step": 2.6984140872955322, "step": 1407} +{"train_info/time_between_train_steps": 0.003459453582763672, "step": 1407} +{"info/global_step": 1408, "train_info/time_within_train_step": 2.9244277477264404, "step": 1408} +{"train_info/time_between_train_steps": 0.003450632095336914, "step": 1408} +{"info/global_step": 1409, "train_info/time_within_train_step": 2.9454469680786133, "step": 1409} +{"train_info/time_between_train_steps": 0.0034232139587402344, "step": 1409} +{"info/global_step": 1410, "train_info/time_within_train_step": 3.1174190044403076, "step": 1410} +{"train_info/time_between_train_steps": 0.0034487247467041016, "step": 1410} +{"info/global_step": 1411, "train_info/time_within_train_step": 2.773742198944092, "step": 1411} +{"train_info/time_between_train_steps": 0.0033965110778808594, "step": 1411} +{"info/global_step": 1412, "train_info/time_within_train_step": 2.6985433101654053, "step": 1412} +{"train_info/time_between_train_steps": 0.003376007080078125, "step": 1412} +{"info/global_step": 1413, "train_info/time_within_train_step": 2.698620319366455, "step": 1413} +{"train_info/time_between_train_steps": 0.003481149673461914, "step": 1413} +{"info/global_step": 1414, "train_info/time_within_train_step": 2.699918746948242, "step": 1414} +{"train_info/time_between_train_steps": 0.0036721229553222656, "step": 1414} +{"info/global_step": 1415, "train_info/time_within_train_step": 2.698547124862671, "step": 1415} +{"train_info/time_between_train_steps": 0.0037505626678466797, "step": 1415} +{"info/global_step": 1416, "train_info/time_within_train_step": 2.6985301971435547, "step": 1416} +{"train_info/time_between_train_steps": 0.0035886764526367188, "step": 1416} +{"info/global_step": 1417, "train_info/time_within_train_step": 2.7342612743377686, "step": 1417} +{"train_info/time_between_train_steps": 0.003681182861328125, "step": 1417} +{"info/global_step": 1418, "train_info/time_within_train_step": 2.821291446685791, "step": 1418} +{"train_info/time_between_train_steps": 0.003677845001220703, "step": 1418} +{"info/global_step": 1419, "train_info/time_within_train_step": 3.0254154205322266, "step": 1419} +{"train_info/time_between_train_steps": 0.0035178661346435547, "step": 1419} +{"info/global_step": 1420, "train_info/time_within_train_step": 2.746112823486328, "step": 1420} +{"train_info/time_between_train_steps": 0.0037627220153808594, "step": 1420} +{"info/global_step": 1421, "train_info/time_within_train_step": 2.702174186706543, "step": 1421} +{"train_info/time_between_train_steps": 0.003766775131225586, "step": 1421} +{"info/global_step": 1422, "train_info/time_within_train_step": 2.6998536586761475, "step": 1422} +{"train_info/time_between_train_steps": 0.0037326812744140625, "step": 1422} +{"info/global_step": 1423, "train_info/time_within_train_step": 2.698410749435425, "step": 1423} +{"train_info/time_between_train_steps": 0.0036339759826660156, "step": 1423} +{"info/global_step": 1424, "train_info/time_within_train_step": 2.7034003734588623, "step": 1424} +{"train_info/time_between_train_steps": 0.0036427974700927734, "step": 1424} +{"info/global_step": 1425, "train_info/time_within_train_step": 2.8375535011291504, "step": 1425} +{"train_info/time_between_train_steps": 0.0036072731018066406, "step": 1425} +{"info/global_step": 1426, "train_info/time_within_train_step": 2.805759906768799, "step": 1426} +{"train_info/time_between_train_steps": 0.0035371780395507812, "step": 1426} +{"info/global_step": 1427, "train_info/time_within_train_step": 2.743265151977539, "step": 1427} +{"train_info/time_between_train_steps": 0.003551959991455078, "step": 1427} +{"info/global_step": 1428, "train_info/time_within_train_step": 2.75526762008667, "step": 1428} +{"train_info/time_between_train_steps": 0.0036618709564208984, "step": 1428} +{"info/global_step": 1429, "train_info/time_within_train_step": 2.733139753341675, "step": 1429} +{"train_info/time_between_train_steps": 0.003512144088745117, "step": 1429} +{"info/global_step": 1430, "train_info/time_within_train_step": 2.7317018508911133, "step": 1430} +{"train_info/time_between_train_steps": 0.003606081008911133, "step": 1430} +{"info/global_step": 1431, "train_info/time_within_train_step": 2.798447608947754, "step": 1431} +{"train_info/time_between_train_steps": 0.003686189651489258, "step": 1431} +{"info/global_step": 1432, "train_info/time_within_train_step": 2.7348079681396484, "step": 1432} +{"train_info/time_between_train_steps": 0.003609895706176758, "step": 1432} +{"info/global_step": 1433, "train_info/time_within_train_step": 2.759796380996704, "step": 1433} +{"train_info/time_between_train_steps": 0.003637075424194336, "step": 1433} +{"info/global_step": 1434, "train_info/time_within_train_step": 2.835587739944458, "step": 1434} +{"train_info/time_between_train_steps": 0.003711223602294922, "step": 1434} +{"info/global_step": 1435, "train_info/time_within_train_step": 2.739504814147949, "step": 1435} +{"train_info/time_between_train_steps": 0.003605365753173828, "step": 1435} +{"info/global_step": 1436, "train_info/time_within_train_step": 2.710986852645874, "step": 1436} +{"train_info/time_between_train_steps": 0.0035729408264160156, "step": 1436} +{"info/global_step": 1437, "train_info/time_within_train_step": 2.820033311843872, "step": 1437} +{"train_info/time_between_train_steps": 0.0036008358001708984, "step": 1437} +{"info/global_step": 1438, "train_info/time_within_train_step": 2.758028268814087, "step": 1438} +{"train_info/time_between_train_steps": 0.003719329833984375, "step": 1438} +{"info/global_step": 1439, "train_info/time_within_train_step": 2.761460304260254, "step": 1439} +{"train_info/time_between_train_steps": 0.003799915313720703, "step": 1439} +{"info/global_step": 1440, "train_info/time_within_train_step": 2.765073537826538, "step": 1440} +{"train_info/time_between_train_steps": 0.0037069320678710938, "step": 1440} +{"info/global_step": 1441, "train_info/time_within_train_step": 2.812427282333374, "step": 1441} +{"train_info/time_between_train_steps": 0.003627777099609375, "step": 1441} +{"info/global_step": 1442, "train_info/time_within_train_step": 2.734422445297241, "step": 1442} +{"train_info/time_between_train_steps": 0.003625154495239258, "step": 1442} +{"info/global_step": 1443, "train_info/time_within_train_step": 2.7532260417938232, "step": 1443} +{"train_info/time_between_train_steps": 0.0036313533782958984, "step": 1443} +{"info/global_step": 1444, "train_info/time_within_train_step": 2.8465170860290527, "step": 1444} +{"train_info/time_between_train_steps": 0.0037038326263427734, "step": 1444} +{"info/global_step": 1445, "train_info/time_within_train_step": 2.813739061355591, "step": 1445} +{"train_info/time_between_train_steps": 0.003622293472290039, "step": 1445} +{"info/global_step": 1446, "train_info/time_within_train_step": 2.7462592124938965, "step": 1446} +{"train_info/time_between_train_steps": 0.0036749839782714844, "step": 1446} +{"info/global_step": 1447, "train_info/time_within_train_step": 2.7174129486083984, "step": 1447} +{"train_info/time_between_train_steps": 0.003630399703979492, "step": 1447} +{"info/global_step": 1448, "train_info/time_within_train_step": 2.7997500896453857, "step": 1448} +{"train_info/time_between_train_steps": 0.0037479400634765625, "step": 1448} +{"info/global_step": 1449, "train_info/time_within_train_step": 2.7257564067840576, "step": 1449} +{"train_info/time_between_train_steps": 0.0037016868591308594, "step": 1449} +{"info/global_step": 1450, "train_info/time_within_train_step": 2.702202081680298, "step": 1450} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746290437, "_runtime": 4459}, "step": 1450} +{"logs": {"train/loss": 4.95, "train/learning_rate": 0.0003444444444444444, "train/epoch": 1.23, "_timestamp": 1746290437, "_runtime": 4459}, "step": 1450} +{"train_info/time_between_train_steps": 0.02955770492553711, "step": 1450} +{"info/global_step": 1451, "train_info/time_within_train_step": 2.7385902404785156, "step": 1451} +{"train_info/time_between_train_steps": 0.003799915313720703, "step": 1451} +{"info/global_step": 1452, "train_info/time_within_train_step": 2.75948429107666, "step": 1452} +{"train_info/time_between_train_steps": 0.003648042678833008, "step": 1452} +{"info/global_step": 1453, "train_info/time_within_train_step": 2.735647439956665, "step": 1453} +{"train_info/time_between_train_steps": 0.003856658935546875, "step": 1453} +{"info/global_step": 1454, "train_info/time_within_train_step": 2.7321152687072754, "step": 1454} +{"train_info/time_between_train_steps": 0.0037615299224853516, "step": 1454} +{"info/global_step": 1455, "train_info/time_within_train_step": 2.7008118629455566, "step": 1455} +{"train_info/time_between_train_steps": 0.00360107421875, "step": 1455} +{"info/global_step": 1456, "train_info/time_within_train_step": 2.6983726024627686, "step": 1456} +{"train_info/time_between_train_steps": 0.0037500858306884766, "step": 1456} +{"info/global_step": 1457, "train_info/time_within_train_step": 2.6990814208984375, "step": 1457} +{"train_info/time_between_train_steps": 0.003543853759765625, "step": 1457} +{"info/global_step": 1458, "train_info/time_within_train_step": 2.860384941101074, "step": 1458} +{"train_info/time_between_train_steps": 0.003468036651611328, "step": 1458} +{"info/global_step": 1459, "train_info/time_within_train_step": 2.8661251068115234, "step": 1459} +{"train_info/time_between_train_steps": 0.0035219192504882812, "step": 1459} +{"info/global_step": 1460, "train_info/time_within_train_step": 2.766216516494751, "step": 1460} +{"train_info/time_between_train_steps": 0.0036373138427734375, "step": 1460} +{"info/global_step": 1461, "train_info/time_within_train_step": 2.699500799179077, "step": 1461} +{"train_info/time_between_train_steps": 0.003530740737915039, "step": 1461} +{"info/global_step": 1462, "train_info/time_within_train_step": 2.748518943786621, "step": 1462} +{"train_info/time_between_train_steps": 0.0037300586700439453, "step": 1462} +{"info/global_step": 1463, "train_info/time_within_train_step": 2.712015151977539, "step": 1463} +{"train_info/time_between_train_steps": 0.0035321712493896484, "step": 1463} +{"info/global_step": 1464, "train_info/time_within_train_step": 2.700331926345825, "step": 1464} +{"train_info/time_between_train_steps": 0.003587484359741211, "step": 1464} +{"info/global_step": 1465, "train_info/time_within_train_step": 2.7643942832946777, "step": 1465} +{"train_info/time_between_train_steps": 0.003555774688720703, "step": 1465} +{"info/global_step": 1466, "train_info/time_within_train_step": 2.7688839435577393, "step": 1466} +{"train_info/time_between_train_steps": 0.0035953521728515625, "step": 1466} +{"info/global_step": 1467, "train_info/time_within_train_step": 2.7134265899658203, "step": 1467} +{"train_info/time_between_train_steps": 0.003609895706176758, "step": 1467} +{"info/global_step": 1468, "train_info/time_within_train_step": 2.704686164855957, "step": 1468} +{"train_info/time_between_train_steps": 0.003459930419921875, "step": 1468} +{"info/global_step": 1469, "train_info/time_within_train_step": 2.733036994934082, "step": 1469} +{"train_info/time_between_train_steps": 0.003533601760864258, "step": 1469} +{"info/global_step": 1470, "train_info/time_within_train_step": 2.850074052810669, "step": 1470} +{"train_info/time_between_train_steps": 0.003609180450439453, "step": 1470} +{"info/global_step": 1471, "train_info/time_within_train_step": 2.7597873210906982, "step": 1471} +{"train_info/time_between_train_steps": 0.003699779510498047, "step": 1471} +{"info/global_step": 1472, "train_info/time_within_train_step": 2.702465057373047, "step": 1472} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 1472} +{"info/global_step": 1473, "train_info/time_within_train_step": 2.7123727798461914, "step": 1473} +{"train_info/time_between_train_steps": 0.0036127567291259766, "step": 1473} +{"info/global_step": 1474, "train_info/time_within_train_step": 2.812727212905884, "step": 1474} +{"train_info/time_between_train_steps": 0.0035064220428466797, "step": 1474} +{"info/global_step": 1475, "train_info/time_within_train_step": 2.7636544704437256, "step": 1475} +{"train_info/time_between_train_steps": 0.0035736560821533203, "step": 1475} +{"info/global_step": 1476, "train_info/time_within_train_step": 2.7005741596221924, "step": 1476} +{"train_info/time_between_train_steps": 0.0035495758056640625, "step": 1476} +{"info/global_step": 1477, "train_info/time_within_train_step": 2.7273612022399902, "step": 1477} +{"train_info/time_between_train_steps": 0.0035123825073242188, "step": 1477} +{"info/global_step": 1478, "train_info/time_within_train_step": 2.7850873470306396, "step": 1478} +{"train_info/time_between_train_steps": 0.0034186840057373047, "step": 1478} +{"info/global_step": 1479, "train_info/time_within_train_step": 2.7250890731811523, "step": 1479} +{"train_info/time_between_train_steps": 0.0034432411193847656, "step": 1479} +{"info/global_step": 1480, "train_info/time_within_train_step": 2.7195513248443604, "step": 1480} +{"train_info/time_between_train_steps": 0.003547191619873047, "step": 1480} +{"info/global_step": 1481, "train_info/time_within_train_step": 2.744624376296997, "step": 1481} +{"train_info/time_between_train_steps": 0.0035200119018554688, "step": 1481} +{"info/global_step": 1482, "train_info/time_within_train_step": 2.7204513549804688, "step": 1482} +{"train_info/time_between_train_steps": 0.003548860549926758, "step": 1482} +{"info/global_step": 1483, "train_info/time_within_train_step": 2.7263057231903076, "step": 1483} +{"train_info/time_between_train_steps": 0.00337982177734375, "step": 1483} +{"info/global_step": 1484, "train_info/time_within_train_step": 2.732583522796631, "step": 1484} +{"train_info/time_between_train_steps": 0.003459453582763672, "step": 1484} +{"info/global_step": 1485, "train_info/time_within_train_step": 2.7274231910705566, "step": 1485} +{"train_info/time_between_train_steps": 0.0033845901489257812, "step": 1485} +{"info/global_step": 1486, "train_info/time_within_train_step": 2.8262405395507812, "step": 1486} +{"train_info/time_between_train_steps": 0.003665447235107422, "step": 1486} +{"info/global_step": 1487, "train_info/time_within_train_step": 2.7052199840545654, "step": 1487} +{"train_info/time_between_train_steps": 0.003463268280029297, "step": 1487} +{"info/global_step": 1488, "train_info/time_within_train_step": 2.7023680210113525, "step": 1488} +{"train_info/time_between_train_steps": 0.003601551055908203, "step": 1488} +{"info/global_step": 1489, "train_info/time_within_train_step": 2.7002463340759277, "step": 1489} +{"train_info/time_between_train_steps": 0.003486156463623047, "step": 1489} +{"info/global_step": 1490, "train_info/time_within_train_step": 2.733806610107422, "step": 1490} +{"train_info/time_between_train_steps": 0.0035271644592285156, "step": 1490} +{"info/global_step": 1491, "train_info/time_within_train_step": 2.8835246562957764, "step": 1491} +{"train_info/time_between_train_steps": 0.003517627716064453, "step": 1491} +{"info/global_step": 1492, "train_info/time_within_train_step": 2.7231040000915527, "step": 1492} +{"train_info/time_between_train_steps": 0.003524303436279297, "step": 1492} +{"info/global_step": 1493, "train_info/time_within_train_step": 2.699467182159424, "step": 1493} +{"train_info/time_between_train_steps": 0.0035467147827148438, "step": 1493} +{"info/global_step": 1494, "train_info/time_within_train_step": 2.6998238563537598, "step": 1494} +{"train_info/time_between_train_steps": 0.003614187240600586, "step": 1494} +{"info/global_step": 1495, "train_info/time_within_train_step": 2.77663516998291, "step": 1495} +{"train_info/time_between_train_steps": 0.003595590591430664, "step": 1495} +{"info/global_step": 1496, "train_info/time_within_train_step": 2.850938558578491, "step": 1496} +{"train_info/time_between_train_steps": 0.0035681724548339844, "step": 1496} +{"info/global_step": 1497, "train_info/time_within_train_step": 2.7343175411224365, "step": 1497} +{"train_info/time_between_train_steps": 0.0038406848907470703, "step": 1497} +{"info/global_step": 1498, "train_info/time_within_train_step": 2.7619547843933105, "step": 1498} +{"train_info/time_between_train_steps": 0.003517627716064453, "step": 1498} +{"info/global_step": 1499, "train_info/time_within_train_step": 2.699042558670044, "step": 1499} +{"train_info/time_between_train_steps": 0.003692626953125, "step": 1499} +{"info/global_step": 1500, "train_info/time_within_train_step": 3.301513910293579, "step": 1500} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746290577, "_runtime": 4599}, "step": 1500} +{"logs": {"train/loss": 4.9236, "train/learning_rate": 0.0003333333333333333, "train/epoch": 1.25, "_timestamp": 1746290577, "_runtime": 4599}, "step": 1500} +{"train_info/time_between_train_steps": 14.678784847259521, "step": 1500} +{"info/global_step": 1501, "train_info/time_within_train_step": 2.4859323501586914, "step": 1501} +{"train_info/time_between_train_steps": 0.003991365432739258, "step": 1501} +{"info/global_step": 1502, "train_info/time_within_train_step": 2.503350019454956, "step": 1502} +{"train_info/time_between_train_steps": 0.004140377044677734, "step": 1502} +{"info/global_step": 1503, "train_info/time_within_train_step": 2.6840901374816895, "step": 1503} +{"train_info/time_between_train_steps": 0.0038352012634277344, "step": 1503} +{"info/global_step": 1504, "train_info/time_within_train_step": 2.7038824558258057, "step": 1504} +{"train_info/time_between_train_steps": 0.0043430328369140625, "step": 1504} +{"info/global_step": 1505, "train_info/time_within_train_step": 2.6969199180603027, "step": 1505} +{"train_info/time_between_train_steps": 0.00787496566772461, "step": 1505} +{"info/global_step": 1506, "train_info/time_within_train_step": 2.69840407371521, "step": 1506} +{"train_info/time_between_train_steps": 0.007822275161743164, "step": 1506} +{"info/global_step": 1507, "train_info/time_within_train_step": 2.699773073196411, "step": 1507} +{"train_info/time_between_train_steps": 0.007608175277709961, "step": 1507} +{"info/global_step": 1508, "train_info/time_within_train_step": 2.863093376159668, "step": 1508} +{"train_info/time_between_train_steps": 0.0042896270751953125, "step": 1508} +{"info/global_step": 1509, "train_info/time_within_train_step": 3.0318000316619873, "step": 1509} +{"train_info/time_between_train_steps": 0.0040247440338134766, "step": 1509} +{"info/global_step": 1510, "train_info/time_within_train_step": 3.072175979614258, "step": 1510} +{"train_info/time_between_train_steps": 0.004189729690551758, "step": 1510} +{"info/global_step": 1511, "train_info/time_within_train_step": 2.7288620471954346, "step": 1511} +{"train_info/time_between_train_steps": 0.0040130615234375, "step": 1511} +{"info/global_step": 1512, "train_info/time_within_train_step": 2.7003607749938965, "step": 1512} +{"train_info/time_between_train_steps": 0.004193782806396484, "step": 1512} +{"info/global_step": 1513, "train_info/time_within_train_step": 2.702228307723999, "step": 1513} +{"train_info/time_between_train_steps": 0.004046201705932617, "step": 1513} +{"info/global_step": 1514, "train_info/time_within_train_step": 2.701936721801758, "step": 1514} +{"train_info/time_between_train_steps": 0.004069805145263672, "step": 1514} +{"info/global_step": 1515, "train_info/time_within_train_step": 2.702829599380493, "step": 1515} +{"train_info/time_between_train_steps": 0.004183769226074219, "step": 1515} +{"info/global_step": 1516, "train_info/time_within_train_step": 2.7395071983337402, "step": 1516} +{"train_info/time_between_train_steps": 0.004568576812744141, "step": 1516} +{"train_info/time_between_train_steps": 3.0999655723571777, "step": 1516} +{"info/global_step": 1517, "train_info/time_within_train_step": 2.7229089736938477, "step": 1517} +{"train_info/time_between_train_steps": 0.003516674041748047, "step": 1517} +{"info/global_step": 1518, "train_info/time_within_train_step": 2.9207520484924316, "step": 1518} +{"train_info/time_between_train_steps": 0.003544330596923828, "step": 1518} +{"info/global_step": 1519, "train_info/time_within_train_step": 2.6958391666412354, "step": 1519} +{"train_info/time_between_train_steps": 0.003511667251586914, "step": 1519} +{"info/global_step": 1520, "train_info/time_within_train_step": 2.6974592208862305, "step": 1520} +{"train_info/time_between_train_steps": 0.0035758018493652344, "step": 1520} +{"info/global_step": 1521, "train_info/time_within_train_step": 2.6963229179382324, "step": 1521} +{"train_info/time_between_train_steps": 0.003674745559692383, "step": 1521} +{"info/global_step": 1522, "train_info/time_within_train_step": 2.696559190750122, "step": 1522} +{"train_info/time_between_train_steps": 0.003713846206665039, "step": 1522} +{"info/global_step": 1523, "train_info/time_within_train_step": 2.7024779319763184, "step": 1523} +{"train_info/time_between_train_steps": 0.003572702407836914, "step": 1523} +{"info/global_step": 1524, "train_info/time_within_train_step": 2.69789457321167, "step": 1524} +{"train_info/time_between_train_steps": 0.003533601760864258, "step": 1524} +{"info/global_step": 1525, "train_info/time_within_train_step": 2.698457956314087, "step": 1525} +{"train_info/time_between_train_steps": 0.003597736358642578, "step": 1525} +{"info/global_step": 1526, "train_info/time_within_train_step": 2.6989903450012207, "step": 1526} +{"train_info/time_between_train_steps": 0.0036253929138183594, "step": 1526} +{"info/global_step": 1527, "train_info/time_within_train_step": 2.701202154159546, "step": 1527} +{"train_info/time_between_train_steps": 0.003729104995727539, "step": 1527} +{"info/global_step": 1528, "train_info/time_within_train_step": 2.769209861755371, "step": 1528} +{"train_info/time_between_train_steps": 0.00411224365234375, "step": 1528} +{"info/global_step": 1529, "train_info/time_within_train_step": 2.8261265754699707, "step": 1529} +{"train_info/time_between_train_steps": 0.004159688949584961, "step": 1529} +{"info/global_step": 1530, "train_info/time_within_train_step": 3.005600929260254, "step": 1530} +{"train_info/time_between_train_steps": 0.003924131393432617, "step": 1530} +{"info/global_step": 1531, "train_info/time_within_train_step": 2.7353782653808594, "step": 1531} +{"train_info/time_between_train_steps": 0.00407862663269043, "step": 1531} +{"info/global_step": 1532, "train_info/time_within_train_step": 2.700800657272339, "step": 1532} +{"train_info/time_between_train_steps": 0.0038607120513916016, "step": 1532} +{"info/global_step": 1533, "train_info/time_within_train_step": 2.699491262435913, "step": 1533} +{"train_info/time_between_train_steps": 0.0038423538208007812, "step": 1533} +{"info/global_step": 1534, "train_info/time_within_train_step": 2.701089859008789, "step": 1534} +{"train_info/time_between_train_steps": 0.0039403438568115234, "step": 1534} +{"info/global_step": 1535, "train_info/time_within_train_step": 2.7037670612335205, "step": 1535} +{"train_info/time_between_train_steps": 0.003975629806518555, "step": 1535} +{"info/global_step": 1536, "train_info/time_within_train_step": 2.7151544094085693, "step": 1536} +{"train_info/time_between_train_steps": 0.0040683746337890625, "step": 1536} +{"info/global_step": 1537, "train_info/time_within_train_step": 2.918778657913208, "step": 1537} +{"train_info/time_between_train_steps": 0.0045130252838134766, "step": 1537} +{"info/global_step": 1538, "train_info/time_within_train_step": 2.9552903175354004, "step": 1538} +{"train_info/time_between_train_steps": 0.003810882568359375, "step": 1538} +{"info/global_step": 1539, "train_info/time_within_train_step": 2.7081851959228516, "step": 1539} +{"train_info/time_between_train_steps": 0.004010915756225586, "step": 1539} +{"info/global_step": 1540, "train_info/time_within_train_step": 2.7028164863586426, "step": 1540} +{"train_info/time_between_train_steps": 0.003993034362792969, "step": 1540} +{"info/global_step": 1541, "train_info/time_within_train_step": 2.7019567489624023, "step": 1541} +{"train_info/time_between_train_steps": 0.0038826465606689453, "step": 1541} +{"info/global_step": 1542, "train_info/time_within_train_step": 2.7003226280212402, "step": 1542} +{"train_info/time_between_train_steps": 0.0037865638732910156, "step": 1542} +{"info/global_step": 1543, "train_info/time_within_train_step": 2.768364429473877, "step": 1543} +{"train_info/time_between_train_steps": 0.003835916519165039, "step": 1543} +{"info/global_step": 1544, "train_info/time_within_train_step": 2.9687628746032715, "step": 1544} +{"train_info/time_between_train_steps": 0.0037946701049804688, "step": 1544} +{"info/global_step": 1545, "train_info/time_within_train_step": 2.8186144828796387, "step": 1545} +{"train_info/time_between_train_steps": 0.003798961639404297, "step": 1545} +{"info/global_step": 1546, "train_info/time_within_train_step": 2.7020246982574463, "step": 1546} +{"train_info/time_between_train_steps": 0.0038139820098876953, "step": 1546} +{"info/global_step": 1547, "train_info/time_within_train_step": 2.69901180267334, "step": 1547} +{"train_info/time_between_train_steps": 0.0037164688110351562, "step": 1547} +{"info/global_step": 1548, "train_info/time_within_train_step": 2.7588629722595215, "step": 1548} +{"train_info/time_between_train_steps": 0.0037081241607666016, "step": 1548} +{"info/global_step": 1549, "train_info/time_within_train_step": 2.945976734161377, "step": 1549} +{"train_info/time_between_train_steps": 0.003638029098510742, "step": 1549} +{"info/global_step": 1550, "train_info/time_within_train_step": 2.740553379058838, "step": 1550} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746290735, "_runtime": 4757}, "step": 1550} +{"logs": {"train/loss": 4.9317, "train/learning_rate": 0.0003222222222222222, "train/epoch": 2.01, "_timestamp": 1746290735, "_runtime": 4757}, "step": 1550} +{"train_info/time_between_train_steps": 0.02434062957763672, "step": 1550} +{"info/global_step": 1551, "train_info/time_within_train_step": 2.6996757984161377, "step": 1551} +{"train_info/time_between_train_steps": 0.0037491321563720703, "step": 1551} +{"info/global_step": 1552, "train_info/time_within_train_step": 2.747070789337158, "step": 1552} +{"train_info/time_between_train_steps": 0.003713369369506836, "step": 1552} +{"info/global_step": 1553, "train_info/time_within_train_step": 2.938610076904297, "step": 1553} +{"train_info/time_between_train_steps": 0.003741741180419922, "step": 1553} +{"info/global_step": 1554, "train_info/time_within_train_step": 2.820486307144165, "step": 1554} +{"train_info/time_between_train_steps": 0.0038993358612060547, "step": 1554} +{"info/global_step": 1555, "train_info/time_within_train_step": 2.7131428718566895, "step": 1555} +{"train_info/time_between_train_steps": 0.0038268566131591797, "step": 1555} +{"info/global_step": 1556, "train_info/time_within_train_step": 2.7024648189544678, "step": 1556} +{"train_info/time_between_train_steps": 0.0038263797760009766, "step": 1556} +{"info/global_step": 1557, "train_info/time_within_train_step": 3.020078182220459, "step": 1557} +{"train_info/time_between_train_steps": 0.003698587417602539, "step": 1557} +{"info/global_step": 1558, "train_info/time_within_train_step": 2.698301076889038, "step": 1558} +{"train_info/time_between_train_steps": 0.0036020278930664062, "step": 1558} +{"info/global_step": 1559, "train_info/time_within_train_step": 2.6979458332061768, "step": 1559} +{"train_info/time_between_train_steps": 0.0035767555236816406, "step": 1559} +{"info/global_step": 1560, "train_info/time_within_train_step": 2.7871010303497314, "step": 1560} +{"train_info/time_between_train_steps": 0.003641366958618164, "step": 1560} +{"info/global_step": 1561, "train_info/time_within_train_step": 2.867324113845825, "step": 1561} +{"train_info/time_between_train_steps": 0.0039179325103759766, "step": 1561} +{"info/global_step": 1562, "train_info/time_within_train_step": 2.752986192703247, "step": 1562} +{"train_info/time_between_train_steps": 0.003566741943359375, "step": 1562} +{"info/global_step": 1563, "train_info/time_within_train_step": 2.6987714767456055, "step": 1563} +{"train_info/time_between_train_steps": 0.003572225570678711, "step": 1563} +{"info/global_step": 1564, "train_info/time_within_train_step": 2.7041099071502686, "step": 1564} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 1564} +{"info/global_step": 1565, "train_info/time_within_train_step": 2.7207460403442383, "step": 1565} +{"train_info/time_between_train_steps": 0.0035495758056640625, "step": 1565} +{"info/global_step": 1566, "train_info/time_within_train_step": 2.7350516319274902, "step": 1566} +{"train_info/time_between_train_steps": 0.0035827159881591797, "step": 1566} +{"info/global_step": 1567, "train_info/time_within_train_step": 2.8027145862579346, "step": 1567} +{"train_info/time_between_train_steps": 0.003628969192504883, "step": 1567} +{"info/global_step": 1568, "train_info/time_within_train_step": 2.7695391178131104, "step": 1568} +{"train_info/time_between_train_steps": 0.0035858154296875, "step": 1568} +{"info/global_step": 1569, "train_info/time_within_train_step": 2.7148566246032715, "step": 1569} +{"train_info/time_between_train_steps": 0.0036497116088867188, "step": 1569} +{"info/global_step": 1570, "train_info/time_within_train_step": 2.777218818664551, "step": 1570} +{"train_info/time_between_train_steps": 0.0035674571990966797, "step": 1570} +{"info/global_step": 1571, "train_info/time_within_train_step": 2.810257911682129, "step": 1571} +{"train_info/time_between_train_steps": 0.00356292724609375, "step": 1571} +{"info/global_step": 1572, "train_info/time_within_train_step": 2.705352783203125, "step": 1572} +{"train_info/time_between_train_steps": 0.0036618709564208984, "step": 1572} +{"info/global_step": 1573, "train_info/time_within_train_step": 2.6999146938323975, "step": 1573} +{"train_info/time_between_train_steps": 0.0036423206329345703, "step": 1573} +{"info/global_step": 1574, "train_info/time_within_train_step": 2.699758291244507, "step": 1574} +{"train_info/time_between_train_steps": 0.0036547183990478516, "step": 1574} +{"info/global_step": 1575, "train_info/time_within_train_step": 2.772972583770752, "step": 1575} +{"train_info/time_between_train_steps": 0.00363922119140625, "step": 1575} +{"info/global_step": 1576, "train_info/time_within_train_step": 2.92429518699646, "step": 1576} +{"train_info/time_between_train_steps": 0.0035681724548339844, "step": 1576} +{"info/global_step": 1577, "train_info/time_within_train_step": 2.757094144821167, "step": 1577} +{"train_info/time_between_train_steps": 0.0037746429443359375, "step": 1577} +{"info/global_step": 1578, "train_info/time_within_train_step": 2.7009847164154053, "step": 1578} +{"train_info/time_between_train_steps": 0.0037984848022460938, "step": 1578} +{"info/global_step": 1579, "train_info/time_within_train_step": 2.826137065887451, "step": 1579} +{"train_info/time_between_train_steps": 0.0036516189575195312, "step": 1579} +{"info/global_step": 1580, "train_info/time_within_train_step": 2.700118064880371, "step": 1580} +{"train_info/time_between_train_steps": 0.0039026737213134766, "step": 1580} +{"info/global_step": 1581, "train_info/time_within_train_step": 2.9789352416992188, "step": 1581} +{"train_info/time_between_train_steps": 0.0035860538482666016, "step": 1581} +{"info/global_step": 1582, "train_info/time_within_train_step": 2.6958394050598145, "step": 1582} +{"train_info/time_between_train_steps": 0.003561735153198242, "step": 1582} +{"info/global_step": 1583, "train_info/time_within_train_step": 2.695981979370117, "step": 1583} +{"train_info/time_between_train_steps": 0.003513336181640625, "step": 1583} +{"info/global_step": 1584, "train_info/time_within_train_step": 2.698216199874878, "step": 1584} +{"train_info/time_between_train_steps": 0.0035920143127441406, "step": 1584} +{"info/global_step": 1585, "train_info/time_within_train_step": 2.6968047618865967, "step": 1585} +{"train_info/time_between_train_steps": 0.003573894500732422, "step": 1585} +{"info/global_step": 1586, "train_info/time_within_train_step": 2.697626829147339, "step": 1586} +{"train_info/time_between_train_steps": 0.0036232471466064453, "step": 1586} +{"info/global_step": 1587, "train_info/time_within_train_step": 2.6975131034851074, "step": 1587} +{"train_info/time_between_train_steps": 0.003467082977294922, "step": 1587} +{"info/global_step": 1588, "train_info/time_within_train_step": 2.6964874267578125, "step": 1588} +{"train_info/time_between_train_steps": 0.003564596176147461, "step": 1588} +{"info/global_step": 1589, "train_info/time_within_train_step": 2.6951048374176025, "step": 1589} +{"train_info/time_between_train_steps": 0.003607511520385742, "step": 1589} +{"info/global_step": 1590, "train_info/time_within_train_step": 2.6944644451141357, "step": 1590} +{"train_info/time_between_train_steps": 0.0035543441772460938, "step": 1590} +{"info/global_step": 1591, "train_info/time_within_train_step": 2.6977341175079346, "step": 1591} +{"train_info/time_between_train_steps": 0.0034897327423095703, "step": 1591} +{"info/global_step": 1592, "train_info/time_within_train_step": 2.6949222087860107, "step": 1592} +{"train_info/time_between_train_steps": 0.0035598278045654297, "step": 1592} +{"info/global_step": 1593, "train_info/time_within_train_step": 2.695209503173828, "step": 1593} +{"train_info/time_between_train_steps": 0.003535747528076172, "step": 1593} +{"info/global_step": 1594, "train_info/time_within_train_step": 2.694127321243286, "step": 1594} +{"train_info/time_between_train_steps": 0.003585338592529297, "step": 1594} +{"info/global_step": 1595, "train_info/time_within_train_step": 2.6950368881225586, "step": 1595} +{"train_info/time_between_train_steps": 0.0036745071411132812, "step": 1595} +{"info/global_step": 1596, "train_info/time_within_train_step": 2.6955106258392334, "step": 1596} +{"train_info/time_between_train_steps": 0.0036020278930664062, "step": 1596} +{"info/global_step": 1597, "train_info/time_within_train_step": 2.695622205734253, "step": 1597} +{"train_info/time_between_train_steps": 0.0036301612854003906, "step": 1597} +{"info/global_step": 1598, "train_info/time_within_train_step": 2.695373296737671, "step": 1598} +{"train_info/time_between_train_steps": 0.0038938522338867188, "step": 1598} +{"info/global_step": 1599, "train_info/time_within_train_step": 2.697519540786743, "step": 1599} +{"train_info/time_between_train_steps": 0.004060029983520508, "step": 1599} +{"info/global_step": 1600, "train_info/time_within_train_step": 2.6971402168273926, "step": 1600} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746290880, "_runtime": 4902}, "step": 1600} +{"logs": {"train/loss": 4.8668, "train/learning_rate": 0.00031111111111111107, "train/epoch": 2.03, "_timestamp": 1746290880, "_runtime": 4902}, "step": 1600} +{"train_info/time_between_train_steps": 36.086138010025024, "step": 1600} +{"info/global_step": 1601, "train_info/time_within_train_step": 2.4938571453094482, "step": 1601} +{"train_info/time_between_train_steps": 0.004158735275268555, "step": 1601} +{"info/global_step": 1602, "train_info/time_within_train_step": 2.5033841133117676, "step": 1602} +{"train_info/time_between_train_steps": 0.004168272018432617, "step": 1602} +{"info/global_step": 1603, "train_info/time_within_train_step": 2.6784110069274902, "step": 1603} +{"train_info/time_between_train_steps": 0.004090547561645508, "step": 1603} +{"info/global_step": 1604, "train_info/time_within_train_step": 2.693915605545044, "step": 1604} +{"train_info/time_between_train_steps": 0.004309892654418945, "step": 1604} +{"info/global_step": 1605, "train_info/time_within_train_step": 2.6950008869171143, "step": 1605} +{"train_info/time_between_train_steps": 0.0040874481201171875, "step": 1605} +{"info/global_step": 1606, "train_info/time_within_train_step": 2.6960654258728027, "step": 1606} +{"train_info/time_between_train_steps": 0.004083395004272461, "step": 1606} +{"info/global_step": 1607, "train_info/time_within_train_step": 2.6993370056152344, "step": 1607} +{"train_info/time_between_train_steps": 0.0041925907135009766, "step": 1607} +{"info/global_step": 1608, "train_info/time_within_train_step": 2.699321746826172, "step": 1608} +{"train_info/time_between_train_steps": 0.0041120052337646484, "step": 1608} +{"info/global_step": 1609, "train_info/time_within_train_step": 2.6975293159484863, "step": 1609} +{"train_info/time_between_train_steps": 0.004143953323364258, "step": 1609} +{"info/global_step": 1610, "train_info/time_within_train_step": 2.736948013305664, "step": 1610} +{"train_info/time_between_train_steps": 0.005293130874633789, "step": 1610} +{"info/global_step": 1611, "train_info/time_within_train_step": 2.840723991394043, "step": 1611} +{"train_info/time_between_train_steps": 0.004018545150756836, "step": 1611} +{"info/global_step": 1612, "train_info/time_within_train_step": 2.966200590133667, "step": 1612} +{"train_info/time_between_train_steps": 0.00399470329284668, "step": 1612} +{"info/global_step": 1613, "train_info/time_within_train_step": 2.7483270168304443, "step": 1613} +{"train_info/time_between_train_steps": 0.003969907760620117, "step": 1613} +{"info/global_step": 1614, "train_info/time_within_train_step": 2.6999640464782715, "step": 1614} +{"train_info/time_between_train_steps": 0.0039806365966796875, "step": 1614} +{"info/global_step": 1615, "train_info/time_within_train_step": 2.699765920639038, "step": 1615} +{"train_info/time_between_train_steps": 0.004060029983520508, "step": 1615} +{"info/global_step": 1616, "train_info/time_within_train_step": 2.699408531188965, "step": 1616} +{"train_info/time_between_train_steps": 0.004275083541870117, "step": 1616} +{"info/global_step": 1617, "train_info/time_within_train_step": 2.702971935272217, "step": 1617} +{"train_info/time_between_train_steps": 0.003938436508178711, "step": 1617} +{"info/global_step": 1618, "train_info/time_within_train_step": 2.7015559673309326, "step": 1618} +{"train_info/time_between_train_steps": 0.0039446353912353516, "step": 1618} +{"info/global_step": 1619, "train_info/time_within_train_step": 2.7006237506866455, "step": 1619} +{"train_info/time_between_train_steps": 0.003977775573730469, "step": 1619} +{"info/global_step": 1620, "train_info/time_within_train_step": 2.698686122894287, "step": 1620} +{"train_info/time_between_train_steps": 0.0039136409759521484, "step": 1620} +{"info/global_step": 1621, "train_info/time_within_train_step": 2.6998705863952637, "step": 1621} +{"train_info/time_between_train_steps": 0.003999233245849609, "step": 1621} +{"info/global_step": 1622, "train_info/time_within_train_step": 2.698749303817749, "step": 1622} +{"train_info/time_between_train_steps": 0.003936767578125, "step": 1622} +{"info/global_step": 1623, "train_info/time_within_train_step": 2.700495481491089, "step": 1623} +{"train_info/time_between_train_steps": 0.0038878917694091797, "step": 1623} +{"info/global_step": 1624, "train_info/time_within_train_step": 2.698927402496338, "step": 1624} +{"train_info/time_between_train_steps": 0.0039942264556884766, "step": 1624} +{"info/global_step": 1625, "train_info/time_within_train_step": 3.085651159286499, "step": 1625} +{"train_info/time_between_train_steps": 0.0038428306579589844, "step": 1625} +{"info/global_step": 1626, "train_info/time_within_train_step": 2.698483943939209, "step": 1626} +{"train_info/time_between_train_steps": 0.003802061080932617, "step": 1626} +{"info/global_step": 1627, "train_info/time_within_train_step": 2.6991453170776367, "step": 1627} +{"train_info/time_between_train_steps": 0.003930568695068359, "step": 1627} +{"info/global_step": 1628, "train_info/time_within_train_step": 2.6990129947662354, "step": 1628} +{"train_info/time_between_train_steps": 0.0037806034088134766, "step": 1628} +{"info/global_step": 1629, "train_info/time_within_train_step": 2.6984775066375732, "step": 1629} +{"train_info/time_between_train_steps": 0.0037431716918945312, "step": 1629} +{"info/global_step": 1630, "train_info/time_within_train_step": 2.699676275253296, "step": 1630} +{"train_info/time_between_train_steps": 0.003864765167236328, "step": 1630} +{"info/global_step": 1631, "train_info/time_within_train_step": 2.6989567279815674, "step": 1631} +{"train_info/time_between_train_steps": 0.00382232666015625, "step": 1631} +{"info/global_step": 1632, "train_info/time_within_train_step": 2.698621988296509, "step": 1632} +{"train_info/time_between_train_steps": 0.003826141357421875, "step": 1632} +{"info/global_step": 1633, "train_info/time_within_train_step": 2.7007339000701904, "step": 1633} +{"train_info/time_between_train_steps": 0.0038819313049316406, "step": 1633} +{"info/global_step": 1634, "train_info/time_within_train_step": 2.7013018131256104, "step": 1634} +{"train_info/time_between_train_steps": 0.003824472427368164, "step": 1634} +{"info/global_step": 1635, "train_info/time_within_train_step": 2.7011477947235107, "step": 1635} +{"train_info/time_between_train_steps": 0.003966093063354492, "step": 1635} +{"info/global_step": 1636, "train_info/time_within_train_step": 2.6996922492980957, "step": 1636} +{"train_info/time_between_train_steps": 0.003777027130126953, "step": 1636} +{"info/global_step": 1637, "train_info/time_within_train_step": 2.7001075744628906, "step": 1637} +{"train_info/time_between_train_steps": 0.003709077835083008, "step": 1637} +{"info/global_step": 1638, "train_info/time_within_train_step": 2.6998677253723145, "step": 1638} +{"train_info/time_between_train_steps": 0.003738880157470703, "step": 1638} +{"info/global_step": 1639, "train_info/time_within_train_step": 2.7004759311676025, "step": 1639} +{"train_info/time_between_train_steps": 0.003740549087524414, "step": 1639} +{"info/global_step": 1640, "train_info/time_within_train_step": 2.69909405708313, "step": 1640} +{"train_info/time_between_train_steps": 0.003834247589111328, "step": 1640} +{"info/global_step": 1641, "train_info/time_within_train_step": 2.699212074279785, "step": 1641} +{"train_info/time_between_train_steps": 0.16795659065246582, "step": 1641} +{"info/global_step": 1642, "train_info/time_within_train_step": 2.6997950077056885, "step": 1642} +{"train_info/time_between_train_steps": 0.0036661624908447266, "step": 1642} +{"info/global_step": 1643, "train_info/time_within_train_step": 2.698978900909424, "step": 1643} +{"train_info/time_between_train_steps": 0.003648042678833008, "step": 1643} +{"info/global_step": 1644, "train_info/time_within_train_step": 2.700181245803833, "step": 1644} +{"train_info/time_between_train_steps": 0.003732919692993164, "step": 1644} +{"info/global_step": 1645, "train_info/time_within_train_step": 2.7001523971557617, "step": 1645} +{"train_info/time_between_train_steps": 0.0037643909454345703, "step": 1645} +{"info/global_step": 1646, "train_info/time_within_train_step": 2.7862493991851807, "step": 1646} +{"train_info/time_between_train_steps": 0.0036432743072509766, "step": 1646} +{"info/global_step": 1647, "train_info/time_within_train_step": 2.698000192642212, "step": 1647} +{"train_info/time_between_train_steps": 0.0036940574645996094, "step": 1647} +{"info/global_step": 1648, "train_info/time_within_train_step": 2.934291362762451, "step": 1648} +{"train_info/time_between_train_steps": 0.003777742385864258, "step": 1648} +{"info/global_step": 1649, "train_info/time_within_train_step": 2.698399066925049, "step": 1649} +{"train_info/time_between_train_steps": 0.00385284423828125, "step": 1649} +{"info/global_step": 1650, "train_info/time_within_train_step": 2.697620153427124, "step": 1650} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746291061, "_runtime": 5083}, "step": 1650} +{"logs": {"train/loss": 4.8461, "train/learning_rate": 0.0003, "train/epoch": 2.04, "_timestamp": 1746291061, "_runtime": 5083}, "step": 1650} +{"train_info/time_between_train_steps": 0.04958844184875488, "step": 1650} +{"info/global_step": 1651, "train_info/time_within_train_step": 2.697967290878296, "step": 1651} +{"train_info/time_between_train_steps": 0.0038840770721435547, "step": 1651} +{"info/global_step": 1652, "train_info/time_within_train_step": 2.6979105472564697, "step": 1652} +{"train_info/time_between_train_steps": 0.003907203674316406, "step": 1652} +{"info/global_step": 1653, "train_info/time_within_train_step": 2.698646306991577, "step": 1653} +{"train_info/time_between_train_steps": 0.00395655632019043, "step": 1653} +{"info/global_step": 1654, "train_info/time_within_train_step": 2.69899582862854, "step": 1654} +{"train_info/time_between_train_steps": 0.0041425228118896484, "step": 1654} +{"info/global_step": 1655, "train_info/time_within_train_step": 2.6987667083740234, "step": 1655} +{"train_info/time_between_train_steps": 0.0039288997650146484, "step": 1655} +{"info/global_step": 1656, "train_info/time_within_train_step": 2.7001092433929443, "step": 1656} +{"train_info/time_between_train_steps": 0.004052639007568359, "step": 1656} +{"info/global_step": 1657, "train_info/time_within_train_step": 2.698587656021118, "step": 1657} +{"train_info/time_between_train_steps": 0.003993034362792969, "step": 1657} +{"info/global_step": 1658, "train_info/time_within_train_step": 2.6997530460357666, "step": 1658} +{"train_info/time_between_train_steps": 0.003922700881958008, "step": 1658} +{"info/global_step": 1659, "train_info/time_within_train_step": 2.70025634765625, "step": 1659} +{"train_info/time_between_train_steps": 0.003907680511474609, "step": 1659} +{"info/global_step": 1660, "train_info/time_within_train_step": 2.6992928981781006, "step": 1660} +{"train_info/time_between_train_steps": 0.004035234451293945, "step": 1660} +{"info/global_step": 1661, "train_info/time_within_train_step": 2.7700119018554688, "step": 1661} +{"train_info/time_between_train_steps": 0.0038917064666748047, "step": 1661} +{"info/global_step": 1662, "train_info/time_within_train_step": 2.701073169708252, "step": 1662} +{"train_info/time_between_train_steps": 0.00391697883605957, "step": 1662} +{"info/global_step": 1663, "train_info/time_within_train_step": 3.4255733489990234, "step": 1663} +{"train_info/time_between_train_steps": 0.0039539337158203125, "step": 1663} +{"info/global_step": 1664, "train_info/time_within_train_step": 2.6980135440826416, "step": 1664} +{"train_info/time_between_train_steps": 0.0038619041442871094, "step": 1664} +{"info/global_step": 1665, "train_info/time_within_train_step": 3.060357093811035, "step": 1665} +{"train_info/time_between_train_steps": 0.0035898685455322266, "step": 1665} +{"info/global_step": 1666, "train_info/time_within_train_step": 2.69724178314209, "step": 1666} +{"train_info/time_between_train_steps": 0.0035991668701171875, "step": 1666} +{"info/global_step": 1667, "train_info/time_within_train_step": 2.696706771850586, "step": 1667} +{"train_info/time_between_train_steps": 0.003599405288696289, "step": 1667} +{"info/global_step": 1668, "train_info/time_within_train_step": 2.7045180797576904, "step": 1668} +{"train_info/time_between_train_steps": 0.0036089420318603516, "step": 1668} +{"info/global_step": 1669, "train_info/time_within_train_step": 2.69897198677063, "step": 1669} +{"train_info/time_between_train_steps": 0.0036127567291259766, "step": 1669} +{"info/global_step": 1670, "train_info/time_within_train_step": 2.6975767612457275, "step": 1670} +{"train_info/time_between_train_steps": 0.0035858154296875, "step": 1670} +{"info/global_step": 1671, "train_info/time_within_train_step": 2.6987125873565674, "step": 1671} +{"train_info/time_between_train_steps": 0.00357818603515625, "step": 1671} +{"info/global_step": 1672, "train_info/time_within_train_step": 2.7006123065948486, "step": 1672} +{"train_info/time_between_train_steps": 0.0036368370056152344, "step": 1672} +{"info/global_step": 1673, "train_info/time_within_train_step": 2.697939157485962, "step": 1673} +{"train_info/time_between_train_steps": 0.003584623336791992, "step": 1673} +{"info/global_step": 1674, "train_info/time_within_train_step": 2.6983706951141357, "step": 1674} +{"train_info/time_between_train_steps": 0.0035576820373535156, "step": 1674} +{"info/global_step": 1675, "train_info/time_within_train_step": 2.702063798904419, "step": 1675} +{"train_info/time_between_train_steps": 0.0036134719848632812, "step": 1675} +{"info/global_step": 1676, "train_info/time_within_train_step": 2.7814245223999023, "step": 1676} +{"train_info/time_between_train_steps": 0.003606557846069336, "step": 1676} +{"info/global_step": 1677, "train_info/time_within_train_step": 2.9736764430999756, "step": 1677} +{"train_info/time_between_train_steps": 0.0036096572875976562, "step": 1677} +{"info/global_step": 1678, "train_info/time_within_train_step": 2.802074432373047, "step": 1678} +{"train_info/time_between_train_steps": 0.0035583972930908203, "step": 1678} +{"info/global_step": 1679, "train_info/time_within_train_step": 2.6988370418548584, "step": 1679} +{"train_info/time_between_train_steps": 0.0037984848022460938, "step": 1679} +{"info/global_step": 1680, "train_info/time_within_train_step": 2.6974191665649414, "step": 1680} +{"train_info/time_between_train_steps": 0.003525257110595703, "step": 1680} +{"info/global_step": 1681, "train_info/time_within_train_step": 2.6976892948150635, "step": 1681} +{"train_info/time_between_train_steps": 0.0037555694580078125, "step": 1681} +{"info/global_step": 1682, "train_info/time_within_train_step": 2.6973278522491455, "step": 1682} +{"train_info/time_between_train_steps": 0.0036177635192871094, "step": 1682} +{"info/global_step": 1683, "train_info/time_within_train_step": 2.7002313137054443, "step": 1683} +{"train_info/time_between_train_steps": 0.0035741329193115234, "step": 1683} +{"info/global_step": 1684, "train_info/time_within_train_step": 2.6973180770874023, "step": 1684} +{"train_info/time_between_train_steps": 0.0035827159881591797, "step": 1684} +{"info/global_step": 1685, "train_info/time_within_train_step": 2.6969010829925537, "step": 1685} +{"train_info/time_between_train_steps": 0.0036323070526123047, "step": 1685} +{"info/global_step": 1686, "train_info/time_within_train_step": 2.6984033584594727, "step": 1686} +{"train_info/time_between_train_steps": 0.0036470890045166016, "step": 1686} +{"info/global_step": 1687, "train_info/time_within_train_step": 2.6995811462402344, "step": 1687} +{"train_info/time_between_train_steps": 0.0036704540252685547, "step": 1687} +{"info/global_step": 1688, "train_info/time_within_train_step": 2.6979305744171143, "step": 1688} +{"train_info/time_between_train_steps": 0.0036144256591796875, "step": 1688} +{"info/global_step": 1689, "train_info/time_within_train_step": 2.6996333599090576, "step": 1689} +{"train_info/time_between_train_steps": 0.003612041473388672, "step": 1689} +{"info/global_step": 1690, "train_info/time_within_train_step": 2.6976544857025146, "step": 1690} +{"train_info/time_between_train_steps": 0.003586292266845703, "step": 1690} +{"info/global_step": 1691, "train_info/time_within_train_step": 2.6980631351470947, "step": 1691} +{"train_info/time_between_train_steps": 0.0036077499389648438, "step": 1691} +{"info/global_step": 1692, "train_info/time_within_train_step": 2.699096441268921, "step": 1692} +{"train_info/time_between_train_steps": 0.003686189651489258, "step": 1692} +{"info/global_step": 1693, "train_info/time_within_train_step": 2.6991007328033447, "step": 1693} +{"train_info/time_between_train_steps": 0.003601551055908203, "step": 1693} +{"info/global_step": 1694, "train_info/time_within_train_step": 2.698939323425293, "step": 1694} +{"train_info/time_between_train_steps": 0.003589630126953125, "step": 1694} +{"info/global_step": 1695, "train_info/time_within_train_step": 2.6980597972869873, "step": 1695} +{"train_info/time_between_train_steps": 0.0035653114318847656, "step": 1695} +{"info/global_step": 1696, "train_info/time_within_train_step": 2.6998653411865234, "step": 1696} +{"train_info/time_between_train_steps": 0.0036170482635498047, "step": 1696} +{"info/global_step": 1697, "train_info/time_within_train_step": 2.718625545501709, "step": 1697} +{"train_info/time_between_train_steps": 0.0036253929138183594, "step": 1697} +{"info/global_step": 1698, "train_info/time_within_train_step": 2.700958728790283, "step": 1698} +{"train_info/time_between_train_steps": 0.0035889148712158203, "step": 1698} +{"info/global_step": 1699, "train_info/time_within_train_step": 2.69852352142334, "step": 1699} +{"train_info/time_between_train_steps": 0.0035827159881591797, "step": 1699} +{"info/global_step": 1700, "train_info/time_within_train_step": 2.6993608474731445, "step": 1700} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746291206, "_runtime": 5228}, "step": 1700} +{"logs": {"train/loss": 4.8275, "train/learning_rate": 0.0002888888888888888, "train/epoch": 2.06, "_timestamp": 1746291206, "_runtime": 5228}, "step": 1700} +{"train_info/time_between_train_steps": 33.321579933166504, "step": 1700} +{"info/global_step": 1701, "train_info/time_within_train_step": 2.4889798164367676, "step": 1701} +{"train_info/time_between_train_steps": 0.003559112548828125, "step": 1701} +{"info/global_step": 1702, "train_info/time_within_train_step": 2.468393564224243, "step": 1702} +{"train_info/time_between_train_steps": 0.0037217140197753906, "step": 1702} +{"info/global_step": 1703, "train_info/time_within_train_step": 3.0186498165130615, "step": 1703} +{"train_info/time_between_train_steps": 0.0035829544067382812, "step": 1703} +{"info/global_step": 1704, "train_info/time_within_train_step": 2.851508617401123, "step": 1704} +{"train_info/time_between_train_steps": 0.0035653114318847656, "step": 1704} +{"info/global_step": 1705, "train_info/time_within_train_step": 2.6920859813690186, "step": 1705} +{"train_info/time_between_train_steps": 0.003692626953125, "step": 1705} +{"info/global_step": 1706, "train_info/time_within_train_step": 2.6951053142547607, "step": 1706} +{"train_info/time_between_train_steps": 0.004044532775878906, "step": 1706} +{"info/global_step": 1707, "train_info/time_within_train_step": 2.697335958480835, "step": 1707} +{"train_info/time_between_train_steps": 0.0039997100830078125, "step": 1707} +{"info/global_step": 1708, "train_info/time_within_train_step": 2.6992204189300537, "step": 1708} +{"train_info/time_between_train_steps": 0.004077434539794922, "step": 1708} +{"info/global_step": 1709, "train_info/time_within_train_step": 2.700179100036621, "step": 1709} +{"train_info/time_between_train_steps": 0.003972530364990234, "step": 1709} +{"info/global_step": 1710, "train_info/time_within_train_step": 2.8495383262634277, "step": 1710} +{"train_info/time_between_train_steps": 0.004026651382446289, "step": 1710} +{"info/global_step": 1711, "train_info/time_within_train_step": 2.894127130508423, "step": 1711} +{"train_info/time_between_train_steps": 0.004101276397705078, "step": 1711} +{"info/global_step": 1712, "train_info/time_within_train_step": 2.902364730834961, "step": 1712} +{"train_info/time_between_train_steps": 0.0039730072021484375, "step": 1712} +{"info/global_step": 1713, "train_info/time_within_train_step": 2.6961514949798584, "step": 1713} +{"train_info/time_between_train_steps": 0.003920555114746094, "step": 1713} +{"info/global_step": 1714, "train_info/time_within_train_step": 2.6977593898773193, "step": 1714} +{"train_info/time_between_train_steps": 0.004051923751831055, "step": 1714} +{"info/global_step": 1715, "train_info/time_within_train_step": 2.6981043815612793, "step": 1715} +{"train_info/time_between_train_steps": 0.004000663757324219, "step": 1715} +{"info/global_step": 1716, "train_info/time_within_train_step": 2.6973607540130615, "step": 1716} +{"train_info/time_between_train_steps": 0.003838062286376953, "step": 1716} +{"info/global_step": 1717, "train_info/time_within_train_step": 2.69901704788208, "step": 1717} +{"train_info/time_between_train_steps": 0.004107475280761719, "step": 1717} +{"info/global_step": 1718, "train_info/time_within_train_step": 2.700174570083618, "step": 1718} +{"train_info/time_between_train_steps": 0.003970623016357422, "step": 1718} +{"info/global_step": 1719, "train_info/time_within_train_step": 2.700760841369629, "step": 1719} +{"train_info/time_between_train_steps": 0.003981828689575195, "step": 1719} +{"info/global_step": 1720, "train_info/time_within_train_step": 2.6994948387145996, "step": 1720} +{"train_info/time_between_train_steps": 0.0039463043212890625, "step": 1720} +{"info/global_step": 1721, "train_info/time_within_train_step": 2.6996910572052, "step": 1721} +{"train_info/time_between_train_steps": 0.004004955291748047, "step": 1721} +{"info/global_step": 1722, "train_info/time_within_train_step": 2.6991100311279297, "step": 1722} +{"train_info/time_between_train_steps": 0.003931999206542969, "step": 1722} +{"info/global_step": 1723, "train_info/time_within_train_step": 2.69883131980896, "step": 1723} +{"train_info/time_between_train_steps": 0.004042625427246094, "step": 1723} +{"info/global_step": 1724, "train_info/time_within_train_step": 2.700228214263916, "step": 1724} +{"train_info/time_between_train_steps": 0.0041332244873046875, "step": 1724} +{"info/global_step": 1725, "train_info/time_within_train_step": 2.698650360107422, "step": 1725} +{"train_info/time_between_train_steps": 0.003982067108154297, "step": 1725} +{"info/global_step": 1726, "train_info/time_within_train_step": 2.697786331176758, "step": 1726} +{"train_info/time_between_train_steps": 0.00397491455078125, "step": 1726} +{"info/global_step": 1727, "train_info/time_within_train_step": 3.0093319416046143, "step": 1727} +{"train_info/time_between_train_steps": 0.004091739654541016, "step": 1727} +{"info/global_step": 1728, "train_info/time_within_train_step": 2.6991055011749268, "step": 1728} +{"train_info/time_between_train_steps": 0.004038572311401367, "step": 1728} +{"info/global_step": 1729, "train_info/time_within_train_step": 2.6991963386535645, "step": 1729} +{"train_info/time_between_train_steps": 0.004088163375854492, "step": 1729} +{"info/global_step": 1730, "train_info/time_within_train_step": 2.699280261993408, "step": 1730} +{"train_info/time_between_train_steps": 0.004003047943115234, "step": 1730} +{"info/global_step": 1731, "train_info/time_within_train_step": 2.697610855102539, "step": 1731} +{"train_info/time_between_train_steps": 0.00397038459777832, "step": 1731} +{"info/global_step": 1732, "train_info/time_within_train_step": 2.6983418464660645, "step": 1732} +{"train_info/time_between_train_steps": 0.003930807113647461, "step": 1732} +{"info/global_step": 1733, "train_info/time_within_train_step": 2.697558641433716, "step": 1733} +{"train_info/time_between_train_steps": 0.0038518905639648438, "step": 1733} +{"info/global_step": 1734, "train_info/time_within_train_step": 2.698927164077759, "step": 1734} +{"train_info/time_between_train_steps": 0.003945112228393555, "step": 1734} +{"info/global_step": 1735, "train_info/time_within_train_step": 2.6977455615997314, "step": 1735} +{"train_info/time_between_train_steps": 0.003996372222900391, "step": 1735} +{"info/global_step": 1736, "train_info/time_within_train_step": 2.6993088722229004, "step": 1736} +{"train_info/time_between_train_steps": 0.003906726837158203, "step": 1736} +{"info/global_step": 1737, "train_info/time_within_train_step": 2.697641372680664, "step": 1737} +{"train_info/time_between_train_steps": 0.0038957595825195312, "step": 1737} +{"info/global_step": 1738, "train_info/time_within_train_step": 2.6992175579071045, "step": 1738} +{"train_info/time_between_train_steps": 0.0039691925048828125, "step": 1738} +{"info/global_step": 1739, "train_info/time_within_train_step": 2.6998088359832764, "step": 1739} +{"train_info/time_between_train_steps": 0.003924846649169922, "step": 1739} +{"info/global_step": 1740, "train_info/time_within_train_step": 2.700551748275757, "step": 1740} +{"train_info/time_between_train_steps": 0.0038857460021972656, "step": 1740} +{"info/global_step": 1741, "train_info/time_within_train_step": 2.7010889053344727, "step": 1741} +{"train_info/time_between_train_steps": 0.0039691925048828125, "step": 1741} +{"info/global_step": 1742, "train_info/time_within_train_step": 3.0801784992218018, "step": 1742} +{"train_info/time_between_train_steps": 0.0036530494689941406, "step": 1742} +{"info/global_step": 1743, "train_info/time_within_train_step": 2.7032277584075928, "step": 1743} +{"train_info/time_between_train_steps": 0.003614664077758789, "step": 1743} +{"info/global_step": 1744, "train_info/time_within_train_step": 2.7387614250183105, "step": 1744} +{"train_info/time_between_train_steps": 0.003625631332397461, "step": 1744} +{"info/global_step": 1745, "train_info/time_within_train_step": 2.9227724075317383, "step": 1745} +{"train_info/time_between_train_steps": 0.0036559104919433594, "step": 1745} +{"info/global_step": 1746, "train_info/time_within_train_step": 2.978428602218628, "step": 1746} +{"train_info/time_between_train_steps": 0.0037031173706054688, "step": 1746} +{"info/global_step": 1747, "train_info/time_within_train_step": 2.700789213180542, "step": 1747} +{"train_info/time_between_train_steps": 0.003682374954223633, "step": 1747} +{"info/global_step": 1748, "train_info/time_within_train_step": 2.697887659072876, "step": 1748} +{"train_info/time_between_train_steps": 0.003602266311645508, "step": 1748} +{"info/global_step": 1749, "train_info/time_within_train_step": 3.275129795074463, "step": 1749} +{"train_info/time_between_train_steps": 0.0041501522064208984, "step": 1749} +{"info/global_step": 1750, "train_info/time_within_train_step": 2.6978793144226074, "step": 1750} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746291386, "_runtime": 5408}, "step": 1750} +{"logs": {"train/loss": 4.7996, "train/learning_rate": 0.0002777777777777778, "train/epoch": 2.08, "_timestamp": 1746291386, "_runtime": 5408}, "step": 1750} +{"train_info/time_between_train_steps": 0.07500028610229492, "step": 1750} +{"info/global_step": 1751, "train_info/time_within_train_step": 2.69743275642395, "step": 1751} +{"train_info/time_between_train_steps": 0.003704071044921875, "step": 1751} +{"info/global_step": 1752, "train_info/time_within_train_step": 2.6978061199188232, "step": 1752} +{"train_info/time_between_train_steps": 0.00357818603515625, "step": 1752} +{"info/global_step": 1753, "train_info/time_within_train_step": 2.6982429027557373, "step": 1753} +{"train_info/time_between_train_steps": 0.0036253929138183594, "step": 1753} +{"info/global_step": 1754, "train_info/time_within_train_step": 2.6986193656921387, "step": 1754} +{"train_info/time_between_train_steps": 0.003605365753173828, "step": 1754} +{"info/global_step": 1755, "train_info/time_within_train_step": 2.9795124530792236, "step": 1755} +{"train_info/time_between_train_steps": 0.0036344528198242188, "step": 1755} +{"info/global_step": 1756, "train_info/time_within_train_step": 2.6993496417999268, "step": 1756} +{"train_info/time_between_train_steps": 0.0035915374755859375, "step": 1756} +{"info/global_step": 1757, "train_info/time_within_train_step": 2.700194835662842, "step": 1757} +{"train_info/time_between_train_steps": 0.003735780715942383, "step": 1757} +{"info/global_step": 1758, "train_info/time_within_train_step": 2.6989476680755615, "step": 1758} +{"train_info/time_between_train_steps": 0.003660917282104492, "step": 1758} +{"info/global_step": 1759, "train_info/time_within_train_step": 2.6991348266601562, "step": 1759} +{"train_info/time_between_train_steps": 0.0036857128143310547, "step": 1759} +{"info/global_step": 1760, "train_info/time_within_train_step": 2.6974053382873535, "step": 1760} +{"train_info/time_between_train_steps": 0.004040956497192383, "step": 1760} +{"info/global_step": 1761, "train_info/time_within_train_step": 2.700345754623413, "step": 1761} +{"train_info/time_between_train_steps": 0.003841876983642578, "step": 1761} +{"info/global_step": 1762, "train_info/time_within_train_step": 2.699951648712158, "step": 1762} +{"train_info/time_between_train_steps": 0.0041959285736083984, "step": 1762} +{"info/global_step": 1763, "train_info/time_within_train_step": 2.6989352703094482, "step": 1763} +{"train_info/time_between_train_steps": 0.0038976669311523438, "step": 1763} +{"info/global_step": 1764, "train_info/time_within_train_step": 2.697868824005127, "step": 1764} +{"train_info/time_between_train_steps": 0.0040149688720703125, "step": 1764} +{"info/global_step": 1765, "train_info/time_within_train_step": 2.6993119716644287, "step": 1765} +{"train_info/time_between_train_steps": 0.007459163665771484, "step": 1765} +{"info/global_step": 1766, "train_info/time_within_train_step": 2.6989638805389404, "step": 1766} +{"train_info/time_between_train_steps": 0.18578457832336426, "step": 1766} +{"info/global_step": 1767, "train_info/time_within_train_step": 2.699272632598877, "step": 1767} +{"train_info/time_between_train_steps": 0.003803730010986328, "step": 1767} +{"info/global_step": 1768, "train_info/time_within_train_step": 2.697906494140625, "step": 1768} +{"train_info/time_between_train_steps": 0.007355213165283203, "step": 1768} +{"info/global_step": 1769, "train_info/time_within_train_step": 2.699334144592285, "step": 1769} +{"train_info/time_between_train_steps": 0.0037941932678222656, "step": 1769} +{"info/global_step": 1770, "train_info/time_within_train_step": 2.6982593536376953, "step": 1770} +{"train_info/time_between_train_steps": 0.0036950111389160156, "step": 1770} +{"info/global_step": 1771, "train_info/time_within_train_step": 2.697568655014038, "step": 1771} +{"train_info/time_between_train_steps": 0.0037398338317871094, "step": 1771} +{"info/global_step": 1772, "train_info/time_within_train_step": 2.698806047439575, "step": 1772} +{"train_info/time_between_train_steps": 0.0068798065185546875, "step": 1772} +{"info/global_step": 1773, "train_info/time_within_train_step": 2.7007863521575928, "step": 1773} +{"train_info/time_between_train_steps": 0.003705739974975586, "step": 1773} +{"info/global_step": 1774, "train_info/time_within_train_step": 2.69708251953125, "step": 1774} +{"train_info/time_between_train_steps": 0.003738880157470703, "step": 1774} +{"info/global_step": 1775, "train_info/time_within_train_step": 2.779320001602173, "step": 1775} +{"train_info/time_between_train_steps": 0.0036652088165283203, "step": 1775} +{"info/global_step": 1776, "train_info/time_within_train_step": 3.000352144241333, "step": 1776} +{"train_info/time_between_train_steps": 0.003724813461303711, "step": 1776} +{"info/global_step": 1777, "train_info/time_within_train_step": 2.9638960361480713, "step": 1777} +{"train_info/time_between_train_steps": 0.0037212371826171875, "step": 1777} +{"info/global_step": 1778, "train_info/time_within_train_step": 2.704317808151245, "step": 1778} +{"train_info/time_between_train_steps": 0.0037412643432617188, "step": 1778} +{"info/global_step": 1779, "train_info/time_within_train_step": 2.6992805004119873, "step": 1779} +{"train_info/time_between_train_steps": 0.0037474632263183594, "step": 1779} +{"info/global_step": 1780, "train_info/time_within_train_step": 2.6991913318634033, "step": 1780} +{"train_info/time_between_train_steps": 0.0036821365356445312, "step": 1780} +{"info/global_step": 1781, "train_info/time_within_train_step": 2.697571277618408, "step": 1781} +{"train_info/time_between_train_steps": 0.0036923885345458984, "step": 1781} +{"info/global_step": 1782, "train_info/time_within_train_step": 2.696214437484741, "step": 1782} +{"train_info/time_between_train_steps": 0.003705263137817383, "step": 1782} +{"info/global_step": 1783, "train_info/time_within_train_step": 2.6989939212799072, "step": 1783} +{"train_info/time_between_train_steps": 0.003779172897338867, "step": 1783} +{"info/global_step": 1784, "train_info/time_within_train_step": 2.699733257293701, "step": 1784} +{"train_info/time_between_train_steps": 0.0037581920623779297, "step": 1784} +{"info/global_step": 1785, "train_info/time_within_train_step": 2.69919753074646, "step": 1785} +{"train_info/time_between_train_steps": 0.003951311111450195, "step": 1785} +{"info/global_step": 1786, "train_info/time_within_train_step": 2.6988041400909424, "step": 1786} +{"train_info/time_between_train_steps": 0.003888368606567383, "step": 1786} +{"info/global_step": 1787, "train_info/time_within_train_step": 2.699920654296875, "step": 1787} +{"train_info/time_between_train_steps": 0.00397181510925293, "step": 1787} +{"info/global_step": 1788, "train_info/time_within_train_step": 2.7003889083862305, "step": 1788} +{"train_info/time_between_train_steps": 0.004113197326660156, "step": 1788} +{"info/global_step": 1789, "train_info/time_within_train_step": 2.6993825435638428, "step": 1789} +{"train_info/time_between_train_steps": 0.0039806365966796875, "step": 1789} +{"info/global_step": 1790, "train_info/time_within_train_step": 2.700118064880371, "step": 1790} +{"train_info/time_between_train_steps": 0.003924131393432617, "step": 1790} +{"info/global_step": 1791, "train_info/time_within_train_step": 2.700150728225708, "step": 1791} +{"train_info/time_between_train_steps": 0.0038499832153320312, "step": 1791} +{"info/global_step": 1792, "train_info/time_within_train_step": 2.6994340419769287, "step": 1792} +{"train_info/time_between_train_steps": 0.003923177719116211, "step": 1792} +{"info/global_step": 1793, "train_info/time_within_train_step": 2.700167417526245, "step": 1793} +{"train_info/time_between_train_steps": 0.003968477249145508, "step": 1793} +{"info/global_step": 1794, "train_info/time_within_train_step": 2.700671434402466, "step": 1794} +{"train_info/time_between_train_steps": 0.003946065902709961, "step": 1794} +{"info/global_step": 1795, "train_info/time_within_train_step": 2.7637362480163574, "step": 1795} +{"train_info/time_between_train_steps": 0.0038683414459228516, "step": 1795} +{"info/global_step": 1796, "train_info/time_within_train_step": 2.9593629837036133, "step": 1796} +{"train_info/time_between_train_steps": 0.003950595855712891, "step": 1796} +{"info/global_step": 1797, "train_info/time_within_train_step": 2.917933464050293, "step": 1797} +{"train_info/time_between_train_steps": 0.003942251205444336, "step": 1797} +{"info/global_step": 1798, "train_info/time_within_train_step": 2.7010841369628906, "step": 1798} +{"train_info/time_between_train_steps": 0.003907680511474609, "step": 1798} +{"info/global_step": 1799, "train_info/time_within_train_step": 2.698775053024292, "step": 1799} +{"train_info/time_between_train_steps": 0.003930330276489258, "step": 1799} +{"info/global_step": 1800, "train_info/time_within_train_step": 2.697632074356079, "step": 1800} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746291532, "_runtime": 5554}, "step": 1800} +{"logs": {"train/loss": 4.7694, "train/learning_rate": 0.0002666666666666666, "train/epoch": 2.09, "_timestamp": 1746291532, "_runtime": 5554}, "step": 1800} +{"train_info/time_between_train_steps": 33.90987682342529, "step": 1800} +{"info/global_step": 1801, "train_info/time_within_train_step": 2.4862003326416016, "step": 1801} +{"train_info/time_between_train_steps": 0.004616737365722656, "step": 1801} +{"info/global_step": 1802, "train_info/time_within_train_step": 2.4872071743011475, "step": 1802} +{"train_info/time_between_train_steps": 0.00490880012512207, "step": 1802} +{"info/global_step": 1803, "train_info/time_within_train_step": 2.6784918308258057, "step": 1803} +{"train_info/time_between_train_steps": 0.004932403564453125, "step": 1803} +{"info/global_step": 1804, "train_info/time_within_train_step": 2.697084903717041, "step": 1804} +{"train_info/time_between_train_steps": 0.004222869873046875, "step": 1804} +{"info/global_step": 1805, "train_info/time_within_train_step": 2.8461122512817383, "step": 1805} +{"train_info/time_between_train_steps": 0.004871845245361328, "step": 1805} +{"info/global_step": 1806, "train_info/time_within_train_step": 2.7038843631744385, "step": 1806} +{"train_info/time_between_train_steps": 0.004982948303222656, "step": 1806} +{"info/global_step": 1807, "train_info/time_within_train_step": 2.7008516788482666, "step": 1807} +{"train_info/time_between_train_steps": 0.004239797592163086, "step": 1807} +{"info/global_step": 1808, "train_info/time_within_train_step": 2.6998987197875977, "step": 1808} +{"train_info/time_between_train_steps": 0.004452705383300781, "step": 1808} +{"info/global_step": 1809, "train_info/time_within_train_step": 2.7020061016082764, "step": 1809} +{"train_info/time_between_train_steps": 0.004400968551635742, "step": 1809} +{"info/global_step": 1810, "train_info/time_within_train_step": 2.701176643371582, "step": 1810} +{"train_info/time_between_train_steps": 0.004010915756225586, "step": 1810} +{"info/global_step": 1811, "train_info/time_within_train_step": 2.8738274574279785, "step": 1811} +{"train_info/time_between_train_steps": 0.0040857791900634766, "step": 1811} +{"info/global_step": 1812, "train_info/time_within_train_step": 3.0751070976257324, "step": 1812} +{"train_info/time_between_train_steps": 0.004227399826049805, "step": 1812} +{"info/global_step": 1813, "train_info/time_within_train_step": 2.820972204208374, "step": 1813} +{"train_info/time_between_train_steps": 0.004013538360595703, "step": 1813} +{"info/global_step": 1814, "train_info/time_within_train_step": 2.7013723850250244, "step": 1814} +{"train_info/time_between_train_steps": 0.004115581512451172, "step": 1814} +{"info/global_step": 1815, "train_info/time_within_train_step": 2.6991775035858154, "step": 1815} +{"train_info/time_between_train_steps": 0.004452705383300781, "step": 1815} +{"info/global_step": 1816, "train_info/time_within_train_step": 2.700312376022339, "step": 1816} +{"train_info/time_between_train_steps": 0.004201650619506836, "step": 1816} +{"info/global_step": 1817, "train_info/time_within_train_step": 3.1042025089263916, "step": 1817} +{"train_info/time_between_train_steps": 0.003678560256958008, "step": 1817} +{"info/global_step": 1818, "train_info/time_within_train_step": 2.6974034309387207, "step": 1818} +{"train_info/time_between_train_steps": 0.0037152767181396484, "step": 1818} +{"info/global_step": 1819, "train_info/time_within_train_step": 2.6994199752807617, "step": 1819} +{"train_info/time_between_train_steps": 0.0036363601684570312, "step": 1819} +{"info/global_step": 1820, "train_info/time_within_train_step": 2.6974799633026123, "step": 1820} +{"train_info/time_between_train_steps": 0.003644227981567383, "step": 1820} +{"info/global_step": 1821, "train_info/time_within_train_step": 2.6986136436462402, "step": 1821} +{"train_info/time_between_train_steps": 0.003608226776123047, "step": 1821} +{"info/global_step": 1822, "train_info/time_within_train_step": 2.6982643604278564, "step": 1822} +{"train_info/time_between_train_steps": 0.0036346912384033203, "step": 1822} +{"info/global_step": 1823, "train_info/time_within_train_step": 2.6993072032928467, "step": 1823} +{"train_info/time_between_train_steps": 0.0036499500274658203, "step": 1823} +{"info/global_step": 1824, "train_info/time_within_train_step": 2.699108123779297, "step": 1824} +{"train_info/time_between_train_steps": 0.0036284923553466797, "step": 1824} +{"info/global_step": 1825, "train_info/time_within_train_step": 2.6987128257751465, "step": 1825} +{"train_info/time_between_train_steps": 0.003664255142211914, "step": 1825} +{"info/global_step": 1826, "train_info/time_within_train_step": 2.7008962631225586, "step": 1826} +{"train_info/time_between_train_steps": 0.0037131309509277344, "step": 1826} +{"info/global_step": 1827, "train_info/time_within_train_step": 2.6994452476501465, "step": 1827} +{"train_info/time_between_train_steps": 0.0037691593170166016, "step": 1827} +{"info/global_step": 1828, "train_info/time_within_train_step": 2.6992878913879395, "step": 1828} +{"train_info/time_between_train_steps": 0.004041433334350586, "step": 1828} +{"info/global_step": 1829, "train_info/time_within_train_step": 2.8822004795074463, "step": 1829} +{"train_info/time_between_train_steps": 0.004042148590087891, "step": 1829} +{"info/global_step": 1830, "train_info/time_within_train_step": 2.6987359523773193, "step": 1830} +{"train_info/time_between_train_steps": 0.004014730453491211, "step": 1830} +{"info/global_step": 1831, "train_info/time_within_train_step": 2.698115825653076, "step": 1831} +{"train_info/time_between_train_steps": 0.0038232803344726562, "step": 1831} +{"info/global_step": 1832, "train_info/time_within_train_step": 2.700831651687622, "step": 1832} +{"train_info/time_between_train_steps": 0.003876924514770508, "step": 1832} +{"info/global_step": 1833, "train_info/time_within_train_step": 2.6992437839508057, "step": 1833} +{"train_info/time_between_train_steps": 0.003838777542114258, "step": 1833} +{"info/global_step": 1834, "train_info/time_within_train_step": 2.69838285446167, "step": 1834} +{"train_info/time_between_train_steps": 0.0037796497344970703, "step": 1834} +{"info/global_step": 1835, "train_info/time_within_train_step": 2.697377920150757, "step": 1835} +{"train_info/time_between_train_steps": 0.0037894248962402344, "step": 1835} +{"info/global_step": 1836, "train_info/time_within_train_step": 2.6989448070526123, "step": 1836} +{"train_info/time_between_train_steps": 0.003778696060180664, "step": 1836} +{"info/global_step": 1837, "train_info/time_within_train_step": 2.69810152053833, "step": 1837} +{"train_info/time_between_train_steps": 0.0037393569946289062, "step": 1837} +{"info/global_step": 1838, "train_info/time_within_train_step": 2.6998186111450195, "step": 1838} +{"train_info/time_between_train_steps": 0.003779888153076172, "step": 1838} +{"info/global_step": 1839, "train_info/time_within_train_step": 2.6994574069976807, "step": 1839} +{"train_info/time_between_train_steps": 0.003776073455810547, "step": 1839} +{"info/global_step": 1840, "train_info/time_within_train_step": 2.6989617347717285, "step": 1840} +{"train_info/time_between_train_steps": 0.0038034915924072266, "step": 1840} +{"info/global_step": 1841, "train_info/time_within_train_step": 2.6987481117248535, "step": 1841} +{"train_info/time_between_train_steps": 0.0037212371826171875, "step": 1841} +{"info/global_step": 1842, "train_info/time_within_train_step": 2.701145887374878, "step": 1842} +{"train_info/time_between_train_steps": 0.0037724971771240234, "step": 1842} +{"info/global_step": 1843, "train_info/time_within_train_step": 2.7266366481781006, "step": 1843} +{"train_info/time_between_train_steps": 0.0037598609924316406, "step": 1843} +{"info/global_step": 1844, "train_info/time_within_train_step": 2.823507070541382, "step": 1844} +{"train_info/time_between_train_steps": 0.003761768341064453, "step": 1844} +{"info/global_step": 1845, "train_info/time_within_train_step": 2.8998818397521973, "step": 1845} +{"train_info/time_between_train_steps": 0.0038318634033203125, "step": 1845} +{"info/global_step": 1846, "train_info/time_within_train_step": 2.747741937637329, "step": 1846} +{"train_info/time_between_train_steps": 0.004129171371459961, "step": 1846} +{"info/global_step": 1847, "train_info/time_within_train_step": 3.214160203933716, "step": 1847} +{"train_info/time_between_train_steps": 0.00410771369934082, "step": 1847} +{"info/global_step": 1848, "train_info/time_within_train_step": 2.699223041534424, "step": 1848} +{"train_info/time_between_train_steps": 0.004183769226074219, "step": 1848} +{"info/global_step": 1849, "train_info/time_within_train_step": 2.697531223297119, "step": 1849} +{"train_info/time_between_train_steps": 0.004037141799926758, "step": 1849} +{"info/global_step": 1850, "train_info/time_within_train_step": 2.699578046798706, "step": 1850} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746291712, "_runtime": 5734}, "step": 1850} +{"logs": {"train/loss": 4.7622, "train/learning_rate": 0.00025555555555555553, "train/epoch": 2.11, "_timestamp": 1746291712, "_runtime": 5734}, "step": 1850} +{"train_info/time_between_train_steps": 0.026488780975341797, "step": 1850} +{"info/global_step": 1851, "train_info/time_within_train_step": 2.699542999267578, "step": 1851} +{"train_info/time_between_train_steps": 0.003999471664428711, "step": 1851} +{"info/global_step": 1852, "train_info/time_within_train_step": 2.782783269882202, "step": 1852} +{"train_info/time_between_train_steps": 0.004024505615234375, "step": 1852} +{"info/global_step": 1853, "train_info/time_within_train_step": 2.6986494064331055, "step": 1853} +{"train_info/time_between_train_steps": 0.004031658172607422, "step": 1853} +{"info/global_step": 1854, "train_info/time_within_train_step": 2.6973092555999756, "step": 1854} +{"train_info/time_between_train_steps": 0.004052162170410156, "step": 1854} +{"info/global_step": 1855, "train_info/time_within_train_step": 2.696721076965332, "step": 1855} +{"train_info/time_between_train_steps": 0.003939390182495117, "step": 1855} +{"info/global_step": 1856, "train_info/time_within_train_step": 3.0930187702178955, "step": 1856} +{"train_info/time_between_train_steps": 0.003641843795776367, "step": 1856} +{"info/global_step": 1857, "train_info/time_within_train_step": 2.696882724761963, "step": 1857} +{"train_info/time_between_train_steps": 0.0036230087280273438, "step": 1857} +{"info/global_step": 1858, "train_info/time_within_train_step": 2.6969563961029053, "step": 1858} +{"train_info/time_between_train_steps": 0.0035970211029052734, "step": 1858} +{"info/global_step": 1859, "train_info/time_within_train_step": 2.697373867034912, "step": 1859} +{"train_info/time_between_train_steps": 0.0036242008209228516, "step": 1859} +{"info/global_step": 1860, "train_info/time_within_train_step": 2.6966402530670166, "step": 1860} +{"train_info/time_between_train_steps": 0.0037164688110351562, "step": 1860} +{"info/global_step": 1861, "train_info/time_within_train_step": 2.6958625316619873, "step": 1861} +{"train_info/time_between_train_steps": 0.0035505294799804688, "step": 1861} +{"info/global_step": 1862, "train_info/time_within_train_step": 2.7063238620758057, "step": 1862} +{"train_info/time_between_train_steps": 0.0035958290100097656, "step": 1862} +{"info/global_step": 1863, "train_info/time_within_train_step": 2.698251485824585, "step": 1863} +{"train_info/time_between_train_steps": 0.003587007522583008, "step": 1863} +{"info/global_step": 1864, "train_info/time_within_train_step": 2.6961421966552734, "step": 1864} +{"train_info/time_between_train_steps": 0.0035545825958251953, "step": 1864} +{"info/global_step": 1865, "train_info/time_within_train_step": 2.696101665496826, "step": 1865} +{"train_info/time_between_train_steps": 0.003534555435180664, "step": 1865} +{"info/global_step": 1866, "train_info/time_within_train_step": 2.6968941688537598, "step": 1866} +{"train_info/time_between_train_steps": 0.0036683082580566406, "step": 1866} +{"info/global_step": 1867, "train_info/time_within_train_step": 2.7035746574401855, "step": 1867} +{"train_info/time_between_train_steps": 0.003633260726928711, "step": 1867} +{"info/global_step": 1868, "train_info/time_within_train_step": 2.6991889476776123, "step": 1868} +{"train_info/time_between_train_steps": 0.0036568641662597656, "step": 1868} +{"info/global_step": 1869, "train_info/time_within_train_step": 2.6987829208374023, "step": 1869} +{"train_info/time_between_train_steps": 0.0035886764526367188, "step": 1869} +{"info/global_step": 1870, "train_info/time_within_train_step": 2.698213577270508, "step": 1870} +{"train_info/time_between_train_steps": 0.0036957263946533203, "step": 1870} +{"info/global_step": 1871, "train_info/time_within_train_step": 2.6981241703033447, "step": 1871} +{"train_info/time_between_train_steps": 0.004190921783447266, "step": 1871} +{"info/global_step": 1872, "train_info/time_within_train_step": 2.7012240886688232, "step": 1872} +{"train_info/time_between_train_steps": 0.0041294097900390625, "step": 1872} +{"info/global_step": 1873, "train_info/time_within_train_step": 2.701630115509033, "step": 1873} +{"train_info/time_between_train_steps": 0.0039746761322021484, "step": 1873} +{"info/global_step": 1874, "train_info/time_within_train_step": 2.6978554725646973, "step": 1874} +{"train_info/time_between_train_steps": 0.003991603851318359, "step": 1874} +{"info/global_step": 1875, "train_info/time_within_train_step": 2.699890613555908, "step": 1875} +{"train_info/time_between_train_steps": 0.0040166378021240234, "step": 1875} +{"info/global_step": 1876, "train_info/time_within_train_step": 2.782723903656006, "step": 1876} +{"train_info/time_between_train_steps": 0.0040187835693359375, "step": 1876} +{"info/global_step": 1877, "train_info/time_within_train_step": 2.9378597736358643, "step": 1877} +{"train_info/time_between_train_steps": 0.004198551177978516, "step": 1877} +{"info/global_step": 1878, "train_info/time_within_train_step": 2.8157472610473633, "step": 1878} +{"train_info/time_between_train_steps": 0.004088401794433594, "step": 1878} +{"info/global_step": 1879, "train_info/time_within_train_step": 2.699955940246582, "step": 1879} +{"train_info/time_between_train_steps": 0.004030704498291016, "step": 1879} +{"info/global_step": 1880, "train_info/time_within_train_step": 2.700958490371704, "step": 1880} +{"train_info/time_between_train_steps": 0.004068851470947266, "step": 1880} +{"info/global_step": 1881, "train_info/time_within_train_step": 2.7001094818115234, "step": 1881} +{"train_info/time_between_train_steps": 0.004155874252319336, "step": 1881} +{"info/global_step": 1882, "train_info/time_within_train_step": 2.6997952461242676, "step": 1882} +{"train_info/time_between_train_steps": 0.003987789154052734, "step": 1882} +{"info/global_step": 1883, "train_info/time_within_train_step": 2.6970441341400146, "step": 1883} +{"train_info/time_between_train_steps": 0.0038824081420898438, "step": 1883} +{"info/global_step": 1884, "train_info/time_within_train_step": 2.699277639389038, "step": 1884} +{"train_info/time_between_train_steps": 0.003998756408691406, "step": 1884} +{"info/global_step": 1885, "train_info/time_within_train_step": 2.699583053588867, "step": 1885} +{"train_info/time_between_train_steps": 0.003971099853515625, "step": 1885} +{"info/global_step": 1886, "train_info/time_within_train_step": 2.6988863945007324, "step": 1886} +{"train_info/time_between_train_steps": 0.003940105438232422, "step": 1886} +{"info/global_step": 1887, "train_info/time_within_train_step": 2.6997029781341553, "step": 1887} +{"train_info/time_between_train_steps": 0.003896474838256836, "step": 1887} +{"info/global_step": 1888, "train_info/time_within_train_step": 2.76112961769104, "step": 1888} +{"train_info/time_between_train_steps": 0.004173994064331055, "step": 1888} +{"info/global_step": 1889, "train_info/time_within_train_step": 2.710681676864624, "step": 1889} +{"train_info/time_between_train_steps": 0.003963947296142578, "step": 1889} +{"info/global_step": 1890, "train_info/time_within_train_step": 2.699313163757324, "step": 1890} +{"train_info/time_between_train_steps": 0.003972053527832031, "step": 1890} +{"info/global_step": 1891, "train_info/time_within_train_step": 2.7008988857269287, "step": 1891} +{"train_info/time_between_train_steps": 0.18829965591430664, "step": 1891} +{"info/global_step": 1892, "train_info/time_within_train_step": 2.7002475261688232, "step": 1892} +{"train_info/time_between_train_steps": 0.003805398941040039, "step": 1892} +{"info/global_step": 1893, "train_info/time_within_train_step": 2.7001545429229736, "step": 1893} +{"train_info/time_between_train_steps": 0.003757476806640625, "step": 1893} +{"info/global_step": 1894, "train_info/time_within_train_step": 2.70031476020813, "step": 1894} +{"train_info/time_between_train_steps": 0.003838062286376953, "step": 1894} +{"info/global_step": 1895, "train_info/time_within_train_step": 2.7516725063323975, "step": 1895} +{"train_info/time_between_train_steps": 0.0037877559661865234, "step": 1895} +{"info/global_step": 1896, "train_info/time_within_train_step": 2.8462321758270264, "step": 1896} +{"train_info/time_between_train_steps": 0.0037064552307128906, "step": 1896} +{"info/global_step": 1897, "train_info/time_within_train_step": 2.782310962677002, "step": 1897} +{"train_info/time_between_train_steps": 0.0037250518798828125, "step": 1897} +{"info/global_step": 1898, "train_info/time_within_train_step": 2.7005295753479004, "step": 1898} +{"train_info/time_between_train_steps": 0.0037217140197753906, "step": 1898} +{"info/global_step": 1899, "train_info/time_within_train_step": 2.7020249366760254, "step": 1899} +{"train_info/time_between_train_steps": 0.003936052322387695, "step": 1899} +{"info/global_step": 1900, "train_info/time_within_train_step": 2.703472375869751, "step": 1900} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746291855, "_runtime": 5877}, "step": 1900} +{"logs": {"train/loss": 4.7345, "train/learning_rate": 0.00024444444444444443, "train/epoch": 2.13, "_timestamp": 1746291855, "_runtime": 5877}, "step": 1900} +{"train_info/time_between_train_steps": 32.37481427192688, "step": 1900} +{"info/global_step": 1901, "train_info/time_within_train_step": 2.4780540466308594, "step": 1901} +{"train_info/time_between_train_steps": 0.004073143005371094, "step": 1901} +{"info/global_step": 1902, "train_info/time_within_train_step": 2.484135627746582, "step": 1902} +{"train_info/time_between_train_steps": 0.004002809524536133, "step": 1902} +{"info/global_step": 1903, "train_info/time_within_train_step": 2.649609088897705, "step": 1903} +{"train_info/time_between_train_steps": 0.004048824310302734, "step": 1903} +{"info/global_step": 1904, "train_info/time_within_train_step": 2.7261083126068115, "step": 1904} +{"train_info/time_between_train_steps": 0.004275083541870117, "step": 1904} +{"info/global_step": 1905, "train_info/time_within_train_step": 2.6955747604370117, "step": 1905} +{"train_info/time_between_train_steps": 0.004094362258911133, "step": 1905} +{"info/global_step": 1906, "train_info/time_within_train_step": 2.69592547416687, "step": 1906} +{"train_info/time_between_train_steps": 0.004092216491699219, "step": 1906} +{"info/global_step": 1907, "train_info/time_within_train_step": 2.7012417316436768, "step": 1907} +{"train_info/time_between_train_steps": 0.003929853439331055, "step": 1907} +{"info/global_step": 1908, "train_info/time_within_train_step": 2.697415351867676, "step": 1908} +{"train_info/time_between_train_steps": 0.0039806365966796875, "step": 1908} +{"info/global_step": 1909, "train_info/time_within_train_step": 2.69929575920105, "step": 1909} +{"train_info/time_between_train_steps": 0.004093170166015625, "step": 1909} +{"info/global_step": 1910, "train_info/time_within_train_step": 2.701993465423584, "step": 1910} +{"train_info/time_between_train_steps": 0.004447221755981445, "step": 1910} +{"info/global_step": 1911, "train_info/time_within_train_step": 2.9110069274902344, "step": 1911} +{"train_info/time_between_train_steps": 0.003974437713623047, "step": 1911} +{"info/global_step": 1912, "train_info/time_within_train_step": 3.034802198410034, "step": 1912} +{"train_info/time_between_train_steps": 0.003994941711425781, "step": 1912} +{"info/global_step": 1913, "train_info/time_within_train_step": 2.891242504119873, "step": 1913} +{"train_info/time_between_train_steps": 0.0043027400970458984, "step": 1913} +{"info/global_step": 1914, "train_info/time_within_train_step": 2.697807788848877, "step": 1914} +{"train_info/time_between_train_steps": 0.004085540771484375, "step": 1914} +{"info/global_step": 1915, "train_info/time_within_train_step": 2.697108507156372, "step": 1915} +{"train_info/time_between_train_steps": 0.0039043426513671875, "step": 1915} +{"info/global_step": 1916, "train_info/time_within_train_step": 2.698119640350342, "step": 1916} +{"train_info/time_between_train_steps": 0.004000186920166016, "step": 1916} +{"info/global_step": 1917, "train_info/time_within_train_step": 2.697561740875244, "step": 1917} +{"train_info/time_between_train_steps": 0.004033803939819336, "step": 1917} +{"info/global_step": 1918, "train_info/time_within_train_step": 2.698606252670288, "step": 1918} +{"train_info/time_between_train_steps": 0.004060029983520508, "step": 1918} +{"info/global_step": 1919, "train_info/time_within_train_step": 2.6987125873565674, "step": 1919} +{"train_info/time_between_train_steps": 0.003985881805419922, "step": 1919} +{"info/global_step": 1920, "train_info/time_within_train_step": 2.6977663040161133, "step": 1920} +{"train_info/time_between_train_steps": 0.003953218460083008, "step": 1920} +{"info/global_step": 1921, "train_info/time_within_train_step": 2.6979682445526123, "step": 1921} +{"train_info/time_between_train_steps": 0.003975629806518555, "step": 1921} +{"info/global_step": 1922, "train_info/time_within_train_step": 2.6989099979400635, "step": 1922} +{"train_info/time_between_train_steps": 0.003943920135498047, "step": 1922} +{"info/global_step": 1923, "train_info/time_within_train_step": 2.699769973754883, "step": 1923} +{"train_info/time_between_train_steps": 0.003923177719116211, "step": 1923} +{"info/global_step": 1924, "train_info/time_within_train_step": 2.6976823806762695, "step": 1924} +{"train_info/time_between_train_steps": 0.003916501998901367, "step": 1924} +{"info/global_step": 1925, "train_info/time_within_train_step": 2.6974689960479736, "step": 1925} +{"train_info/time_between_train_steps": 0.004179954528808594, "step": 1925} +{"info/global_step": 1926, "train_info/time_within_train_step": 3.092986822128296, "step": 1926} +{"train_info/time_between_train_steps": 0.0036270618438720703, "step": 1926} +{"info/global_step": 1927, "train_info/time_within_train_step": 2.7049365043640137, "step": 1927} +{"train_info/time_between_train_steps": 0.0037746429443359375, "step": 1927} +{"info/global_step": 1928, "train_info/time_within_train_step": 2.6991612911224365, "step": 1928} +{"train_info/time_between_train_steps": 0.003809690475463867, "step": 1928} +{"info/global_step": 1929, "train_info/time_within_train_step": 2.6981759071350098, "step": 1929} +{"train_info/time_between_train_steps": 0.0036122798919677734, "step": 1929} +{"info/global_step": 1930, "train_info/time_within_train_step": 2.6829724311828613, "step": 1930} +{"train_info/time_between_train_steps": 0.003742218017578125, "step": 1930} +{"info/global_step": 1931, "train_info/time_within_train_step": 2.6950337886810303, "step": 1931} +{"train_info/time_between_train_steps": 0.003810882568359375, "step": 1931} +{"info/global_step": 1932, "train_info/time_within_train_step": 2.697188138961792, "step": 1932} +{"train_info/time_between_train_steps": 0.0041942596435546875, "step": 1932} +{"info/global_step": 1933, "train_info/time_within_train_step": 2.696079730987549, "step": 1933} +{"train_info/time_between_train_steps": 0.004137754440307617, "step": 1933} +{"info/global_step": 1934, "train_info/time_within_train_step": 2.698843479156494, "step": 1934} +{"train_info/time_between_train_steps": 0.0041887760162353516, "step": 1934} +{"info/global_step": 1935, "train_info/time_within_train_step": 2.698693037033081, "step": 1935} +{"train_info/time_between_train_steps": 0.004210948944091797, "step": 1935} +{"info/global_step": 1936, "train_info/time_within_train_step": 2.6972362995147705, "step": 1936} +{"train_info/time_between_train_steps": 0.004166603088378906, "step": 1936} +{"info/global_step": 1937, "train_info/time_within_train_step": 2.698572874069214, "step": 1937} +{"train_info/time_between_train_steps": 0.004110813140869141, "step": 1937} +{"info/global_step": 1938, "train_info/time_within_train_step": 2.6985881328582764, "step": 1938} +{"train_info/time_between_train_steps": 0.0041675567626953125, "step": 1938} +{"info/global_step": 1939, "train_info/time_within_train_step": 2.700110673904419, "step": 1939} +{"train_info/time_between_train_steps": 0.004197359085083008, "step": 1939} +{"info/global_step": 1940, "train_info/time_within_train_step": 2.6992011070251465, "step": 1940} +{"train_info/time_between_train_steps": 0.00410008430480957, "step": 1940} +{"info/global_step": 1941, "train_info/time_within_train_step": 2.7007389068603516, "step": 1941} +{"train_info/time_between_train_steps": 0.004227399826049805, "step": 1941} +{"info/global_step": 1942, "train_info/time_within_train_step": 2.700220823287964, "step": 1942} +{"train_info/time_between_train_steps": 0.004178047180175781, "step": 1942} +{"info/global_step": 1943, "train_info/time_within_train_step": 2.7005741596221924, "step": 1943} +{"train_info/time_between_train_steps": 0.004098415374755859, "step": 1943} +{"info/global_step": 1944, "train_info/time_within_train_step": 2.7012267112731934, "step": 1944} +{"train_info/time_between_train_steps": 0.0041561126708984375, "step": 1944} +{"info/global_step": 1945, "train_info/time_within_train_step": 2.7020702362060547, "step": 1945} +{"train_info/time_between_train_steps": 0.004896402359008789, "step": 1945} +{"info/global_step": 1946, "train_info/time_within_train_step": 2.7002158164978027, "step": 1946} +{"train_info/time_between_train_steps": 0.003993511199951172, "step": 1946} +{"info/global_step": 1947, "train_info/time_within_train_step": 2.7017462253570557, "step": 1947} +{"train_info/time_between_train_steps": 0.004243612289428711, "step": 1947} +{"info/global_step": 1948, "train_info/time_within_train_step": 2.832879066467285, "step": 1948} +{"train_info/time_between_train_steps": 0.004021167755126953, "step": 1948} +{"info/global_step": 1949, "train_info/time_within_train_step": 3.0857083797454834, "step": 1949} +{"train_info/time_between_train_steps": 0.004213094711303711, "step": 1949} +{"info/global_step": 1950, "train_info/time_within_train_step": 2.757119655609131, "step": 1950} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292036, "_runtime": 6058}, "step": 1950} +{"logs": {"train/loss": 4.7142, "train/learning_rate": 0.0002333333333333333, "train/epoch": 2.14, "_timestamp": 1746292036, "_runtime": 6058}, "step": 1950} +{"train_info/time_between_train_steps": 0.3502810001373291, "step": 1950} +{"info/global_step": 1951, "train_info/time_within_train_step": 2.6982405185699463, "step": 1951} +{"train_info/time_between_train_steps": 0.004049539566040039, "step": 1951} +{"info/global_step": 1952, "train_info/time_within_train_step": 2.6983420848846436, "step": 1952} +{"train_info/time_between_train_steps": 0.0040531158447265625, "step": 1952} +{"info/global_step": 1953, "train_info/time_within_train_step": 2.698575019836426, "step": 1953} +{"train_info/time_between_train_steps": 0.0039653778076171875, "step": 1953} +{"info/global_step": 1954, "train_info/time_within_train_step": 2.758727788925171, "step": 1954} +{"train_info/time_between_train_steps": 0.0037610530853271484, "step": 1954} +{"info/global_step": 1955, "train_info/time_within_train_step": 2.698974609375, "step": 1955} +{"train_info/time_between_train_steps": 0.003713846206665039, "step": 1955} +{"info/global_step": 1956, "train_info/time_within_train_step": 2.6972827911376953, "step": 1956} +{"train_info/time_between_train_steps": 0.003858327865600586, "step": 1956} +{"info/global_step": 1957, "train_info/time_within_train_step": 2.69994854927063, "step": 1957} +{"train_info/time_between_train_steps": 0.003858804702758789, "step": 1957} +{"info/global_step": 1958, "train_info/time_within_train_step": 2.697941303253174, "step": 1958} +{"train_info/time_between_train_steps": 0.0037665367126464844, "step": 1958} +{"info/global_step": 1959, "train_info/time_within_train_step": 2.699681282043457, "step": 1959} +{"train_info/time_between_train_steps": 0.0037794113159179688, "step": 1959} +{"info/global_step": 1960, "train_info/time_within_train_step": 2.6990463733673096, "step": 1960} +{"train_info/time_between_train_steps": 0.003956317901611328, "step": 1960} +{"info/global_step": 1961, "train_info/time_within_train_step": 2.6998138427734375, "step": 1961} +{"train_info/time_between_train_steps": 0.003751993179321289, "step": 1961} +{"info/global_step": 1962, "train_info/time_within_train_step": 3.0053911209106445, "step": 1962} +{"train_info/time_between_train_steps": 0.0038738250732421875, "step": 1962} +{"info/global_step": 1963, "train_info/time_within_train_step": 2.6980581283569336, "step": 1963} +{"train_info/time_between_train_steps": 0.003509044647216797, "step": 1963} +{"info/global_step": 1964, "train_info/time_within_train_step": 2.6974689960479736, "step": 1964} +{"train_info/time_between_train_steps": 0.00405120849609375, "step": 1964} +{"info/global_step": 1965, "train_info/time_within_train_step": 2.698328971862793, "step": 1965} +{"train_info/time_between_train_steps": 0.0036787986755371094, "step": 1965} +{"info/global_step": 1966, "train_info/time_within_train_step": 3.07786226272583, "step": 1966} +{"train_info/time_between_train_steps": 0.004065990447998047, "step": 1966} +{"info/global_step": 1967, "train_info/time_within_train_step": 2.6983096599578857, "step": 1967} +{"train_info/time_between_train_steps": 0.0034301280975341797, "step": 1967} +{"info/global_step": 1968, "train_info/time_within_train_step": 2.6965272426605225, "step": 1968} +{"train_info/time_between_train_steps": 0.003292083740234375, "step": 1968} +{"info/global_step": 1969, "train_info/time_within_train_step": 2.696913480758667, "step": 1969} +{"train_info/time_between_train_steps": 0.0033075809478759766, "step": 1969} +{"info/global_step": 1970, "train_info/time_within_train_step": 2.699211359024048, "step": 1970} +{"train_info/time_between_train_steps": 0.0034465789794921875, "step": 1970} +{"info/global_step": 1971, "train_info/time_within_train_step": 2.6997108459472656, "step": 1971} +{"train_info/time_between_train_steps": 0.0036857128143310547, "step": 1971} +{"info/global_step": 1972, "train_info/time_within_train_step": 2.6978559494018555, "step": 1972} +{"train_info/time_between_train_steps": 0.003681182861328125, "step": 1972} +{"info/global_step": 1973, "train_info/time_within_train_step": 2.6985886096954346, "step": 1973} +{"train_info/time_between_train_steps": 0.0035665035247802734, "step": 1973} +{"info/global_step": 1974, "train_info/time_within_train_step": 2.696857452392578, "step": 1974} +{"train_info/time_between_train_steps": 0.0037055015563964844, "step": 1974} +{"info/global_step": 1975, "train_info/time_within_train_step": 2.6980133056640625, "step": 1975} +{"train_info/time_between_train_steps": 0.0035142898559570312, "step": 1975} +{"info/global_step": 1976, "train_info/time_within_train_step": 2.6985998153686523, "step": 1976} +{"train_info/time_between_train_steps": 0.003676891326904297, "step": 1976} +{"info/global_step": 1977, "train_info/time_within_train_step": 2.699105978012085, "step": 1977} +{"train_info/time_between_train_steps": 0.0036597251892089844, "step": 1977} +{"info/global_step": 1978, "train_info/time_within_train_step": 2.698054075241089, "step": 1978} +{"train_info/time_between_train_steps": 0.0034797191619873047, "step": 1978} +{"info/global_step": 1979, "train_info/time_within_train_step": 2.698204278945923, "step": 1979} +{"train_info/time_between_train_steps": 0.003502368927001953, "step": 1979} +{"info/global_step": 1980, "train_info/time_within_train_step": 2.701361894607544, "step": 1980} +{"train_info/time_between_train_steps": 0.0036389827728271484, "step": 1980} +{"info/global_step": 1981, "train_info/time_within_train_step": 2.741128921508789, "step": 1981} +{"train_info/time_between_train_steps": 0.003551006317138672, "step": 1981} +{"info/global_step": 1982, "train_info/time_within_train_step": 2.9574623107910156, "step": 1982} +{"train_info/time_between_train_steps": 0.00357818603515625, "step": 1982} +{"info/global_step": 1983, "train_info/time_within_train_step": 2.9922335147857666, "step": 1983} +{"train_info/time_between_train_steps": 0.003639698028564453, "step": 1983} +{"info/global_step": 1984, "train_info/time_within_train_step": 2.6950020790100098, "step": 1984} +{"train_info/time_between_train_steps": 0.003661632537841797, "step": 1984} +{"info/global_step": 1985, "train_info/time_within_train_step": 2.6954424381256104, "step": 1985} +{"train_info/time_between_train_steps": 0.0035109519958496094, "step": 1985} +{"info/global_step": 1986, "train_info/time_within_train_step": 2.6973583698272705, "step": 1986} +{"train_info/time_between_train_steps": 0.0035736560821533203, "step": 1986} +{"info/global_step": 1987, "train_info/time_within_train_step": 2.6968154907226562, "step": 1987} +{"train_info/time_between_train_steps": 0.0035903453826904297, "step": 1987} +{"info/global_step": 1988, "train_info/time_within_train_step": 2.8428752422332764, "step": 1988} +{"train_info/time_between_train_steps": 0.003675222396850586, "step": 1988} +{"info/global_step": 1989, "train_info/time_within_train_step": 2.6969192028045654, "step": 1989} +{"train_info/time_between_train_steps": 0.003704071044921875, "step": 1989} +{"info/global_step": 1990, "train_info/time_within_train_step": 2.6983540058135986, "step": 1990} +{"train_info/time_between_train_steps": 0.0036885738372802734, "step": 1990} +{"info/global_step": 1991, "train_info/time_within_train_step": 2.698004722595215, "step": 1991} +{"train_info/time_between_train_steps": 0.0035991668701171875, "step": 1991} +{"info/global_step": 1992, "train_info/time_within_train_step": 2.7000579833984375, "step": 1992} +{"train_info/time_between_train_steps": 0.003649473190307617, "step": 1992} +{"info/global_step": 1993, "train_info/time_within_train_step": 2.6995973587036133, "step": 1993} +{"train_info/time_between_train_steps": 0.0036695003509521484, "step": 1993} +{"info/global_step": 1994, "train_info/time_within_train_step": 2.697277784347534, "step": 1994} +{"train_info/time_between_train_steps": 0.0036199092864990234, "step": 1994} +{"info/global_step": 1995, "train_info/time_within_train_step": 2.6980016231536865, "step": 1995} +{"train_info/time_between_train_steps": 0.0036132335662841797, "step": 1995} +{"info/global_step": 1996, "train_info/time_within_train_step": 2.6982340812683105, "step": 1996} +{"train_info/time_between_train_steps": 0.003671884536743164, "step": 1996} +{"info/global_step": 1997, "train_info/time_within_train_step": 2.6997764110565186, "step": 1997} +{"train_info/time_between_train_steps": 0.0038862228393554688, "step": 1997} +{"info/global_step": 1998, "train_info/time_within_train_step": 2.6989119052886963, "step": 1998} +{"train_info/time_between_train_steps": 0.0036051273345947266, "step": 1998} +{"info/global_step": 1999, "train_info/time_within_train_step": 3.302065134048462, "step": 1999} +{"train_info/time_between_train_steps": 0.0036067962646484375, "step": 1999} +{"info/global_step": 2000, "train_info/time_within_train_step": 2.696369171142578, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292182, "_runtime": 6204}, "step": 2000} +{"logs": {"train/loss": 4.6988, "train/learning_rate": 0.00022222222222222218, "train/epoch": 2.16, "_timestamp": 1746292182, "_runtime": 6204}, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292187, "_runtime": 6209}, "step": 2000} +{"logs": {"eval/loss": 5.084012985229492, "eval/runtime": 5.3939, "eval/samples_per_second": 33.742, "eval/steps_per_second": 1.112, "train/epoch": 2.16, "_timestamp": 1746292187, "_runtime": 6209}, "step": 2000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292187, "_runtime": 6209}, "step": 2000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 5.084012985229492, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 161.42053613050612, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.3939, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 33.742, "train/epoch": 2.16, "_timestamp": 1746292187, "_runtime": 6209}, "step": 2000} +{"train_info/time_between_train_steps": 38.94654321670532, "step": 2000} +{"info/global_step": 2001, "train_info/time_within_train_step": 2.483752727508545, "step": 2001} +{"train_info/time_between_train_steps": 0.0036268234252929688, "step": 2001} +{"info/global_step": 2002, "train_info/time_within_train_step": 2.4803123474121094, "step": 2002} +{"train_info/time_between_train_steps": 0.003620147705078125, "step": 2002} +{"info/global_step": 2003, "train_info/time_within_train_step": 2.6496596336364746, "step": 2003} +{"train_info/time_between_train_steps": 0.0036585330963134766, "step": 2003} +{"info/global_step": 2004, "train_info/time_within_train_step": 2.6927056312561035, "step": 2004} +{"train_info/time_between_train_steps": 0.003534078598022461, "step": 2004} +{"info/global_step": 2005, "train_info/time_within_train_step": 2.6941134929656982, "step": 2005} +{"train_info/time_between_train_steps": 0.003527402877807617, "step": 2005} +{"info/global_step": 2006, "train_info/time_within_train_step": 2.6969218254089355, "step": 2006} +{"train_info/time_between_train_steps": 0.0037381649017333984, "step": 2006} +{"info/global_step": 2007, "train_info/time_within_train_step": 2.6968295574188232, "step": 2007} +{"train_info/time_between_train_steps": 0.003657102584838867, "step": 2007} +{"info/global_step": 2008, "train_info/time_within_train_step": 2.698641777038574, "step": 2008} +{"train_info/time_between_train_steps": 0.0036504268646240234, "step": 2008} +{"info/global_step": 2009, "train_info/time_within_train_step": 2.6977901458740234, "step": 2009} +{"train_info/time_between_train_steps": 0.003515005111694336, "step": 2009} +{"info/global_step": 2010, "train_info/time_within_train_step": 2.737373113632202, "step": 2010} +{"train_info/time_between_train_steps": 0.003596782684326172, "step": 2010} +{"info/global_step": 2011, "train_info/time_within_train_step": 2.8304264545440674, "step": 2011} +{"train_info/time_between_train_steps": 0.0036115646362304688, "step": 2011} +{"info/global_step": 2012, "train_info/time_within_train_step": 3.0314102172851562, "step": 2012} +{"train_info/time_between_train_steps": 0.0036389827728271484, "step": 2012} +{"info/global_step": 2013, "train_info/time_within_train_step": 2.7663979530334473, "step": 2013} +{"train_info/time_between_train_steps": 0.003601551055908203, "step": 2013} +{"info/global_step": 2014, "train_info/time_within_train_step": 2.7039613723754883, "step": 2014} +{"train_info/time_between_train_steps": 0.004017353057861328, "step": 2014} +{"info/global_step": 2015, "train_info/time_within_train_step": 2.701646089553833, "step": 2015} +{"train_info/time_between_train_steps": 0.0038042068481445312, "step": 2015} +{"info/global_step": 2016, "train_info/time_within_train_step": 2.7018282413482666, "step": 2016} +{"train_info/time_between_train_steps": 0.003749847412109375, "step": 2016} +{"info/global_step": 2017, "train_info/time_within_train_step": 2.7007999420166016, "step": 2017} +{"train_info/time_between_train_steps": 0.0036568641662597656, "step": 2017} +{"info/global_step": 2018, "train_info/time_within_train_step": 2.696678638458252, "step": 2018} +{"train_info/time_between_train_steps": 0.003701925277709961, "step": 2018} +{"info/global_step": 2019, "train_info/time_within_train_step": 2.6973330974578857, "step": 2019} +{"train_info/time_between_train_steps": 0.0036890506744384766, "step": 2019} +{"info/global_step": 2020, "train_info/time_within_train_step": 2.7008397579193115, "step": 2020} +{"train_info/time_between_train_steps": 0.0037889480590820312, "step": 2020} +{"info/global_step": 2021, "train_info/time_within_train_step": 2.702458381652832, "step": 2021} +{"train_info/time_between_train_steps": 0.003991603851318359, "step": 2021} +{"info/global_step": 2022, "train_info/time_within_train_step": 2.7509663105010986, "step": 2022} +{"train_info/time_between_train_steps": 0.003693103790283203, "step": 2022} +{"info/global_step": 2023, "train_info/time_within_train_step": 2.7001636028289795, "step": 2023} +{"train_info/time_between_train_steps": 0.0037255287170410156, "step": 2023} +{"info/global_step": 2024, "train_info/time_within_train_step": 2.6987144947052, "step": 2024} +{"train_info/time_between_train_steps": 0.00363922119140625, "step": 2024} +{"info/global_step": 2025, "train_info/time_within_train_step": 2.6974985599517822, "step": 2025} +{"train_info/time_between_train_steps": 0.003630399703979492, "step": 2025} +{"info/global_step": 2026, "train_info/time_within_train_step": 2.699629068374634, "step": 2026} +{"train_info/time_between_train_steps": 0.00362396240234375, "step": 2026} +{"info/global_step": 2027, "train_info/time_within_train_step": 3.0233078002929688, "step": 2027} +{"train_info/time_between_train_steps": 0.0033943653106689453, "step": 2027} +{"info/global_step": 2028, "train_info/time_within_train_step": 2.69966983795166, "step": 2028} +{"train_info/time_between_train_steps": 0.0036351680755615234, "step": 2028} +{"info/global_step": 2029, "train_info/time_within_train_step": 2.701233386993408, "step": 2029} +{"train_info/time_between_train_steps": 0.0037224292755126953, "step": 2029} +{"info/global_step": 2030, "train_info/time_within_train_step": 2.697023391723633, "step": 2030} +{"train_info/time_between_train_steps": 0.003564596176147461, "step": 2030} +{"info/global_step": 2031, "train_info/time_within_train_step": 2.702725648880005, "step": 2031} +{"train_info/time_between_train_steps": 0.003579854965209961, "step": 2031} +{"info/global_step": 2032, "train_info/time_within_train_step": 2.6973965167999268, "step": 2032} +{"train_info/time_between_train_steps": 0.003650665283203125, "step": 2032} +{"info/global_step": 2033, "train_info/time_within_train_step": 2.6974244117736816, "step": 2033} +{"train_info/time_between_train_steps": 0.0035436153411865234, "step": 2033} +{"info/global_step": 2034, "train_info/time_within_train_step": 2.6976354122161865, "step": 2034} +{"train_info/time_between_train_steps": 0.0036211013793945312, "step": 2034} +{"info/global_step": 2035, "train_info/time_within_train_step": 2.697993516921997, "step": 2035} +{"train_info/time_between_train_steps": 0.0035305023193359375, "step": 2035} +{"info/global_step": 2036, "train_info/time_within_train_step": 2.6998698711395264, "step": 2036} +{"train_info/time_between_train_steps": 0.0035266876220703125, "step": 2036} +{"info/global_step": 2037, "train_info/time_within_train_step": 2.6995697021484375, "step": 2037} +{"train_info/time_between_train_steps": 0.003545522689819336, "step": 2037} +{"info/global_step": 2038, "train_info/time_within_train_step": 2.700845956802368, "step": 2038} +{"train_info/time_between_train_steps": 0.003701448440551758, "step": 2038} +{"info/global_step": 2039, "train_info/time_within_train_step": 2.698688268661499, "step": 2039} +{"train_info/time_between_train_steps": 0.0035872459411621094, "step": 2039} +{"info/global_step": 2040, "train_info/time_within_train_step": 2.6992242336273193, "step": 2040} +{"train_info/time_between_train_steps": 0.003675699234008789, "step": 2040} +{"info/global_step": 2041, "train_info/time_within_train_step": 2.69851016998291, "step": 2041} +{"train_info/time_between_train_steps": 0.003618001937866211, "step": 2041} +{"info/global_step": 2042, "train_info/time_within_train_step": 2.698399066925049, "step": 2042} +{"train_info/time_between_train_steps": 0.003534555435180664, "step": 2042} +{"info/global_step": 2043, "train_info/time_within_train_step": 2.7001914978027344, "step": 2043} +{"train_info/time_between_train_steps": 0.003698587417602539, "step": 2043} +{"info/global_step": 2044, "train_info/time_within_train_step": 2.697002410888672, "step": 2044} +{"train_info/time_between_train_steps": 0.0035424232482910156, "step": 2044} +{"info/global_step": 2045, "train_info/time_within_train_step": 2.697186231613159, "step": 2045} +{"train_info/time_between_train_steps": 0.0036008358001708984, "step": 2045} +{"info/global_step": 2046, "train_info/time_within_train_step": 2.6988208293914795, "step": 2046} +{"train_info/time_between_train_steps": 0.003674745559692383, "step": 2046} +{"info/global_step": 2047, "train_info/time_within_train_step": 2.6959996223449707, "step": 2047} +{"train_info/time_between_train_steps": 0.0037713050842285156, "step": 2047} +{"info/global_step": 2048, "train_info/time_within_train_step": 2.6970133781433105, "step": 2048} +{"train_info/time_between_train_steps": 0.003773212432861328, "step": 2048} +{"info/global_step": 2049, "train_info/time_within_train_step": 2.6996665000915527, "step": 2049} +{"train_info/time_between_train_steps": 0.0037033557891845703, "step": 2049} +{"info/global_step": 2050, "train_info/time_within_train_step": 2.700157403945923, "step": 2050} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292366, "_runtime": 6388}, "step": 2050} +{"logs": {"train/loss": 4.6722, "train/learning_rate": 0.0002111111111111111, "train/epoch": 2.18, "_timestamp": 1746292366, "_runtime": 6388}, "step": 2050} +{"train_info/time_between_train_steps": 0.025905132293701172, "step": 2050} +{"info/global_step": 2051, "train_info/time_within_train_step": 2.700725555419922, "step": 2051} +{"train_info/time_between_train_steps": 0.004507780075073242, "step": 2051} +{"info/global_step": 2052, "train_info/time_within_train_step": 2.6994614601135254, "step": 2052} +{"train_info/time_between_train_steps": 0.0035610198974609375, "step": 2052} +{"info/global_step": 2053, "train_info/time_within_train_step": 2.6988131999969482, "step": 2053} +{"train_info/time_between_train_steps": 0.003454446792602539, "step": 2053} +{"info/global_step": 2054, "train_info/time_within_train_step": 2.695707321166992, "step": 2054} +{"train_info/time_between_train_steps": 0.0035369396209716797, "step": 2054} +{"info/global_step": 2055, "train_info/time_within_train_step": 2.753135919570923, "step": 2055} +{"train_info/time_between_train_steps": 0.003492116928100586, "step": 2055} +{"info/global_step": 2056, "train_info/time_within_train_step": 2.6961987018585205, "step": 2056} +{"train_info/time_between_train_steps": 0.0036592483520507812, "step": 2056} +{"info/global_step": 2057, "train_info/time_within_train_step": 2.699873208999634, "step": 2057} +{"train_info/time_between_train_steps": 0.003655672073364258, "step": 2057} +{"info/global_step": 2058, "train_info/time_within_train_step": 2.6972899436950684, "step": 2058} +{"train_info/time_between_train_steps": 0.0035715103149414062, "step": 2058} +{"info/global_step": 2059, "train_info/time_within_train_step": 2.6967313289642334, "step": 2059} +{"train_info/time_between_train_steps": 0.003739595413208008, "step": 2059} +{"info/global_step": 2060, "train_info/time_within_train_step": 2.696899652481079, "step": 2060} +{"train_info/time_between_train_steps": 0.003623485565185547, "step": 2060} +{"info/global_step": 2061, "train_info/time_within_train_step": 2.69732928276062, "step": 2061} +{"train_info/time_between_train_steps": 0.0035293102264404297, "step": 2061} +{"info/global_step": 2062, "train_info/time_within_train_step": 3.1073720455169678, "step": 2062} +{"train_info/time_between_train_steps": 0.003531217575073242, "step": 2062} +{"info/global_step": 2063, "train_info/time_within_train_step": 2.6996335983276367, "step": 2063} +{"train_info/time_between_train_steps": 0.0036211013793945312, "step": 2063} +{"info/global_step": 2064, "train_info/time_within_train_step": 2.6982812881469727, "step": 2064} +{"train_info/time_between_train_steps": 0.0035665035247802734, "step": 2064} +{"info/global_step": 2065, "train_info/time_within_train_step": 2.6997382640838623, "step": 2065} +{"train_info/time_between_train_steps": 0.003718852996826172, "step": 2065} +{"info/global_step": 2066, "train_info/time_within_train_step": 2.6994881629943848, "step": 2066} +{"train_info/time_between_train_steps": 0.0036411285400390625, "step": 2066} +{"info/global_step": 2067, "train_info/time_within_train_step": 2.6997876167297363, "step": 2067} +{"train_info/time_between_train_steps": 0.003609180450439453, "step": 2067} +{"info/global_step": 2068, "train_info/time_within_train_step": 2.698680877685547, "step": 2068} +{"train_info/time_between_train_steps": 0.003597259521484375, "step": 2068} +{"info/global_step": 2069, "train_info/time_within_train_step": 2.6979868412017822, "step": 2069} +{"train_info/time_between_train_steps": 0.0035250186920166016, "step": 2069} +{"info/global_step": 2070, "train_info/time_within_train_step": 2.698803663253784, "step": 2070} +{"train_info/time_between_train_steps": 0.0035676956176757812, "step": 2070} +{"info/global_step": 2071, "train_info/time_within_train_step": 2.697136402130127, "step": 2071} +{"train_info/time_between_train_steps": 0.0035445690155029297, "step": 2071} +{"info/global_step": 2072, "train_info/time_within_train_step": 2.6990246772766113, "step": 2072} +{"train_info/time_between_train_steps": 0.0035147666931152344, "step": 2072} +{"info/global_step": 2073, "train_info/time_within_train_step": 2.696735143661499, "step": 2073} +{"train_info/time_between_train_steps": 0.003586292266845703, "step": 2073} +{"info/global_step": 2074, "train_info/time_within_train_step": 2.699333906173706, "step": 2074} +{"train_info/time_between_train_steps": 0.003589630126953125, "step": 2074} +{"info/global_step": 2075, "train_info/time_within_train_step": 2.7129886150360107, "step": 2075} +{"train_info/time_between_train_steps": 0.0035614967346191406, "step": 2075} +{"info/global_step": 2076, "train_info/time_within_train_step": 2.698181629180908, "step": 2076} +{"train_info/time_between_train_steps": 0.0035469532012939453, "step": 2076} +{"info/global_step": 2077, "train_info/time_within_train_step": 2.6985673904418945, "step": 2077} +{"train_info/time_between_train_steps": 0.003537416458129883, "step": 2077} +{"info/global_step": 2078, "train_info/time_within_train_step": 2.738327980041504, "step": 2078} +{"train_info/time_between_train_steps": 0.003596067428588867, "step": 2078} +{"info/global_step": 2079, "train_info/time_within_train_step": 2.9998185634613037, "step": 2079} +{"train_info/time_between_train_steps": 0.003532886505126953, "step": 2079} +{"info/global_step": 2080, "train_info/time_within_train_step": 2.848392963409424, "step": 2080} +{"train_info/time_between_train_steps": 0.0036067962646484375, "step": 2080} +{"info/global_step": 2081, "train_info/time_within_train_step": 2.698169231414795, "step": 2081} +{"train_info/time_between_train_steps": 0.0035114288330078125, "step": 2081} +{"info/global_step": 2082, "train_info/time_within_train_step": 2.6983189582824707, "step": 2082} +{"train_info/time_between_train_steps": 0.003557443618774414, "step": 2082} +{"info/global_step": 2083, "train_info/time_within_train_step": 2.7002508640289307, "step": 2083} +{"train_info/time_between_train_steps": 0.004889965057373047, "step": 2083} +{"info/global_step": 2084, "train_info/time_within_train_step": 2.697110891342163, "step": 2084} +{"train_info/time_between_train_steps": 0.006970405578613281, "step": 2084} +{"info/global_step": 2085, "train_info/time_within_train_step": 2.6991074085235596, "step": 2085} +{"train_info/time_between_train_steps": 0.0035657882690429688, "step": 2085} +{"info/global_step": 2086, "train_info/time_within_train_step": 2.6998519897460938, "step": 2086} +{"train_info/time_between_train_steps": 0.007054328918457031, "step": 2086} +{"info/global_step": 2087, "train_info/time_within_train_step": 2.700031042098999, "step": 2087} +{"train_info/time_between_train_steps": 0.0070171356201171875, "step": 2087} +{"info/global_step": 2088, "train_info/time_within_train_step": 2.6988019943237305, "step": 2088} +{"train_info/time_between_train_steps": 0.006996870040893555, "step": 2088} +{"info/global_step": 2089, "train_info/time_within_train_step": 2.699618339538574, "step": 2089} +{"train_info/time_between_train_steps": 0.003640890121459961, "step": 2089} +{"info/global_step": 2090, "train_info/time_within_train_step": 2.699979543685913, "step": 2090} +{"train_info/time_between_train_steps": 0.0036666393280029297, "step": 2090} +{"info/global_step": 2091, "train_info/time_within_train_step": 2.6997008323669434, "step": 2091} +{"train_info/time_between_train_steps": 0.003527402877807617, "step": 2091} +{"info/global_step": 2092, "train_info/time_within_train_step": 2.700310230255127, "step": 2092} +{"train_info/time_between_train_steps": 0.003720998764038086, "step": 2092} +{"info/global_step": 2093, "train_info/time_within_train_step": 2.6988399028778076, "step": 2093} +{"train_info/time_between_train_steps": 0.003943681716918945, "step": 2093} +{"info/global_step": 2094, "train_info/time_within_train_step": 2.698538303375244, "step": 2094} +{"train_info/time_between_train_steps": 0.003529787063598633, "step": 2094} +{"info/global_step": 2095, "train_info/time_within_train_step": 2.7006731033325195, "step": 2095} +{"train_info/time_between_train_steps": 0.0036199092864990234, "step": 2095} +{"info/global_step": 2096, "train_info/time_within_train_step": 2.713998794555664, "step": 2096} +{"train_info/time_between_train_steps": 0.003687143325805664, "step": 2096} +{"info/global_step": 2097, "train_info/time_within_train_step": 2.6993415355682373, "step": 2097} +{"train_info/time_between_train_steps": 0.0034651756286621094, "step": 2097} +{"info/global_step": 2098, "train_info/time_within_train_step": 2.699451446533203, "step": 2098} +{"train_info/time_between_train_steps": 0.003560304641723633, "step": 2098} +{"info/global_step": 2099, "train_info/time_within_train_step": 2.712838649749756, "step": 2099} +{"train_info/time_between_train_steps": 0.0035140514373779297, "step": 2099} +{"info/global_step": 2100, "train_info/time_within_train_step": 2.7548160552978516, "step": 2100} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292511, "_runtime": 6533}, "step": 2100} +{"logs": {"train/loss": 4.6452, "train/learning_rate": 0.00019999999999999998, "train/epoch": 2.19, "_timestamp": 1746292511, "_runtime": 6533}, "step": 2100} +{"train_info/time_between_train_steps": 33.232171058654785, "step": 2100} +{"info/global_step": 2101, "train_info/time_within_train_step": 2.4829094409942627, "step": 2101} +{"train_info/time_between_train_steps": 0.003705263137817383, "step": 2101} +{"info/global_step": 2102, "train_info/time_within_train_step": 2.4720537662506104, "step": 2102} +{"train_info/time_between_train_steps": 0.003627777099609375, "step": 2102} +{"info/global_step": 2103, "train_info/time_within_train_step": 2.621704339981079, "step": 2103} +{"train_info/time_between_train_steps": 0.00353240966796875, "step": 2103} +{"info/global_step": 2104, "train_info/time_within_train_step": 2.6914334297180176, "step": 2104} +{"train_info/time_between_train_steps": 0.0038461685180664062, "step": 2104} +{"info/global_step": 2105, "train_info/time_within_train_step": 2.6932260990142822, "step": 2105} +{"train_info/time_between_train_steps": 0.003727436065673828, "step": 2105} +{"info/global_step": 2106, "train_info/time_within_train_step": 2.767148971557617, "step": 2106} +{"train_info/time_between_train_steps": 0.0038030147552490234, "step": 2106} +{"info/global_step": 2107, "train_info/time_within_train_step": 2.6967482566833496, "step": 2107} +{"train_info/time_between_train_steps": 0.003771066665649414, "step": 2107} +{"info/global_step": 2108, "train_info/time_within_train_step": 2.698627471923828, "step": 2108} +{"train_info/time_between_train_steps": 0.0037577152252197266, "step": 2108} +{"info/global_step": 2109, "train_info/time_within_train_step": 2.698457717895508, "step": 2109} +{"train_info/time_between_train_steps": 0.00385284423828125, "step": 2109} +{"info/global_step": 2110, "train_info/time_within_train_step": 2.6997714042663574, "step": 2110} +{"train_info/time_between_train_steps": 0.003701925277709961, "step": 2110} +{"info/global_step": 2111, "train_info/time_within_train_step": 2.976100206375122, "step": 2111} +{"train_info/time_between_train_steps": 0.0036268234252929688, "step": 2111} +{"info/global_step": 2112, "train_info/time_within_train_step": 2.8985140323638916, "step": 2112} +{"train_info/time_between_train_steps": 0.003902912139892578, "step": 2112} +{"info/global_step": 2113, "train_info/time_within_train_step": 2.8019447326660156, "step": 2113} +{"train_info/time_between_train_steps": 0.0038957595825195312, "step": 2113} +{"info/global_step": 2114, "train_info/time_within_train_step": 2.701409339904785, "step": 2114} +{"train_info/time_between_train_steps": 0.0037195682525634766, "step": 2114} +{"info/global_step": 2115, "train_info/time_within_train_step": 2.7016782760620117, "step": 2115} +{"train_info/time_between_train_steps": 0.003850698471069336, "step": 2115} +{"info/global_step": 2116, "train_info/time_within_train_step": 2.7003173828125, "step": 2116} +{"train_info/time_between_train_steps": 0.0040094852447509766, "step": 2116} +{"info/global_step": 2117, "train_info/time_within_train_step": 2.702977180480957, "step": 2117} +{"train_info/time_between_train_steps": 0.0037381649017333984, "step": 2117} +{"info/global_step": 2118, "train_info/time_within_train_step": 2.700289487838745, "step": 2118} +{"train_info/time_between_train_steps": 0.003690481185913086, "step": 2118} +{"info/global_step": 2119, "train_info/time_within_train_step": 2.701930284500122, "step": 2119} +{"train_info/time_between_train_steps": 0.003909587860107422, "step": 2119} +{"info/global_step": 2120, "train_info/time_within_train_step": 2.7024784088134766, "step": 2120} +{"train_info/time_between_train_steps": 0.0037338733673095703, "step": 2120} +{"info/global_step": 2121, "train_info/time_within_train_step": 2.7015178203582764, "step": 2121} +{"train_info/time_between_train_steps": 0.0037567615509033203, "step": 2121} +{"info/global_step": 2122, "train_info/time_within_train_step": 2.9023635387420654, "step": 2122} +{"train_info/time_between_train_steps": 0.0037610530853271484, "step": 2122} +{"info/global_step": 2123, "train_info/time_within_train_step": 2.781358242034912, "step": 2123} +{"train_info/time_between_train_steps": 0.0039446353912353516, "step": 2123} +{"info/global_step": 2124, "train_info/time_within_train_step": 2.699862003326416, "step": 2124} +{"train_info/time_between_train_steps": 0.003805398941040039, "step": 2124} +{"info/global_step": 2125, "train_info/time_within_train_step": 2.6997604370117188, "step": 2125} +{"train_info/time_between_train_steps": 0.0037822723388671875, "step": 2125} +{"info/global_step": 2126, "train_info/time_within_train_step": 2.6985485553741455, "step": 2126} +{"train_info/time_between_train_steps": 0.003773212432861328, "step": 2126} +{"info/global_step": 2127, "train_info/time_within_train_step": 2.8126888275146484, "step": 2127} +{"train_info/time_between_train_steps": 0.003757953643798828, "step": 2127} +{"info/global_step": 2128, "train_info/time_within_train_step": 2.6999523639678955, "step": 2128} +{"train_info/time_between_train_steps": 0.0037488937377929688, "step": 2128} +{"info/global_step": 2129, "train_info/time_within_train_step": 2.6997063159942627, "step": 2129} +{"train_info/time_between_train_steps": 0.003829479217529297, "step": 2129} +{"info/global_step": 2130, "train_info/time_within_train_step": 2.699068784713745, "step": 2130} +{"train_info/time_between_train_steps": 0.0037190914154052734, "step": 2130} +{"info/global_step": 2131, "train_info/time_within_train_step": 2.698725700378418, "step": 2131} +{"train_info/time_between_train_steps": 0.003694295883178711, "step": 2131} +{"info/global_step": 2132, "train_info/time_within_train_step": 2.700033664703369, "step": 2132} +{"train_info/time_between_train_steps": 0.003673076629638672, "step": 2132} +{"info/global_step": 2133, "train_info/time_within_train_step": 2.7003729343414307, "step": 2133} +{"train_info/time_between_train_steps": 0.0036945343017578125, "step": 2133} +{"info/global_step": 2134, "train_info/time_within_train_step": 2.6988701820373535, "step": 2134} +{"train_info/time_between_train_steps": 0.0041539669036865234, "step": 2134} +{"info/global_step": 2135, "train_info/time_within_train_step": 2.736644983291626, "step": 2135} +{"train_info/time_between_train_steps": 0.0037665367126464844, "step": 2135} +{"info/global_step": 2136, "train_info/time_within_train_step": 2.7004306316375732, "step": 2136} +{"train_info/time_between_train_steps": 0.003722667694091797, "step": 2136} +{"info/global_step": 2137, "train_info/time_within_train_step": 2.7003448009490967, "step": 2137} +{"train_info/time_between_train_steps": 0.003714323043823242, "step": 2137} +{"info/global_step": 2138, "train_info/time_within_train_step": 2.700587511062622, "step": 2138} +{"train_info/time_between_train_steps": 0.004812479019165039, "step": 2138} +{"info/global_step": 2139, "train_info/time_within_train_step": 2.7007217407226562, "step": 2139} +{"train_info/time_between_train_steps": 0.003803730010986328, "step": 2139} +{"info/global_step": 2140, "train_info/time_within_train_step": 2.701368570327759, "step": 2140} +{"train_info/time_between_train_steps": 0.0037856101989746094, "step": 2140} +{"info/global_step": 2141, "train_info/time_within_train_step": 2.700033187866211, "step": 2141} +{"train_info/time_between_train_steps": 0.003731966018676758, "step": 2141} +{"info/global_step": 2142, "train_info/time_within_train_step": 2.6998274326324463, "step": 2142} +{"train_info/time_between_train_steps": 0.0037505626678466797, "step": 2142} +{"info/global_step": 2143, "train_info/time_within_train_step": 2.7010631561279297, "step": 2143} +{"train_info/time_between_train_steps": 0.0037975311279296875, "step": 2143} +{"info/global_step": 2144, "train_info/time_within_train_step": 2.699014186859131, "step": 2144} +{"train_info/time_between_train_steps": 0.004328727722167969, "step": 2144} +{"info/global_step": 2145, "train_info/time_within_train_step": 2.7005887031555176, "step": 2145} +{"train_info/time_between_train_steps": 0.0037679672241210938, "step": 2145} +{"info/global_step": 2146, "train_info/time_within_train_step": 2.7008938789367676, "step": 2146} +{"train_info/time_between_train_steps": 0.0037200450897216797, "step": 2146} +{"info/global_step": 2147, "train_info/time_within_train_step": 2.7020671367645264, "step": 2147} +{"train_info/time_between_train_steps": 0.0037674903869628906, "step": 2147} +{"info/global_step": 2148, "train_info/time_within_train_step": 2.7195544242858887, "step": 2148} +{"train_info/time_between_train_steps": 0.0036830902099609375, "step": 2148} +{"info/global_step": 2149, "train_info/time_within_train_step": 2.7023143768310547, "step": 2149} +{"train_info/time_between_train_steps": 0.003774404525756836, "step": 2149} +{"info/global_step": 2150, "train_info/time_within_train_step": 2.699244499206543, "step": 2150} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292687, "_runtime": 6709}, "step": 2150} +{"logs": {"train/loss": 4.6364, "train/learning_rate": 0.00018888888888888888, "train/epoch": 2.21, "_timestamp": 1746292687, "_runtime": 6709}, "step": 2150} +{"train_info/time_between_train_steps": 0.02392125129699707, "step": 2150} +{"info/global_step": 2151, "train_info/time_within_train_step": 2.740839958190918, "step": 2151} +{"train_info/time_between_train_steps": 0.0036668777465820312, "step": 2151} +{"info/global_step": 2152, "train_info/time_within_train_step": 2.8856544494628906, "step": 2152} +{"train_info/time_between_train_steps": 0.0036983489990234375, "step": 2152} +{"info/global_step": 2153, "train_info/time_within_train_step": 2.7926907539367676, "step": 2153} +{"train_info/time_between_train_steps": 0.0036759376525878906, "step": 2153} +{"info/global_step": 2154, "train_info/time_within_train_step": 2.715773820877075, "step": 2154} +{"train_info/time_between_train_steps": 0.003566265106201172, "step": 2154} +{"info/global_step": 2155, "train_info/time_within_train_step": 2.7243967056274414, "step": 2155} +{"train_info/time_between_train_steps": 0.003760099411010742, "step": 2155} +{"info/global_step": 2156, "train_info/time_within_train_step": 2.806161642074585, "step": 2156} +{"train_info/time_between_train_steps": 0.0037152767181396484, "step": 2156} +{"info/global_step": 2157, "train_info/time_within_train_step": 2.7383244037628174, "step": 2157} +{"train_info/time_between_train_steps": 0.0035796165466308594, "step": 2157} +{"info/global_step": 2158, "train_info/time_within_train_step": 2.6970462799072266, "step": 2158} +{"train_info/time_between_train_steps": 0.003447294235229492, "step": 2158} +{"info/global_step": 2159, "train_info/time_within_train_step": 2.6979172229766846, "step": 2159} +{"train_info/time_between_train_steps": 0.003662109375, "step": 2159} +{"info/global_step": 2160, "train_info/time_within_train_step": 2.6983399391174316, "step": 2160} +{"train_info/time_between_train_steps": 0.0036356449127197266, "step": 2160} +{"info/global_step": 2161, "train_info/time_within_train_step": 2.6987409591674805, "step": 2161} +{"train_info/time_between_train_steps": 0.003654956817626953, "step": 2161} +{"info/global_step": 2162, "train_info/time_within_train_step": 2.6984071731567383, "step": 2162} +{"train_info/time_between_train_steps": 0.0035047531127929688, "step": 2162} +{"info/global_step": 2163, "train_info/time_within_train_step": 2.6994705200195312, "step": 2163} +{"train_info/time_between_train_steps": 0.0035326480865478516, "step": 2163} +{"info/global_step": 2164, "train_info/time_within_train_step": 2.6992084980010986, "step": 2164} +{"train_info/time_between_train_steps": 0.0035293102264404297, "step": 2164} +{"info/global_step": 2165, "train_info/time_within_train_step": 2.6996333599090576, "step": 2165} +{"train_info/time_between_train_steps": 0.003542661666870117, "step": 2165} +{"info/global_step": 2166, "train_info/time_within_train_step": 2.6996920108795166, "step": 2166} +{"train_info/time_between_train_steps": 0.0035238265991210938, "step": 2166} +{"info/global_step": 2167, "train_info/time_within_train_step": 2.701625347137451, "step": 2167} +{"train_info/time_between_train_steps": 0.003549814224243164, "step": 2167} +{"info/global_step": 2168, "train_info/time_within_train_step": 2.702548027038574, "step": 2168} +{"train_info/time_between_train_steps": 0.0034966468811035156, "step": 2168} +{"info/global_step": 2169, "train_info/time_within_train_step": 2.6974399089813232, "step": 2169} +{"train_info/time_between_train_steps": 0.0034532546997070312, "step": 2169} +{"info/global_step": 2170, "train_info/time_within_train_step": 2.6994872093200684, "step": 2170} +{"train_info/time_between_train_steps": 0.0035347938537597656, "step": 2170} +{"info/global_step": 2171, "train_info/time_within_train_step": 2.698505401611328, "step": 2171} +{"train_info/time_between_train_steps": 0.0034999847412109375, "step": 2171} +{"info/global_step": 2172, "train_info/time_within_train_step": 2.6979830265045166, "step": 2172} +{"train_info/time_between_train_steps": 0.003526926040649414, "step": 2172} +{"info/global_step": 2173, "train_info/time_within_train_step": 2.69754695892334, "step": 2173} +{"train_info/time_between_train_steps": 0.0035703182220458984, "step": 2173} +{"info/global_step": 2174, "train_info/time_within_train_step": 2.69735050201416, "step": 2174} +{"train_info/time_between_train_steps": 0.003481149673461914, "step": 2174} +{"info/global_step": 2175, "train_info/time_within_train_step": 2.6972622871398926, "step": 2175} +{"train_info/time_between_train_steps": 0.0034821033477783203, "step": 2175} +{"info/global_step": 2176, "train_info/time_within_train_step": 2.7005770206451416, "step": 2176} +{"train_info/time_between_train_steps": 0.0035550594329833984, "step": 2176} +{"info/global_step": 2177, "train_info/time_within_train_step": 2.6973118782043457, "step": 2177} +{"train_info/time_between_train_steps": 0.0034224987030029297, "step": 2177} +{"info/global_step": 2178, "train_info/time_within_train_step": 2.7832956314086914, "step": 2178} +{"train_info/time_between_train_steps": 0.003475189208984375, "step": 2178} +{"info/global_step": 2179, "train_info/time_within_train_step": 2.7509586811065674, "step": 2179} +{"train_info/time_between_train_steps": 0.0035152435302734375, "step": 2179} +{"info/global_step": 2180, "train_info/time_within_train_step": 2.6974563598632812, "step": 2180} +{"train_info/time_between_train_steps": 0.0035033226013183594, "step": 2180} +{"info/global_step": 2181, "train_info/time_within_train_step": 2.697568893432617, "step": 2181} +{"train_info/time_between_train_steps": 0.003487825393676758, "step": 2181} +{"info/global_step": 2182, "train_info/time_within_train_step": 2.697599411010742, "step": 2182} +{"train_info/time_between_train_steps": 0.0034933090209960938, "step": 2182} +{"info/global_step": 2183, "train_info/time_within_train_step": 2.6970293521881104, "step": 2183} +{"train_info/time_between_train_steps": 0.0035963058471679688, "step": 2183} +{"info/global_step": 2184, "train_info/time_within_train_step": 2.6976702213287354, "step": 2184} +{"train_info/time_between_train_steps": 0.0034668445587158203, "step": 2184} +{"info/global_step": 2185, "train_info/time_within_train_step": 2.6921563148498535, "step": 2185} +{"train_info/time_between_train_steps": 0.0034568309783935547, "step": 2185} +{"info/global_step": 2186, "train_info/time_within_train_step": 2.694101572036743, "step": 2186} +{"train_info/time_between_train_steps": 0.0034554004669189453, "step": 2186} +{"info/global_step": 2187, "train_info/time_within_train_step": 2.6939916610717773, "step": 2187} +{"train_info/time_between_train_steps": 0.003403186798095703, "step": 2187} +{"info/global_step": 2188, "train_info/time_within_train_step": 2.6938538551330566, "step": 2188} +{"train_info/time_between_train_steps": 0.0034410953521728516, "step": 2188} +{"info/global_step": 2189, "train_info/time_within_train_step": 2.694957971572876, "step": 2189} +{"train_info/time_between_train_steps": 0.0034661293029785156, "step": 2189} +{"info/global_step": 2190, "train_info/time_within_train_step": 2.712000846862793, "step": 2190} +{"train_info/time_between_train_steps": 0.003576040267944336, "step": 2190} +{"info/global_step": 2191, "train_info/time_within_train_step": 2.6974875926971436, "step": 2191} +{"train_info/time_between_train_steps": 0.0035746097564697266, "step": 2191} +{"info/global_step": 2192, "train_info/time_within_train_step": 2.6979639530181885, "step": 2192} +{"train_info/time_between_train_steps": 0.003572225570678711, "step": 2192} +{"info/global_step": 2193, "train_info/time_within_train_step": 2.6982829570770264, "step": 2193} +{"train_info/time_between_train_steps": 0.0035643577575683594, "step": 2193} +{"info/global_step": 2194, "train_info/time_within_train_step": 2.699174642562866, "step": 2194} +{"train_info/time_between_train_steps": 0.003697633743286133, "step": 2194} +{"info/global_step": 2195, "train_info/time_within_train_step": 2.69580078125, "step": 2195} +{"train_info/time_between_train_steps": 0.0035369396209716797, "step": 2195} +{"info/global_step": 2196, "train_info/time_within_train_step": 2.6947615146636963, "step": 2196} +{"train_info/time_between_train_steps": 0.0034766197204589844, "step": 2196} +{"info/global_step": 2197, "train_info/time_within_train_step": 2.6964149475097656, "step": 2197} +{"train_info/time_between_train_steps": 0.003607511520385742, "step": 2197} +{"info/global_step": 2198, "train_info/time_within_train_step": 2.710771083831787, "step": 2198} +{"train_info/time_between_train_steps": 0.003603219985961914, "step": 2198} +{"info/global_step": 2199, "train_info/time_within_train_step": 2.6985409259796143, "step": 2199} +{"train_info/time_between_train_steps": 0.0035774707794189453, "step": 2199} +{"info/global_step": 2200, "train_info/time_within_train_step": 2.6981663703918457, "step": 2200} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746292832, "_runtime": 6854}, "step": 2200} +{"logs": {"train/loss": 4.6236, "train/learning_rate": 0.00017777777777777776, "train/epoch": 2.23, "_timestamp": 1746292832, "_runtime": 6854}, "step": 2200} +{"train_info/time_between_train_steps": 33.219870805740356, "step": 2200} +{"info/global_step": 2201, "train_info/time_within_train_step": 2.488020658493042, "step": 2201} +{"train_info/time_between_train_steps": 0.003872394561767578, "step": 2201} +{"info/global_step": 2202, "train_info/time_within_train_step": 2.463034152984619, "step": 2202} +{"train_info/time_between_train_steps": 0.0037145614624023438, "step": 2202} +{"info/global_step": 2203, "train_info/time_within_train_step": 2.7637734413146973, "step": 2203} +{"train_info/time_between_train_steps": 0.003354310989379883, "step": 2203} +{"info/global_step": 2204, "train_info/time_within_train_step": 2.694706916809082, "step": 2204} +{"train_info/time_between_train_steps": 0.003914356231689453, "step": 2204} +{"info/global_step": 2205, "train_info/time_within_train_step": 2.695279598236084, "step": 2205} +{"train_info/time_between_train_steps": 0.003704071044921875, "step": 2205} +{"info/global_step": 2206, "train_info/time_within_train_step": 2.694910764694214, "step": 2206} +{"train_info/time_between_train_steps": 0.004622936248779297, "step": 2206} +{"info/global_step": 2207, "train_info/time_within_train_step": 2.6951794624328613, "step": 2207} +{"train_info/time_between_train_steps": 0.0036377906799316406, "step": 2207} +{"info/global_step": 2208, "train_info/time_within_train_step": 2.6957433223724365, "step": 2208} +{"train_info/time_between_train_steps": 0.003604888916015625, "step": 2208} +{"info/global_step": 2209, "train_info/time_within_train_step": 2.6964380741119385, "step": 2209} +{"train_info/time_between_train_steps": 0.0036144256591796875, "step": 2209} +{"info/global_step": 2210, "train_info/time_within_train_step": 2.69745135307312, "step": 2210} +{"train_info/time_between_train_steps": 0.003531217575073242, "step": 2210} +{"info/global_step": 2211, "train_info/time_within_train_step": 2.722440719604492, "step": 2211} +{"train_info/time_between_train_steps": 0.003503561019897461, "step": 2211} +{"info/global_step": 2212, "train_info/time_within_train_step": 2.864884853363037, "step": 2212} +{"train_info/time_between_train_steps": 0.003671884536743164, "step": 2212} +{"info/global_step": 2213, "train_info/time_within_train_step": 2.91749906539917, "step": 2213} +{"train_info/time_between_train_steps": 0.0037429332733154297, "step": 2213} +{"info/global_step": 2214, "train_info/time_within_train_step": 2.8243889808654785, "step": 2214} +{"train_info/time_between_train_steps": 0.0037276744842529297, "step": 2214} +{"info/global_step": 2215, "train_info/time_within_train_step": 2.698194980621338, "step": 2215} +{"train_info/time_between_train_steps": 0.003700733184814453, "step": 2215} +{"info/global_step": 2216, "train_info/time_within_train_step": 2.698835611343384, "step": 2216} +{"train_info/time_between_train_steps": 0.0037736892700195312, "step": 2216} +{"info/global_step": 2217, "train_info/time_within_train_step": 2.6965749263763428, "step": 2217} +{"train_info/time_between_train_steps": 0.003753662109375, "step": 2217} +{"info/global_step": 2218, "train_info/time_within_train_step": 2.6970818042755127, "step": 2218} +{"train_info/time_between_train_steps": 0.003650665283203125, "step": 2218} +{"info/global_step": 2219, "train_info/time_within_train_step": 2.6975321769714355, "step": 2219} +{"train_info/time_between_train_steps": 0.0035805702209472656, "step": 2219} +{"info/global_step": 2220, "train_info/time_within_train_step": 2.6974594593048096, "step": 2220} +{"train_info/time_between_train_steps": 0.0037593841552734375, "step": 2220} +{"info/global_step": 2221, "train_info/time_within_train_step": 2.698312282562256, "step": 2221} +{"train_info/time_between_train_steps": 0.003628253936767578, "step": 2221} +{"info/global_step": 2222, "train_info/time_within_train_step": 2.6961169242858887, "step": 2222} +{"train_info/time_between_train_steps": 0.003679990768432617, "step": 2222} +{"info/global_step": 2223, "train_info/time_within_train_step": 2.700471878051758, "step": 2223} +{"train_info/time_between_train_steps": 0.003778219223022461, "step": 2223} +{"info/global_step": 2224, "train_info/time_within_train_step": 2.698376178741455, "step": 2224} +{"train_info/time_between_train_steps": 0.0037119388580322266, "step": 2224} +{"info/global_step": 2225, "train_info/time_within_train_step": 2.700056791305542, "step": 2225} +{"train_info/time_between_train_steps": 0.003651142120361328, "step": 2225} +{"info/global_step": 2226, "train_info/time_within_train_step": 2.700202465057373, "step": 2226} +{"train_info/time_between_train_steps": 0.0035889148712158203, "step": 2226} +{"info/global_step": 2227, "train_info/time_within_train_step": 2.698338031768799, "step": 2227} +{"train_info/time_between_train_steps": 0.0036897659301757812, "step": 2227} +{"info/global_step": 2228, "train_info/time_within_train_step": 2.700235605239868, "step": 2228} +{"train_info/time_between_train_steps": 0.0038175582885742188, "step": 2228} +{"info/global_step": 2229, "train_info/time_within_train_step": 2.8092663288116455, "step": 2229} +{"train_info/time_between_train_steps": 0.0036592483520507812, "step": 2229} +{"info/global_step": 2230, "train_info/time_within_train_step": 2.6979641914367676, "step": 2230} +{"train_info/time_between_train_steps": 0.0035495758056640625, "step": 2230} +{"info/global_step": 2231, "train_info/time_within_train_step": 2.6982595920562744, "step": 2231} +{"train_info/time_between_train_steps": 0.003690958023071289, "step": 2231} +{"info/global_step": 2232, "train_info/time_within_train_step": 2.6974329948425293, "step": 2232} +{"train_info/time_between_train_steps": 0.0036644935607910156, "step": 2232} +{"info/global_step": 2233, "train_info/time_within_train_step": 2.701291561126709, "step": 2233} +{"train_info/time_between_train_steps": 0.0036072731018066406, "step": 2233} +{"info/global_step": 2234, "train_info/time_within_train_step": 2.698277711868286, "step": 2234} +{"train_info/time_between_train_steps": 0.005475044250488281, "step": 2234} +{"info/global_step": 2235, "train_info/time_within_train_step": 2.6975114345550537, "step": 2235} +{"train_info/time_between_train_steps": 0.003701925277709961, "step": 2235} +{"info/global_step": 2236, "train_info/time_within_train_step": 2.6997251510620117, "step": 2236} +{"train_info/time_between_train_steps": 0.003622293472290039, "step": 2236} +{"info/global_step": 2237, "train_info/time_within_train_step": 2.6993744373321533, "step": 2237} +{"train_info/time_between_train_steps": 0.0035593509674072266, "step": 2237} +{"info/global_step": 2238, "train_info/time_within_train_step": 2.698791742324829, "step": 2238} +{"train_info/time_between_train_steps": 0.0036535263061523438, "step": 2238} +{"info/global_step": 2239, "train_info/time_within_train_step": 2.6985208988189697, "step": 2239} +{"train_info/time_between_train_steps": 0.003640890121459961, "step": 2239} +{"info/global_step": 2240, "train_info/time_within_train_step": 2.80057692527771, "step": 2240} +{"train_info/time_between_train_steps": 0.003446340560913086, "step": 2240} +{"info/global_step": 2241, "train_info/time_within_train_step": 2.6978492736816406, "step": 2241} +{"train_info/time_between_train_steps": 0.0033898353576660156, "step": 2241} +{"info/global_step": 2242, "train_info/time_within_train_step": 2.744885206222534, "step": 2242} +{"train_info/time_between_train_steps": 0.003426074981689453, "step": 2242} +{"info/global_step": 2243, "train_info/time_within_train_step": 2.6981570720672607, "step": 2243} +{"train_info/time_between_train_steps": 0.003763437271118164, "step": 2243} +{"info/global_step": 2244, "train_info/time_within_train_step": 2.6970198154449463, "step": 2244} +{"train_info/time_between_train_steps": 0.0034825801849365234, "step": 2244} +{"info/global_step": 2245, "train_info/time_within_train_step": 2.6974382400512695, "step": 2245} +{"train_info/time_between_train_steps": 0.003313302993774414, "step": 2245} +{"info/global_step": 2246, "train_info/time_within_train_step": 2.7012853622436523, "step": 2246} +{"train_info/time_between_train_steps": 0.0035839080810546875, "step": 2246} +{"info/global_step": 2247, "train_info/time_within_train_step": 2.6989243030548096, "step": 2247} +{"train_info/time_between_train_steps": 0.004140615463256836, "step": 2247} +{"info/global_step": 2248, "train_info/time_within_train_step": 2.6984665393829346, "step": 2248} +{"train_info/time_between_train_steps": 0.003495931625366211, "step": 2248} +{"info/global_step": 2249, "train_info/time_within_train_step": 3.2901031970977783, "step": 2249} +{"train_info/time_between_train_steps": 0.00890350341796875, "step": 2249} +{"info/global_step": 2250, "train_info/time_within_train_step": 2.703409194946289, "step": 2250} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746293009, "_runtime": 7031}, "step": 2250} +{"logs": {"train/loss": 4.6008, "train/learning_rate": 0.00016666666666666666, "train/epoch": 2.24, "_timestamp": 1746293009, "_runtime": 7031}, "step": 2250} +{"train_info/time_between_train_steps": 0.025266647338867188, "step": 2250} +{"info/global_step": 2251, "train_info/time_within_train_step": 2.7035281658172607, "step": 2251} +{"train_info/time_between_train_steps": 0.004330158233642578, "step": 2251} +{"info/global_step": 2252, "train_info/time_within_train_step": 2.701021432876587, "step": 2252} +{"train_info/time_between_train_steps": 0.0038459300994873047, "step": 2252} +{"info/global_step": 2253, "train_info/time_within_train_step": 2.701155185699463, "step": 2253} +{"train_info/time_between_train_steps": 0.004152774810791016, "step": 2253} +{"info/global_step": 2254, "train_info/time_within_train_step": 2.7007405757904053, "step": 2254} +{"train_info/time_between_train_steps": 0.004306793212890625, "step": 2254} +{"info/global_step": 2255, "train_info/time_within_train_step": 2.7022557258605957, "step": 2255} +{"train_info/time_between_train_steps": 0.00395655632019043, "step": 2255} +{"info/global_step": 2256, "train_info/time_within_train_step": 2.700411081314087, "step": 2256} +{"train_info/time_between_train_steps": 0.003950357437133789, "step": 2256} +{"info/global_step": 2257, "train_info/time_within_train_step": 2.6993820667266846, "step": 2257} +{"train_info/time_between_train_steps": 0.003683805465698242, "step": 2257} +{"info/global_step": 2258, "train_info/time_within_train_step": 2.701150417327881, "step": 2258} +{"train_info/time_between_train_steps": 0.003852367401123047, "step": 2258} +{"info/global_step": 2259, "train_info/time_within_train_step": 2.699084997177124, "step": 2259} +{"train_info/time_between_train_steps": 0.0039861202239990234, "step": 2259} +{"info/global_step": 2260, "train_info/time_within_train_step": 2.699951410293579, "step": 2260} +{"train_info/time_between_train_steps": 0.003943204879760742, "step": 2260} +{"info/global_step": 2261, "train_info/time_within_train_step": 2.726069688796997, "step": 2261} +{"train_info/time_between_train_steps": 0.005478858947753906, "step": 2261} +{"info/global_step": 2262, "train_info/time_within_train_step": 2.704568386077881, "step": 2262} +{"train_info/time_between_train_steps": 0.0040018558502197266, "step": 2262} +{"info/global_step": 2263, "train_info/time_within_train_step": 2.7217016220092773, "step": 2263} +{"train_info/time_between_train_steps": 0.004039287567138672, "step": 2263} +{"info/global_step": 2264, "train_info/time_within_train_step": 2.7002298831939697, "step": 2264} +{"train_info/time_between_train_steps": 0.004047870635986328, "step": 2264} +{"info/global_step": 2265, "train_info/time_within_train_step": 2.7019765377044678, "step": 2265} +{"train_info/time_between_train_steps": 0.004256725311279297, "step": 2265} +{"info/global_step": 2266, "train_info/time_within_train_step": 2.7012746334075928, "step": 2266} +{"train_info/time_between_train_steps": 0.004119873046875, "step": 2266} +{"info/global_step": 2267, "train_info/time_within_train_step": 2.7028374671936035, "step": 2267} +{"train_info/time_between_train_steps": 0.004186868667602539, "step": 2267} +{"info/global_step": 2268, "train_info/time_within_train_step": 2.700591564178467, "step": 2268} +{"train_info/time_between_train_steps": 0.0041544437408447266, "step": 2268} +{"info/global_step": 2269, "train_info/time_within_train_step": 2.702483654022217, "step": 2269} +{"train_info/time_between_train_steps": 0.009282112121582031, "step": 2269} +{"info/global_step": 2270, "train_info/time_within_train_step": 2.7345504760742188, "step": 2270} +{"train_info/time_between_train_steps": 0.004051923751831055, "step": 2270} +{"info/global_step": 2271, "train_info/time_within_train_step": 2.701322317123413, "step": 2271} +{"train_info/time_between_train_steps": 0.003966808319091797, "step": 2271} +{"info/global_step": 2272, "train_info/time_within_train_step": 2.7018232345581055, "step": 2272} +{"train_info/time_between_train_steps": 0.0043582916259765625, "step": 2272} +{"info/global_step": 2273, "train_info/time_within_train_step": 2.7027931213378906, "step": 2273} +{"train_info/time_between_train_steps": 0.004281520843505859, "step": 2273} +{"info/global_step": 2274, "train_info/time_within_train_step": 2.7017297744750977, "step": 2274} +{"train_info/time_between_train_steps": 0.004651784896850586, "step": 2274} +{"train_info/time_between_train_steps": 3.243345260620117, "step": 2274} +{"info/global_step": 2275, "train_info/time_within_train_step": 2.690669298171997, "step": 2275} +{"train_info/time_between_train_steps": 0.0035126209259033203, "step": 2275} +{"info/global_step": 2276, "train_info/time_within_train_step": 2.694366455078125, "step": 2276} +{"train_info/time_between_train_steps": 0.0037622451782226562, "step": 2276} +{"info/global_step": 2277, "train_info/time_within_train_step": 2.6951301097869873, "step": 2277} +{"train_info/time_between_train_steps": 0.0036313533782958984, "step": 2277} +{"info/global_step": 2278, "train_info/time_within_train_step": 2.6969501972198486, "step": 2278} +{"train_info/time_between_train_steps": 0.003717184066772461, "step": 2278} +{"info/global_step": 2279, "train_info/time_within_train_step": 2.6963765621185303, "step": 2279} +{"train_info/time_between_train_steps": 0.003624439239501953, "step": 2279} +{"info/global_step": 2280, "train_info/time_within_train_step": 2.696272373199463, "step": 2280} +{"train_info/time_between_train_steps": 0.003934621810913086, "step": 2280} +{"info/global_step": 2281, "train_info/time_within_train_step": 2.696188449859619, "step": 2281} +{"train_info/time_between_train_steps": 0.0038270950317382812, "step": 2281} +{"info/global_step": 2282, "train_info/time_within_train_step": 2.697983503341675, "step": 2282} +{"train_info/time_between_train_steps": 0.003616809844970703, "step": 2282} +{"info/global_step": 2283, "train_info/time_within_train_step": 2.727365255355835, "step": 2283} +{"train_info/time_between_train_steps": 0.003586292266845703, "step": 2283} +{"info/global_step": 2284, "train_info/time_within_train_step": 2.6979057788848877, "step": 2284} +{"train_info/time_between_train_steps": 0.0037446022033691406, "step": 2284} +{"info/global_step": 2285, "train_info/time_within_train_step": 2.698823928833008, "step": 2285} +{"train_info/time_between_train_steps": 0.0038814544677734375, "step": 2285} +{"info/global_step": 2286, "train_info/time_within_train_step": 2.6991729736328125, "step": 2286} +{"train_info/time_between_train_steps": 0.0037767887115478516, "step": 2286} +{"info/global_step": 2287, "train_info/time_within_train_step": 2.7471096515655518, "step": 2287} +{"train_info/time_between_train_steps": 0.003957509994506836, "step": 2287} +{"info/global_step": 2288, "train_info/time_within_train_step": 2.7293763160705566, "step": 2288} +{"train_info/time_between_train_steps": 0.0041120052337646484, "step": 2288} +{"info/global_step": 2289, "train_info/time_within_train_step": 2.707437515258789, "step": 2289} +{"train_info/time_between_train_steps": 0.0039141178131103516, "step": 2289} +{"info/global_step": 2290, "train_info/time_within_train_step": 2.9815995693206787, "step": 2290} +{"train_info/time_between_train_steps": 0.0038106441497802734, "step": 2290} +{"info/global_step": 2291, "train_info/time_within_train_step": 2.702765941619873, "step": 2291} +{"train_info/time_between_train_steps": 0.0038673877716064453, "step": 2291} +{"info/global_step": 2292, "train_info/time_within_train_step": 2.7027053833007812, "step": 2292} +{"train_info/time_between_train_steps": 0.003774881362915039, "step": 2292} +{"info/global_step": 2293, "train_info/time_within_train_step": 2.702080249786377, "step": 2293} +{"train_info/time_between_train_steps": 0.0038154125213623047, "step": 2293} +{"info/global_step": 2294, "train_info/time_within_train_step": 2.7034924030303955, "step": 2294} +{"train_info/time_between_train_steps": 0.0038840770721435547, "step": 2294} +{"info/global_step": 2295, "train_info/time_within_train_step": 2.70251202583313, "step": 2295} +{"train_info/time_between_train_steps": 0.0037970542907714844, "step": 2295} +{"info/global_step": 2296, "train_info/time_within_train_step": 2.7049028873443604, "step": 2296} +{"train_info/time_between_train_steps": 0.0046844482421875, "step": 2296} +{"info/global_step": 2297, "train_info/time_within_train_step": 2.703850746154785, "step": 2297} +{"train_info/time_between_train_steps": 0.003883838653564453, "step": 2297} +{"info/global_step": 2298, "train_info/time_within_train_step": 2.7036685943603516, "step": 2298} +{"train_info/time_between_train_steps": 0.0037915706634521484, "step": 2298} +{"info/global_step": 2299, "train_info/time_within_train_step": 2.700958728790283, "step": 2299} +{"train_info/time_between_train_steps": 0.0039255619049072266, "step": 2299} +{"info/global_step": 2300, "train_info/time_within_train_step": 2.8535280227661133, "step": 2300} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746293154, "_runtime": 7176}, "step": 2300} +{"logs": {"train/loss": 4.6189, "train/learning_rate": 0.00015555555555555554, "train/epoch": 3.01, "_timestamp": 1746293154, "_runtime": 7176}, "step": 2300} +{"train_info/time_between_train_steps": 14.57427167892456, "step": 2300} +{"info/global_step": 2301, "train_info/time_within_train_step": 2.4995996952056885, "step": 2301} +{"train_info/time_between_train_steps": 0.004132747650146484, "step": 2301} +{"info/global_step": 2302, "train_info/time_within_train_step": 2.5033555030822754, "step": 2302} +{"train_info/time_between_train_steps": 0.004102468490600586, "step": 2302} +{"info/global_step": 2303, "train_info/time_within_train_step": 2.693065643310547, "step": 2303} +{"train_info/time_between_train_steps": 0.0040247440338134766, "step": 2303} +{"info/global_step": 2304, "train_info/time_within_train_step": 2.697495937347412, "step": 2304} +{"train_info/time_between_train_steps": 0.0038847923278808594, "step": 2304} +{"info/global_step": 2305, "train_info/time_within_train_step": 2.6991138458251953, "step": 2305} +{"train_info/time_between_train_steps": 0.004036664962768555, "step": 2305} +{"info/global_step": 2306, "train_info/time_within_train_step": 2.6994004249572754, "step": 2306} +{"train_info/time_between_train_steps": 0.0039043426513671875, "step": 2306} +{"info/global_step": 2307, "train_info/time_within_train_step": 2.7002675533294678, "step": 2307} +{"train_info/time_between_train_steps": 0.0040853023529052734, "step": 2307} +{"info/global_step": 2308, "train_info/time_within_train_step": 2.7033653259277344, "step": 2308} +{"train_info/time_between_train_steps": 0.0039293766021728516, "step": 2308} +{"info/global_step": 2309, "train_info/time_within_train_step": 2.925349712371826, "step": 2309} +{"train_info/time_between_train_steps": 0.0038895606994628906, "step": 2309} +{"info/global_step": 2310, "train_info/time_within_train_step": 3.022475481033325, "step": 2310} +{"train_info/time_between_train_steps": 0.003848552703857422, "step": 2310} +{"info/global_step": 2311, "train_info/time_within_train_step": 2.8290319442749023, "step": 2311} +{"train_info/time_between_train_steps": 0.0038192272186279297, "step": 2311} +{"info/global_step": 2312, "train_info/time_within_train_step": 2.7018463611602783, "step": 2312} +{"train_info/time_between_train_steps": 0.003909111022949219, "step": 2312} +{"info/global_step": 2313, "train_info/time_within_train_step": 2.701146125793457, "step": 2313} +{"train_info/time_between_train_steps": 0.003964662551879883, "step": 2313} +{"info/global_step": 2314, "train_info/time_within_train_step": 2.7010815143585205, "step": 2314} +{"train_info/time_between_train_steps": 0.003867626190185547, "step": 2314} +{"info/global_step": 2315, "train_info/time_within_train_step": 2.7005186080932617, "step": 2315} +{"train_info/time_between_train_steps": 0.0038673877716064453, "step": 2315} +{"info/global_step": 2316, "train_info/time_within_train_step": 2.6996028423309326, "step": 2316} +{"train_info/time_between_train_steps": 0.003896951675415039, "step": 2316} +{"info/global_step": 2317, "train_info/time_within_train_step": 2.7013766765594482, "step": 2317} +{"train_info/time_between_train_steps": 0.003917694091796875, "step": 2317} +{"info/global_step": 2318, "train_info/time_within_train_step": 2.7022058963775635, "step": 2318} +{"train_info/time_between_train_steps": 0.0038962364196777344, "step": 2318} +{"info/global_step": 2319, "train_info/time_within_train_step": 2.7014501094818115, "step": 2319} +{"train_info/time_between_train_steps": 0.0038597583770751953, "step": 2319} +{"info/global_step": 2320, "train_info/time_within_train_step": 2.703136682510376, "step": 2320} +{"train_info/time_between_train_steps": 0.003835439682006836, "step": 2320} +{"info/global_step": 2321, "train_info/time_within_train_step": 2.703171968460083, "step": 2321} +{"train_info/time_between_train_steps": 0.003857851028442383, "step": 2321} +{"info/global_step": 2322, "train_info/time_within_train_step": 2.7044999599456787, "step": 2322} +{"train_info/time_between_train_steps": 0.0038759708404541016, "step": 2322} +{"info/global_step": 2323, "train_info/time_within_train_step": 2.706507682800293, "step": 2323} +{"train_info/time_between_train_steps": 0.0038373470306396484, "step": 2323} +{"info/global_step": 2324, "train_info/time_within_train_step": 2.701345443725586, "step": 2324} +{"train_info/time_between_train_steps": 0.0039000511169433594, "step": 2324} +{"info/global_step": 2325, "train_info/time_within_train_step": 2.709594249725342, "step": 2325} +{"train_info/time_between_train_steps": 0.0038957595825195312, "step": 2325} +{"info/global_step": 2326, "train_info/time_within_train_step": 2.7901628017425537, "step": 2326} +{"train_info/time_between_train_steps": 0.004418849945068359, "step": 2326} +{"info/global_step": 2327, "train_info/time_within_train_step": 2.9161603450775146, "step": 2327} +{"train_info/time_between_train_steps": 0.003804922103881836, "step": 2327} +{"info/global_step": 2328, "train_info/time_within_train_step": 2.707481622695923, "step": 2328} +{"train_info/time_between_train_steps": 0.003902912139892578, "step": 2328} +{"info/global_step": 2329, "train_info/time_within_train_step": 2.7000486850738525, "step": 2329} +{"train_info/time_between_train_steps": 0.0037186145782470703, "step": 2329} +{"info/global_step": 2330, "train_info/time_within_train_step": 2.6987128257751465, "step": 2330} +{"train_info/time_between_train_steps": 0.003818988800048828, "step": 2330} +{"info/global_step": 2331, "train_info/time_within_train_step": 2.7010748386383057, "step": 2331} +{"train_info/time_between_train_steps": 0.003855466842651367, "step": 2331} +{"info/global_step": 2332, "train_info/time_within_train_step": 2.700042963027954, "step": 2332} +{"train_info/time_between_train_steps": 0.0037751197814941406, "step": 2332} +{"info/global_step": 2333, "train_info/time_within_train_step": 2.7010841369628906, "step": 2333} +{"train_info/time_between_train_steps": 0.00379180908203125, "step": 2333} +{"info/global_step": 2334, "train_info/time_within_train_step": 2.7018508911132812, "step": 2334} +{"train_info/time_between_train_steps": 0.004099130630493164, "step": 2334} +{"info/global_step": 2335, "train_info/time_within_train_step": 2.701833486557007, "step": 2335} +{"train_info/time_between_train_steps": 0.004221916198730469, "step": 2335} +{"info/global_step": 2336, "train_info/time_within_train_step": 2.702010154724121, "step": 2336} +{"train_info/time_between_train_steps": 0.004309892654418945, "step": 2336} +{"info/global_step": 2337, "train_info/time_within_train_step": 2.874527931213379, "step": 2337} +{"train_info/time_between_train_steps": 0.0037565231323242188, "step": 2337} +{"info/global_step": 2338, "train_info/time_within_train_step": 2.700089454650879, "step": 2338} +{"train_info/time_between_train_steps": 0.0037910938262939453, "step": 2338} +{"info/global_step": 2339, "train_info/time_within_train_step": 2.7013485431671143, "step": 2339} +{"train_info/time_between_train_steps": 0.0037910938262939453, "step": 2339} +{"info/global_step": 2340, "train_info/time_within_train_step": 2.6995208263397217, "step": 2340} +{"train_info/time_between_train_steps": 0.003828287124633789, "step": 2340} +{"info/global_step": 2341, "train_info/time_within_train_step": 2.716142416000366, "step": 2341} +{"train_info/time_between_train_steps": 0.004220008850097656, "step": 2341} +{"info/global_step": 2342, "train_info/time_within_train_step": 2.7075233459472656, "step": 2342} +{"train_info/time_between_train_steps": 0.004262208938598633, "step": 2342} +{"info/global_step": 2343, "train_info/time_within_train_step": 2.716330051422119, "step": 2343} +{"train_info/time_between_train_steps": 0.00424957275390625, "step": 2343} +{"info/global_step": 2344, "train_info/time_within_train_step": 2.780980348587036, "step": 2344} +{"train_info/time_between_train_steps": 0.00428318977355957, "step": 2344} +{"info/global_step": 2345, "train_info/time_within_train_step": 2.7049410343170166, "step": 2345} +{"train_info/time_between_train_steps": 0.004061222076416016, "step": 2345} +{"info/global_step": 2346, "train_info/time_within_train_step": 2.6986467838287354, "step": 2346} +{"train_info/time_between_train_steps": 0.004330158233642578, "step": 2346} +{"info/global_step": 2347, "train_info/time_within_train_step": 2.707794189453125, "step": 2347} +{"train_info/time_between_train_steps": 0.004251718521118164, "step": 2347} +{"info/global_step": 2348, "train_info/time_within_train_step": 2.745617628097534, "step": 2348} +{"train_info/time_between_train_steps": 0.00396275520324707, "step": 2348} +{"info/global_step": 2349, "train_info/time_within_train_step": 2.711419105529785, "step": 2349} +{"train_info/time_between_train_steps": 0.0040912628173828125, "step": 2349} +{"info/global_step": 2350, "train_info/time_within_train_step": 2.728015899658203, "step": 2350} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746293307, "_runtime": 7329}, "step": 2350} +{"logs": {"train/loss": 4.564, "train/learning_rate": 0.0001444444444444444, "train/epoch": 3.03, "_timestamp": 1746293307, "_runtime": 7329}, "step": 2350} +{"train_info/time_between_train_steps": 0.028858661651611328, "step": 2350} +{"info/global_step": 2351, "train_info/time_within_train_step": 2.7160420417785645, "step": 2351} +{"train_info/time_between_train_steps": 0.003958940505981445, "step": 2351} +{"info/global_step": 2352, "train_info/time_within_train_step": 2.7006688117980957, "step": 2352} +{"train_info/time_between_train_steps": 0.0042231082916259766, "step": 2352} +{"info/global_step": 2353, "train_info/time_within_train_step": 2.771681070327759, "step": 2353} +{"train_info/time_between_train_steps": 0.004220485687255859, "step": 2353} +{"info/global_step": 2354, "train_info/time_within_train_step": 2.869077444076538, "step": 2354} +{"train_info/time_between_train_steps": 0.004183053970336914, "step": 2354} +{"info/global_step": 2355, "train_info/time_within_train_step": 2.712160110473633, "step": 2355} +{"train_info/time_between_train_steps": 0.004006147384643555, "step": 2355} +{"info/global_step": 2356, "train_info/time_within_train_step": 2.699758529663086, "step": 2356} +{"train_info/time_between_train_steps": 0.004162788391113281, "step": 2356} +{"info/global_step": 2357, "train_info/time_within_train_step": 2.6985878944396973, "step": 2357} +{"train_info/time_between_train_steps": 0.00404047966003418, "step": 2357} +{"info/global_step": 2358, "train_info/time_within_train_step": 2.7370617389678955, "step": 2358} +{"train_info/time_between_train_steps": 0.004067659378051758, "step": 2358} +{"info/global_step": 2359, "train_info/time_within_train_step": 2.7078933715820312, "step": 2359} +{"train_info/time_between_train_steps": 0.004094839096069336, "step": 2359} +{"info/global_step": 2360, "train_info/time_within_train_step": 2.702559232711792, "step": 2360} +{"train_info/time_between_train_steps": 0.004036664962768555, "step": 2360} +{"info/global_step": 2361, "train_info/time_within_train_step": 2.7010390758514404, "step": 2361} +{"train_info/time_between_train_steps": 0.004193782806396484, "step": 2361} +{"info/global_step": 2362, "train_info/time_within_train_step": 2.701150894165039, "step": 2362} +{"train_info/time_between_train_steps": 0.004044771194458008, "step": 2362} +{"info/global_step": 2363, "train_info/time_within_train_step": 2.7031896114349365, "step": 2363} +{"train_info/time_between_train_steps": 0.004081249237060547, "step": 2363} +{"info/global_step": 2364, "train_info/time_within_train_step": 2.702136278152466, "step": 2364} +{"train_info/time_between_train_steps": 0.0039713382720947266, "step": 2364} +{"info/global_step": 2365, "train_info/time_within_train_step": 3.1479220390319824, "step": 2365} +{"train_info/time_between_train_steps": 0.003701925277709961, "step": 2365} +{"info/global_step": 2366, "train_info/time_within_train_step": 2.699591875076294, "step": 2366} +{"train_info/time_between_train_steps": 0.0036389827728271484, "step": 2366} +{"info/global_step": 2367, "train_info/time_within_train_step": 2.6980764865875244, "step": 2367} +{"train_info/time_between_train_steps": 0.0036499500274658203, "step": 2367} +{"info/global_step": 2368, "train_info/time_within_train_step": 2.69968843460083, "step": 2368} +{"train_info/time_between_train_steps": 0.0036487579345703125, "step": 2368} +{"info/global_step": 2369, "train_info/time_within_train_step": 2.6994171142578125, "step": 2369} +{"train_info/time_between_train_steps": 0.003631114959716797, "step": 2369} +{"info/global_step": 2370, "train_info/time_within_train_step": 2.700512409210205, "step": 2370} +{"train_info/time_between_train_steps": 0.003759622573852539, "step": 2370} +{"info/global_step": 2371, "train_info/time_within_train_step": 2.7006871700286865, "step": 2371} +{"train_info/time_between_train_steps": 0.0036530494689941406, "step": 2371} +{"info/global_step": 2372, "train_info/time_within_train_step": 2.7372400760650635, "step": 2372} +{"train_info/time_between_train_steps": 0.003696441650390625, "step": 2372} +{"info/global_step": 2373, "train_info/time_within_train_step": 2.69960355758667, "step": 2373} +{"train_info/time_between_train_steps": 0.003556966781616211, "step": 2373} +{"info/global_step": 2374, "train_info/time_within_train_step": 2.698103904724121, "step": 2374} +{"train_info/time_between_train_steps": 0.0036509037017822266, "step": 2374} +{"info/global_step": 2375, "train_info/time_within_train_step": 2.6976985931396484, "step": 2375} +{"train_info/time_between_train_steps": 0.0035555362701416016, "step": 2375} +{"info/global_step": 2376, "train_info/time_within_train_step": 2.6978871822357178, "step": 2376} +{"train_info/time_between_train_steps": 0.0036764144897460938, "step": 2376} +{"info/global_step": 2377, "train_info/time_within_train_step": 2.6989312171936035, "step": 2377} +{"train_info/time_between_train_steps": 0.003617525100708008, "step": 2377} +{"info/global_step": 2378, "train_info/time_within_train_step": 2.700166702270508, "step": 2378} +{"train_info/time_between_train_steps": 0.0035865306854248047, "step": 2378} +{"info/global_step": 2379, "train_info/time_within_train_step": 2.77872896194458, "step": 2379} +{"train_info/time_between_train_steps": 0.0036673545837402344, "step": 2379} +{"info/global_step": 2380, "train_info/time_within_train_step": 2.8060460090637207, "step": 2380} +{"train_info/time_between_train_steps": 0.0036525726318359375, "step": 2380} +{"info/global_step": 2381, "train_info/time_within_train_step": 2.7065975666046143, "step": 2381} +{"train_info/time_between_train_steps": 0.003771066665649414, "step": 2381} +{"info/global_step": 2382, "train_info/time_within_train_step": 2.6992993354797363, "step": 2382} +{"train_info/time_between_train_steps": 0.003920793533325195, "step": 2382} +{"info/global_step": 2383, "train_info/time_within_train_step": 2.700773239135742, "step": 2383} +{"train_info/time_between_train_steps": 0.004144906997680664, "step": 2383} +{"info/global_step": 2384, "train_info/time_within_train_step": 2.700314521789551, "step": 2384} +{"train_info/time_between_train_steps": 0.003855466842651367, "step": 2384} +{"info/global_step": 2385, "train_info/time_within_train_step": 2.6992974281311035, "step": 2385} +{"train_info/time_between_train_steps": 0.003809213638305664, "step": 2385} +{"info/global_step": 2386, "train_info/time_within_train_step": 2.701294183731079, "step": 2386} +{"train_info/time_between_train_steps": 0.0038356781005859375, "step": 2386} +{"info/global_step": 2387, "train_info/time_within_train_step": 2.7022581100463867, "step": 2387} +{"train_info/time_between_train_steps": 0.0038299560546875, "step": 2387} +{"info/global_step": 2388, "train_info/time_within_train_step": 2.7315118312835693, "step": 2388} +{"train_info/time_between_train_steps": 0.003955841064453125, "step": 2388} +{"info/global_step": 2389, "train_info/time_within_train_step": 2.7170658111572266, "step": 2389} +{"train_info/time_between_train_steps": 0.0038542747497558594, "step": 2389} +{"info/global_step": 2390, "train_info/time_within_train_step": 2.701843500137329, "step": 2390} +{"train_info/time_between_train_steps": 0.003952980041503906, "step": 2390} +{"info/global_step": 2391, "train_info/time_within_train_step": 2.7010836601257324, "step": 2391} +{"train_info/time_between_train_steps": 0.0038399696350097656, "step": 2391} +{"info/global_step": 2392, "train_info/time_within_train_step": 2.700589418411255, "step": 2392} +{"train_info/time_between_train_steps": 0.003866434097290039, "step": 2392} +{"info/global_step": 2393, "train_info/time_within_train_step": 2.7017195224761963, "step": 2393} +{"train_info/time_between_train_steps": 0.00388336181640625, "step": 2393} +{"info/global_step": 2394, "train_info/time_within_train_step": 2.7394497394561768, "step": 2394} +{"train_info/time_between_train_steps": 0.003905773162841797, "step": 2394} +{"info/global_step": 2395, "train_info/time_within_train_step": 2.722654342651367, "step": 2395} +{"train_info/time_between_train_steps": 0.003823995590209961, "step": 2395} +{"info/global_step": 2396, "train_info/time_within_train_step": 2.699742555618286, "step": 2396} +{"train_info/time_between_train_steps": 0.003902912139892578, "step": 2396} +{"info/global_step": 2397, "train_info/time_within_train_step": 2.6992452144622803, "step": 2397} +{"train_info/time_between_train_steps": 0.0037925243377685547, "step": 2397} +{"info/global_step": 2398, "train_info/time_within_train_step": 2.699892997741699, "step": 2398} +{"train_info/time_between_train_steps": 0.0038318634033203125, "step": 2398} +{"info/global_step": 2399, "train_info/time_within_train_step": 2.6989192962646484, "step": 2399} +{"train_info/time_between_train_steps": 0.16658902168273926, "step": 2399} +{"info/global_step": 2400, "train_info/time_within_train_step": 2.696868896484375, "step": 2400} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746293446, "_runtime": 7468}, "step": 2400} +{"logs": {"train/loss": 4.5505, "train/learning_rate": 0.0001333333333333333, "train/epoch": 3.04, "_timestamp": 1746293446, "_runtime": 7468}, "step": 2400} +{"train_info/time_between_train_steps": 17.471428155899048, "step": 2400} +{"info/global_step": 2401, "train_info/time_within_train_step": 2.4964919090270996, "step": 2401} +{"train_info/time_between_train_steps": 0.003720521926879883, "step": 2401} +{"info/global_step": 2402, "train_info/time_within_train_step": 2.491211414337158, "step": 2402} +{"train_info/time_between_train_steps": 0.0037102699279785156, "step": 2402} +{"info/global_step": 2403, "train_info/time_within_train_step": 2.6597979068756104, "step": 2403} +{"train_info/time_between_train_steps": 0.0037996768951416016, "step": 2403} +{"info/global_step": 2404, "train_info/time_within_train_step": 2.6934597492218018, "step": 2404} +{"train_info/time_between_train_steps": 0.0036706924438476562, "step": 2404} +{"info/global_step": 2405, "train_info/time_within_train_step": 2.6961746215820312, "step": 2405} +{"train_info/time_between_train_steps": 0.003771543502807617, "step": 2405} +{"info/global_step": 2406, "train_info/time_within_train_step": 2.6983585357666016, "step": 2406} +{"train_info/time_between_train_steps": 0.0038924217224121094, "step": 2406} +{"info/global_step": 2407, "train_info/time_within_train_step": 2.698960781097412, "step": 2407} +{"train_info/time_between_train_steps": 0.003915071487426758, "step": 2407} +{"info/global_step": 2408, "train_info/time_within_train_step": 2.6999075412750244, "step": 2408} +{"train_info/time_between_train_steps": 0.00405430793762207, "step": 2408} +{"info/global_step": 2409, "train_info/time_within_train_step": 2.6991794109344482, "step": 2409} +{"train_info/time_between_train_steps": 0.003960847854614258, "step": 2409} +{"info/global_step": 2410, "train_info/time_within_train_step": 3.0619122982025146, "step": 2410} +{"train_info/time_between_train_steps": 0.004111766815185547, "step": 2410} +{"info/global_step": 2411, "train_info/time_within_train_step": 2.7017757892608643, "step": 2411} +{"train_info/time_between_train_steps": 0.003900289535522461, "step": 2411} +{"info/global_step": 2412, "train_info/time_within_train_step": 2.6990277767181396, "step": 2412} +{"train_info/time_between_train_steps": 0.003914833068847656, "step": 2412} +{"info/global_step": 2413, "train_info/time_within_train_step": 2.6993823051452637, "step": 2413} +{"train_info/time_between_train_steps": 0.003949403762817383, "step": 2413} +{"info/global_step": 2414, "train_info/time_within_train_step": 2.7020022869110107, "step": 2414} +{"train_info/time_between_train_steps": 0.003918170928955078, "step": 2414} +{"info/global_step": 2415, "train_info/time_within_train_step": 2.7013673782348633, "step": 2415} +{"train_info/time_between_train_steps": 0.003920555114746094, "step": 2415} +{"info/global_step": 2416, "train_info/time_within_train_step": 2.7018349170684814, "step": 2416} +{"train_info/time_between_train_steps": 0.0039937496185302734, "step": 2416} +{"info/global_step": 2417, "train_info/time_within_train_step": 2.8248939514160156, "step": 2417} +{"train_info/time_between_train_steps": 0.0038902759552001953, "step": 2417} +{"info/global_step": 2418, "train_info/time_within_train_step": 2.8599624633789062, "step": 2418} +{"train_info/time_between_train_steps": 0.00388336181640625, "step": 2418} +{"info/global_step": 2419, "train_info/time_within_train_step": 2.9767823219299316, "step": 2419} +{"train_info/time_between_train_steps": 0.003949403762817383, "step": 2419} +{"info/global_step": 2420, "train_info/time_within_train_step": 2.723583698272705, "step": 2420} +{"train_info/time_between_train_steps": 0.003851175308227539, "step": 2420} +{"info/global_step": 2421, "train_info/time_within_train_step": 2.698796510696411, "step": 2421} +{"train_info/time_between_train_steps": 0.0038154125213623047, "step": 2421} +{"info/global_step": 2422, "train_info/time_within_train_step": 2.6985507011413574, "step": 2422} +{"train_info/time_between_train_steps": 0.0038917064666748047, "step": 2422} +{"info/global_step": 2423, "train_info/time_within_train_step": 2.6994879245758057, "step": 2423} +{"train_info/time_between_train_steps": 0.0038619041442871094, "step": 2423} +{"info/global_step": 2424, "train_info/time_within_train_step": 2.701146364212036, "step": 2424} +{"train_info/time_between_train_steps": 0.003887176513671875, "step": 2424} +{"info/global_step": 2425, "train_info/time_within_train_step": 2.70096492767334, "step": 2425} +{"train_info/time_between_train_steps": 0.003921985626220703, "step": 2425} +{"info/global_step": 2426, "train_info/time_within_train_step": 2.7001190185546875, "step": 2426} +{"train_info/time_between_train_steps": 0.003833770751953125, "step": 2426} +{"info/global_step": 2427, "train_info/time_within_train_step": 2.7373862266540527, "step": 2427} +{"train_info/time_between_train_steps": 0.0038166046142578125, "step": 2427} +{"info/global_step": 2428, "train_info/time_within_train_step": 2.8614349365234375, "step": 2428} +{"train_info/time_between_train_steps": 0.004003763198852539, "step": 2428} +{"info/global_step": 2429, "train_info/time_within_train_step": 2.7399065494537354, "step": 2429} +{"train_info/time_between_train_steps": 0.004002571105957031, "step": 2429} +{"info/global_step": 2430, "train_info/time_within_train_step": 2.702122926712036, "step": 2430} +{"train_info/time_between_train_steps": 0.003949880599975586, "step": 2430} +{"info/global_step": 2431, "train_info/time_within_train_step": 2.7022950649261475, "step": 2431} +{"train_info/time_between_train_steps": 0.003996133804321289, "step": 2431} +{"info/global_step": 2432, "train_info/time_within_train_step": 3.0729706287384033, "step": 2432} +{"train_info/time_between_train_steps": 0.0036771297454833984, "step": 2432} +{"info/global_step": 2433, "train_info/time_within_train_step": 2.7003884315490723, "step": 2433} +{"train_info/time_between_train_steps": 0.003773927688598633, "step": 2433} +{"info/global_step": 2434, "train_info/time_within_train_step": 2.7010984420776367, "step": 2434} +{"train_info/time_between_train_steps": 0.003609895706176758, "step": 2434} +{"info/global_step": 2435, "train_info/time_within_train_step": 2.700380802154541, "step": 2435} +{"train_info/time_between_train_steps": 0.003598928451538086, "step": 2435} +{"info/global_step": 2436, "train_info/time_within_train_step": 2.7010116577148438, "step": 2436} +{"train_info/time_between_train_steps": 0.003592252731323242, "step": 2436} +{"info/global_step": 2437, "train_info/time_within_train_step": 2.7336912155151367, "step": 2437} +{"train_info/time_between_train_steps": 0.003618955612182617, "step": 2437} +{"info/global_step": 2438, "train_info/time_within_train_step": 2.978764533996582, "step": 2438} +{"train_info/time_between_train_steps": 0.0036220550537109375, "step": 2438} +{"info/global_step": 2439, "train_info/time_within_train_step": 2.756225347518921, "step": 2439} +{"train_info/time_between_train_steps": 0.003612995147705078, "step": 2439} +{"info/global_step": 2440, "train_info/time_within_train_step": 2.700024366378784, "step": 2440} +{"train_info/time_between_train_steps": 0.003573179244995117, "step": 2440} +{"info/global_step": 2441, "train_info/time_within_train_step": 2.7003977298736572, "step": 2441} +{"train_info/time_between_train_steps": 0.003590822219848633, "step": 2441} +{"info/global_step": 2442, "train_info/time_within_train_step": 2.697260856628418, "step": 2442} +{"train_info/time_between_train_steps": 0.003611326217651367, "step": 2442} +{"info/global_step": 2443, "train_info/time_within_train_step": 2.698484182357788, "step": 2443} +{"train_info/time_between_train_steps": 0.0035119056701660156, "step": 2443} +{"info/global_step": 2444, "train_info/time_within_train_step": 2.6997079849243164, "step": 2444} +{"train_info/time_between_train_steps": 0.0035381317138671875, "step": 2444} +{"info/global_step": 2445, "train_info/time_within_train_step": 2.70060396194458, "step": 2445} +{"train_info/time_between_train_steps": 0.0036242008209228516, "step": 2445} +{"info/global_step": 2446, "train_info/time_within_train_step": 2.699246883392334, "step": 2446} +{"train_info/time_between_train_steps": 0.003623485565185547, "step": 2446} +{"info/global_step": 2447, "train_info/time_within_train_step": 2.6991467475891113, "step": 2447} +{"train_info/time_between_train_steps": 0.0036411285400390625, "step": 2447} +{"info/global_step": 2448, "train_info/time_within_train_step": 2.7017014026641846, "step": 2448} +{"train_info/time_between_train_steps": 0.0036308765411376953, "step": 2448} +{"info/global_step": 2449, "train_info/time_within_train_step": 2.7048799991607666, "step": 2449} +{"train_info/time_between_train_steps": 0.0037500858306884766, "step": 2449} +{"info/global_step": 2450, "train_info/time_within_train_step": 2.821833848953247, "step": 2450} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746293605, "_runtime": 7627}, "step": 2450} +{"logs": {"train/loss": 4.5283, "train/learning_rate": 0.00012222222222222221, "train/epoch": 3.06, "_timestamp": 1746293605, "_runtime": 7627}, "step": 2450} +{"train_info/time_between_train_steps": 0.0253448486328125, "step": 2450} +{"info/global_step": 2451, "train_info/time_within_train_step": 2.7735722064971924, "step": 2451} +{"train_info/time_between_train_steps": 0.004059791564941406, "step": 2451} +{"info/global_step": 2452, "train_info/time_within_train_step": 2.739762783050537, "step": 2452} +{"train_info/time_between_train_steps": 0.0038843154907226562, "step": 2452} +{"info/global_step": 2453, "train_info/time_within_train_step": 2.702892303466797, "step": 2453} +{"train_info/time_between_train_steps": 0.004179239273071289, "step": 2453} +{"info/global_step": 2454, "train_info/time_within_train_step": 2.701427936553955, "step": 2454} +{"train_info/time_between_train_steps": 0.003833293914794922, "step": 2454} +{"info/global_step": 2455, "train_info/time_within_train_step": 2.7004055976867676, "step": 2455} +{"train_info/time_between_train_steps": 0.003827333450317383, "step": 2455} +{"info/global_step": 2456, "train_info/time_within_train_step": 2.6988437175750732, "step": 2456} +{"train_info/time_between_train_steps": 0.0038602352142333984, "step": 2456} +{"info/global_step": 2457, "train_info/time_within_train_step": 2.699272632598877, "step": 2457} +{"train_info/time_between_train_steps": 0.003928422927856445, "step": 2457} +{"info/global_step": 2458, "train_info/time_within_train_step": 2.7011635303497314, "step": 2458} +{"train_info/time_between_train_steps": 0.0039026737213134766, "step": 2458} +{"info/global_step": 2459, "train_info/time_within_train_step": 2.700934886932373, "step": 2459} +{"train_info/time_between_train_steps": 0.003816843032836914, "step": 2459} +{"info/global_step": 2460, "train_info/time_within_train_step": 2.701573133468628, "step": 2460} +{"train_info/time_between_train_steps": 0.003953456878662109, "step": 2460} +{"info/global_step": 2461, "train_info/time_within_train_step": 2.7595291137695312, "step": 2461} +{"train_info/time_between_train_steps": 0.0037856101989746094, "step": 2461} +{"info/global_step": 2462, "train_info/time_within_train_step": 2.9710097312927246, "step": 2462} +{"train_info/time_between_train_steps": 0.003677845001220703, "step": 2462} +{"info/global_step": 2463, "train_info/time_within_train_step": 2.6985690593719482, "step": 2463} +{"train_info/time_between_train_steps": 0.003660917282104492, "step": 2463} +{"info/global_step": 2464, "train_info/time_within_train_step": 2.6980605125427246, "step": 2464} +{"train_info/time_between_train_steps": 0.003679990768432617, "step": 2464} +{"info/global_step": 2465, "train_info/time_within_train_step": 2.7010579109191895, "step": 2465} +{"train_info/time_between_train_steps": 0.003690481185913086, "step": 2465} +{"info/global_step": 2466, "train_info/time_within_train_step": 2.6999876499176025, "step": 2466} +{"train_info/time_between_train_steps": 0.0037598609924316406, "step": 2466} +{"info/global_step": 2467, "train_info/time_within_train_step": 2.700446367263794, "step": 2467} +{"train_info/time_between_train_steps": 0.003686666488647461, "step": 2467} +{"info/global_step": 2468, "train_info/time_within_train_step": 2.700342893600464, "step": 2468} +{"train_info/time_between_train_steps": 0.0037789344787597656, "step": 2468} +{"info/global_step": 2469, "train_info/time_within_train_step": 2.723618984222412, "step": 2469} +{"train_info/time_between_train_steps": 0.003690958023071289, "step": 2469} +{"info/global_step": 2470, "train_info/time_within_train_step": 2.82055401802063, "step": 2470} +{"train_info/time_between_train_steps": 0.003644704818725586, "step": 2470} +{"info/global_step": 2471, "train_info/time_within_train_step": 3.067905902862549, "step": 2471} +{"train_info/time_between_train_steps": 0.003573894500732422, "step": 2471} +{"info/global_step": 2472, "train_info/time_within_train_step": 2.6988608837127686, "step": 2472} +{"train_info/time_between_train_steps": 0.0035979747772216797, "step": 2472} +{"info/global_step": 2473, "train_info/time_within_train_step": 2.6990222930908203, "step": 2473} +{"train_info/time_between_train_steps": 0.003673553466796875, "step": 2473} +{"info/global_step": 2474, "train_info/time_within_train_step": 2.6983747482299805, "step": 2474} +{"train_info/time_between_train_steps": 0.003875255584716797, "step": 2474} +{"info/global_step": 2475, "train_info/time_within_train_step": 2.7006897926330566, "step": 2475} +{"train_info/time_between_train_steps": 0.003922462463378906, "step": 2475} +{"info/global_step": 2476, "train_info/time_within_train_step": 2.702545404434204, "step": 2476} +{"train_info/time_between_train_steps": 0.003924131393432617, "step": 2476} +{"info/global_step": 2477, "train_info/time_within_train_step": 2.701167345046997, "step": 2477} +{"train_info/time_between_train_steps": 0.003953456878662109, "step": 2477} +{"info/global_step": 2478, "train_info/time_within_train_step": 2.7004377841949463, "step": 2478} +{"train_info/time_between_train_steps": 0.003894329071044922, "step": 2478} +{"info/global_step": 2479, "train_info/time_within_train_step": 2.7003109455108643, "step": 2479} +{"train_info/time_between_train_steps": 0.003965616226196289, "step": 2479} +{"info/global_step": 2480, "train_info/time_within_train_step": 2.6994521617889404, "step": 2480} +{"train_info/time_between_train_steps": 0.003885507583618164, "step": 2480} +{"info/global_step": 2481, "train_info/time_within_train_step": 2.6981825828552246, "step": 2481} +{"train_info/time_between_train_steps": 0.003878355026245117, "step": 2481} +{"info/global_step": 2482, "train_info/time_within_train_step": 2.702582836151123, "step": 2482} +{"train_info/time_between_train_steps": 0.004054069519042969, "step": 2482} +{"info/global_step": 2483, "train_info/time_within_train_step": 2.701834201812744, "step": 2483} +{"train_info/time_between_train_steps": 0.003973960876464844, "step": 2483} +{"info/global_step": 2484, "train_info/time_within_train_step": 2.701066255569458, "step": 2484} +{"train_info/time_between_train_steps": 0.003871440887451172, "step": 2484} +{"info/global_step": 2485, "train_info/time_within_train_step": 2.699937343597412, "step": 2485} +{"train_info/time_between_train_steps": 0.0038123130798339844, "step": 2485} +{"info/global_step": 2486, "train_info/time_within_train_step": 2.7016890048980713, "step": 2486} +{"train_info/time_between_train_steps": 0.0038466453552246094, "step": 2486} +{"info/global_step": 2487, "train_info/time_within_train_step": 2.7001020908355713, "step": 2487} +{"train_info/time_between_train_steps": 0.003852367401123047, "step": 2487} +{"info/global_step": 2488, "train_info/time_within_train_step": 2.700270652770996, "step": 2488} +{"train_info/time_between_train_steps": 0.003935337066650391, "step": 2488} +{"info/global_step": 2489, "train_info/time_within_train_step": 2.699486017227173, "step": 2489} +{"train_info/time_between_train_steps": 0.0038788318634033203, "step": 2489} +{"info/global_step": 2490, "train_info/time_within_train_step": 2.6991984844207764, "step": 2490} +{"train_info/time_between_train_steps": 0.004042148590087891, "step": 2490} +{"info/global_step": 2491, "train_info/time_within_train_step": 2.6995162963867188, "step": 2491} +{"train_info/time_between_train_steps": 0.003843545913696289, "step": 2491} +{"info/global_step": 2492, "train_info/time_within_train_step": 2.6986136436462402, "step": 2492} +{"train_info/time_between_train_steps": 0.003810882568359375, "step": 2492} +{"info/global_step": 2493, "train_info/time_within_train_step": 2.699932813644409, "step": 2493} +{"train_info/time_between_train_steps": 0.00386810302734375, "step": 2493} +{"info/global_step": 2494, "train_info/time_within_train_step": 2.6998744010925293, "step": 2494} +{"train_info/time_between_train_steps": 0.003856182098388672, "step": 2494} +{"info/global_step": 2495, "train_info/time_within_train_step": 2.6999351978302, "step": 2495} +{"train_info/time_between_train_steps": 0.0039098262786865234, "step": 2495} +{"info/global_step": 2496, "train_info/time_within_train_step": 2.701221466064453, "step": 2496} +{"train_info/time_between_train_steps": 0.003834247589111328, "step": 2496} +{"info/global_step": 2497, "train_info/time_within_train_step": 2.701122522354126, "step": 2497} +{"train_info/time_between_train_steps": 0.003816843032836914, "step": 2497} +{"info/global_step": 2498, "train_info/time_within_train_step": 2.7017364501953125, "step": 2498} +{"train_info/time_between_train_steps": 0.0038788318634033203, "step": 2498} +{"info/global_step": 2499, "train_info/time_within_train_step": 3.283613443374634, "step": 2499} +{"train_info/time_between_train_steps": 0.003918886184692383, "step": 2499} +{"info/global_step": 2500, "train_info/time_within_train_step": 2.7003014087677, "step": 2500} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746293744, "_runtime": 7766}, "step": 2500} +{"logs": {"train/loss": 4.5213, "train/learning_rate": 0.00011111111111111109, "train/epoch": 3.08, "_timestamp": 1746293744, "_runtime": 7766}, "step": 2500} +{"train_info/time_between_train_steps": 16.781566381454468, "step": 2500} +{"info/global_step": 2501, "train_info/time_within_train_step": 2.5012588500976562, "step": 2501} +{"train_info/time_between_train_steps": 0.0038232803344726562, "step": 2501} +{"info/global_step": 2502, "train_info/time_within_train_step": 2.500131130218506, "step": 2502} +{"train_info/time_between_train_steps": 0.003870248794555664, "step": 2502} +{"info/global_step": 2503, "train_info/time_within_train_step": 2.67529559135437, "step": 2503} +{"train_info/time_between_train_steps": 0.003999948501586914, "step": 2503} +{"info/global_step": 2504, "train_info/time_within_train_step": 2.8630573749542236, "step": 2504} +{"train_info/time_between_train_steps": 0.003854990005493164, "step": 2504} +{"info/global_step": 2505, "train_info/time_within_train_step": 2.6977274417877197, "step": 2505} +{"train_info/time_between_train_steps": 0.003830432891845703, "step": 2505} +{"info/global_step": 2506, "train_info/time_within_train_step": 2.6940619945526123, "step": 2506} +{"train_info/time_between_train_steps": 0.003805875778198242, "step": 2506} +{"info/global_step": 2507, "train_info/time_within_train_step": 2.696603536605835, "step": 2507} +{"train_info/time_between_train_steps": 0.0037431716918945312, "step": 2507} +{"info/global_step": 2508, "train_info/time_within_train_step": 2.6981911659240723, "step": 2508} +{"train_info/time_between_train_steps": 0.003694772720336914, "step": 2508} +{"info/global_step": 2509, "train_info/time_within_train_step": 2.845960855484009, "step": 2509} +{"train_info/time_between_train_steps": 0.003794431686401367, "step": 2509} +{"info/global_step": 2510, "train_info/time_within_train_step": 2.9357762336730957, "step": 2510} +{"train_info/time_between_train_steps": 0.0037834644317626953, "step": 2510} +{"info/global_step": 2511, "train_info/time_within_train_step": 3.050614595413208, "step": 2511} +{"train_info/time_between_train_steps": 0.003755807876586914, "step": 2511} +{"info/global_step": 2512, "train_info/time_within_train_step": 2.7201712131500244, "step": 2512} +{"train_info/time_between_train_steps": 0.003825664520263672, "step": 2512} +{"info/global_step": 2513, "train_info/time_within_train_step": 2.6991209983825684, "step": 2513} +{"train_info/time_between_train_steps": 0.0038242340087890625, "step": 2513} +{"info/global_step": 2514, "train_info/time_within_train_step": 2.699096918106079, "step": 2514} +{"train_info/time_between_train_steps": 0.003803253173828125, "step": 2514} +{"info/global_step": 2515, "train_info/time_within_train_step": 2.698012590408325, "step": 2515} +{"train_info/time_between_train_steps": 0.003787994384765625, "step": 2515} +{"info/global_step": 2516, "train_info/time_within_train_step": 2.698113203048706, "step": 2516} +{"train_info/time_between_train_steps": 0.0038182735443115234, "step": 2516} +{"info/global_step": 2517, "train_info/time_within_train_step": 2.6984996795654297, "step": 2517} +{"train_info/time_between_train_steps": 0.0038063526153564453, "step": 2517} +{"info/global_step": 2518, "train_info/time_within_train_step": 2.698982000350952, "step": 2518} +{"train_info/time_between_train_steps": 0.003927946090698242, "step": 2518} +{"info/global_step": 2519, "train_info/time_within_train_step": 2.7020926475524902, "step": 2519} +{"train_info/time_between_train_steps": 0.003890514373779297, "step": 2519} +{"info/global_step": 2520, "train_info/time_within_train_step": 2.701371669769287, "step": 2520} +{"train_info/time_between_train_steps": 0.003930330276489258, "step": 2520} +{"info/global_step": 2521, "train_info/time_within_train_step": 2.7016608715057373, "step": 2521} +{"train_info/time_between_train_steps": 0.003948211669921875, "step": 2521} +{"info/global_step": 2522, "train_info/time_within_train_step": 2.7103352546691895, "step": 2522} +{"train_info/time_between_train_steps": 0.003915548324584961, "step": 2522} +{"info/global_step": 2523, "train_info/time_within_train_step": 2.972109079360962, "step": 2523} +{"train_info/time_between_train_steps": 0.003937959671020508, "step": 2523} +{"info/global_step": 2524, "train_info/time_within_train_step": 2.853336811065674, "step": 2524} +{"train_info/time_between_train_steps": 0.1808149814605713, "step": 2524} +{"info/global_step": 2525, "train_info/time_within_train_step": 2.7003400325775146, "step": 2525} +{"train_info/time_between_train_steps": 0.0037877559661865234, "step": 2525} +{"info/global_step": 2526, "train_info/time_within_train_step": 2.6996054649353027, "step": 2526} +{"train_info/time_between_train_steps": 0.003808259963989258, "step": 2526} +{"info/global_step": 2527, "train_info/time_within_train_step": 2.701308250427246, "step": 2527} +{"train_info/time_between_train_steps": 0.0037872791290283203, "step": 2527} +{"info/global_step": 2528, "train_info/time_within_train_step": 2.700106143951416, "step": 2528} +{"train_info/time_between_train_steps": 0.0037262439727783203, "step": 2528} +{"info/global_step": 2529, "train_info/time_within_train_step": 2.699406862258911, "step": 2529} +{"train_info/time_between_train_steps": 0.0037381649017333984, "step": 2529} +{"info/global_step": 2530, "train_info/time_within_train_step": 2.7010059356689453, "step": 2530} +{"train_info/time_between_train_steps": 0.003730297088623047, "step": 2530} +{"info/global_step": 2531, "train_info/time_within_train_step": 2.6995396614074707, "step": 2531} +{"train_info/time_between_train_steps": 0.0037508010864257812, "step": 2531} +{"info/global_step": 2532, "train_info/time_within_train_step": 2.701504945755005, "step": 2532} +{"train_info/time_between_train_steps": 0.003729581832885742, "step": 2532} +{"info/global_step": 2533, "train_info/time_within_train_step": 3.079174280166626, "step": 2533} +{"train_info/time_between_train_steps": 0.003688812255859375, "step": 2533} +{"info/global_step": 2534, "train_info/time_within_train_step": 2.6978707313537598, "step": 2534} +{"train_info/time_between_train_steps": 0.003730297088623047, "step": 2534} +{"info/global_step": 2535, "train_info/time_within_train_step": 2.695263385772705, "step": 2535} +{"train_info/time_between_train_steps": 0.0036766529083251953, "step": 2535} +{"info/global_step": 2536, "train_info/time_within_train_step": 2.695263624191284, "step": 2536} +{"train_info/time_between_train_steps": 0.003692626953125, "step": 2536} +{"info/global_step": 2537, "train_info/time_within_train_step": 2.696235179901123, "step": 2537} +{"train_info/time_between_train_steps": 0.003747224807739258, "step": 2537} +{"info/global_step": 2538, "train_info/time_within_train_step": 2.697659492492676, "step": 2538} +{"train_info/time_between_train_steps": 0.003735780715942383, "step": 2538} +{"info/global_step": 2539, "train_info/time_within_train_step": 2.6974828243255615, "step": 2539} +{"train_info/time_between_train_steps": 0.003715038299560547, "step": 2539} +{"info/global_step": 2540, "train_info/time_within_train_step": 2.6976444721221924, "step": 2540} +{"train_info/time_between_train_steps": 0.0038099288940429688, "step": 2540} +{"info/global_step": 2541, "train_info/time_within_train_step": 2.697864055633545, "step": 2541} +{"train_info/time_between_train_steps": 0.0037262439727783203, "step": 2541} +{"info/global_step": 2542, "train_info/time_within_train_step": 2.6984825134277344, "step": 2542} +{"train_info/time_between_train_steps": 0.0037674903869628906, "step": 2542} +{"info/global_step": 2543, "train_info/time_within_train_step": 2.698998212814331, "step": 2543} +{"train_info/time_between_train_steps": 0.003719329833984375, "step": 2543} +{"info/global_step": 2544, "train_info/time_within_train_step": 2.697946786880493, "step": 2544} +{"train_info/time_between_train_steps": 0.0037183761596679688, "step": 2544} +{"info/global_step": 2545, "train_info/time_within_train_step": 2.6982884407043457, "step": 2545} +{"train_info/time_between_train_steps": 0.0037033557891845703, "step": 2545} +{"info/global_step": 2546, "train_info/time_within_train_step": 2.696359395980835, "step": 2546} +{"train_info/time_between_train_steps": 0.003735780715942383, "step": 2546} +{"info/global_step": 2547, "train_info/time_within_train_step": 2.698437452316284, "step": 2547} +{"train_info/time_between_train_steps": 0.0037581920623779297, "step": 2547} +{"info/global_step": 2548, "train_info/time_within_train_step": 2.699551582336426, "step": 2548} +{"train_info/time_between_train_steps": 0.00394892692565918, "step": 2548} +{"info/global_step": 2549, "train_info/time_within_train_step": 2.6986873149871826, "step": 2549} +{"train_info/time_between_train_steps": 0.0037963390350341797, "step": 2549} +{"info/global_step": 2550, "train_info/time_within_train_step": 2.7001898288726807, "step": 2550} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746293903, "_runtime": 7925}, "step": 2550} +{"logs": {"train/loss": 4.49, "train/learning_rate": 9.999999999999999e-05, "train/epoch": 3.09, "_timestamp": 1746293903, "_runtime": 7925}, "step": 2550} +{"train_info/time_between_train_steps": 0.02450251579284668, "step": 2550} +{"info/global_step": 2551, "train_info/time_within_train_step": 2.70058274269104, "step": 2551} +{"train_info/time_between_train_steps": 0.0039370059967041016, "step": 2551} +{"info/global_step": 2552, "train_info/time_within_train_step": 2.696892261505127, "step": 2552} +{"train_info/time_between_train_steps": 0.003979206085205078, "step": 2552} +{"info/global_step": 2553, "train_info/time_within_train_step": 2.701122999191284, "step": 2553} +{"train_info/time_between_train_steps": 0.0039825439453125, "step": 2553} +{"info/global_step": 2554, "train_info/time_within_train_step": 2.701125144958496, "step": 2554} +{"train_info/time_between_train_steps": 0.004029512405395508, "step": 2554} +{"info/global_step": 2555, "train_info/time_within_train_step": 2.700411796569824, "step": 2555} +{"train_info/time_between_train_steps": 0.003977537155151367, "step": 2555} +{"info/global_step": 2556, "train_info/time_within_train_step": 2.7014429569244385, "step": 2556} +{"train_info/time_between_train_steps": 0.003963470458984375, "step": 2556} +{"info/global_step": 2557, "train_info/time_within_train_step": 2.701258420944214, "step": 2557} +{"train_info/time_between_train_steps": 0.004003047943115234, "step": 2557} +{"info/global_step": 2558, "train_info/time_within_train_step": 3.0920450687408447, "step": 2558} +{"train_info/time_between_train_steps": 0.003572702407836914, "step": 2558} +{"info/global_step": 2559, "train_info/time_within_train_step": 2.698206901550293, "step": 2559} +{"train_info/time_between_train_steps": 0.0035369396209716797, "step": 2559} +{"info/global_step": 2560, "train_info/time_within_train_step": 2.697514533996582, "step": 2560} +{"train_info/time_between_train_steps": 0.003643035888671875, "step": 2560} +{"info/global_step": 2561, "train_info/time_within_train_step": 2.6982343196868896, "step": 2561} +{"train_info/time_between_train_steps": 0.003588438034057617, "step": 2561} +{"info/global_step": 2562, "train_info/time_within_train_step": 2.711372137069702, "step": 2562} +{"train_info/time_between_train_steps": 0.003664255142211914, "step": 2562} +{"info/global_step": 2563, "train_info/time_within_train_step": 2.773686647415161, "step": 2563} +{"train_info/time_between_train_steps": 0.003874540328979492, "step": 2563} +{"info/global_step": 2564, "train_info/time_within_train_step": 2.935506820678711, "step": 2564} +{"train_info/time_between_train_steps": 0.003577709197998047, "step": 2564} +{"info/global_step": 2565, "train_info/time_within_train_step": 2.7032222747802734, "step": 2565} +{"train_info/time_between_train_steps": 0.0035543441772460938, "step": 2565} +{"info/global_step": 2566, "train_info/time_within_train_step": 2.6982131004333496, "step": 2566} +{"train_info/time_between_train_steps": 0.003560304641723633, "step": 2566} +{"info/global_step": 2567, "train_info/time_within_train_step": 2.69710111618042, "step": 2567} +{"train_info/time_between_train_steps": 0.003574371337890625, "step": 2567} +{"info/global_step": 2568, "train_info/time_within_train_step": 2.6977250576019287, "step": 2568} +{"train_info/time_between_train_steps": 0.0035347938537597656, "step": 2568} +{"info/global_step": 2569, "train_info/time_within_train_step": 2.6974129676818848, "step": 2569} +{"train_info/time_between_train_steps": 0.0035505294799804688, "step": 2569} +{"info/global_step": 2570, "train_info/time_within_train_step": 2.697936534881592, "step": 2570} +{"train_info/time_between_train_steps": 0.003560781478881836, "step": 2570} +{"info/global_step": 2571, "train_info/time_within_train_step": 2.69852352142334, "step": 2571} +{"train_info/time_between_train_steps": 0.0035898685455322266, "step": 2571} +{"info/global_step": 2572, "train_info/time_within_train_step": 2.69844388961792, "step": 2572} +{"train_info/time_between_train_steps": 0.0035855770111083984, "step": 2572} +{"info/global_step": 2573, "train_info/time_within_train_step": 2.7004714012145996, "step": 2573} +{"train_info/time_between_train_steps": 0.0035598278045654297, "step": 2573} +{"info/global_step": 2574, "train_info/time_within_train_step": 2.6989521980285645, "step": 2574} +{"train_info/time_between_train_steps": 0.003528594970703125, "step": 2574} +{"info/global_step": 2575, "train_info/time_within_train_step": 2.717498540878296, "step": 2575} +{"train_info/time_between_train_steps": 0.0035605430603027344, "step": 2575} +{"info/global_step": 2576, "train_info/time_within_train_step": 2.8842554092407227, "step": 2576} +{"train_info/time_between_train_steps": 0.003635406494140625, "step": 2576} +{"info/global_step": 2577, "train_info/time_within_train_step": 2.726747989654541, "step": 2577} +{"train_info/time_between_train_steps": 0.003597259521484375, "step": 2577} +{"info/global_step": 2578, "train_info/time_within_train_step": 2.6986889839172363, "step": 2578} +{"train_info/time_between_train_steps": 0.0035555362701416016, "step": 2578} +{"info/global_step": 2579, "train_info/time_within_train_step": 2.6975080966949463, "step": 2579} +{"train_info/time_between_train_steps": 0.0035600662231445312, "step": 2579} +{"info/global_step": 2580, "train_info/time_within_train_step": 2.6975903511047363, "step": 2580} +{"train_info/time_between_train_steps": 0.0035088062286376953, "step": 2580} +{"info/global_step": 2581, "train_info/time_within_train_step": 2.7100749015808105, "step": 2581} +{"train_info/time_between_train_steps": 0.0036547183990478516, "step": 2581} +{"info/global_step": 2582, "train_info/time_within_train_step": 2.819253921508789, "step": 2582} +{"train_info/time_between_train_steps": 0.003544330596923828, "step": 2582} +{"info/global_step": 2583, "train_info/time_within_train_step": 2.7579236030578613, "step": 2583} +{"train_info/time_between_train_steps": 0.0035512447357177734, "step": 2583} +{"info/global_step": 2584, "train_info/time_within_train_step": 2.698556423187256, "step": 2584} +{"train_info/time_between_train_steps": 0.0035943984985351562, "step": 2584} +{"info/global_step": 2585, "train_info/time_within_train_step": 2.7167091369628906, "step": 2585} +{"train_info/time_between_train_steps": 0.0035848617553710938, "step": 2585} +{"info/global_step": 2586, "train_info/time_within_train_step": 2.726506233215332, "step": 2586} +{"train_info/time_between_train_steps": 0.0037381649017333984, "step": 2586} +{"info/global_step": 2587, "train_info/time_within_train_step": 2.861870527267456, "step": 2587} +{"train_info/time_between_train_steps": 0.003576993942260742, "step": 2587} +{"info/global_step": 2588, "train_info/time_within_train_step": 2.697309970855713, "step": 2588} +{"train_info/time_between_train_steps": 0.0035779476165771484, "step": 2588} +{"info/global_step": 2589, "train_info/time_within_train_step": 2.707007646560669, "step": 2589} +{"train_info/time_between_train_steps": 0.0035228729248046875, "step": 2589} +{"info/global_step": 2590, "train_info/time_within_train_step": 2.755993366241455, "step": 2590} +{"train_info/time_between_train_steps": 0.003587961196899414, "step": 2590} +{"info/global_step": 2591, "train_info/time_within_train_step": 2.6981871128082275, "step": 2591} +{"train_info/time_between_train_steps": 0.0035293102264404297, "step": 2591} +{"info/global_step": 2592, "train_info/time_within_train_step": 2.6982262134552, "step": 2592} +{"train_info/time_between_train_steps": 0.0035240650177001953, "step": 2592} +{"info/global_step": 2593, "train_info/time_within_train_step": 2.698763370513916, "step": 2593} +{"train_info/time_between_train_steps": 0.003650188446044922, "step": 2593} +{"info/global_step": 2594, "train_info/time_within_train_step": 2.7013158798217773, "step": 2594} +{"train_info/time_between_train_steps": 0.003580331802368164, "step": 2594} +{"info/global_step": 2595, "train_info/time_within_train_step": 2.7794971466064453, "step": 2595} +{"train_info/time_between_train_steps": 0.003606557846069336, "step": 2595} +{"info/global_step": 2596, "train_info/time_within_train_step": 2.739377737045288, "step": 2596} +{"train_info/time_between_train_steps": 0.003616809844970703, "step": 2596} +{"info/global_step": 2597, "train_info/time_within_train_step": 2.700770616531372, "step": 2597} +{"train_info/time_between_train_steps": 0.0036919116973876953, "step": 2597} +{"info/global_step": 2598, "train_info/time_within_train_step": 2.701713800430298, "step": 2598} +{"train_info/time_between_train_steps": 0.00365447998046875, "step": 2598} +{"info/global_step": 2599, "train_info/time_within_train_step": 2.725321054458618, "step": 2599} +{"train_info/time_between_train_steps": 0.003835916519165039, "step": 2599} +{"info/global_step": 2600, "train_info/time_within_train_step": 2.72572660446167, "step": 2600} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746294042, "_runtime": 8064}, "step": 2600} +{"logs": {"train/loss": 4.4891, "train/learning_rate": 8.888888888888888e-05, "train/epoch": 3.11, "_timestamp": 1746294042, "_runtime": 8064}, "step": 2600} +{"train_info/time_between_train_steps": 17.264835596084595, "step": 2600} +{"info/global_step": 2601, "train_info/time_within_train_step": 2.49346661567688, "step": 2601} +{"train_info/time_between_train_steps": 0.004763603210449219, "step": 2601} +{"info/global_step": 2602, "train_info/time_within_train_step": 2.4898593425750732, "step": 2602} +{"train_info/time_between_train_steps": 0.004105806350708008, "step": 2602} +{"info/global_step": 2603, "train_info/time_within_train_step": 2.678424119949341, "step": 2603} +{"train_info/time_between_train_steps": 0.004000425338745117, "step": 2603} +{"info/global_step": 2604, "train_info/time_within_train_step": 2.696514129638672, "step": 2604} +{"train_info/time_between_train_steps": 0.0039670467376708984, "step": 2604} +{"info/global_step": 2605, "train_info/time_within_train_step": 2.695780038833618, "step": 2605} +{"train_info/time_between_train_steps": 0.003964662551879883, "step": 2605} +{"info/global_step": 2606, "train_info/time_within_train_step": 2.6978087425231934, "step": 2606} +{"train_info/time_between_train_steps": 0.003901243209838867, "step": 2606} +{"info/global_step": 2607, "train_info/time_within_train_step": 2.69877552986145, "step": 2607} +{"train_info/time_between_train_steps": 0.003911733627319336, "step": 2607} +{"info/global_step": 2608, "train_info/time_within_train_step": 2.7018673419952393, "step": 2608} +{"train_info/time_between_train_steps": 0.0039060115814208984, "step": 2608} +{"info/global_step": 2609, "train_info/time_within_train_step": 2.919645309448242, "step": 2609} +{"train_info/time_between_train_steps": 0.003949642181396484, "step": 2609} +{"info/global_step": 2610, "train_info/time_within_train_step": 2.733623504638672, "step": 2610} +{"train_info/time_between_train_steps": 0.0039424896240234375, "step": 2610} +{"info/global_step": 2611, "train_info/time_within_train_step": 2.7044100761413574, "step": 2611} +{"train_info/time_between_train_steps": 0.003843545913696289, "step": 2611} +{"info/global_step": 2612, "train_info/time_within_train_step": 2.698611259460449, "step": 2612} +{"train_info/time_between_train_steps": 0.0038983821868896484, "step": 2612} +{"info/global_step": 2613, "train_info/time_within_train_step": 2.6984260082244873, "step": 2613} +{"train_info/time_between_train_steps": 0.0038242340087890625, "step": 2613} +{"info/global_step": 2614, "train_info/time_within_train_step": 2.6996757984161377, "step": 2614} +{"train_info/time_between_train_steps": 0.003960371017456055, "step": 2614} +{"info/global_step": 2615, "train_info/time_within_train_step": 2.6985023021698, "step": 2615} +{"train_info/time_between_train_steps": 0.003902435302734375, "step": 2615} +{"info/global_step": 2616, "train_info/time_within_train_step": 2.699732542037964, "step": 2616} +{"train_info/time_between_train_steps": 0.0038917064666748047, "step": 2616} +{"info/global_step": 2617, "train_info/time_within_train_step": 2.7563774585723877, "step": 2617} +{"train_info/time_between_train_steps": 0.007308244705200195, "step": 2617} +{"info/global_step": 2618, "train_info/time_within_train_step": 2.713479518890381, "step": 2618} +{"train_info/time_between_train_steps": 0.0038335323333740234, "step": 2618} +{"info/global_step": 2619, "train_info/time_within_train_step": 3.0938162803649902, "step": 2619} +{"train_info/time_between_train_steps": 0.00419926643371582, "step": 2619} +{"info/global_step": 2620, "train_info/time_within_train_step": 2.6992008686065674, "step": 2620} +{"train_info/time_between_train_steps": 0.0035982131958007812, "step": 2620} +{"info/global_step": 2621, "train_info/time_within_train_step": 2.697960615158081, "step": 2621} +{"train_info/time_between_train_steps": 0.0036215782165527344, "step": 2621} +{"info/global_step": 2622, "train_info/time_within_train_step": 2.6993248462677, "step": 2622} +{"train_info/time_between_train_steps": 0.003607511520385742, "step": 2622} +{"info/global_step": 2623, "train_info/time_within_train_step": 2.6987311840057373, "step": 2623} +{"train_info/time_between_train_steps": 0.0036339759826660156, "step": 2623} +{"info/global_step": 2624, "train_info/time_within_train_step": 2.703805446624756, "step": 2624} +{"train_info/time_between_train_steps": 0.0037941932678222656, "step": 2624} +{"info/global_step": 2625, "train_info/time_within_train_step": 2.701106309890747, "step": 2625} +{"train_info/time_between_train_steps": 0.003863096237182617, "step": 2625} +{"info/global_step": 2626, "train_info/time_within_train_step": 2.7416486740112305, "step": 2626} +{"train_info/time_between_train_steps": 0.003998994827270508, "step": 2626} +{"info/global_step": 2627, "train_info/time_within_train_step": 2.7232699394226074, "step": 2627} +{"train_info/time_between_train_steps": 0.003782033920288086, "step": 2627} +{"info/global_step": 2628, "train_info/time_within_train_step": 2.6988637447357178, "step": 2628} +{"train_info/time_between_train_steps": 0.0041675567626953125, "step": 2628} +{"info/global_step": 2629, "train_info/time_within_train_step": 2.6986396312713623, "step": 2629} +{"train_info/time_between_train_steps": 0.003974437713623047, "step": 2629} +{"info/global_step": 2630, "train_info/time_within_train_step": 2.7010498046875, "step": 2630} +{"train_info/time_between_train_steps": 0.004168272018432617, "step": 2630} +{"info/global_step": 2631, "train_info/time_within_train_step": 2.701775312423706, "step": 2631} +{"train_info/time_between_train_steps": 0.0039670467376708984, "step": 2631} +{"info/global_step": 2632, "train_info/time_within_train_step": 2.7367398738861084, "step": 2632} +{"train_info/time_between_train_steps": 0.003993988037109375, "step": 2632} +{"info/global_step": 2633, "train_info/time_within_train_step": 2.840278387069702, "step": 2633} +{"train_info/time_between_train_steps": 0.0040171146392822266, "step": 2633} +{"info/global_step": 2634, "train_info/time_within_train_step": 2.743342399597168, "step": 2634} +{"train_info/time_between_train_steps": 0.003982067108154297, "step": 2634} +{"info/global_step": 2635, "train_info/time_within_train_step": 2.7002429962158203, "step": 2635} +{"train_info/time_between_train_steps": 0.00406336784362793, "step": 2635} +{"info/global_step": 2636, "train_info/time_within_train_step": 2.6995797157287598, "step": 2636} +{"train_info/time_between_train_steps": 0.003945112228393555, "step": 2636} +{"info/global_step": 2637, "train_info/time_within_train_step": 2.707263231277466, "step": 2637} +{"train_info/time_between_train_steps": 0.003918647766113281, "step": 2637} +{"info/global_step": 2638, "train_info/time_within_train_step": 2.7211852073669434, "step": 2638} +{"train_info/time_between_train_steps": 0.0038309097290039062, "step": 2638} +{"info/global_step": 2639, "train_info/time_within_train_step": 2.6985695362091064, "step": 2639} +{"train_info/time_between_train_steps": 0.003858327865600586, "step": 2639} +{"info/global_step": 2640, "train_info/time_within_train_step": 2.706843376159668, "step": 2640} +{"train_info/time_between_train_steps": 0.0038366317749023438, "step": 2640} +{"info/global_step": 2641, "train_info/time_within_train_step": 2.7136123180389404, "step": 2641} +{"train_info/time_between_train_steps": 0.0037567615509033203, "step": 2641} +{"info/global_step": 2642, "train_info/time_within_train_step": 2.706022262573242, "step": 2642} +{"train_info/time_between_train_steps": 0.003907918930053711, "step": 2642} +{"info/global_step": 2643, "train_info/time_within_train_step": 2.698915719985962, "step": 2643} +{"train_info/time_between_train_steps": 0.0039615631103515625, "step": 2643} +{"info/global_step": 2644, "train_info/time_within_train_step": 2.699920892715454, "step": 2644} +{"train_info/time_between_train_steps": 0.003856658935546875, "step": 2644} +{"info/global_step": 2645, "train_info/time_within_train_step": 2.717740535736084, "step": 2645} +{"train_info/time_between_train_steps": 0.003844022750854492, "step": 2645} +{"info/global_step": 2646, "train_info/time_within_train_step": 2.7767107486724854, "step": 2646} +{"train_info/time_between_train_steps": 0.0038869380950927734, "step": 2646} +{"info/global_step": 2647, "train_info/time_within_train_step": 2.7050535678863525, "step": 2647} +{"train_info/time_between_train_steps": 0.0039038658142089844, "step": 2647} +{"info/global_step": 2648, "train_info/time_within_train_step": 2.6999151706695557, "step": 2648} +{"train_info/time_between_train_steps": 0.004096508026123047, "step": 2648} +{"info/global_step": 2649, "train_info/time_within_train_step": 2.831120491027832, "step": 2649} +{"train_info/time_between_train_steps": 0.16573476791381836, "step": 2649} +{"info/global_step": 2650, "train_info/time_within_train_step": 2.698624849319458, "step": 2650} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746294198, "_runtime": 8220}, "step": 2650} +{"logs": {"train/loss": 4.4619, "train/learning_rate": 7.777777777777777e-05, "train/epoch": 3.13, "_timestamp": 1746294198, "_runtime": 8220}, "step": 2650} +{"train_info/time_between_train_steps": 0.02636575698852539, "step": 2650} +{"info/global_step": 2651, "train_info/time_within_train_step": 2.6989357471466064, "step": 2651} +{"train_info/time_between_train_steps": 0.0039010047912597656, "step": 2651} +{"info/global_step": 2652, "train_info/time_within_train_step": 2.706573247909546, "step": 2652} +{"train_info/time_between_train_steps": 0.003667593002319336, "step": 2652} +{"info/global_step": 2653, "train_info/time_within_train_step": 2.6987264156341553, "step": 2653} +{"train_info/time_between_train_steps": 0.0036830902099609375, "step": 2653} +{"info/global_step": 2654, "train_info/time_within_train_step": 2.6972153186798096, "step": 2654} +{"train_info/time_between_train_steps": 0.003749370574951172, "step": 2654} +{"info/global_step": 2655, "train_info/time_within_train_step": 2.69974422454834, "step": 2655} +{"train_info/time_between_train_steps": 0.0037364959716796875, "step": 2655} +{"info/global_step": 2656, "train_info/time_within_train_step": 2.698582887649536, "step": 2656} +{"train_info/time_between_train_steps": 0.0036847591400146484, "step": 2656} +{"info/global_step": 2657, "train_info/time_within_train_step": 2.697848320007324, "step": 2657} +{"train_info/time_between_train_steps": 0.003689289093017578, "step": 2657} +{"info/global_step": 2658, "train_info/time_within_train_step": 2.6983542442321777, "step": 2658} +{"train_info/time_between_train_steps": 0.0036194324493408203, "step": 2658} +{"info/global_step": 2659, "train_info/time_within_train_step": 2.6969046592712402, "step": 2659} +{"train_info/time_between_train_steps": 0.003638744354248047, "step": 2659} +{"info/global_step": 2660, "train_info/time_within_train_step": 2.6981704235076904, "step": 2660} +{"train_info/time_between_train_steps": 0.0037093162536621094, "step": 2660} +{"info/global_step": 2661, "train_info/time_within_train_step": 2.6994190216064453, "step": 2661} +{"train_info/time_between_train_steps": 0.003712177276611328, "step": 2661} +{"info/global_step": 2662, "train_info/time_within_train_step": 2.6991963386535645, "step": 2662} +{"train_info/time_between_train_steps": 0.0036852359771728516, "step": 2662} +{"info/global_step": 2663, "train_info/time_within_train_step": 2.6986286640167236, "step": 2663} +{"train_info/time_between_train_steps": 0.003707408905029297, "step": 2663} +{"info/global_step": 2664, "train_info/time_within_train_step": 2.7005202770233154, "step": 2664} +{"train_info/time_between_train_steps": 0.0037221908569335938, "step": 2664} +{"info/global_step": 2665, "train_info/time_within_train_step": 2.6977968215942383, "step": 2665} +{"train_info/time_between_train_steps": 0.003680706024169922, "step": 2665} +{"info/global_step": 2666, "train_info/time_within_train_step": 2.700437307357788, "step": 2666} +{"train_info/time_between_train_steps": 0.0036885738372802734, "step": 2666} +{"info/global_step": 2667, "train_info/time_within_train_step": 2.6981019973754883, "step": 2667} +{"train_info/time_between_train_steps": 0.0036470890045166016, "step": 2667} +{"info/global_step": 2668, "train_info/time_within_train_step": 2.6971638202667236, "step": 2668} +{"train_info/time_between_train_steps": 0.003756284713745117, "step": 2668} +{"info/global_step": 2669, "train_info/time_within_train_step": 2.7023305892944336, "step": 2669} +{"train_info/time_between_train_steps": 0.003757953643798828, "step": 2669} +{"info/global_step": 2670, "train_info/time_within_train_step": 2.702008008956909, "step": 2670} +{"train_info/time_between_train_steps": 0.003792285919189453, "step": 2670} +{"info/global_step": 2671, "train_info/time_within_train_step": 2.698683261871338, "step": 2671} +{"train_info/time_between_train_steps": 0.003751516342163086, "step": 2671} +{"info/global_step": 2672, "train_info/time_within_train_step": 2.697727918624878, "step": 2672} +{"train_info/time_between_train_steps": 0.0037488937377929688, "step": 2672} +{"info/global_step": 2673, "train_info/time_within_train_step": 3.062622547149658, "step": 2673} +{"train_info/time_between_train_steps": 0.0036551952362060547, "step": 2673} +{"info/global_step": 2674, "train_info/time_within_train_step": 2.696915626525879, "step": 2674} +{"train_info/time_between_train_steps": 0.003847837448120117, "step": 2674} +{"info/global_step": 2675, "train_info/time_within_train_step": 2.695770502090454, "step": 2675} +{"train_info/time_between_train_steps": 0.003822803497314453, "step": 2675} +{"info/global_step": 2676, "train_info/time_within_train_step": 2.6971435546875, "step": 2676} +{"train_info/time_between_train_steps": 0.003912448883056641, "step": 2676} +{"info/global_step": 2677, "train_info/time_within_train_step": 2.696390151977539, "step": 2677} +{"train_info/time_between_train_steps": 0.003817319869995117, "step": 2677} +{"info/global_step": 2678, "train_info/time_within_train_step": 2.695021629333496, "step": 2678} +{"train_info/time_between_train_steps": 0.0038733482360839844, "step": 2678} +{"info/global_step": 2679, "train_info/time_within_train_step": 2.697976589202881, "step": 2679} +{"train_info/time_between_train_steps": 0.003880739212036133, "step": 2679} +{"info/global_step": 2680, "train_info/time_within_train_step": 2.6982429027557373, "step": 2680} +{"train_info/time_between_train_steps": 0.0038444995880126953, "step": 2680} +{"info/global_step": 2681, "train_info/time_within_train_step": 2.6976428031921387, "step": 2681} +{"train_info/time_between_train_steps": 0.004063606262207031, "step": 2681} +{"info/global_step": 2682, "train_info/time_within_train_step": 2.6985023021698, "step": 2682} +{"train_info/time_between_train_steps": 0.003859996795654297, "step": 2682} +{"info/global_step": 2683, "train_info/time_within_train_step": 2.7001543045043945, "step": 2683} +{"train_info/time_between_train_steps": 0.0038568973541259766, "step": 2683} +{"info/global_step": 2684, "train_info/time_within_train_step": 2.697840690612793, "step": 2684} +{"train_info/time_between_train_steps": 0.0038404464721679688, "step": 2684} +{"info/global_step": 2685, "train_info/time_within_train_step": 2.6980059146881104, "step": 2685} +{"train_info/time_between_train_steps": 0.0038204193115234375, "step": 2685} +{"info/global_step": 2686, "train_info/time_within_train_step": 2.6992344856262207, "step": 2686} +{"train_info/time_between_train_steps": 0.003904104232788086, "step": 2686} +{"info/global_step": 2687, "train_info/time_within_train_step": 2.6979918479919434, "step": 2687} +{"train_info/time_between_train_steps": 0.003793954849243164, "step": 2687} +{"info/global_step": 2688, "train_info/time_within_train_step": 2.697284460067749, "step": 2688} +{"train_info/time_between_train_steps": 0.0038547515869140625, "step": 2688} +{"info/global_step": 2689, "train_info/time_within_train_step": 2.698714256286621, "step": 2689} +{"train_info/time_between_train_steps": 0.0038840770721435547, "step": 2689} +{"info/global_step": 2690, "train_info/time_within_train_step": 2.698847770690918, "step": 2690} +{"train_info/time_between_train_steps": 0.003823518753051758, "step": 2690} +{"info/global_step": 2691, "train_info/time_within_train_step": 2.70015811920166, "step": 2691} +{"train_info/time_between_train_steps": 0.0038187503814697266, "step": 2691} +{"info/global_step": 2692, "train_info/time_within_train_step": 2.6991043090820312, "step": 2692} +{"train_info/time_between_train_steps": 0.003832578659057617, "step": 2692} +{"info/global_step": 2693, "train_info/time_within_train_step": 2.698659896850586, "step": 2693} +{"train_info/time_between_train_steps": 0.003915309906005859, "step": 2693} +{"info/global_step": 2694, "train_info/time_within_train_step": 2.7005701065063477, "step": 2694} +{"train_info/time_between_train_steps": 0.0038590431213378906, "step": 2694} +{"info/global_step": 2695, "train_info/time_within_train_step": 2.700439929962158, "step": 2695} +{"train_info/time_between_train_steps": 0.0038280487060546875, "step": 2695} +{"info/global_step": 2696, "train_info/time_within_train_step": 2.703282117843628, "step": 2696} +{"train_info/time_between_train_steps": 0.0039556026458740234, "step": 2696} +{"info/global_step": 2697, "train_info/time_within_train_step": 2.7012863159179688, "step": 2697} +{"train_info/time_between_train_steps": 0.003954410552978516, "step": 2697} +{"info/global_step": 2698, "train_info/time_within_train_step": 2.701399087905884, "step": 2698} +{"train_info/time_between_train_steps": 0.0038661956787109375, "step": 2698} +{"info/global_step": 2699, "train_info/time_within_train_step": 2.7011468410491943, "step": 2699} +{"train_info/time_between_train_steps": 0.0038747787475585938, "step": 2699} +{"info/global_step": 2700, "train_info/time_within_train_step": 2.70137882232666, "step": 2700} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746294339, "_runtime": 8361}, "step": 2700} +{"logs": {"train/loss": 4.4552, "train/learning_rate": 6.666666666666666e-05, "train/epoch": 3.14, "_timestamp": 1746294339, "_runtime": 8361}, "step": 2700} +{"train_info/time_between_train_steps": 17.319241285324097, "step": 2700} +{"info/global_step": 2701, "train_info/time_within_train_step": 2.486294746398926, "step": 2701} +{"train_info/time_between_train_steps": 0.004061222076416016, "step": 2701} +{"info/global_step": 2702, "train_info/time_within_train_step": 2.514594078063965, "step": 2702} +{"train_info/time_between_train_steps": 0.004963874816894531, "step": 2702} +{"info/global_step": 2703, "train_info/time_within_train_step": 2.694093704223633, "step": 2703} +{"train_info/time_between_train_steps": 0.004048824310302734, "step": 2703} +{"info/global_step": 2704, "train_info/time_within_train_step": 2.7012786865234375, "step": 2704} +{"train_info/time_between_train_steps": 0.004052877426147461, "step": 2704} +{"info/global_step": 2705, "train_info/time_within_train_step": 2.697345495223999, "step": 2705} +{"train_info/time_between_train_steps": 0.004071474075317383, "step": 2705} +{"info/global_step": 2706, "train_info/time_within_train_step": 2.6981215476989746, "step": 2706} +{"train_info/time_between_train_steps": 0.003996610641479492, "step": 2706} +{"info/global_step": 2707, "train_info/time_within_train_step": 2.7157227993011475, "step": 2707} +{"train_info/time_between_train_steps": 0.004129171371459961, "step": 2707} +{"info/global_step": 2708, "train_info/time_within_train_step": 2.6990625858306885, "step": 2708} +{"train_info/time_between_train_steps": 0.0038690567016601562, "step": 2708} +{"info/global_step": 2709, "train_info/time_within_train_step": 2.822066068649292, "step": 2709} +{"train_info/time_between_train_steps": 0.0038623809814453125, "step": 2709} +{"info/global_step": 2710, "train_info/time_within_train_step": 2.90641450881958, "step": 2710} +{"train_info/time_between_train_steps": 0.003900289535522461, "step": 2710} +{"info/global_step": 2711, "train_info/time_within_train_step": 3.02780818939209, "step": 2711} +{"train_info/time_between_train_steps": 0.004143714904785156, "step": 2711} +{"info/global_step": 2712, "train_info/time_within_train_step": 2.7820491790771484, "step": 2712} +{"train_info/time_between_train_steps": 0.0039806365966796875, "step": 2712} +{"info/global_step": 2713, "train_info/time_within_train_step": 2.6988110542297363, "step": 2713} +{"train_info/time_between_train_steps": 0.00380706787109375, "step": 2713} +{"info/global_step": 2714, "train_info/time_within_train_step": 2.701030731201172, "step": 2714} +{"train_info/time_between_train_steps": 0.0041654109954833984, "step": 2714} +{"info/global_step": 2715, "train_info/time_within_train_step": 2.703688144683838, "step": 2715} +{"train_info/time_between_train_steps": 0.0045163631439208984, "step": 2715} +{"info/global_step": 2716, "train_info/time_within_train_step": 2.7014472484588623, "step": 2716} +{"train_info/time_between_train_steps": 0.0041730403900146484, "step": 2716} +{"info/global_step": 2717, "train_info/time_within_train_step": 3.087721347808838, "step": 2717} +{"train_info/time_between_train_steps": 0.004132270812988281, "step": 2717} +{"info/global_step": 2718, "train_info/time_within_train_step": 2.7026963233947754, "step": 2718} +{"train_info/time_between_train_steps": 0.004228830337524414, "step": 2718} +{"info/global_step": 2719, "train_info/time_within_train_step": 2.7007784843444824, "step": 2719} +{"train_info/time_between_train_steps": 0.00407719612121582, "step": 2719} +{"info/global_step": 2720, "train_info/time_within_train_step": 2.7119193077087402, "step": 2720} +{"train_info/time_between_train_steps": 0.003846883773803711, "step": 2720} +{"info/global_step": 2721, "train_info/time_within_train_step": 2.6986653804779053, "step": 2721} +{"train_info/time_between_train_steps": 0.00351715087890625, "step": 2721} +{"info/global_step": 2722, "train_info/time_within_train_step": 2.702880382537842, "step": 2722} +{"train_info/time_between_train_steps": 0.003657817840576172, "step": 2722} +{"info/global_step": 2723, "train_info/time_within_train_step": 2.7008166313171387, "step": 2723} +{"train_info/time_between_train_steps": 0.003660917282104492, "step": 2723} +{"info/global_step": 2724, "train_info/time_within_train_step": 2.6999804973602295, "step": 2724} +{"train_info/time_between_train_steps": 0.0035827159881591797, "step": 2724} +{"info/global_step": 2725, "train_info/time_within_train_step": 2.7011008262634277, "step": 2725} +{"train_info/time_between_train_steps": 0.0036439895629882812, "step": 2725} +{"info/global_step": 2726, "train_info/time_within_train_step": 2.70048451423645, "step": 2726} +{"train_info/time_between_train_steps": 0.0036187171936035156, "step": 2726} +{"info/global_step": 2727, "train_info/time_within_train_step": 2.701775550842285, "step": 2727} +{"train_info/time_between_train_steps": 0.0036017894744873047, "step": 2727} +{"info/global_step": 2728, "train_info/time_within_train_step": 2.7082016468048096, "step": 2728} +{"train_info/time_between_train_steps": 0.0035600662231445312, "step": 2728} +{"info/global_step": 2729, "train_info/time_within_train_step": 2.8299925327301025, "step": 2729} +{"train_info/time_between_train_steps": 0.0036215782165527344, "step": 2729} +{"info/global_step": 2730, "train_info/time_within_train_step": 2.945618152618408, "step": 2730} +{"train_info/time_between_train_steps": 0.0035812854766845703, "step": 2730} +{"info/global_step": 2731, "train_info/time_within_train_step": 2.7035207748413086, "step": 2731} +{"train_info/time_between_train_steps": 0.0036208629608154297, "step": 2731} +{"info/global_step": 2732, "train_info/time_within_train_step": 2.700378894805908, "step": 2732} +{"train_info/time_between_train_steps": 0.003609895706176758, "step": 2732} +{"info/global_step": 2733, "train_info/time_within_train_step": 2.6987884044647217, "step": 2733} +{"train_info/time_between_train_steps": 0.0035600662231445312, "step": 2733} +{"info/global_step": 2734, "train_info/time_within_train_step": 2.6999826431274414, "step": 2734} +{"train_info/time_between_train_steps": 0.003570556640625, "step": 2734} +{"info/global_step": 2735, "train_info/time_within_train_step": 2.699453830718994, "step": 2735} +{"train_info/time_between_train_steps": 0.0035605430603027344, "step": 2735} +{"info/global_step": 2736, "train_info/time_within_train_step": 2.6989691257476807, "step": 2736} +{"train_info/time_between_train_steps": 0.003529787063598633, "step": 2736} +{"info/global_step": 2737, "train_info/time_within_train_step": 2.699925422668457, "step": 2737} +{"train_info/time_between_train_steps": 0.0035164356231689453, "step": 2737} +{"info/global_step": 2738, "train_info/time_within_train_step": 2.701430082321167, "step": 2738} +{"train_info/time_between_train_steps": 0.008895158767700195, "step": 2738} +{"info/global_step": 2739, "train_info/time_within_train_step": 2.701154947280884, "step": 2739} +{"train_info/time_between_train_steps": 0.0034945011138916016, "step": 2739} +{"info/global_step": 2740, "train_info/time_within_train_step": 2.6995651721954346, "step": 2740} +{"train_info/time_between_train_steps": 0.0035691261291503906, "step": 2740} +{"info/global_step": 2741, "train_info/time_within_train_step": 2.700835943222046, "step": 2741} +{"train_info/time_between_train_steps": 0.0035338401794433594, "step": 2741} +{"info/global_step": 2742, "train_info/time_within_train_step": 2.7619102001190186, "step": 2742} +{"train_info/time_between_train_steps": 0.0035812854766845703, "step": 2742} +{"info/global_step": 2743, "train_info/time_within_train_step": 2.9163601398468018, "step": 2743} +{"train_info/time_between_train_steps": 0.009817361831665039, "step": 2743} +{"info/global_step": 2744, "train_info/time_within_train_step": 2.745415449142456, "step": 2744} +{"train_info/time_between_train_steps": 0.008738517761230469, "step": 2744} +{"info/global_step": 2745, "train_info/time_within_train_step": 2.7017428874969482, "step": 2745} +{"train_info/time_between_train_steps": 0.00899362564086914, "step": 2745} +{"info/global_step": 2746, "train_info/time_within_train_step": 2.713602304458618, "step": 2746} +{"train_info/time_between_train_steps": 0.003581523895263672, "step": 2746} +{"info/global_step": 2747, "train_info/time_within_train_step": 2.705481767654419, "step": 2747} +{"train_info/time_between_train_steps": 0.003509044647216797, "step": 2747} +{"info/global_step": 2748, "train_info/time_within_train_step": 2.7020230293273926, "step": 2748} +{"train_info/time_between_train_steps": 0.00842142105102539, "step": 2748} +{"info/global_step": 2749, "train_info/time_within_train_step": 3.2469732761383057, "step": 2749} +{"train_info/time_between_train_steps": 0.00363922119140625, "step": 2749} +{"info/global_step": 2750, "train_info/time_within_train_step": 2.7021591663360596, "step": 2750} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746294495, "_runtime": 8517}, "step": 2750} +{"logs": {"train/loss": 4.4394, "train/learning_rate": 5.5555555555555545e-05, "train/epoch": 3.16, "_timestamp": 1746294495, "_runtime": 8517}, "step": 2750} +{"train_info/time_between_train_steps": 0.11502504348754883, "step": 2750} +{"info/global_step": 2751, "train_info/time_within_train_step": 2.701700210571289, "step": 2751} +{"train_info/time_between_train_steps": 0.0036211013793945312, "step": 2751} +{"info/global_step": 2752, "train_info/time_within_train_step": 2.7014355659484863, "step": 2752} +{"train_info/time_between_train_steps": 0.008742094039916992, "step": 2752} +{"info/global_step": 2753, "train_info/time_within_train_step": 2.7001636028289795, "step": 2753} +{"train_info/time_between_train_steps": 0.008496522903442383, "step": 2753} +{"info/global_step": 2754, "train_info/time_within_train_step": 2.7010295391082764, "step": 2754} +{"train_info/time_between_train_steps": 0.008965492248535156, "step": 2754} +{"info/global_step": 2755, "train_info/time_within_train_step": 2.6994519233703613, "step": 2755} +{"train_info/time_between_train_steps": 0.007296085357666016, "step": 2755} +{"info/global_step": 2756, "train_info/time_within_train_step": 2.700756549835205, "step": 2756} +{"train_info/time_between_train_steps": 0.008656024932861328, "step": 2756} +{"info/global_step": 2757, "train_info/time_within_train_step": 2.6991443634033203, "step": 2757} +{"train_info/time_between_train_steps": 0.0035429000854492188, "step": 2757} +{"info/global_step": 2758, "train_info/time_within_train_step": 2.700054168701172, "step": 2758} +{"train_info/time_between_train_steps": 0.0036602020263671875, "step": 2758} +{"info/global_step": 2759, "train_info/time_within_train_step": 2.700451374053955, "step": 2759} +{"train_info/time_between_train_steps": 0.008822202682495117, "step": 2759} +{"info/global_step": 2760, "train_info/time_within_train_step": 2.701150894165039, "step": 2760} +{"train_info/time_between_train_steps": 0.008613348007202148, "step": 2760} +{"info/global_step": 2761, "train_info/time_within_train_step": 2.6999638080596924, "step": 2761} +{"train_info/time_between_train_steps": 0.008435964584350586, "step": 2761} +{"info/global_step": 2762, "train_info/time_within_train_step": 2.7000699043273926, "step": 2762} +{"train_info/time_between_train_steps": 0.003515958786010742, "step": 2762} +{"info/global_step": 2763, "train_info/time_within_train_step": 2.698577404022217, "step": 2763} +{"train_info/time_between_train_steps": 0.0034723281860351562, "step": 2763} +{"info/global_step": 2764, "train_info/time_within_train_step": 2.6998138427734375, "step": 2764} +{"train_info/time_between_train_steps": 0.003707408905029297, "step": 2764} +{"info/global_step": 2765, "train_info/time_within_train_step": 2.7279396057128906, "step": 2765} +{"train_info/time_between_train_steps": 0.0035505294799804688, "step": 2765} +{"info/global_step": 2766, "train_info/time_within_train_step": 2.789806842803955, "step": 2766} +{"train_info/time_between_train_steps": 0.003554821014404297, "step": 2766} +{"info/global_step": 2767, "train_info/time_within_train_step": 2.7074174880981445, "step": 2767} +{"train_info/time_between_train_steps": 0.0035886764526367188, "step": 2767} +{"info/global_step": 2768, "train_info/time_within_train_step": 2.700852394104004, "step": 2768} +{"train_info/time_between_train_steps": 0.0035560131072998047, "step": 2768} +{"info/global_step": 2769, "train_info/time_within_train_step": 2.7037723064422607, "step": 2769} +{"train_info/time_between_train_steps": 0.008802175521850586, "step": 2769} +{"info/global_step": 2770, "train_info/time_within_train_step": 2.751777410507202, "step": 2770} +{"train_info/time_between_train_steps": 0.008633613586425781, "step": 2770} +{"info/global_step": 2771, "train_info/time_within_train_step": 2.733048915863037, "step": 2771} +{"train_info/time_between_train_steps": 0.00894021987915039, "step": 2771} +{"info/global_step": 2772, "train_info/time_within_train_step": 2.7018251419067383, "step": 2772} +{"train_info/time_between_train_steps": 0.0038328170776367188, "step": 2772} +{"info/global_step": 2773, "train_info/time_within_train_step": 2.702462673187256, "step": 2773} +{"train_info/time_between_train_steps": 0.009083986282348633, "step": 2773} +{"info/global_step": 2774, "train_info/time_within_train_step": 2.700709104537964, "step": 2774} +{"train_info/time_between_train_steps": 0.0035963058471679688, "step": 2774} +{"info/global_step": 2775, "train_info/time_within_train_step": 2.7004964351654053, "step": 2775} +{"train_info/time_between_train_steps": 0.0035429000854492188, "step": 2775} +{"info/global_step": 2776, "train_info/time_within_train_step": 2.6994996070861816, "step": 2776} +{"train_info/time_between_train_steps": 0.0037567615509033203, "step": 2776} +{"info/global_step": 2777, "train_info/time_within_train_step": 2.701206684112549, "step": 2777} +{"train_info/time_between_train_steps": 0.0035440921783447266, "step": 2777} +{"info/global_step": 2778, "train_info/time_within_train_step": 3.0279996395111084, "step": 2778} +{"train_info/time_between_train_steps": 0.003328084945678711, "step": 2778} +{"info/global_step": 2779, "train_info/time_within_train_step": 2.6981072425842285, "step": 2779} +{"train_info/time_between_train_steps": 0.003505706787109375, "step": 2779} +{"info/global_step": 2780, "train_info/time_within_train_step": 2.698184013366699, "step": 2780} +{"train_info/time_between_train_steps": 0.003286123275756836, "step": 2780} +{"info/global_step": 2781, "train_info/time_within_train_step": 2.698254108428955, "step": 2781} +{"train_info/time_between_train_steps": 0.0033223628997802734, "step": 2781} +{"info/global_step": 2782, "train_info/time_within_train_step": 2.6987879276275635, "step": 2782} +{"train_info/time_between_train_steps": 0.0033369064331054688, "step": 2782} +{"info/global_step": 2783, "train_info/time_within_train_step": 2.697781801223755, "step": 2783} +{"train_info/time_between_train_steps": 0.00341796875, "step": 2783} +{"info/global_step": 2784, "train_info/time_within_train_step": 2.69913649559021, "step": 2784} +{"train_info/time_between_train_steps": 0.0033528804779052734, "step": 2784} +{"info/global_step": 2785, "train_info/time_within_train_step": 2.705251932144165, "step": 2785} +{"train_info/time_between_train_steps": 0.0036344528198242188, "step": 2785} +{"info/global_step": 2786, "train_info/time_within_train_step": 2.6996402740478516, "step": 2786} +{"train_info/time_between_train_steps": 0.003587961196899414, "step": 2786} +{"info/global_step": 2787, "train_info/time_within_train_step": 2.700744152069092, "step": 2787} +{"train_info/time_between_train_steps": 0.0036170482635498047, "step": 2787} +{"info/global_step": 2788, "train_info/time_within_train_step": 2.703246831893921, "step": 2788} +{"train_info/time_between_train_steps": 0.0034978389739990234, "step": 2788} +{"info/global_step": 2789, "train_info/time_within_train_step": 2.698901653289795, "step": 2789} +{"train_info/time_between_train_steps": 0.0034978389739990234, "step": 2789} +{"info/global_step": 2790, "train_info/time_within_train_step": 2.6982338428497314, "step": 2790} +{"train_info/time_between_train_steps": 0.003592967987060547, "step": 2790} +{"info/global_step": 2791, "train_info/time_within_train_step": 2.698880672454834, "step": 2791} +{"train_info/time_between_train_steps": 0.003595113754272461, "step": 2791} +{"info/global_step": 2792, "train_info/time_within_train_step": 2.700216054916382, "step": 2792} +{"train_info/time_between_train_steps": 0.003876209259033203, "step": 2792} +{"info/global_step": 2793, "train_info/time_within_train_step": 2.7008957862854004, "step": 2793} +{"train_info/time_between_train_steps": 0.0037059783935546875, "step": 2793} +{"info/global_step": 2794, "train_info/time_within_train_step": 2.701359748840332, "step": 2794} +{"train_info/time_between_train_steps": 0.0036046504974365234, "step": 2794} +{"info/global_step": 2795, "train_info/time_within_train_step": 2.700146198272705, "step": 2795} +{"train_info/time_between_train_steps": 0.0035886764526367188, "step": 2795} +{"info/global_step": 2796, "train_info/time_within_train_step": 2.6993701457977295, "step": 2796} +{"train_info/time_between_train_steps": 0.003530263900756836, "step": 2796} +{"info/global_step": 2797, "train_info/time_within_train_step": 2.7002246379852295, "step": 2797} +{"train_info/time_between_train_steps": 0.0037240982055664062, "step": 2797} +{"info/global_step": 2798, "train_info/time_within_train_step": 2.698880910873413, "step": 2798} +{"train_info/time_between_train_steps": 0.0037653446197509766, "step": 2798} +{"info/global_step": 2799, "train_info/time_within_train_step": 2.699525833129883, "step": 2799} +{"train_info/time_between_train_steps": 0.003589153289794922, "step": 2799} +{"info/global_step": 2800, "train_info/time_within_train_step": 2.699836015701294, "step": 2800} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746294634, "_runtime": 8656}, "step": 2800} +{"logs": {"train/loss": 4.4219, "train/learning_rate": 4.444444444444444e-05, "train/epoch": 3.18, "_timestamp": 1746294634, "_runtime": 8656}, "step": 2800} +{"train_info/time_between_train_steps": 13.779573202133179, "step": 2800} +{"info/global_step": 2801, "train_info/time_within_train_step": 2.491846799850464, "step": 2801} +{"train_info/time_between_train_steps": 0.0036034584045410156, "step": 2801} +{"info/global_step": 2802, "train_info/time_within_train_step": 2.499162197113037, "step": 2802} +{"train_info/time_between_train_steps": 0.003529071807861328, "step": 2802} +{"info/global_step": 2803, "train_info/time_within_train_step": 2.6858534812927246, "step": 2803} +{"train_info/time_between_train_steps": 0.0037870407104492188, "step": 2803} +{"info/global_step": 2804, "train_info/time_within_train_step": 2.6942858695983887, "step": 2804} +{"train_info/time_between_train_steps": 0.0038225650787353516, "step": 2804} +{"info/global_step": 2805, "train_info/time_within_train_step": 2.6948673725128174, "step": 2805} +{"train_info/time_between_train_steps": 0.0036306381225585938, "step": 2805} +{"info/global_step": 2806, "train_info/time_within_train_step": 2.699026107788086, "step": 2806} +{"train_info/time_between_train_steps": 0.003656148910522461, "step": 2806} +{"info/global_step": 2807, "train_info/time_within_train_step": 2.6977460384368896, "step": 2807} +{"train_info/time_between_train_steps": 0.0037851333618164062, "step": 2807} +{"info/global_step": 2808, "train_info/time_within_train_step": 2.6990621089935303, "step": 2808} +{"train_info/time_between_train_steps": 0.0038602352142333984, "step": 2808} +{"info/global_step": 2809, "train_info/time_within_train_step": 2.798896551132202, "step": 2809} +{"train_info/time_between_train_steps": 0.003622770309448242, "step": 2809} +{"info/global_step": 2810, "train_info/time_within_train_step": 2.73656964302063, "step": 2810} +{"train_info/time_between_train_steps": 0.0036215782165527344, "step": 2810} +{"info/global_step": 2811, "train_info/time_within_train_step": 2.8641748428344727, "step": 2811} +{"train_info/time_between_train_steps": 0.003558635711669922, "step": 2811} +{"info/global_step": 2812, "train_info/time_within_train_step": 2.7096729278564453, "step": 2812} +{"train_info/time_between_train_steps": 0.003650188446044922, "step": 2812} +{"info/global_step": 2813, "train_info/time_within_train_step": 2.700838804244995, "step": 2813} +{"train_info/time_between_train_steps": 0.003556489944458008, "step": 2813} +{"info/global_step": 2814, "train_info/time_within_train_step": 2.700815439224243, "step": 2814} +{"train_info/time_between_train_steps": 0.0035538673400878906, "step": 2814} +{"info/global_step": 2815, "train_info/time_within_train_step": 2.69917893409729, "step": 2815} +{"train_info/time_between_train_steps": 0.003621816635131836, "step": 2815} +{"info/global_step": 2816, "train_info/time_within_train_step": 2.700223207473755, "step": 2816} +{"train_info/time_between_train_steps": 0.003543376922607422, "step": 2816} +{"info/global_step": 2817, "train_info/time_within_train_step": 2.698831796646118, "step": 2817} +{"train_info/time_between_train_steps": 0.00706791877746582, "step": 2817} +{"info/global_step": 2818, "train_info/time_within_train_step": 2.7011778354644775, "step": 2818} +{"train_info/time_between_train_steps": 0.003731966018676758, "step": 2818} +{"info/global_step": 2819, "train_info/time_within_train_step": 2.720651388168335, "step": 2819} +{"train_info/time_between_train_steps": 0.003609180450439453, "step": 2819} +{"info/global_step": 2820, "train_info/time_within_train_step": 2.8844056129455566, "step": 2820} +{"train_info/time_between_train_steps": 0.003733396530151367, "step": 2820} +{"info/global_step": 2821, "train_info/time_within_train_step": 2.77014422416687, "step": 2821} +{"train_info/time_between_train_steps": 0.003682851791381836, "step": 2821} +{"info/global_step": 2822, "train_info/time_within_train_step": 2.7024831771850586, "step": 2822} +{"train_info/time_between_train_steps": 0.003610372543334961, "step": 2822} +{"info/global_step": 2823, "train_info/time_within_train_step": 2.698361396789551, "step": 2823} +{"train_info/time_between_train_steps": 0.0036232471466064453, "step": 2823} +{"info/global_step": 2824, "train_info/time_within_train_step": 2.6989665031433105, "step": 2824} +{"train_info/time_between_train_steps": 0.003694772720336914, "step": 2824} +{"info/global_step": 2825, "train_info/time_within_train_step": 2.9803643226623535, "step": 2825} +{"train_info/time_between_train_steps": 0.003269195556640625, "step": 2825} +{"info/global_step": 2826, "train_info/time_within_train_step": 2.6986589431762695, "step": 2826} +{"train_info/time_between_train_steps": 0.003328084945678711, "step": 2826} +{"info/global_step": 2827, "train_info/time_within_train_step": 2.698848247528076, "step": 2827} +{"train_info/time_between_train_steps": 0.003426074981689453, "step": 2827} +{"info/global_step": 2828, "train_info/time_within_train_step": 2.6986989974975586, "step": 2828} +{"train_info/time_between_train_steps": 0.0033783912658691406, "step": 2828} +{"info/global_step": 2829, "train_info/time_within_train_step": 2.699425220489502, "step": 2829} +{"train_info/time_between_train_steps": 0.003317594528198242, "step": 2829} +{"info/global_step": 2830, "train_info/time_within_train_step": 2.699086904525757, "step": 2830} +{"train_info/time_between_train_steps": 0.003293275833129883, "step": 2830} +{"info/global_step": 2831, "train_info/time_within_train_step": 2.698442220687866, "step": 2831} +{"train_info/time_between_train_steps": 0.0033125877380371094, "step": 2831} +{"info/global_step": 2832, "train_info/time_within_train_step": 2.882535219192505, "step": 2832} +{"train_info/time_between_train_steps": 0.003290891647338867, "step": 2832} +{"info/global_step": 2833, "train_info/time_within_train_step": 2.739391803741455, "step": 2833} +{"train_info/time_between_train_steps": 0.0033044815063476562, "step": 2833} +{"info/global_step": 2834, "train_info/time_within_train_step": 2.698935031890869, "step": 2834} +{"train_info/time_between_train_steps": 0.003297090530395508, "step": 2834} +{"info/global_step": 2835, "train_info/time_within_train_step": 2.6985716819763184, "step": 2835} +{"train_info/time_between_train_steps": 0.003320932388305664, "step": 2835} +{"info/global_step": 2836, "train_info/time_within_train_step": 2.6994547843933105, "step": 2836} +{"train_info/time_between_train_steps": 0.003331899642944336, "step": 2836} +{"info/global_step": 2837, "train_info/time_within_train_step": 2.7004942893981934, "step": 2837} +{"train_info/time_between_train_steps": 0.0066814422607421875, "step": 2837} +{"info/global_step": 2838, "train_info/time_within_train_step": 2.735650062561035, "step": 2838} +{"train_info/time_between_train_steps": 0.005011558532714844, "step": 2838} +{"info/global_step": 2839, "train_info/time_within_train_step": 2.7091732025146484, "step": 2839} +{"train_info/time_between_train_steps": 0.006671428680419922, "step": 2839} +{"info/global_step": 2840, "train_info/time_within_train_step": 2.7211906909942627, "step": 2840} +{"train_info/time_between_train_steps": 0.0033278465270996094, "step": 2840} +{"info/global_step": 2841, "train_info/time_within_train_step": 2.7159245014190674, "step": 2841} +{"train_info/time_between_train_steps": 0.00331878662109375, "step": 2841} +{"info/global_step": 2842, "train_info/time_within_train_step": 2.698244571685791, "step": 2842} +{"train_info/time_between_train_steps": 0.003412008285522461, "step": 2842} +{"info/global_step": 2843, "train_info/time_within_train_step": 2.6986284255981445, "step": 2843} +{"train_info/time_between_train_steps": 0.0033066272735595703, "step": 2843} +{"info/global_step": 2844, "train_info/time_within_train_step": 2.6972131729125977, "step": 2844} +{"train_info/time_between_train_steps": 0.006580352783203125, "step": 2844} +{"info/global_step": 2845, "train_info/time_within_train_step": 2.697641372680664, "step": 2845} +{"train_info/time_between_train_steps": 0.006718873977661133, "step": 2845} +{"info/global_step": 2846, "train_info/time_within_train_step": 2.698138952255249, "step": 2846} +{"train_info/time_between_train_steps": 0.00681757926940918, "step": 2846} +{"info/global_step": 2847, "train_info/time_within_train_step": 2.69754958152771, "step": 2847} +{"train_info/time_between_train_steps": 0.0033185482025146484, "step": 2847} +{"info/global_step": 2848, "train_info/time_within_train_step": 2.6985085010528564, "step": 2848} +{"train_info/time_between_train_steps": 0.0032901763916015625, "step": 2848} +{"info/global_step": 2849, "train_info/time_within_train_step": 2.7004683017730713, "step": 2849} +{"train_info/time_between_train_steps": 0.003751039505004883, "step": 2849} +{"info/global_step": 2850, "train_info/time_within_train_step": 2.69978928565979, "step": 2850} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746294788, "_runtime": 8810}, "step": 2850} +{"logs": {"train/loss": 4.4073, "train/learning_rate": 3.333333333333333e-05, "train/epoch": 3.19, "_timestamp": 1746294788, "_runtime": 8810}, "step": 2850} +{"train_info/time_between_train_steps": 0.9197735786437988, "step": 2850} +{"info/global_step": 2851, "train_info/time_within_train_step": 2.6967434883117676, "step": 2851} +{"train_info/time_between_train_steps": 0.0036156177520751953, "step": 2851} +{"info/global_step": 2852, "train_info/time_within_train_step": 2.6948790550231934, "step": 2852} +{"train_info/time_between_train_steps": 0.003388643264770508, "step": 2852} +{"info/global_step": 2853, "train_info/time_within_train_step": 2.694523572921753, "step": 2853} +{"train_info/time_between_train_steps": 0.003475666046142578, "step": 2853} +{"info/global_step": 2854, "train_info/time_within_train_step": 2.695708751678467, "step": 2854} +{"train_info/time_between_train_steps": 0.0035848617553710938, "step": 2854} +{"info/global_step": 2855, "train_info/time_within_train_step": 2.693779230117798, "step": 2855} +{"train_info/time_between_train_steps": 0.0034554004669189453, "step": 2855} +{"info/global_step": 2856, "train_info/time_within_train_step": 2.6962008476257324, "step": 2856} +{"train_info/time_between_train_steps": 0.003614664077758789, "step": 2856} +{"info/global_step": 2857, "train_info/time_within_train_step": 2.694744110107422, "step": 2857} +{"train_info/time_between_train_steps": 0.003656148910522461, "step": 2857} +{"info/global_step": 2858, "train_info/time_within_train_step": 2.696587562561035, "step": 2858} +{"train_info/time_between_train_steps": 0.0038542747497558594, "step": 2858} +{"info/global_step": 2859, "train_info/time_within_train_step": 2.696601152420044, "step": 2859} +{"train_info/time_between_train_steps": 0.003670930862426758, "step": 2859} +{"info/global_step": 2860, "train_info/time_within_train_step": 2.6976118087768555, "step": 2860} +{"train_info/time_between_train_steps": 0.003633737564086914, "step": 2860} +{"info/global_step": 2861, "train_info/time_within_train_step": 2.6966888904571533, "step": 2861} +{"train_info/time_between_train_steps": 0.003588438034057617, "step": 2861} +{"info/global_step": 2862, "train_info/time_within_train_step": 2.694178819656372, "step": 2862} +{"train_info/time_between_train_steps": 0.0036249160766601562, "step": 2862} +{"info/global_step": 2863, "train_info/time_within_train_step": 2.69755482673645, "step": 2863} +{"train_info/time_between_train_steps": 0.0035507678985595703, "step": 2863} +{"info/global_step": 2864, "train_info/time_within_train_step": 2.694889783859253, "step": 2864} +{"train_info/time_between_train_steps": 0.003541707992553711, "step": 2864} +{"info/global_step": 2865, "train_info/time_within_train_step": 2.6953346729278564, "step": 2865} +{"train_info/time_between_train_steps": 0.0035555362701416016, "step": 2865} +{"info/global_step": 2866, "train_info/time_within_train_step": 2.6952459812164307, "step": 2866} +{"train_info/time_between_train_steps": 0.0036194324493408203, "step": 2866} +{"info/global_step": 2867, "train_info/time_within_train_step": 2.697070360183716, "step": 2867} +{"train_info/time_between_train_steps": 0.0035333633422851562, "step": 2867} +{"info/global_step": 2868, "train_info/time_within_train_step": 2.6971797943115234, "step": 2868} +{"train_info/time_between_train_steps": 0.003602266311645508, "step": 2868} +{"info/global_step": 2869, "train_info/time_within_train_step": 2.697553873062134, "step": 2869} +{"train_info/time_between_train_steps": 0.0035369396209716797, "step": 2869} +{"info/global_step": 2870, "train_info/time_within_train_step": 2.6952381134033203, "step": 2870} +{"train_info/time_between_train_steps": 0.0036830902099609375, "step": 2870} +{"info/global_step": 2871, "train_info/time_within_train_step": 2.694918632507324, "step": 2871} +{"train_info/time_between_train_steps": 0.0038111209869384766, "step": 2871} +{"info/global_step": 2872, "train_info/time_within_train_step": 2.695892095565796, "step": 2872} +{"train_info/time_between_train_steps": 0.0035245418548583984, "step": 2872} +{"info/global_step": 2873, "train_info/time_within_train_step": 2.732851982116699, "step": 2873} +{"train_info/time_between_train_steps": 0.0035505294799804688, "step": 2873} +{"info/global_step": 2874, "train_info/time_within_train_step": 2.695134162902832, "step": 2874} +{"train_info/time_between_train_steps": 0.003629446029663086, "step": 2874} +{"info/global_step": 2875, "train_info/time_within_train_step": 2.6968142986297607, "step": 2875} +{"train_info/time_between_train_steps": 0.0035521984100341797, "step": 2875} +{"info/global_step": 2876, "train_info/time_within_train_step": 2.6962873935699463, "step": 2876} +{"train_info/time_between_train_steps": 0.0037949085235595703, "step": 2876} +{"info/global_step": 2877, "train_info/time_within_train_step": 2.6956424713134766, "step": 2877} +{"train_info/time_between_train_steps": 0.0034842491149902344, "step": 2877} +{"info/global_step": 2878, "train_info/time_within_train_step": 2.696347713470459, "step": 2878} +{"train_info/time_between_train_steps": 0.003670215606689453, "step": 2878} +{"info/global_step": 2879, "train_info/time_within_train_step": 2.6964476108551025, "step": 2879} +{"train_info/time_between_train_steps": 0.0035178661346435547, "step": 2879} +{"info/global_step": 2880, "train_info/time_within_train_step": 2.695136070251465, "step": 2880} +{"train_info/time_between_train_steps": 0.0036864280700683594, "step": 2880} +{"info/global_step": 2881, "train_info/time_within_train_step": 2.6976559162139893, "step": 2881} +{"train_info/time_between_train_steps": 0.0036361217498779297, "step": 2881} +{"info/global_step": 2882, "train_info/time_within_train_step": 2.6984822750091553, "step": 2882} +{"train_info/time_between_train_steps": 0.003720521926879883, "step": 2882} +{"info/global_step": 2883, "train_info/time_within_train_step": 2.697143793106079, "step": 2883} +{"train_info/time_between_train_steps": 0.003668546676635742, "step": 2883} +{"info/global_step": 2884, "train_info/time_within_train_step": 2.6977033615112305, "step": 2884} +{"train_info/time_between_train_steps": 0.0036509037017822266, "step": 2884} +{"info/global_step": 2885, "train_info/time_within_train_step": 2.696523666381836, "step": 2885} +{"train_info/time_between_train_steps": 0.00354766845703125, "step": 2885} +{"info/global_step": 2886, "train_info/time_within_train_step": 2.69903302192688, "step": 2886} +{"train_info/time_between_train_steps": 0.0037724971771240234, "step": 2886} +{"info/global_step": 2887, "train_info/time_within_train_step": 2.696043014526367, "step": 2887} +{"train_info/time_between_train_steps": 0.00383758544921875, "step": 2887} +{"info/global_step": 2888, "train_info/time_within_train_step": 2.6866791248321533, "step": 2888} +{"train_info/time_between_train_steps": 0.003673076629638672, "step": 2888} +{"info/global_step": 2889, "train_info/time_within_train_step": 2.6941418647766113, "step": 2889} +{"train_info/time_between_train_steps": 0.003637552261352539, "step": 2889} +{"info/global_step": 2890, "train_info/time_within_train_step": 2.695479393005371, "step": 2890} +{"train_info/time_between_train_steps": 0.003574848175048828, "step": 2890} +{"info/global_step": 2891, "train_info/time_within_train_step": 2.6940252780914307, "step": 2891} +{"train_info/time_between_train_steps": 0.0036873817443847656, "step": 2891} +{"info/global_step": 2892, "train_info/time_within_train_step": 2.696028470993042, "step": 2892} +{"train_info/time_between_train_steps": 0.00356292724609375, "step": 2892} +{"info/global_step": 2893, "train_info/time_within_train_step": 2.696375608444214, "step": 2893} +{"train_info/time_between_train_steps": 0.0036618709564208984, "step": 2893} +{"info/global_step": 2894, "train_info/time_within_train_step": 2.696453332901001, "step": 2894} +{"train_info/time_between_train_steps": 0.003805875778198242, "step": 2894} +{"info/global_step": 2895, "train_info/time_within_train_step": 2.697061777114868, "step": 2895} +{"train_info/time_between_train_steps": 0.004647493362426758, "step": 2895} +{"info/global_step": 2896, "train_info/time_within_train_step": 2.6974496841430664, "step": 2896} +{"train_info/time_between_train_steps": 0.0038573741912841797, "step": 2896} +{"info/global_step": 2897, "train_info/time_within_train_step": 2.695897340774536, "step": 2897} +{"train_info/time_between_train_steps": 0.003681659698486328, "step": 2897} +{"info/global_step": 2898, "train_info/time_within_train_step": 2.696734666824341, "step": 2898} +{"train_info/time_between_train_steps": 0.003517627716064453, "step": 2898} +{"info/global_step": 2899, "train_info/time_within_train_step": 2.697262763977051, "step": 2899} +{"train_info/time_between_train_steps": 0.0035619735717773438, "step": 2899} +{"info/global_step": 2900, "train_info/time_within_train_step": 2.6973876953125, "step": 2900} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746294940, "_runtime": 8962}, "step": 2900} +{"logs": {"train/loss": 4.393, "train/learning_rate": 2.222222222222222e-05, "train/epoch": 3.21, "_timestamp": 1746294940, "_runtime": 8962}, "step": 2900} +{"train_info/time_between_train_steps": 37.261958837509155, "step": 2900} +{"info/global_step": 2901, "train_info/time_within_train_step": 2.47627854347229, "step": 2901} +{"train_info/time_between_train_steps": 0.003815889358520508, "step": 2901} +{"info/global_step": 2902, "train_info/time_within_train_step": 2.469827890396118, "step": 2902} +{"train_info/time_between_train_steps": 0.0036172866821289062, "step": 2902} +{"info/global_step": 2903, "train_info/time_within_train_step": 2.6225180625915527, "step": 2903} +{"train_info/time_between_train_steps": 0.0036978721618652344, "step": 2903} +{"info/global_step": 2904, "train_info/time_within_train_step": 2.693209648132324, "step": 2904} +{"train_info/time_between_train_steps": 0.003972053527832031, "step": 2904} +{"info/global_step": 2905, "train_info/time_within_train_step": 2.6930954456329346, "step": 2905} +{"train_info/time_between_train_steps": 0.003645181655883789, "step": 2905} +{"info/global_step": 2906, "train_info/time_within_train_step": 2.693941354751587, "step": 2906} +{"train_info/time_between_train_steps": 0.003653287887573242, "step": 2906} +{"info/global_step": 2907, "train_info/time_within_train_step": 2.6952600479125977, "step": 2907} +{"train_info/time_between_train_steps": 0.0037055015563964844, "step": 2907} +{"info/global_step": 2908, "train_info/time_within_train_step": 2.6961724758148193, "step": 2908} +{"train_info/time_between_train_steps": 0.003652811050415039, "step": 2908} +{"info/global_step": 2909, "train_info/time_within_train_step": 2.695579767227173, "step": 2909} +{"train_info/time_between_train_steps": 0.0036470890045166016, "step": 2909} +{"info/global_step": 2910, "train_info/time_within_train_step": 2.891692638397217, "step": 2910} +{"train_info/time_between_train_steps": 0.003442525863647461, "step": 2910} +{"info/global_step": 2911, "train_info/time_within_train_step": 2.697723627090454, "step": 2911} +{"train_info/time_between_train_steps": 0.0036268234252929688, "step": 2911} +{"info/global_step": 2912, "train_info/time_within_train_step": 2.6974222660064697, "step": 2912} +{"train_info/time_between_train_steps": 0.003660917282104492, "step": 2912} +{"info/global_step": 2913, "train_info/time_within_train_step": 2.7328567504882812, "step": 2913} +{"train_info/time_between_train_steps": 0.0036344528198242188, "step": 2913} +{"info/global_step": 2914, "train_info/time_within_train_step": 2.6971421241760254, "step": 2914} +{"train_info/time_between_train_steps": 0.0038776397705078125, "step": 2914} +{"info/global_step": 2915, "train_info/time_within_train_step": 2.6972296237945557, "step": 2915} +{"train_info/time_between_train_steps": 0.0036025047302246094, "step": 2915} +{"info/global_step": 2916, "train_info/time_within_train_step": 2.694591999053955, "step": 2916} +{"train_info/time_between_train_steps": 0.003584623336791992, "step": 2916} +{"info/global_step": 2917, "train_info/time_within_train_step": 2.6941657066345215, "step": 2917} +{"train_info/time_between_train_steps": 0.003755331039428711, "step": 2917} +{"info/global_step": 2918, "train_info/time_within_train_step": 2.6966779232025146, "step": 2918} +{"train_info/time_between_train_steps": 0.009210348129272461, "step": 2918} +{"info/global_step": 2919, "train_info/time_within_train_step": 2.7001569271087646, "step": 2919} +{"train_info/time_between_train_steps": 0.003732442855834961, "step": 2919} +{"info/global_step": 2920, "train_info/time_within_train_step": 2.70013165473938, "step": 2920} +{"train_info/time_between_train_steps": 0.0035550594329833984, "step": 2920} +{"info/global_step": 2921, "train_info/time_within_train_step": 2.696650743484497, "step": 2921} +{"train_info/time_between_train_steps": 0.0036706924438476562, "step": 2921} +{"info/global_step": 2922, "train_info/time_within_train_step": 2.6990623474121094, "step": 2922} +{"train_info/time_between_train_steps": 0.003709554672241211, "step": 2922} +{"info/global_step": 2923, "train_info/time_within_train_step": 2.701042652130127, "step": 2923} +{"train_info/time_between_train_steps": 0.004005908966064453, "step": 2923} +{"info/global_step": 2924, "train_info/time_within_train_step": 2.699929714202881, "step": 2924} +{"train_info/time_between_train_steps": 0.0037441253662109375, "step": 2924} +{"info/global_step": 2925, "train_info/time_within_train_step": 2.6987287998199463, "step": 2925} +{"train_info/time_between_train_steps": 0.0037794113159179688, "step": 2925} +{"info/global_step": 2926, "train_info/time_within_train_step": 2.70021653175354, "step": 2926} +{"train_info/time_between_train_steps": 0.003819704055786133, "step": 2926} +{"info/global_step": 2927, "train_info/time_within_train_step": 2.718172073364258, "step": 2927} +{"train_info/time_between_train_steps": 0.0035791397094726562, "step": 2927} +{"info/global_step": 2928, "train_info/time_within_train_step": 2.6963000297546387, "step": 2928} +{"train_info/time_between_train_steps": 0.0037376880645751953, "step": 2928} +{"info/global_step": 2929, "train_info/time_within_train_step": 2.693824529647827, "step": 2929} +{"train_info/time_between_train_steps": 0.003659486770629883, "step": 2929} +{"info/global_step": 2930, "train_info/time_within_train_step": 2.6953516006469727, "step": 2930} +{"train_info/time_between_train_steps": 0.0036406517028808594, "step": 2930} +{"info/global_step": 2931, "train_info/time_within_train_step": 2.694432258605957, "step": 2931} +{"train_info/time_between_train_steps": 0.0037772655487060547, "step": 2931} +{"info/global_step": 2932, "train_info/time_within_train_step": 2.6945111751556396, "step": 2932} +{"train_info/time_between_train_steps": 0.003638744354248047, "step": 2932} +{"info/global_step": 2933, "train_info/time_within_train_step": 2.696012020111084, "step": 2933} +{"train_info/time_between_train_steps": 0.003606557846069336, "step": 2933} +{"info/global_step": 2934, "train_info/time_within_train_step": 2.6979596614837646, "step": 2934} +{"train_info/time_between_train_steps": 0.0037834644317626953, "step": 2934} +{"info/global_step": 2935, "train_info/time_within_train_step": 2.695598840713501, "step": 2935} +{"train_info/time_between_train_steps": 0.003604888916015625, "step": 2935} +{"info/global_step": 2936, "train_info/time_within_train_step": 2.6964993476867676, "step": 2936} +{"train_info/time_between_train_steps": 0.003657817840576172, "step": 2936} +{"info/global_step": 2937, "train_info/time_within_train_step": 2.6969101428985596, "step": 2937} +{"train_info/time_between_train_steps": 0.003667593002319336, "step": 2937} +{"info/global_step": 2938, "train_info/time_within_train_step": 2.694889783859253, "step": 2938} +{"train_info/time_between_train_steps": 0.0037670135498046875, "step": 2938} +{"info/global_step": 2939, "train_info/time_within_train_step": 2.697927236557007, "step": 2939} +{"train_info/time_between_train_steps": 0.0037994384765625, "step": 2939} +{"info/global_step": 2940, "train_info/time_within_train_step": 2.6976094245910645, "step": 2940} +{"train_info/time_between_train_steps": 0.0037622451782226562, "step": 2940} +{"info/global_step": 2941, "train_info/time_within_train_step": 2.696906566619873, "step": 2941} +{"train_info/time_between_train_steps": 0.006234645843505859, "step": 2941} +{"info/global_step": 2942, "train_info/time_within_train_step": 2.7018885612487793, "step": 2942} +{"train_info/time_between_train_steps": 0.0037152767181396484, "step": 2942} +{"info/global_step": 2943, "train_info/time_within_train_step": 2.6967079639434814, "step": 2943} +{"train_info/time_between_train_steps": 0.0036973953247070312, "step": 2943} +{"info/global_step": 2944, "train_info/time_within_train_step": 2.6967101097106934, "step": 2944} +{"train_info/time_between_train_steps": 0.003705739974975586, "step": 2944} +{"info/global_step": 2945, "train_info/time_within_train_step": 2.700014591217041, "step": 2945} +{"train_info/time_between_train_steps": 0.003673076629638672, "step": 2945} +{"info/global_step": 2946, "train_info/time_within_train_step": 2.6972451210021973, "step": 2946} +{"train_info/time_between_train_steps": 0.003686189651489258, "step": 2946} +{"info/global_step": 2947, "train_info/time_within_train_step": 2.6966326236724854, "step": 2947} +{"train_info/time_between_train_steps": 0.003628253936767578, "step": 2947} +{"info/global_step": 2948, "train_info/time_within_train_step": 2.6960020065307617, "step": 2948} +{"train_info/time_between_train_steps": 0.0037467479705810547, "step": 2948} +{"info/global_step": 2949, "train_info/time_within_train_step": 2.6971073150634766, "step": 2949} +{"train_info/time_between_train_steps": 0.0036504268646240234, "step": 2949} +{"info/global_step": 2950, "train_info/time_within_train_step": 2.6969356536865234, "step": 2950} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746295126, "_runtime": 9148}, "step": 2950} +{"logs": {"train/loss": 4.3941, "train/learning_rate": 1.111111111111111e-05, "train/epoch": 3.23, "_timestamp": 1746295126, "_runtime": 9148}, "step": 2950} +{"train_info/time_between_train_steps": 0.026326656341552734, "step": 2950} +{"info/global_step": 2951, "train_info/time_within_train_step": 2.6974382400512695, "step": 2951} +{"train_info/time_between_train_steps": 0.0035805702209472656, "step": 2951} +{"info/global_step": 2952, "train_info/time_within_train_step": 2.6981465816497803, "step": 2952} +{"train_info/time_between_train_steps": 0.0035436153411865234, "step": 2952} +{"info/global_step": 2953, "train_info/time_within_train_step": 2.6975691318511963, "step": 2953} +{"train_info/time_between_train_steps": 0.0035469532012939453, "step": 2953} +{"info/global_step": 2954, "train_info/time_within_train_step": 2.698058843612671, "step": 2954} +{"train_info/time_between_train_steps": 0.003686189651489258, "step": 2954} +{"info/global_step": 2955, "train_info/time_within_train_step": 2.6959362030029297, "step": 2955} +{"train_info/time_between_train_steps": 0.0036003589630126953, "step": 2955} +{"info/global_step": 2956, "train_info/time_within_train_step": 2.6955316066741943, "step": 2956} +{"train_info/time_between_train_steps": 0.0035772323608398438, "step": 2956} +{"info/global_step": 2957, "train_info/time_within_train_step": 2.696877956390381, "step": 2957} +{"train_info/time_between_train_steps": 0.0035572052001953125, "step": 2957} +{"info/global_step": 2958, "train_info/time_within_train_step": 2.6961491107940674, "step": 2958} +{"train_info/time_between_train_steps": 0.0035719871520996094, "step": 2958} +{"info/global_step": 2959, "train_info/time_within_train_step": 2.696579933166504, "step": 2959} +{"train_info/time_between_train_steps": 0.0035483837127685547, "step": 2959} +{"info/global_step": 2960, "train_info/time_within_train_step": 2.6975409984588623, "step": 2960} +{"train_info/time_between_train_steps": 0.0037059783935546875, "step": 2960} +{"info/global_step": 2961, "train_info/time_within_train_step": 2.69889235496521, "step": 2961} +{"train_info/time_between_train_steps": 0.0036721229553222656, "step": 2961} +{"info/global_step": 2962, "train_info/time_within_train_step": 2.699061870574951, "step": 2962} +{"train_info/time_between_train_steps": 0.0037190914154052734, "step": 2962} +{"info/global_step": 2963, "train_info/time_within_train_step": 2.699542999267578, "step": 2963} +{"train_info/time_between_train_steps": 0.0035707950592041016, "step": 2963} +{"info/global_step": 2964, "train_info/time_within_train_step": 2.6988914012908936, "step": 2964} +{"train_info/time_between_train_steps": 0.003720521926879883, "step": 2964} +{"info/global_step": 2965, "train_info/time_within_train_step": 2.7396490573883057, "step": 2965} +{"train_info/time_between_train_steps": 0.003846406936645508, "step": 2965} +{"info/global_step": 2966, "train_info/time_within_train_step": 2.695678234100342, "step": 2966} +{"train_info/time_between_train_steps": 0.003600597381591797, "step": 2966} +{"info/global_step": 2967, "train_info/time_within_train_step": 2.6958415508270264, "step": 2967} +{"train_info/time_between_train_steps": 0.003612041473388672, "step": 2967} +{"info/global_step": 2968, "train_info/time_within_train_step": 2.692958116531372, "step": 2968} +{"train_info/time_between_train_steps": 0.0035266876220703125, "step": 2968} +{"info/global_step": 2969, "train_info/time_within_train_step": 2.6948904991149902, "step": 2969} +{"train_info/time_between_train_steps": 0.0036101341247558594, "step": 2969} +{"info/global_step": 2970, "train_info/time_within_train_step": 2.6944282054901123, "step": 2970} +{"train_info/time_between_train_steps": 0.003920793533325195, "step": 2970} +{"info/global_step": 2971, "train_info/time_within_train_step": 2.694117307662964, "step": 2971} +{"train_info/time_between_train_steps": 0.0036165714263916016, "step": 2971} +{"info/global_step": 2972, "train_info/time_within_train_step": 2.6952710151672363, "step": 2972} +{"train_info/time_between_train_steps": 0.003576040267944336, "step": 2972} +{"info/global_step": 2973, "train_info/time_within_train_step": 2.6941869258880615, "step": 2973} +{"train_info/time_between_train_steps": 0.0035810470581054688, "step": 2973} +{"info/global_step": 2974, "train_info/time_within_train_step": 2.6944003105163574, "step": 2974} +{"train_info/time_between_train_steps": 0.003500223159790039, "step": 2974} +{"info/global_step": 2975, "train_info/time_within_train_step": 2.692911148071289, "step": 2975} +{"train_info/time_between_train_steps": 0.003449678421020508, "step": 2975} +{"info/global_step": 2976, "train_info/time_within_train_step": 2.6959469318389893, "step": 2976} +{"train_info/time_between_train_steps": 0.003609180450439453, "step": 2976} +{"info/global_step": 2977, "train_info/time_within_train_step": 2.6959006786346436, "step": 2977} +{"train_info/time_between_train_steps": 0.003512144088745117, "step": 2977} +{"info/global_step": 2978, "train_info/time_within_train_step": 2.6946792602539062, "step": 2978} +{"train_info/time_between_train_steps": 0.0036695003509521484, "step": 2978} +{"info/global_step": 2979, "train_info/time_within_train_step": 2.6953365802764893, "step": 2979} +{"train_info/time_between_train_steps": 0.003442049026489258, "step": 2979} +{"info/global_step": 2980, "train_info/time_within_train_step": 2.694146156311035, "step": 2980} +{"train_info/time_between_train_steps": 0.0035562515258789062, "step": 2980} +{"info/global_step": 2981, "train_info/time_within_train_step": 2.6943750381469727, "step": 2981} +{"train_info/time_between_train_steps": 0.003543376922607422, "step": 2981} +{"info/global_step": 2982, "train_info/time_within_train_step": 2.696923017501831, "step": 2982} +{"train_info/time_between_train_steps": 0.0035278797149658203, "step": 2982} +{"info/global_step": 2983, "train_info/time_within_train_step": 2.695021152496338, "step": 2983} +{"train_info/time_between_train_steps": 0.0034775733947753906, "step": 2983} +{"info/global_step": 2984, "train_info/time_within_train_step": 2.6941018104553223, "step": 2984} +{"train_info/time_between_train_steps": 0.003475666046142578, "step": 2984} +{"info/global_step": 2985, "train_info/time_within_train_step": 2.6968467235565186, "step": 2985} +{"train_info/time_between_train_steps": 0.003572225570678711, "step": 2985} +{"info/global_step": 2986, "train_info/time_within_train_step": 2.695321559906006, "step": 2986} +{"train_info/time_between_train_steps": 0.0035305023193359375, "step": 2986} +{"info/global_step": 2987, "train_info/time_within_train_step": 2.6958296298980713, "step": 2987} +{"train_info/time_between_train_steps": 0.0035707950592041016, "step": 2987} +{"info/global_step": 2988, "train_info/time_within_train_step": 2.6959969997406006, "step": 2988} +{"train_info/time_between_train_steps": 0.003448963165283203, "step": 2988} +{"info/global_step": 2989, "train_info/time_within_train_step": 2.695791482925415, "step": 2989} +{"train_info/time_between_train_steps": 0.003505706787109375, "step": 2989} +{"info/global_step": 2990, "train_info/time_within_train_step": 2.6956841945648193, "step": 2990} +{"train_info/time_between_train_steps": 0.003564119338989258, "step": 2990} +{"info/global_step": 2991, "train_info/time_within_train_step": 2.697103500366211, "step": 2991} +{"train_info/time_between_train_steps": 0.003576993942260742, "step": 2991} +{"info/global_step": 2992, "train_info/time_within_train_step": 2.695838451385498, "step": 2992} +{"train_info/time_between_train_steps": 0.0034799575805664062, "step": 2992} +{"info/global_step": 2993, "train_info/time_within_train_step": 2.6954708099365234, "step": 2993} +{"train_info/time_between_train_steps": 0.0035436153411865234, "step": 2993} +{"info/global_step": 2994, "train_info/time_within_train_step": 2.6944427490234375, "step": 2994} +{"train_info/time_between_train_steps": 0.0034737586975097656, "step": 2994} +{"info/global_step": 2995, "train_info/time_within_train_step": 2.6956655979156494, "step": 2995} +{"train_info/time_between_train_steps": 0.003418445587158203, "step": 2995} +{"info/global_step": 2996, "train_info/time_within_train_step": 2.696093797683716, "step": 2996} +{"train_info/time_between_train_steps": 0.0036096572875976562, "step": 2996} +{"info/global_step": 2997, "train_info/time_within_train_step": 2.694183826446533, "step": 2997} +{"train_info/time_between_train_steps": 0.0035157203674316406, "step": 2997} +{"info/global_step": 2998, "train_info/time_within_train_step": 2.697103500366211, "step": 2998} +{"train_info/time_between_train_steps": 0.0034754276275634766, "step": 2998} +{"info/global_step": 2999, "train_info/time_within_train_step": 3.242354393005371, "step": 2999} +{"train_info/time_between_train_steps": 0.0034666061401367188, "step": 2999} +{"info/global_step": 3000, "train_info/time_within_train_step": 2.6978392601013184, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746295276, "_runtime": 9298}, "step": 3000} +{"logs": {"train/loss": 4.3732, "train/learning_rate": 0.0, "train/epoch": 3.24, "_timestamp": 1746295276, "_runtime": 9298}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746295281, "_runtime": 9303}, "step": 3000} +{"logs": {"eval/loss": 4.9404401779174805, "eval/runtime": 5.1695, "eval/samples_per_second": 35.207, "eval/steps_per_second": 1.161, "train/epoch": 3.24, "_timestamp": 1746295281, "_runtime": 9303}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746295281, "_runtime": 9303}, "step": 3000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.9404401779174805, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 139.8317868800711, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 5.1695, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 35.207, "train/epoch": 3.24, "_timestamp": 1746295281, "_runtime": 9303}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.7724609375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746295313, "_runtime": 9335}, "step": 3000} +{"logs": {"train/train_runtime": 9335.7007, "train/train_samples_per_second": 20.566, "train/train_steps_per_second": 0.321, "train/total_flos": 2.5095009337344e+16, "train/train_loss": 5.1549069751103715, "train/epoch": 3.24, "_timestamp": 1746295313, "_runtime": 9335}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746295336, "_runtime": 9358}, "step": 3000} +{"logs": {"eval/loss": 4.9404401779174805, "eval/runtime": 4.6542, "eval/samples_per_second": 39.104, "eval/steps_per_second": 1.289, "train/epoch": 3.24, "_timestamp": 1746295336, "_runtime": 9358}, "step": 3000} +{"train_info": {"train_info/memory_allocated": 1681.771484375, "train_info/memory_max_allocated": 5246.67626953125, "train_info/memory_reserved": 8746.0, "train_info/memory_max_reserved": 8746.0, "_timestamp": 1746295336, "_runtime": 9358}, "step": 3000} +{"logs": {"eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_loss": 4.9404401779174805, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_ppl": 139.8317868800711, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_runtime": 4.6542, "eval//scratch/xiulyang/multilingual-LM/training/multilingual_dataset.py_samples_per_second": 39.104, "train/epoch": 3.24, "_timestamp": 1746295336, "_runtime": 9358}, "step": 3000}