diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -17082,3 +17082,897 @@ {"current_steps": 85315, "total_steps": 89790, "loss": 0.4636, "lr": 3.7753119997054054e-07, "epoch": 9.50161487916249, "percentage": 95.02, "elapsed_time": "6:42:23", "remaining_time": "0:21:06", "throughput": 4286.68, "total_tokens": 103497232} {"current_steps": 85320, "total_steps": 89790, "loss": 0.4589, "lr": 3.766903377901698e-07, "epoch": 9.502171734046108, "percentage": 95.02, "elapsed_time": "6:42:25", "remaining_time": "0:21:04", "throughput": 4286.7, "total_tokens": 103503152} {"current_steps": 85325, "total_steps": 89790, "loss": 0.4676, "lr": 3.758504059573509e-07, "epoch": 9.502728588929726, "percentage": 95.03, "elapsed_time": "6:42:26", "remaining_time": "0:21:03", "throughput": 4286.73, "total_tokens": 103509264} +{"current_steps": 85330, "total_steps": 89790, "loss": 0.4662, "lr": 3.750114045038139e-07, "epoch": 9.503285443813342, "percentage": 95.03, "elapsed_time": "6:42:27", "remaining_time": "0:21:02", "throughput": 4286.75, "total_tokens": 103515376} +{"current_steps": 85335, "total_steps": 89790, "loss": 0.448, "lr": 3.7417333346126126e-07, "epoch": 9.50384229869696, "percentage": 95.04, "elapsed_time": "6:42:29", "remaining_time": "0:21:00", "throughput": 4286.77, "total_tokens": 103521488} +{"current_steps": 85340, "total_steps": 89790, "loss": 0.4623, "lr": 3.7333619286135933e-07, "epoch": 9.504399153580577, "percentage": 95.04, "elapsed_time": "6:42:30", "remaining_time": "0:20:59", "throughput": 4286.8, "total_tokens": 103527728} +{"current_steps": 85345, "total_steps": 89790, "loss": 0.448, "lr": 3.7249998273573284e-07, "epoch": 9.504956008464195, "percentage": 95.05, "elapsed_time": "6:42:31", "remaining_time": "0:20:57", "throughput": 4286.82, "total_tokens": 103533648} +{"current_steps": 85350, "total_steps": 89790, "loss": 0.4578, "lr": 3.7166470311598146e-07, "epoch": 9.505512863347812, "percentage": 95.06, "elapsed_time": "6:42:32", "remaining_time": "0:20:56", "throughput": 4286.85, "total_tokens": 103539952} +{"current_steps": 85355, "total_steps": 89790, "loss": 0.473, "lr": 3.7083035403366327e-07, "epoch": 9.506069718231428, "percentage": 95.06, "elapsed_time": "6:42:34", "remaining_time": "0:20:55", "throughput": 4286.87, "total_tokens": 103546224} +{"current_steps": 85360, "total_steps": 89790, "loss": 0.454, "lr": 3.6999693552030037e-07, "epoch": 9.506626573115046, "percentage": 95.07, "elapsed_time": "6:42:35", "remaining_time": "0:20:53", "throughput": 4286.89, "total_tokens": 103552560} +{"current_steps": 85365, "total_steps": 89790, "loss": 0.4622, "lr": 3.691644476073869e-07, "epoch": 9.507183427998664, "percentage": 95.07, "elapsed_time": "6:42:36", "remaining_time": "0:20:52", "throughput": 4286.92, "total_tokens": 103558288} +{"current_steps": 85370, "total_steps": 89790, "loss": 0.4726, "lr": 3.6833289032637277e-07, "epoch": 9.507740282882281, "percentage": 95.08, "elapsed_time": "6:42:38", "remaining_time": "0:20:50", "throughput": 4286.94, "total_tokens": 103564368} +{"current_steps": 85375, "total_steps": 89790, "loss": 0.4591, "lr": 3.6750226370867724e-07, "epoch": 9.508297137765899, "percentage": 95.08, "elapsed_time": "6:42:39", "remaining_time": "0:20:49", "throughput": 4286.96, "total_tokens": 103570512} +{"current_steps": 85380, "total_steps": 89790, "loss": 0.4589, "lr": 3.666725677856836e-07, "epoch": 9.508853992649515, "percentage": 95.09, "elapsed_time": "6:42:40", "remaining_time": "0:20:47", "throughput": 4286.98, "total_tokens": 103576592} +{"current_steps": 85385, "total_steps": 89790, "loss": 0.4649, "lr": 3.658438025887445e-07, "epoch": 9.509410847533132, "percentage": 95.09, "elapsed_time": "6:42:42", "remaining_time": "0:20:46", "throughput": 4287.01, "total_tokens": 103582736} +{"current_steps": 85390, "total_steps": 89790, "loss": 0.4653, "lr": 3.6501596814917103e-07, "epoch": 9.50996770241675, "percentage": 95.1, "elapsed_time": "6:42:43", "remaining_time": "0:20:45", "throughput": 4287.03, "total_tokens": 103588752} +{"current_steps": 85395, "total_steps": 89790, "loss": 0.4579, "lr": 3.641890644982382e-07, "epoch": 9.510524557300368, "percentage": 95.11, "elapsed_time": "6:42:44", "remaining_time": "0:20:43", "throughput": 4287.06, "total_tokens": 103594736} +{"current_steps": 85400, "total_steps": 89790, "loss": 0.4821, "lr": 3.6336309166719317e-07, "epoch": 9.511081412183986, "percentage": 95.11, "elapsed_time": "6:42:45", "remaining_time": "0:20:42", "throughput": 4287.08, "total_tokens": 103600880} +{"current_steps": 85405, "total_steps": 89790, "loss": 0.4605, "lr": 3.625380496872416e-07, "epoch": 9.511638267067601, "percentage": 95.12, "elapsed_time": "6:42:47", "remaining_time": "0:20:40", "throughput": 4287.11, "total_tokens": 103607312} +{"current_steps": 85410, "total_steps": 89790, "loss": 0.4587, "lr": 3.6171393858956126e-07, "epoch": 9.512195121951219, "percentage": 95.12, "elapsed_time": "6:42:48", "remaining_time": "0:20:39", "throughput": 4287.13, "total_tokens": 103613392} +{"current_steps": 85415, "total_steps": 89790, "loss": 0.4548, "lr": 3.6089075840528006e-07, "epoch": 9.512751976834837, "percentage": 95.13, "elapsed_time": "6:42:49", "remaining_time": "0:20:37", "throughput": 4287.16, "total_tokens": 103619536} +{"current_steps": 85420, "total_steps": 89790, "loss": 0.4609, "lr": 3.600685091655093e-07, "epoch": 9.513308831718454, "percentage": 95.13, "elapsed_time": "6:42:51", "remaining_time": "0:20:36", "throughput": 4287.18, "total_tokens": 103625872} +{"current_steps": 85425, "total_steps": 89790, "loss": 0.4694, "lr": 3.5924719090131285e-07, "epoch": 9.513865686602072, "percentage": 95.14, "elapsed_time": "6:42:52", "remaining_time": "0:20:35", "throughput": 4287.21, "total_tokens": 103632016} +{"current_steps": 85430, "total_steps": 89790, "loss": 0.4509, "lr": 3.5842680364371885e-07, "epoch": 9.514422541485688, "percentage": 95.14, "elapsed_time": "6:42:53", "remaining_time": "0:20:33", "throughput": 4287.23, "total_tokens": 103638256} +{"current_steps": 85435, "total_steps": 89790, "loss": 0.45, "lr": 3.5760734742373294e-07, "epoch": 9.514979396369306, "percentage": 95.15, "elapsed_time": "6:42:54", "remaining_time": "0:20:32", "throughput": 4287.25, "total_tokens": 103644240} +{"current_steps": 85440, "total_steps": 89790, "loss": 0.4543, "lr": 3.5678882227230814e-07, "epoch": 9.515536251252923, "percentage": 95.16, "elapsed_time": "6:42:56", "remaining_time": "0:20:30", "throughput": 4287.27, "total_tokens": 103650448} +{"current_steps": 85445, "total_steps": 89790, "loss": 0.4599, "lr": 3.559712282203781e-07, "epoch": 9.516093106136541, "percentage": 95.16, "elapsed_time": "6:42:57", "remaining_time": "0:20:29", "throughput": 4287.29, "total_tokens": 103656336} +{"current_steps": 85450, "total_steps": 89790, "loss": 0.461, "lr": 3.551545652988292e-07, "epoch": 9.516649961020159, "percentage": 95.17, "elapsed_time": "6:42:58", "remaining_time": "0:20:28", "throughput": 4287.32, "total_tokens": 103662448} +{"current_steps": 85455, "total_steps": 89790, "loss": 0.4642, "lr": 3.543388335385173e-07, "epoch": 9.517206815903776, "percentage": 95.17, "elapsed_time": "6:43:00", "remaining_time": "0:20:26", "throughput": 4287.34, "total_tokens": 103668528} +{"current_steps": 85460, "total_steps": 89790, "loss": 0.4729, "lr": 3.535240329702677e-07, "epoch": 9.517763670787392, "percentage": 95.18, "elapsed_time": "6:43:01", "remaining_time": "0:20:25", "throughput": 4287.37, "total_tokens": 103674800} +{"current_steps": 85465, "total_steps": 89790, "loss": 0.4618, "lr": 3.5271016362486144e-07, "epoch": 9.51832052567101, "percentage": 95.18, "elapsed_time": "6:43:02", "remaining_time": "0:20:23", "throughput": 4287.39, "total_tokens": 103681168} +{"current_steps": 85470, "total_steps": 89790, "loss": 0.4561, "lr": 3.5189722553305436e-07, "epoch": 9.518877380554628, "percentage": 95.19, "elapsed_time": "6:43:04", "remaining_time": "0:20:22", "throughput": 4287.42, "total_tokens": 103687440} +{"current_steps": 85475, "total_steps": 89790, "loss": 0.4672, "lr": 3.510852187255553e-07, "epoch": 9.519434235438245, "percentage": 95.19, "elapsed_time": "6:43:05", "remaining_time": "0:20:20", "throughput": 4287.44, "total_tokens": 103693360} +{"current_steps": 85480, "total_steps": 89790, "loss": 0.4554, "lr": 3.5027414323304806e-07, "epoch": 9.519991090321863, "percentage": 95.2, "elapsed_time": "6:43:06", "remaining_time": "0:20:19", "throughput": 4287.46, "total_tokens": 103699376} +{"current_steps": 85485, "total_steps": 89790, "loss": 0.4572, "lr": 3.494639990861803e-07, "epoch": 9.520547945205479, "percentage": 95.21, "elapsed_time": "6:43:07", "remaining_time": "0:20:18", "throughput": 4287.48, "total_tokens": 103704752} +{"current_steps": 85490, "total_steps": 89790, "loss": 0.4568, "lr": 3.4865478631555814e-07, "epoch": 9.521104800089097, "percentage": 95.21, "elapsed_time": "6:43:09", "remaining_time": "0:20:16", "throughput": 4287.5, "total_tokens": 103711024} +{"current_steps": 85495, "total_steps": 89790, "loss": 0.4514, "lr": 3.478465049517571e-07, "epoch": 9.521661654972714, "percentage": 95.22, "elapsed_time": "6:43:10", "remaining_time": "0:20:15", "throughput": 4287.53, "total_tokens": 103717168} +{"current_steps": 85500, "total_steps": 89790, "loss": 0.4652, "lr": 3.4703915502531657e-07, "epoch": 9.522218509856332, "percentage": 95.22, "elapsed_time": "6:43:11", "remaining_time": "0:20:13", "throughput": 4287.55, "total_tokens": 103723312} +{"current_steps": 85505, "total_steps": 89790, "loss": 0.4634, "lr": 3.4623273656674283e-07, "epoch": 9.52277536473995, "percentage": 95.23, "elapsed_time": "6:43:13", "remaining_time": "0:20:12", "throughput": 4287.58, "total_tokens": 103729552} +{"current_steps": 85510, "total_steps": 89790, "loss": 0.4624, "lr": 3.454272496065003e-07, "epoch": 9.523332219623565, "percentage": 95.23, "elapsed_time": "6:43:14", "remaining_time": "0:20:10", "throughput": 4287.6, "total_tokens": 103735568} +{"current_steps": 85515, "total_steps": 89790, "loss": 0.4764, "lr": 3.4462269417502856e-07, "epoch": 9.523889074507183, "percentage": 95.24, "elapsed_time": "6:43:15", "remaining_time": "0:20:09", "throughput": 4287.62, "total_tokens": 103741520} +{"current_steps": 85520, "total_steps": 89790, "loss": 0.4629, "lr": 3.438190703027228e-07, "epoch": 9.5244459293908, "percentage": 95.24, "elapsed_time": "6:43:16", "remaining_time": "0:20:08", "throughput": 4287.65, "total_tokens": 103747888} +{"current_steps": 85525, "total_steps": 89790, "loss": 0.4693, "lr": 3.4301637801994466e-07, "epoch": 9.525002784274418, "percentage": 95.25, "elapsed_time": "6:43:18", "remaining_time": "0:20:06", "throughput": 4287.67, "total_tokens": 103753648} +{"current_steps": 85530, "total_steps": 89790, "loss": 0.467, "lr": 3.422146173570284e-07, "epoch": 9.525559639158036, "percentage": 95.26, "elapsed_time": "6:43:19", "remaining_time": "0:20:05", "throughput": 4287.69, "total_tokens": 103759856} +{"current_steps": 85535, "total_steps": 89790, "loss": 0.4614, "lr": 3.4141378834426083e-07, "epoch": 9.526116494041652, "percentage": 95.26, "elapsed_time": "6:43:20", "remaining_time": "0:20:03", "throughput": 4287.72, "total_tokens": 103766064} +{"current_steps": 85540, "total_steps": 89790, "loss": 0.4475, "lr": 3.406138910119039e-07, "epoch": 9.52667334892527, "percentage": 95.27, "elapsed_time": "6:43:21", "remaining_time": "0:20:02", "throughput": 4287.74, "total_tokens": 103771568} +{"current_steps": 85545, "total_steps": 89790, "loss": 0.4453, "lr": 3.398149253901778e-07, "epoch": 9.527230203808887, "percentage": 95.27, "elapsed_time": "6:43:23", "remaining_time": "0:20:01", "throughput": 4287.76, "total_tokens": 103777584} +{"current_steps": 85550, "total_steps": 89790, "loss": 0.4625, "lr": 3.390168915092723e-07, "epoch": 9.527787058692505, "percentage": 95.28, "elapsed_time": "6:43:24", "remaining_time": "0:19:59", "throughput": 4287.78, "total_tokens": 103783920} +{"current_steps": 85555, "total_steps": 89790, "loss": 0.4577, "lr": 3.382197893993411e-07, "epoch": 9.528343913576123, "percentage": 95.28, "elapsed_time": "6:43:25", "remaining_time": "0:19:58", "throughput": 4287.8, "total_tokens": 103790032} +{"current_steps": 85560, "total_steps": 89790, "loss": 0.4569, "lr": 3.374236190904961e-07, "epoch": 9.528900768459739, "percentage": 95.29, "elapsed_time": "6:43:27", "remaining_time": "0:19:56", "throughput": 4287.83, "total_tokens": 103796144} +{"current_steps": 85565, "total_steps": 89790, "loss": 0.4687, "lr": 3.3662838061282174e-07, "epoch": 9.529457623343356, "percentage": 95.29, "elapsed_time": "6:43:28", "remaining_time": "0:19:55", "throughput": 4287.85, "total_tokens": 103802288} +{"current_steps": 85570, "total_steps": 89790, "loss": 0.4669, "lr": 3.3583407399636614e-07, "epoch": 9.530014478226974, "percentage": 95.3, "elapsed_time": "6:43:29", "remaining_time": "0:19:53", "throughput": 4287.87, "total_tokens": 103808240} +{"current_steps": 85575, "total_steps": 89790, "loss": 0.4711, "lr": 3.350406992711358e-07, "epoch": 9.530571333110592, "percentage": 95.31, "elapsed_time": "6:43:31", "remaining_time": "0:19:52", "throughput": 4287.89, "total_tokens": 103814352} +{"current_steps": 85580, "total_steps": 89790, "loss": 0.4544, "lr": 3.342482564671151e-07, "epoch": 9.53112818799421, "percentage": 95.31, "elapsed_time": "6:43:32", "remaining_time": "0:19:51", "throughput": 4287.92, "total_tokens": 103820528} +{"current_steps": 85585, "total_steps": 89790, "loss": 0.464, "lr": 3.3345674561423846e-07, "epoch": 9.531685042877825, "percentage": 95.32, "elapsed_time": "6:43:33", "remaining_time": "0:19:49", "throughput": 4287.94, "total_tokens": 103826672} +{"current_steps": 85590, "total_steps": 89790, "loss": 0.4622, "lr": 3.3266616674241526e-07, "epoch": 9.532241897761443, "percentage": 95.32, "elapsed_time": "6:43:34", "remaining_time": "0:19:48", "throughput": 4287.96, "total_tokens": 103832912} +{"current_steps": 85595, "total_steps": 89790, "loss": 0.4627, "lr": 3.3187651988151323e-07, "epoch": 9.53279875264506, "percentage": 95.33, "elapsed_time": "6:43:36", "remaining_time": "0:19:46", "throughput": 4287.98, "total_tokens": 103838928} +{"current_steps": 85600, "total_steps": 89790, "loss": 0.4695, "lr": 3.310878050613697e-07, "epoch": 9.533355607528678, "percentage": 95.33, "elapsed_time": "6:43:37", "remaining_time": "0:19:45", "throughput": 4288.0, "total_tokens": 103844816} +{"current_steps": 85605, "total_steps": 89790, "loss": 0.4702, "lr": 3.3030002231178305e-07, "epoch": 9.533912462412296, "percentage": 95.34, "elapsed_time": "6:43:38", "remaining_time": "0:19:43", "throughput": 4288.03, "total_tokens": 103850928} +{"current_steps": 85610, "total_steps": 89790, "loss": 0.4647, "lr": 3.2951317166252107e-07, "epoch": 9.534469317295912, "percentage": 95.34, "elapsed_time": "6:43:40", "remaining_time": "0:19:42", "throughput": 4288.05, "total_tokens": 103856912} +{"current_steps": 85615, "total_steps": 89790, "loss": 0.4498, "lr": 3.287272531433128e-07, "epoch": 9.53502617217953, "percentage": 95.35, "elapsed_time": "6:43:41", "remaining_time": "0:19:41", "throughput": 4288.07, "total_tokens": 103862768} +{"current_steps": 85620, "total_steps": 89790, "loss": 0.4568, "lr": 3.2794226678384834e-07, "epoch": 9.535583027063147, "percentage": 95.36, "elapsed_time": "6:43:42", "remaining_time": "0:19:39", "throughput": 4288.09, "total_tokens": 103869008} +{"current_steps": 85625, "total_steps": 89790, "loss": 0.4614, "lr": 3.271582126137929e-07, "epoch": 9.536139881946765, "percentage": 95.36, "elapsed_time": "6:43:43", "remaining_time": "0:19:38", "throughput": 4288.11, "total_tokens": 103875024} +{"current_steps": 85630, "total_steps": 89790, "loss": 0.4755, "lr": 3.263750906627672e-07, "epoch": 9.536696736830383, "percentage": 95.37, "elapsed_time": "6:43:45", "remaining_time": "0:19:36", "throughput": 4288.14, "total_tokens": 103881328} +{"current_steps": 85635, "total_steps": 89790, "loss": 0.4624, "lr": 3.255929009603642e-07, "epoch": 9.537253591713998, "percentage": 95.37, "elapsed_time": "6:43:46", "remaining_time": "0:19:35", "throughput": 4288.16, "total_tokens": 103887504} +{"current_steps": 85640, "total_steps": 89790, "loss": 0.4503, "lr": 3.2481164353613256e-07, "epoch": 9.537810446597616, "percentage": 95.38, "elapsed_time": "6:43:47", "remaining_time": "0:19:34", "throughput": 4288.19, "total_tokens": 103893872} +{"current_steps": 85645, "total_steps": 89790, "loss": 0.4564, "lr": 3.2403131841959036e-07, "epoch": 9.538367301481234, "percentage": 95.38, "elapsed_time": "6:43:49", "remaining_time": "0:19:32", "throughput": 4288.21, "total_tokens": 103899888} +{"current_steps": 85650, "total_steps": 89790, "loss": 0.4625, "lr": 3.2325192564022777e-07, "epoch": 9.538924156364851, "percentage": 95.39, "elapsed_time": "6:43:50", "remaining_time": "0:19:31", "throughput": 4288.23, "total_tokens": 103905616} +{"current_steps": 85655, "total_steps": 89790, "loss": 0.4521, "lr": 3.224734652274825e-07, "epoch": 9.53948101124847, "percentage": 95.39, "elapsed_time": "6:43:51", "remaining_time": "0:19:29", "throughput": 4288.26, "total_tokens": 103911888} +{"current_steps": 85660, "total_steps": 89790, "loss": 0.4569, "lr": 3.216959372107753e-07, "epoch": 9.540037866132085, "percentage": 95.4, "elapsed_time": "6:43:53", "remaining_time": "0:19:28", "throughput": 4288.28, "total_tokens": 103918000} +{"current_steps": 85665, "total_steps": 89790, "loss": 0.4561, "lr": 3.2091934161948277e-07, "epoch": 9.540594721015703, "percentage": 95.41, "elapsed_time": "6:43:54", "remaining_time": "0:19:26", "throughput": 4288.3, "total_tokens": 103923952} +{"current_steps": 85670, "total_steps": 89790, "loss": 0.4558, "lr": 3.2014367848294257e-07, "epoch": 9.54115157589932, "percentage": 95.41, "elapsed_time": "6:43:55", "remaining_time": "0:19:25", "throughput": 4288.33, "total_tokens": 103929872} +{"current_steps": 85675, "total_steps": 89790, "loss": 0.4563, "lr": 3.193689478304646e-07, "epoch": 9.541708430782938, "percentage": 95.42, "elapsed_time": "6:43:56", "remaining_time": "0:19:24", "throughput": 4288.35, "total_tokens": 103936176} +{"current_steps": 85680, "total_steps": 89790, "loss": 0.4617, "lr": 3.1859514969132255e-07, "epoch": 9.542265285666556, "percentage": 95.42, "elapsed_time": "6:43:58", "remaining_time": "0:19:22", "throughput": 4288.38, "total_tokens": 103942704} +{"current_steps": 85685, "total_steps": 89790, "loss": 0.4589, "lr": 3.1782228409475143e-07, "epoch": 9.542822140550173, "percentage": 95.43, "elapsed_time": "6:43:59", "remaining_time": "0:19:21", "throughput": 4288.41, "total_tokens": 103948976} +{"current_steps": 85690, "total_steps": 89790, "loss": 0.4513, "lr": 3.170503510699502e-07, "epoch": 9.54337899543379, "percentage": 95.43, "elapsed_time": "6:44:00", "remaining_time": "0:19:19", "throughput": 4288.43, "total_tokens": 103955184} +{"current_steps": 85695, "total_steps": 89790, "loss": 0.4561, "lr": 3.1627935064608703e-07, "epoch": 9.543935850317407, "percentage": 95.44, "elapsed_time": "6:44:02", "remaining_time": "0:19:18", "throughput": 4288.46, "total_tokens": 103961616} +{"current_steps": 85700, "total_steps": 89790, "loss": 0.4543, "lr": 3.155092828522971e-07, "epoch": 9.544492705201025, "percentage": 95.44, "elapsed_time": "6:44:03", "remaining_time": "0:19:17", "throughput": 4288.48, "total_tokens": 103967088} +{"current_steps": 85705, "total_steps": 89790, "loss": 0.4496, "lr": 3.147401477176681e-07, "epoch": 9.545049560084642, "percentage": 95.45, "elapsed_time": "6:44:04", "remaining_time": "0:19:15", "throughput": 4288.5, "total_tokens": 103972944} +{"current_steps": 85710, "total_steps": 89790, "loss": 0.4486, "lr": 3.139719452712658e-07, "epoch": 9.54560641496826, "percentage": 95.46, "elapsed_time": "6:44:05", "remaining_time": "0:19:14", "throughput": 4288.51, "total_tokens": 103978064} +{"current_steps": 85715, "total_steps": 89790, "loss": 0.4498, "lr": 3.132046755421114e-07, "epoch": 9.546163269851876, "percentage": 95.46, "elapsed_time": "6:44:06", "remaining_time": "0:19:12", "throughput": 4288.53, "total_tokens": 103984016} +{"current_steps": 85720, "total_steps": 89790, "loss": 0.4661, "lr": 3.1243833855919836e-07, "epoch": 9.546720124735494, "percentage": 95.47, "elapsed_time": "6:44:08", "remaining_time": "0:19:11", "throughput": 4288.56, "total_tokens": 103990000} +{"current_steps": 85725, "total_steps": 89790, "loss": 0.4558, "lr": 3.116729343514785e-07, "epoch": 9.547276979619111, "percentage": 95.47, "elapsed_time": "6:44:09", "remaining_time": "0:19:09", "throughput": 4288.58, "total_tokens": 103995920} +{"current_steps": 85730, "total_steps": 89790, "loss": 0.4601, "lr": 3.109084629478759e-07, "epoch": 9.547833834502729, "percentage": 95.48, "elapsed_time": "6:44:10", "remaining_time": "0:19:08", "throughput": 4288.61, "total_tokens": 104002128} +{"current_steps": 85735, "total_steps": 89790, "loss": 0.4628, "lr": 3.101449243772703e-07, "epoch": 9.548390689386347, "percentage": 95.48, "elapsed_time": "6:44:12", "remaining_time": "0:19:07", "throughput": 4288.63, "total_tokens": 104008080} +{"current_steps": 85740, "total_steps": 89790, "loss": 0.4613, "lr": 3.093823186685108e-07, "epoch": 9.548947544269963, "percentage": 95.49, "elapsed_time": "6:44:13", "remaining_time": "0:19:05", "throughput": 4288.66, "total_tokens": 104014576} +{"current_steps": 85745, "total_steps": 89790, "loss": 0.4535, "lr": 3.086206458504159e-07, "epoch": 9.54950439915358, "percentage": 95.5, "elapsed_time": "6:44:14", "remaining_time": "0:19:04", "throughput": 4288.68, "total_tokens": 104020528} +{"current_steps": 85750, "total_steps": 89790, "loss": 0.4498, "lr": 3.078599059517545e-07, "epoch": 9.550061254037198, "percentage": 95.5, "elapsed_time": "6:44:15", "remaining_time": "0:19:02", "throughput": 4288.7, "total_tokens": 104026544} +{"current_steps": 85755, "total_steps": 89790, "loss": 0.4748, "lr": 3.0710009900127847e-07, "epoch": 9.550618108920816, "percentage": 95.51, "elapsed_time": "6:44:17", "remaining_time": "0:19:01", "throughput": 4288.72, "total_tokens": 104032752} +{"current_steps": 85760, "total_steps": 89790, "loss": 0.4538, "lr": 3.0634122502769536e-07, "epoch": 9.551174963804433, "percentage": 95.51, "elapsed_time": "6:44:18", "remaining_time": "0:18:59", "throughput": 4288.75, "total_tokens": 104038992} +{"current_steps": 85765, "total_steps": 89790, "loss": 0.4495, "lr": 3.0558328405967396e-07, "epoch": 9.551731818688049, "percentage": 95.52, "elapsed_time": "6:44:19", "remaining_time": "0:18:58", "throughput": 4288.77, "total_tokens": 104045488} +{"current_steps": 85770, "total_steps": 89790, "loss": 0.4681, "lr": 3.048262761258525e-07, "epoch": 9.552288673571667, "percentage": 95.52, "elapsed_time": "6:44:21", "remaining_time": "0:18:57", "throughput": 4288.8, "total_tokens": 104051568} +{"current_steps": 85775, "total_steps": 89790, "loss": 0.4737, "lr": 3.0407020125483297e-07, "epoch": 9.552845528455284, "percentage": 95.53, "elapsed_time": "6:44:22", "remaining_time": "0:18:55", "throughput": 4288.82, "total_tokens": 104057616} +{"current_steps": 85780, "total_steps": 89790, "loss": 0.4628, "lr": 3.0331505947518714e-07, "epoch": 9.553402383338902, "percentage": 95.53, "elapsed_time": "6:44:23", "remaining_time": "0:18:54", "throughput": 4288.83, "total_tokens": 104063248} +{"current_steps": 85785, "total_steps": 89790, "loss": 0.4671, "lr": 3.025608508154393e-07, "epoch": 9.55395923822252, "percentage": 95.54, "elapsed_time": "6:44:25", "remaining_time": "0:18:52", "throughput": 4288.86, "total_tokens": 104069488} +{"current_steps": 85790, "total_steps": 89790, "loss": 0.4593, "lr": 3.0180757530408887e-07, "epoch": 9.554516093106137, "percentage": 95.55, "elapsed_time": "6:44:26", "remaining_time": "0:18:51", "throughput": 4288.88, "total_tokens": 104075792} +{"current_steps": 85795, "total_steps": 89790, "loss": 0.4657, "lr": 3.0105523296959924e-07, "epoch": 9.555072947989753, "percentage": 95.55, "elapsed_time": "6:44:27", "remaining_time": "0:18:50", "throughput": 4288.9, "total_tokens": 104081648} +{"current_steps": 85800, "total_steps": 89790, "loss": 0.4713, "lr": 3.003038238403949e-07, "epoch": 9.555629802873371, "percentage": 95.56, "elapsed_time": "6:44:28", "remaining_time": "0:18:48", "throughput": 4288.92, "total_tokens": 104087632} +{"current_steps": 85805, "total_steps": 89790, "loss": 0.4513, "lr": 2.99553347944867e-07, "epoch": 9.556186657756989, "percentage": 95.56, "elapsed_time": "6:44:30", "remaining_time": "0:18:47", "throughput": 4288.95, "total_tokens": 104093936} +{"current_steps": 85810, "total_steps": 89790, "loss": 0.4618, "lr": 2.9880380531136787e-07, "epoch": 9.556743512640606, "percentage": 95.57, "elapsed_time": "6:44:31", "remaining_time": "0:18:45", "throughput": 4288.97, "total_tokens": 104100304} +{"current_steps": 85815, "total_steps": 89790, "loss": 0.4587, "lr": 2.980551959682221e-07, "epoch": 9.557300367524224, "percentage": 95.57, "elapsed_time": "6:44:32", "remaining_time": "0:18:44", "throughput": 4288.99, "total_tokens": 104106416} +{"current_steps": 85820, "total_steps": 89790, "loss": 0.4623, "lr": 2.9730751994370975e-07, "epoch": 9.55785722240784, "percentage": 95.58, "elapsed_time": "6:44:34", "remaining_time": "0:18:42", "throughput": 4289.01, "total_tokens": 104112304} +{"current_steps": 85825, "total_steps": 89790, "loss": 0.466, "lr": 2.9656077726608335e-07, "epoch": 9.558414077291458, "percentage": 95.58, "elapsed_time": "6:44:35", "remaining_time": "0:18:41", "throughput": 4289.03, "total_tokens": 104118320} +{"current_steps": 85830, "total_steps": 89790, "loss": 0.4574, "lr": 2.958149679635563e-07, "epoch": 9.558970932175075, "percentage": 95.59, "elapsed_time": "6:44:36", "remaining_time": "0:18:40", "throughput": 4289.06, "total_tokens": 104124496} +{"current_steps": 85835, "total_steps": 89790, "loss": 0.4599, "lr": 2.9507009206430904e-07, "epoch": 9.559527787058693, "percentage": 95.6, "elapsed_time": "6:44:38", "remaining_time": "0:18:38", "throughput": 4289.08, "total_tokens": 104130416} +{"current_steps": 85840, "total_steps": 89790, "loss": 0.4564, "lr": 2.9432614959648555e-07, "epoch": 9.56008464194231, "percentage": 95.6, "elapsed_time": "6:44:39", "remaining_time": "0:18:37", "throughput": 4289.1, "total_tokens": 104136400} +{"current_steps": 85845, "total_steps": 89790, "loss": 0.4571, "lr": 2.9358314058819394e-07, "epoch": 9.560641496825927, "percentage": 95.61, "elapsed_time": "6:44:40", "remaining_time": "0:18:35", "throughput": 4289.13, "total_tokens": 104142608} +{"current_steps": 85850, "total_steps": 89790, "loss": 0.4701, "lr": 2.928410650675034e-07, "epoch": 9.561198351709544, "percentage": 95.61, "elapsed_time": "6:44:41", "remaining_time": "0:18:34", "throughput": 4289.15, "total_tokens": 104148304} +{"current_steps": 85855, "total_steps": 89790, "loss": 0.4571, "lr": 2.9209992306245826e-07, "epoch": 9.561755206593162, "percentage": 95.62, "elapsed_time": "6:44:43", "remaining_time": "0:18:32", "throughput": 4289.17, "total_tokens": 104154384} +{"current_steps": 85860, "total_steps": 89790, "loss": 0.4709, "lr": 2.913597146010583e-07, "epoch": 9.56231206147678, "percentage": 95.62, "elapsed_time": "6:44:44", "remaining_time": "0:18:31", "throughput": 4289.19, "total_tokens": 104160720} +{"current_steps": 85865, "total_steps": 89790, "loss": 0.4574, "lr": 2.9062043971126997e-07, "epoch": 9.562868916360397, "percentage": 95.63, "elapsed_time": "6:44:45", "remaining_time": "0:18:30", "throughput": 4289.22, "total_tokens": 104166928} +{"current_steps": 85870, "total_steps": 89790, "loss": 0.4533, "lr": 2.8988209842102655e-07, "epoch": 9.563425771244013, "percentage": 95.63, "elapsed_time": "6:44:47", "remaining_time": "0:18:28", "throughput": 4289.24, "total_tokens": 104173072} +{"current_steps": 85875, "total_steps": 89790, "loss": 0.4663, "lr": 2.8914469075822517e-07, "epoch": 9.56398262612763, "percentage": 95.64, "elapsed_time": "6:44:48", "remaining_time": "0:18:27", "throughput": 4289.26, "total_tokens": 104178992} +{"current_steps": 85880, "total_steps": 89790, "loss": 0.4793, "lr": 2.884082167507268e-07, "epoch": 9.564539481011249, "percentage": 95.65, "elapsed_time": "6:44:49", "remaining_time": "0:18:25", "throughput": 4289.28, "total_tokens": 104185008} +{"current_steps": 85885, "total_steps": 89790, "loss": 0.4697, "lr": 2.8767267642635933e-07, "epoch": 9.565096335894866, "percentage": 95.65, "elapsed_time": "6:44:50", "remaining_time": "0:18:24", "throughput": 4289.31, "total_tokens": 104191184} +{"current_steps": 85890, "total_steps": 89790, "loss": 0.4646, "lr": 2.869380698129143e-07, "epoch": 9.565653190778484, "percentage": 95.66, "elapsed_time": "6:44:52", "remaining_time": "0:18:23", "throughput": 4289.33, "total_tokens": 104197360} +{"current_steps": 85895, "total_steps": 89790, "loss": 0.4572, "lr": 2.8620439693814174e-07, "epoch": 9.5662100456621, "percentage": 95.66, "elapsed_time": "6:44:53", "remaining_time": "0:18:21", "throughput": 4289.35, "total_tokens": 104202992} +{"current_steps": 85900, "total_steps": 89790, "loss": 0.4662, "lr": 2.8547165782976947e-07, "epoch": 9.566766900545717, "percentage": 95.67, "elapsed_time": "6:44:54", "remaining_time": "0:18:20", "throughput": 4289.38, "total_tokens": 104208976} +{"current_steps": 85905, "total_steps": 89790, "loss": 0.4624, "lr": 2.847398525154782e-07, "epoch": 9.567323755429335, "percentage": 95.67, "elapsed_time": "6:44:55", "remaining_time": "0:18:18", "throughput": 4289.4, "total_tokens": 104214960} +{"current_steps": 85910, "total_steps": 89790, "loss": 0.4604, "lr": 2.8400898102292073e-07, "epoch": 9.567880610312953, "percentage": 95.68, "elapsed_time": "6:44:57", "remaining_time": "0:18:17", "throughput": 4289.42, "total_tokens": 104221136} +{"current_steps": 85915, "total_steps": 89790, "loss": 0.4578, "lr": 2.8327904337970555e-07, "epoch": 9.56843746519657, "percentage": 95.68, "elapsed_time": "6:44:58", "remaining_time": "0:18:15", "throughput": 4289.45, "total_tokens": 104227344} +{"current_steps": 85920, "total_steps": 89790, "loss": 0.47, "lr": 2.8255003961342177e-07, "epoch": 9.568994320080186, "percentage": 95.69, "elapsed_time": "6:44:59", "remaining_time": "0:18:14", "throughput": 4289.47, "total_tokens": 104233520} +{"current_steps": 85925, "total_steps": 89790, "loss": 0.4534, "lr": 2.818219697516056e-07, "epoch": 9.569551174963804, "percentage": 95.7, "elapsed_time": "6:45:01", "remaining_time": "0:18:13", "throughput": 4289.49, "total_tokens": 104239824} +{"current_steps": 85930, "total_steps": 89790, "loss": 0.4639, "lr": 2.8109483382177114e-07, "epoch": 9.570108029847422, "percentage": 95.7, "elapsed_time": "6:45:02", "remaining_time": "0:18:11", "throughput": 4289.52, "total_tokens": 104246352} +{"current_steps": 85935, "total_steps": 89790, "loss": 0.4663, "lr": 2.8036863185138815e-07, "epoch": 9.57066488473104, "percentage": 95.71, "elapsed_time": "6:45:03", "remaining_time": "0:18:10", "throughput": 4289.55, "total_tokens": 104252720} +{"current_steps": 85940, "total_steps": 89790, "loss": 0.4489, "lr": 2.796433638678958e-07, "epoch": 9.571221739614657, "percentage": 95.71, "elapsed_time": "6:45:05", "remaining_time": "0:18:08", "throughput": 4289.57, "total_tokens": 104258896} +{"current_steps": 85945, "total_steps": 89790, "loss": 0.4689, "lr": 2.789190298986999e-07, "epoch": 9.571778594498273, "percentage": 95.72, "elapsed_time": "6:45:06", "remaining_time": "0:18:07", "throughput": 4289.6, "total_tokens": 104265072} +{"current_steps": 85950, "total_steps": 89790, "loss": 0.4608, "lr": 2.781956299711619e-07, "epoch": 9.57233544938189, "percentage": 95.72, "elapsed_time": "6:45:07", "remaining_time": "0:18:06", "throughput": 4289.62, "total_tokens": 104271088} +{"current_steps": 85955, "total_steps": 89790, "loss": 0.4612, "lr": 2.7747316411261827e-07, "epoch": 9.572892304265508, "percentage": 95.73, "elapsed_time": "6:45:08", "remaining_time": "0:18:04", "throughput": 4289.64, "total_tokens": 104276656} +{"current_steps": 85960, "total_steps": 89790, "loss": 0.4716, "lr": 2.767516323503694e-07, "epoch": 9.573449159149126, "percentage": 95.73, "elapsed_time": "6:45:10", "remaining_time": "0:18:03", "throughput": 4289.66, "total_tokens": 104282800} +{"current_steps": 85965, "total_steps": 89790, "loss": 0.4574, "lr": 2.7603103471166846e-07, "epoch": 9.574006014032744, "percentage": 95.74, "elapsed_time": "6:45:11", "remaining_time": "0:18:01", "throughput": 4289.68, "total_tokens": 104288656} +{"current_steps": 85970, "total_steps": 89790, "loss": 0.4692, "lr": 2.7531137122375206e-07, "epoch": 9.57456286891636, "percentage": 95.75, "elapsed_time": "6:45:12", "remaining_time": "0:18:00", "throughput": 4289.7, "total_tokens": 104294704} +{"current_steps": 85975, "total_steps": 89790, "loss": 0.4602, "lr": 2.745926419138012e-07, "epoch": 9.575119723799977, "percentage": 95.75, "elapsed_time": "6:45:14", "remaining_time": "0:17:58", "throughput": 4289.73, "total_tokens": 104301168} +{"current_steps": 85980, "total_steps": 89790, "loss": 0.4519, "lr": 2.738748468089802e-07, "epoch": 9.575676578683595, "percentage": 95.76, "elapsed_time": "6:45:15", "remaining_time": "0:17:57", "throughput": 4289.75, "total_tokens": 104307376} +{"current_steps": 85985, "total_steps": 89790, "loss": 0.4614, "lr": 2.731579859364064e-07, "epoch": 9.576233433567213, "percentage": 95.76, "elapsed_time": "6:45:16", "remaining_time": "0:17:56", "throughput": 4289.78, "total_tokens": 104313904} +{"current_steps": 85990, "total_steps": 89790, "loss": 0.4668, "lr": 2.724420593231636e-07, "epoch": 9.57679028845083, "percentage": 95.77, "elapsed_time": "6:45:18", "remaining_time": "0:17:54", "throughput": 4289.8, "total_tokens": 104320016} +{"current_steps": 85995, "total_steps": 89790, "loss": 0.4668, "lr": 2.7172706699630234e-07, "epoch": 9.577347143334446, "percentage": 95.77, "elapsed_time": "6:45:19", "remaining_time": "0:17:53", "throughput": 4289.83, "total_tokens": 104326224} +{"current_steps": 86000, "total_steps": 89790, "loss": 0.4569, "lr": 2.7101300898284e-07, "epoch": 9.577903998218064, "percentage": 95.78, "elapsed_time": "6:45:20", "remaining_time": "0:17:51", "throughput": 4289.85, "total_tokens": 104332656} +{"current_steps": 86005, "total_steps": 89790, "loss": 0.4647, "lr": 2.702998853097549e-07, "epoch": 9.578460853101681, "percentage": 95.78, "elapsed_time": "6:45:22", "remaining_time": "0:17:50", "throughput": 4289.88, "total_tokens": 104338768} +{"current_steps": 86010, "total_steps": 89790, "loss": 0.4636, "lr": 2.695876960039867e-07, "epoch": 9.5790177079853, "percentage": 95.79, "elapsed_time": "6:45:23", "remaining_time": "0:17:48", "throughput": 4289.89, "total_tokens": 104344400} +{"current_steps": 86015, "total_steps": 89790, "loss": 0.457, "lr": 2.688764410924499e-07, "epoch": 9.579574562868917, "percentage": 95.8, "elapsed_time": "6:45:24", "remaining_time": "0:17:47", "throughput": 4289.92, "total_tokens": 104350384} +{"current_steps": 86020, "total_steps": 89790, "loss": 0.4763, "lr": 2.681661206020175e-07, "epoch": 9.580131417752535, "percentage": 95.8, "elapsed_time": "6:45:25", "remaining_time": "0:17:46", "throughput": 4289.93, "total_tokens": 104355728} +{"current_steps": 86025, "total_steps": 89790, "loss": 0.4601, "lr": 2.674567345595236e-07, "epoch": 9.58068827263615, "percentage": 95.81, "elapsed_time": "6:45:27", "remaining_time": "0:17:44", "throughput": 4289.95, "total_tokens": 104362096} +{"current_steps": 86030, "total_steps": 89790, "loss": 0.4505, "lr": 2.6674828299177446e-07, "epoch": 9.581245127519768, "percentage": 95.81, "elapsed_time": "6:45:28", "remaining_time": "0:17:43", "throughput": 4289.97, "total_tokens": 104367984} +{"current_steps": 86035, "total_steps": 89790, "loss": 0.4651, "lr": 2.6604076592553764e-07, "epoch": 9.581801982403386, "percentage": 95.82, "elapsed_time": "6:45:29", "remaining_time": "0:17:41", "throughput": 4290.0, "total_tokens": 104374096} +{"current_steps": 86040, "total_steps": 89790, "loss": 0.4513, "lr": 2.6533418338754445e-07, "epoch": 9.582358837287003, "percentage": 95.82, "elapsed_time": "6:45:30", "remaining_time": "0:17:40", "throughput": 4290.02, "total_tokens": 104380304} +{"current_steps": 86045, "total_steps": 89790, "loss": 0.4583, "lr": 2.646285354044903e-07, "epoch": 9.582915692170621, "percentage": 95.83, "elapsed_time": "6:45:32", "remaining_time": "0:17:39", "throughput": 4290.04, "total_tokens": 104386288} +{"current_steps": 86050, "total_steps": 89790, "loss": 0.4584, "lr": 2.6392382200303713e-07, "epoch": 9.583472547054237, "percentage": 95.83, "elapsed_time": "6:45:33", "remaining_time": "0:17:37", "throughput": 4290.07, "total_tokens": 104392560} +{"current_steps": 86055, "total_steps": 89790, "loss": 0.4672, "lr": 2.632200432098192e-07, "epoch": 9.584029401937855, "percentage": 95.84, "elapsed_time": "6:45:34", "remaining_time": "0:17:36", "throughput": 4290.09, "total_tokens": 104398960} +{"current_steps": 86060, "total_steps": 89790, "loss": 0.4602, "lr": 2.6251719905141527e-07, "epoch": 9.584586256821472, "percentage": 95.85, "elapsed_time": "6:45:36", "remaining_time": "0:17:34", "throughput": 4290.12, "total_tokens": 104405072} +{"current_steps": 86065, "total_steps": 89790, "loss": 0.4473, "lr": 2.618152895543874e-07, "epoch": 9.58514311170509, "percentage": 95.85, "elapsed_time": "6:45:37", "remaining_time": "0:17:33", "throughput": 4290.14, "total_tokens": 104411376} +{"current_steps": 86070, "total_steps": 89790, "loss": 0.4698, "lr": 2.6111431474525603e-07, "epoch": 9.585699966588708, "percentage": 95.86, "elapsed_time": "6:45:38", "remaining_time": "0:17:31", "throughput": 4290.17, "total_tokens": 104417712} +{"current_steps": 86075, "total_steps": 89790, "loss": 0.4524, "lr": 2.604142746505056e-07, "epoch": 9.586256821472324, "percentage": 95.86, "elapsed_time": "6:45:40", "remaining_time": "0:17:30", "throughput": 4290.19, "total_tokens": 104423920} +{"current_steps": 86080, "total_steps": 89790, "loss": 0.4524, "lr": 2.597151692965871e-07, "epoch": 9.586813676355941, "percentage": 95.87, "elapsed_time": "6:45:41", "remaining_time": "0:17:29", "throughput": 4290.21, "total_tokens": 104429680} +{"current_steps": 86085, "total_steps": 89790, "loss": 0.4645, "lr": 2.5901699870991003e-07, "epoch": 9.587370531239559, "percentage": 95.87, "elapsed_time": "6:45:42", "remaining_time": "0:17:27", "throughput": 4290.23, "total_tokens": 104435920} +{"current_steps": 86090, "total_steps": 89790, "loss": 0.4562, "lr": 2.5831976291686153e-07, "epoch": 9.587927386123177, "percentage": 95.88, "elapsed_time": "6:45:43", "remaining_time": "0:17:26", "throughput": 4290.26, "total_tokens": 104441936} +{"current_steps": 86095, "total_steps": 89790, "loss": 0.4524, "lr": 2.576234619437762e-07, "epoch": 9.588484241006794, "percentage": 95.88, "elapsed_time": "6:45:45", "remaining_time": "0:17:24", "throughput": 4290.27, "total_tokens": 104447312} +{"current_steps": 86100, "total_steps": 89790, "loss": 0.4667, "lr": 2.56928095816969e-07, "epoch": 9.58904109589041, "percentage": 95.89, "elapsed_time": "6:45:46", "remaining_time": "0:17:23", "throughput": 4290.3, "total_tokens": 104453424} +{"current_steps": 86105, "total_steps": 89790, "loss": 0.4507, "lr": 2.562336645627134e-07, "epoch": 9.589597950774028, "percentage": 95.9, "elapsed_time": "6:45:47", "remaining_time": "0:17:22", "throughput": 4290.33, "total_tokens": 104460144} +{"current_steps": 86110, "total_steps": 89790, "loss": 0.465, "lr": 2.555401682072439e-07, "epoch": 9.590154805657646, "percentage": 95.9, "elapsed_time": "6:45:49", "remaining_time": "0:17:20", "throughput": 4290.35, "total_tokens": 104466128} +{"current_steps": 86115, "total_steps": 89790, "loss": 0.4469, "lr": 2.5484760677676466e-07, "epoch": 9.590711660541263, "percentage": 95.91, "elapsed_time": "6:45:50", "remaining_time": "0:17:19", "throughput": 4290.37, "total_tokens": 104471600} +{"current_steps": 86120, "total_steps": 89790, "loss": 0.4592, "lr": 2.541559802974436e-07, "epoch": 9.591268515424881, "percentage": 95.91, "elapsed_time": "6:45:51", "remaining_time": "0:17:17", "throughput": 4290.39, "total_tokens": 104477552} +{"current_steps": 86125, "total_steps": 89790, "loss": 0.446, "lr": 2.5346528879540974e-07, "epoch": 9.591825370308497, "percentage": 95.92, "elapsed_time": "6:45:52", "remaining_time": "0:17:16", "throughput": 4290.41, "total_tokens": 104483760} +{"current_steps": 86130, "total_steps": 89790, "loss": 0.4597, "lr": 2.5277553229676176e-07, "epoch": 9.592382225192114, "percentage": 95.92, "elapsed_time": "6:45:54", "remaining_time": "0:17:14", "throughput": 4290.44, "total_tokens": 104490192} +{"current_steps": 86135, "total_steps": 89790, "loss": 0.4557, "lr": 2.520867108275621e-07, "epoch": 9.592939080075732, "percentage": 95.93, "elapsed_time": "6:45:55", "remaining_time": "0:17:13", "throughput": 4290.46, "total_tokens": 104495600} +{"current_steps": 86140, "total_steps": 89790, "loss": 0.455, "lr": 2.513988244138343e-07, "epoch": 9.59349593495935, "percentage": 95.93, "elapsed_time": "6:45:56", "remaining_time": "0:17:12", "throughput": 4290.48, "total_tokens": 104501328} +{"current_steps": 86145, "total_steps": 89790, "loss": 0.465, "lr": 2.5071187308156887e-07, "epoch": 9.594052789842967, "percentage": 95.94, "elapsed_time": "6:45:57", "remaining_time": "0:17:10", "throughput": 4290.5, "total_tokens": 104507312} +{"current_steps": 86150, "total_steps": 89790, "loss": 0.4679, "lr": 2.5002585685672266e-07, "epoch": 9.594609644726585, "percentage": 95.95, "elapsed_time": "6:45:59", "remaining_time": "0:17:09", "throughput": 4290.51, "total_tokens": 104513008} +{"current_steps": 86155, "total_steps": 89790, "loss": 0.457, "lr": 2.4934077576521384e-07, "epoch": 9.595166499610201, "percentage": 95.95, "elapsed_time": "6:46:00", "remaining_time": "0:17:07", "throughput": 4290.54, "total_tokens": 104518800} +{"current_steps": 86160, "total_steps": 89790, "loss": 0.4593, "lr": 2.4865662983292737e-07, "epoch": 9.595723354493819, "percentage": 95.96, "elapsed_time": "6:46:01", "remaining_time": "0:17:06", "throughput": 4290.56, "total_tokens": 104524656} +{"current_steps": 86165, "total_steps": 89790, "loss": 0.459, "lr": 2.479734190857147e-07, "epoch": 9.596280209377436, "percentage": 95.96, "elapsed_time": "6:46:02", "remaining_time": "0:17:04", "throughput": 4290.58, "total_tokens": 104530736} +{"current_steps": 86170, "total_steps": 89790, "loss": 0.4732, "lr": 2.472911435493858e-07, "epoch": 9.596837064261054, "percentage": 95.97, "elapsed_time": "6:46:04", "remaining_time": "0:17:03", "throughput": 4290.61, "total_tokens": 104536848} +{"current_steps": 86175, "total_steps": 89790, "loss": 0.4478, "lr": 2.4660980324972547e-07, "epoch": 9.597393919144672, "percentage": 95.97, "elapsed_time": "6:46:05", "remaining_time": "0:17:02", "throughput": 4290.63, "total_tokens": 104543024} +{"current_steps": 86180, "total_steps": 89790, "loss": 0.456, "lr": 2.4592939821246886e-07, "epoch": 9.597950774028288, "percentage": 95.98, "elapsed_time": "6:46:06", "remaining_time": "0:17:00", "throughput": 4290.66, "total_tokens": 104549232} +{"current_steps": 86185, "total_steps": 89790, "loss": 0.4489, "lr": 2.4524992846333137e-07, "epoch": 9.598507628911905, "percentage": 95.99, "elapsed_time": "6:46:08", "remaining_time": "0:16:59", "throughput": 4290.68, "total_tokens": 104555536} +{"current_steps": 86190, "total_steps": 89790, "loss": 0.4665, "lr": 2.4457139402797866e-07, "epoch": 9.599064483795523, "percentage": 95.99, "elapsed_time": "6:46:09", "remaining_time": "0:16:57", "throughput": 4290.7, "total_tokens": 104561520} +{"current_steps": 86195, "total_steps": 89790, "loss": 0.4569, "lr": 2.4389379493205133e-07, "epoch": 9.59962133867914, "percentage": 96.0, "elapsed_time": "6:46:10", "remaining_time": "0:16:56", "throughput": 4290.72, "total_tokens": 104567632} +{"current_steps": 86200, "total_steps": 89790, "loss": 0.4579, "lr": 2.4321713120115386e-07, "epoch": 9.600178193562758, "percentage": 96.0, "elapsed_time": "6:46:11", "remaining_time": "0:16:55", "throughput": 4290.74, "total_tokens": 104573552} +{"current_steps": 86205, "total_steps": 89790, "loss": 0.4603, "lr": 2.425414028608491e-07, "epoch": 9.600735048446374, "percentage": 96.01, "elapsed_time": "6:46:13", "remaining_time": "0:16:53", "throughput": 4290.77, "total_tokens": 104579760} +{"current_steps": 86210, "total_steps": 89790, "loss": 0.4618, "lr": 2.4186660993666954e-07, "epoch": 9.601291903329992, "percentage": 96.01, "elapsed_time": "6:46:14", "remaining_time": "0:16:52", "throughput": 4290.79, "total_tokens": 104586000} +{"current_steps": 86215, "total_steps": 89790, "loss": 0.4545, "lr": 2.4119275245411134e-07, "epoch": 9.60184875821361, "percentage": 96.02, "elapsed_time": "6:46:15", "remaining_time": "0:16:50", "throughput": 4290.81, "total_tokens": 104592048} +{"current_steps": 86220, "total_steps": 89790, "loss": 0.467, "lr": 2.405198304386347e-07, "epoch": 9.602405613097227, "percentage": 96.02, "elapsed_time": "6:46:17", "remaining_time": "0:16:49", "throughput": 4290.83, "total_tokens": 104598128} +{"current_steps": 86225, "total_steps": 89790, "loss": 0.457, "lr": 2.398478439156637e-07, "epoch": 9.602962467980845, "percentage": 96.03, "elapsed_time": "6:46:18", "remaining_time": "0:16:47", "throughput": 4290.86, "total_tokens": 104604368} +{"current_steps": 86230, "total_steps": 89790, "loss": 0.4716, "lr": 2.391767929105865e-07, "epoch": 9.60351932286446, "percentage": 96.04, "elapsed_time": "6:46:19", "remaining_time": "0:16:46", "throughput": 4290.88, "total_tokens": 104610544} +{"current_steps": 86235, "total_steps": 89790, "loss": 0.4663, "lr": 2.385066774487632e-07, "epoch": 9.604076177748079, "percentage": 96.04, "elapsed_time": "6:46:21", "remaining_time": "0:16:45", "throughput": 4290.91, "total_tokens": 104616944} +{"current_steps": 86240, "total_steps": 89790, "loss": 0.4744, "lr": 2.3783749755550977e-07, "epoch": 9.604633032631696, "percentage": 96.05, "elapsed_time": "6:46:22", "remaining_time": "0:16:43", "throughput": 4290.93, "total_tokens": 104623088} +{"current_steps": 86245, "total_steps": 89790, "loss": 0.46, "lr": 2.3716925325610874e-07, "epoch": 9.605189887515314, "percentage": 96.05, "elapsed_time": "6:46:23", "remaining_time": "0:16:42", "throughput": 4290.95, "total_tokens": 104629136} +{"current_steps": 86250, "total_steps": 89790, "loss": 0.4675, "lr": 2.365019445758093e-07, "epoch": 9.605746742398932, "percentage": 96.06, "elapsed_time": "6:46:24", "remaining_time": "0:16:40", "throughput": 4290.98, "total_tokens": 104635216} +{"current_steps": 86255, "total_steps": 89790, "loss": 0.4836, "lr": 2.358355715398247e-07, "epoch": 9.606303597282547, "percentage": 96.06, "elapsed_time": "6:46:26", "remaining_time": "0:16:39", "throughput": 4291.0, "total_tokens": 104641264} +{"current_steps": 86260, "total_steps": 89790, "loss": 0.4559, "lr": 2.3517013417333477e-07, "epoch": 9.606860452166165, "percentage": 96.07, "elapsed_time": "6:46:27", "remaining_time": "0:16:37", "throughput": 4291.01, "total_tokens": 104646576} +{"current_steps": 86265, "total_steps": 89790, "loss": 0.4469, "lr": 2.3450563250147771e-07, "epoch": 9.607417307049783, "percentage": 96.07, "elapsed_time": "6:46:28", "remaining_time": "0:16:36", "throughput": 4291.04, "total_tokens": 104652848} +{"current_steps": 86270, "total_steps": 89790, "loss": 0.4639, "lr": 2.3384206654936403e-07, "epoch": 9.6079741619334, "percentage": 96.08, "elapsed_time": "6:46:29", "remaining_time": "0:16:35", "throughput": 4291.06, "total_tokens": 104658960} +{"current_steps": 86275, "total_steps": 89790, "loss": 0.459, "lr": 2.331794363420653e-07, "epoch": 9.608531016817018, "percentage": 96.09, "elapsed_time": "6:46:31", "remaining_time": "0:16:33", "throughput": 4291.09, "total_tokens": 104665296} +{"current_steps": 86280, "total_steps": 89790, "loss": 0.4613, "lr": 2.3251774190461706e-07, "epoch": 9.609087871700634, "percentage": 96.09, "elapsed_time": "6:46:32", "remaining_time": "0:16:32", "throughput": 4291.11, "total_tokens": 104671504} +{"current_steps": 86285, "total_steps": 89790, "loss": 0.4675, "lr": 2.3185698326201598e-07, "epoch": 9.609644726584252, "percentage": 96.1, "elapsed_time": "6:46:33", "remaining_time": "0:16:30", "throughput": 4291.13, "total_tokens": 104677488} +{"current_steps": 86290, "total_steps": 89790, "loss": 0.4648, "lr": 2.3119716043923378e-07, "epoch": 9.61020158146787, "percentage": 96.1, "elapsed_time": "6:46:35", "remaining_time": "0:16:29", "throughput": 4291.15, "total_tokens": 104683472} +{"current_steps": 86295, "total_steps": 89790, "loss": 0.4616, "lr": 2.3053827346119772e-07, "epoch": 9.610758436351487, "percentage": 96.11, "elapsed_time": "6:46:36", "remaining_time": "0:16:28", "throughput": 4291.18, "total_tokens": 104689616} +{"current_steps": 86300, "total_steps": 89790, "loss": 0.4556, "lr": 2.2988032235280454e-07, "epoch": 9.611315291235105, "percentage": 96.11, "elapsed_time": "6:46:37", "remaining_time": "0:16:26", "throughput": 4291.2, "total_tokens": 104695408} +{"current_steps": 86305, "total_steps": 89790, "loss": 0.4648, "lr": 2.2922330713891215e-07, "epoch": 9.61187214611872, "percentage": 96.12, "elapsed_time": "6:46:38", "remaining_time": "0:16:25", "throughput": 4291.22, "total_tokens": 104701264} +{"current_steps": 86310, "total_steps": 89790, "loss": 0.4713, "lr": 2.2856722784434514e-07, "epoch": 9.612429001002338, "percentage": 96.12, "elapsed_time": "6:46:40", "remaining_time": "0:16:23", "throughput": 4291.24, "total_tokens": 104707344} +{"current_steps": 86315, "total_steps": 89790, "loss": 0.4601, "lr": 2.2791208449389202e-07, "epoch": 9.612985855885956, "percentage": 96.13, "elapsed_time": "6:46:41", "remaining_time": "0:16:22", "throughput": 4291.26, "total_tokens": 104712848} +{"current_steps": 86320, "total_steps": 89790, "loss": 0.4554, "lr": 2.2725787711230517e-07, "epoch": 9.613542710769574, "percentage": 96.14, "elapsed_time": "6:46:42", "remaining_time": "0:16:20", "throughput": 4291.28, "total_tokens": 104718704} +{"current_steps": 86325, "total_steps": 89790, "loss": 0.467, "lr": 2.2660460572430376e-07, "epoch": 9.614099565653191, "percentage": 96.14, "elapsed_time": "6:46:44", "remaining_time": "0:16:19", "throughput": 4291.3, "total_tokens": 104725008} +{"current_steps": 86330, "total_steps": 89790, "loss": 0.4637, "lr": 2.2595227035457356e-07, "epoch": 9.614656420536807, "percentage": 96.15, "elapsed_time": "6:46:45", "remaining_time": "0:16:18", "throughput": 4291.33, "total_tokens": 104731344} +{"current_steps": 86335, "total_steps": 89790, "loss": 0.4667, "lr": 2.25300871027756e-07, "epoch": 9.615213275420425, "percentage": 96.15, "elapsed_time": "6:46:46", "remaining_time": "0:16:16", "throughput": 4291.35, "total_tokens": 104737360} +{"current_steps": 86340, "total_steps": 89790, "loss": 0.4686, "lr": 2.2465040776846748e-07, "epoch": 9.615770130304043, "percentage": 96.16, "elapsed_time": "6:46:47", "remaining_time": "0:16:15", "throughput": 4291.37, "total_tokens": 104743376} +{"current_steps": 86345, "total_steps": 89790, "loss": 0.4705, "lr": 2.2400088060128276e-07, "epoch": 9.61632698518766, "percentage": 96.16, "elapsed_time": "6:46:49", "remaining_time": "0:16:13", "throughput": 4291.39, "total_tokens": 104749328} +{"current_steps": 86350, "total_steps": 89790, "loss": 0.4593, "lr": 2.2335228955074338e-07, "epoch": 9.616883840071278, "percentage": 96.17, "elapsed_time": "6:46:50", "remaining_time": "0:16:12", "throughput": 4291.41, "total_tokens": 104755184} +{"current_steps": 86355, "total_steps": 89790, "loss": 0.4685, "lr": 2.2270463464135472e-07, "epoch": 9.617440694954894, "percentage": 96.17, "elapsed_time": "6:46:51", "remaining_time": "0:16:11", "throughput": 4291.44, "total_tokens": 104761392} +{"current_steps": 86360, "total_steps": 89790, "loss": 0.4522, "lr": 2.2205791589758885e-07, "epoch": 9.617997549838512, "percentage": 96.18, "elapsed_time": "6:46:52", "remaining_time": "0:16:09", "throughput": 4291.46, "total_tokens": 104767024} +{"current_steps": 86365, "total_steps": 89790, "loss": 0.4671, "lr": 2.21412133343879e-07, "epoch": 9.61855440472213, "percentage": 96.19, "elapsed_time": "6:46:54", "remaining_time": "0:16:08", "throughput": 4291.48, "total_tokens": 104773040} +{"current_steps": 86370, "total_steps": 89790, "loss": 0.4504, "lr": 2.2076728700462513e-07, "epoch": 9.619111259605747, "percentage": 96.19, "elapsed_time": "6:46:55", "remaining_time": "0:16:06", "throughput": 4291.5, "total_tokens": 104778736} +{"current_steps": 86375, "total_steps": 89790, "loss": 0.4447, "lr": 2.2012337690419383e-07, "epoch": 9.619668114489365, "percentage": 96.2, "elapsed_time": "6:46:56", "remaining_time": "0:16:05", "throughput": 4291.52, "total_tokens": 104784848} +{"current_steps": 86380, "total_steps": 89790, "loss": 0.4602, "lr": 2.1948040306691008e-07, "epoch": 9.620224969372982, "percentage": 96.2, "elapsed_time": "6:46:58", "remaining_time": "0:16:03", "throughput": 4291.54, "total_tokens": 104790928} +{"current_steps": 86385, "total_steps": 89790, "loss": 0.4591, "lr": 2.1883836551707115e-07, "epoch": 9.620781824256598, "percentage": 96.21, "elapsed_time": "6:46:59", "remaining_time": "0:16:02", "throughput": 4291.57, "total_tokens": 104797264} +{"current_steps": 86390, "total_steps": 89790, "loss": 0.4651, "lr": 2.1819726427893262e-07, "epoch": 9.621338679140216, "percentage": 96.21, "elapsed_time": "6:47:00", "remaining_time": "0:16:01", "throughput": 4291.59, "total_tokens": 104803600} +{"current_steps": 86395, "total_steps": 89790, "loss": 0.4661, "lr": 2.1755709937671953e-07, "epoch": 9.621895534023833, "percentage": 96.22, "elapsed_time": "6:47:02", "remaining_time": "0:15:59", "throughput": 4291.61, "total_tokens": 104809744} +{"current_steps": 86400, "total_steps": 89790, "loss": 0.4614, "lr": 2.1691787083462089e-07, "epoch": 9.622452388907451, "percentage": 96.22, "elapsed_time": "6:47:03", "remaining_time": "0:15:58", "throughput": 4291.64, "total_tokens": 104816016} +{"current_steps": 86405, "total_steps": 89790, "loss": 0.4613, "lr": 2.162795786767813e-07, "epoch": 9.623009243791069, "percentage": 96.23, "elapsed_time": "6:47:04", "remaining_time": "0:15:56", "throughput": 4291.66, "total_tokens": 104821840} +{"current_steps": 86410, "total_steps": 89790, "loss": 0.4643, "lr": 2.1564222292732583e-07, "epoch": 9.623566098674685, "percentage": 96.24, "elapsed_time": "6:47:05", "remaining_time": "0:15:55", "throughput": 4291.69, "total_tokens": 104828016} +{"current_steps": 86415, "total_steps": 89790, "loss": 0.4523, "lr": 2.1500580361033251e-07, "epoch": 9.624122953558302, "percentage": 96.24, "elapsed_time": "6:47:07", "remaining_time": "0:15:54", "throughput": 4291.7, "total_tokens": 104833680} +{"current_steps": 86420, "total_steps": 89790, "loss": 0.4551, "lr": 2.1437032074984598e-07, "epoch": 9.62467980844192, "percentage": 96.25, "elapsed_time": "6:47:08", "remaining_time": "0:15:52", "throughput": 4291.73, "total_tokens": 104839760} +{"current_steps": 86425, "total_steps": 89790, "loss": 0.4713, "lr": 2.1373577436988034e-07, "epoch": 9.625236663325538, "percentage": 96.25, "elapsed_time": "6:47:09", "remaining_time": "0:15:51", "throughput": 4291.75, "total_tokens": 104845872} +{"current_steps": 86430, "total_steps": 89790, "loss": 0.4703, "lr": 2.1310216449440533e-07, "epoch": 9.625793518209155, "percentage": 96.26, "elapsed_time": "6:47:10", "remaining_time": "0:15:49", "throughput": 4291.77, "total_tokens": 104851984} +{"current_steps": 86435, "total_steps": 89790, "loss": 0.4526, "lr": 2.1246949114736846e-07, "epoch": 9.626350373092771, "percentage": 96.26, "elapsed_time": "6:47:12", "remaining_time": "0:15:48", "throughput": 4291.8, "total_tokens": 104858288} +{"current_steps": 86440, "total_steps": 89790, "loss": 0.456, "lr": 2.1183775435266728e-07, "epoch": 9.626907227976389, "percentage": 96.27, "elapsed_time": "6:47:13", "remaining_time": "0:15:46", "throughput": 4291.82, "total_tokens": 104864528} +{"current_steps": 86445, "total_steps": 89790, "loss": 0.4631, "lr": 2.1120695413417157e-07, "epoch": 9.627464082860007, "percentage": 96.27, "elapsed_time": "6:47:14", "remaining_time": "0:15:45", "throughput": 4291.85, "total_tokens": 104870576} +{"current_steps": 86450, "total_steps": 89790, "loss": 0.4531, "lr": 2.1057709051571784e-07, "epoch": 9.628020937743624, "percentage": 96.28, "elapsed_time": "6:47:16", "remaining_time": "0:15:44", "throughput": 4291.86, "total_tokens": 104876368} +{"current_steps": 86455, "total_steps": 89790, "loss": 0.4661, "lr": 2.099481635211037e-07, "epoch": 9.628577792627242, "percentage": 96.29, "elapsed_time": "6:47:17", "remaining_time": "0:15:42", "throughput": 4291.88, "total_tokens": 104881776} +{"current_steps": 86460, "total_steps": 89790, "loss": 0.4631, "lr": 2.0932017317409348e-07, "epoch": 9.629134647510858, "percentage": 96.29, "elapsed_time": "6:47:18", "remaining_time": "0:15:41", "throughput": 4291.9, "total_tokens": 104887888} +{"current_steps": 86465, "total_steps": 89790, "loss": 0.4754, "lr": 2.0869311949841265e-07, "epoch": 9.629691502394476, "percentage": 96.3, "elapsed_time": "6:47:19", "remaining_time": "0:15:39", "throughput": 4291.92, "total_tokens": 104893872} +{"current_steps": 86470, "total_steps": 89790, "loss": 0.4583, "lr": 2.0806700251775057e-07, "epoch": 9.630248357278093, "percentage": 96.3, "elapsed_time": "6:47:21", "remaining_time": "0:15:38", "throughput": 4291.94, "total_tokens": 104899888} +{"current_steps": 86475, "total_steps": 89790, "loss": 0.4606, "lr": 2.074418222557689e-07, "epoch": 9.630805212161711, "percentage": 96.31, "elapsed_time": "6:47:22", "remaining_time": "0:15:36", "throughput": 4291.96, "total_tokens": 104906032} +{"current_steps": 86480, "total_steps": 89790, "loss": 0.4552, "lr": 2.0681757873608486e-07, "epoch": 9.631362067045329, "percentage": 96.31, "elapsed_time": "6:47:23", "remaining_time": "0:15:35", "throughput": 4291.98, "total_tokens": 104912016} +{"current_steps": 86485, "total_steps": 89790, "loss": 0.4643, "lr": 2.061942719822879e-07, "epoch": 9.631918921928944, "percentage": 96.32, "elapsed_time": "6:47:25", "remaining_time": "0:15:34", "throughput": 4292.01, "total_tokens": 104918224} +{"current_steps": 86490, "total_steps": 89790, "loss": 0.458, "lr": 2.0557190201792586e-07, "epoch": 9.632475776812562, "percentage": 96.32, "elapsed_time": "6:47:26", "remaining_time": "0:15:32", "throughput": 4292.03, "total_tokens": 104923728} +{"current_steps": 86495, "total_steps": 89790, "loss": 0.4597, "lr": 2.0495046886651602e-07, "epoch": 9.63303263169618, "percentage": 96.33, "elapsed_time": "6:47:27", "remaining_time": "0:15:31", "throughput": 4292.05, "total_tokens": 104929648} +{"current_steps": 86500, "total_steps": 89790, "loss": 0.454, "lr": 2.0432997255153686e-07, "epoch": 9.633589486579798, "percentage": 96.34, "elapsed_time": "6:47:28", "remaining_time": "0:15:29", "throughput": 4292.07, "total_tokens": 104935728} +{"current_steps": 86505, "total_steps": 89790, "loss": 0.4577, "lr": 2.0371041309643346e-07, "epoch": 9.634146341463415, "percentage": 96.34, "elapsed_time": "6:47:30", "remaining_time": "0:15:28", "throughput": 4292.09, "total_tokens": 104942032} +{"current_steps": 86510, "total_steps": 89790, "loss": 0.4586, "lr": 2.0309179052461214e-07, "epoch": 9.634703196347033, "percentage": 96.35, "elapsed_time": "6:47:31", "remaining_time": "0:15:27", "throughput": 4292.11, "total_tokens": 104948240} +{"current_steps": 86515, "total_steps": 89790, "loss": 0.4513, "lr": 2.024741048594514e-07, "epoch": 9.635260051230649, "percentage": 96.35, "elapsed_time": "6:47:32", "remaining_time": "0:15:25", "throughput": 4292.14, "total_tokens": 104954352} +{"current_steps": 86520, "total_steps": 89790, "loss": 0.4575, "lr": 2.0185735612428536e-07, "epoch": 9.635816906114266, "percentage": 96.36, "elapsed_time": "6:47:34", "remaining_time": "0:15:24", "throughput": 4292.16, "total_tokens": 104960432} +{"current_steps": 86525, "total_steps": 89790, "loss": 0.4526, "lr": 2.012415443424176e-07, "epoch": 9.636373760997884, "percentage": 96.36, "elapsed_time": "6:47:35", "remaining_time": "0:15:22", "throughput": 4292.18, "total_tokens": 104966160} +{"current_steps": 86530, "total_steps": 89790, "loss": 0.4504, "lr": 2.0062666953711561e-07, "epoch": 9.636930615881502, "percentage": 96.37, "elapsed_time": "6:47:36", "remaining_time": "0:15:21", "throughput": 4292.2, "total_tokens": 104972208} +{"current_steps": 86535, "total_steps": 89790, "loss": 0.453, "lr": 2.0001273173161085e-07, "epoch": 9.63748747076512, "percentage": 96.37, "elapsed_time": "6:47:37", "remaining_time": "0:15:19", "throughput": 4292.22, "total_tokens": 104978128} +{"current_steps": 86540, "total_steps": 89790, "loss": 0.4661, "lr": 1.9939973094910137e-07, "epoch": 9.638044325648735, "percentage": 96.38, "elapsed_time": "6:47:39", "remaining_time": "0:15:18", "throughput": 4292.25, "total_tokens": 104984432} +{"current_steps": 86545, "total_steps": 89790, "loss": 0.4584, "lr": 1.9878766721274922e-07, "epoch": 9.638601180532353, "percentage": 96.39, "elapsed_time": "6:47:40", "remaining_time": "0:15:17", "throughput": 4292.27, "total_tokens": 104990928} +{"current_steps": 86550, "total_steps": 89790, "loss": 0.473, "lr": 1.981765405456776e-07, "epoch": 9.63915803541597, "percentage": 96.39, "elapsed_time": "6:47:41", "remaining_time": "0:15:15", "throughput": 4292.29, "total_tokens": 104997072} +{"current_steps": 86555, "total_steps": 89790, "loss": 0.4493, "lr": 1.9756635097097632e-07, "epoch": 9.639714890299588, "percentage": 96.4, "elapsed_time": "6:47:42", "remaining_time": "0:15:14", "throughput": 4292.31, "total_tokens": 105002704} +{"current_steps": 86560, "total_steps": 89790, "loss": 0.4615, "lr": 1.9695709851170197e-07, "epoch": 9.640271745183206, "percentage": 96.4, "elapsed_time": "6:47:44", "remaining_time": "0:15:12", "throughput": 4292.33, "total_tokens": 105008816} +{"current_steps": 86565, "total_steps": 89790, "loss": 0.4617, "lr": 1.9634878319087224e-07, "epoch": 9.640828600066822, "percentage": 96.41, "elapsed_time": "6:47:45", "remaining_time": "0:15:11", "throughput": 4292.36, "total_tokens": 105015312} +{"current_steps": 86570, "total_steps": 89790, "loss": 0.4562, "lr": 1.9574140503147709e-07, "epoch": 9.64138545495044, "percentage": 96.41, "elapsed_time": "6:47:46", "remaining_time": "0:15:10", "throughput": 4292.38, "total_tokens": 105021392} +{"current_steps": 86575, "total_steps": 89790, "loss": 0.4578, "lr": 1.9513496405645647e-07, "epoch": 9.641942309834057, "percentage": 96.42, "elapsed_time": "6:47:48", "remaining_time": "0:15:08", "throughput": 4292.4, "total_tokens": 105027440} +{"current_steps": 86580, "total_steps": 89790, "loss": 0.4623, "lr": 1.94529460288731e-07, "epoch": 9.642499164717675, "percentage": 96.42, "elapsed_time": "6:47:49", "remaining_time": "0:15:07", "throughput": 4292.43, "total_tokens": 105033840} +{"current_steps": 86585, "total_steps": 89790, "loss": 0.4677, "lr": 1.9392489375117396e-07, "epoch": 9.643056019601293, "percentage": 96.43, "elapsed_time": "6:47:50", "remaining_time": "0:15:05", "throughput": 4292.45, "total_tokens": 105039984} +{"current_steps": 86590, "total_steps": 89790, "loss": 0.4523, "lr": 1.9332126446663103e-07, "epoch": 9.643612874484909, "percentage": 96.44, "elapsed_time": "6:47:52", "remaining_time": "0:15:04", "throughput": 4292.47, "total_tokens": 105046480} +{"current_steps": 86595, "total_steps": 89790, "loss": 0.4586, "lr": 1.9271857245790337e-07, "epoch": 9.644169729368526, "percentage": 96.44, "elapsed_time": "6:47:53", "remaining_time": "0:15:02", "throughput": 4292.49, "total_tokens": 105052400} +{"current_steps": 86600, "total_steps": 89790, "loss": 0.4689, "lr": 1.9211681774777003e-07, "epoch": 9.644726584252144, "percentage": 96.45, "elapsed_time": "6:47:54", "remaining_time": "0:15:01", "throughput": 4292.52, "total_tokens": 105058448} +{"current_steps": 86605, "total_steps": 89790, "loss": 0.4532, "lr": 1.9151600035896555e-07, "epoch": 9.645283439135762, "percentage": 96.45, "elapsed_time": "6:47:56", "remaining_time": "0:15:00", "throughput": 4292.54, "total_tokens": 105064624} +{"current_steps": 86610, "total_steps": 89790, "loss": 0.4686, "lr": 1.9091612031418572e-07, "epoch": 9.64584029401938, "percentage": 96.46, "elapsed_time": "6:47:57", "remaining_time": "0:14:58", "throughput": 4292.56, "total_tokens": 105070864} +{"current_steps": 86615, "total_steps": 89790, "loss": 0.4585, "lr": 1.9031717763610123e-07, "epoch": 9.646397148902995, "percentage": 96.46, "elapsed_time": "6:47:58", "remaining_time": "0:14:57", "throughput": 4292.59, "total_tokens": 105076912} +{"current_steps": 86620, "total_steps": 89790, "loss": 0.4539, "lr": 1.8971917234734126e-07, "epoch": 9.646954003786613, "percentage": 96.47, "elapsed_time": "6:48:00", "remaining_time": "0:14:55", "throughput": 4292.61, "total_tokens": 105083280} +{"current_steps": 86625, "total_steps": 89790, "loss": 0.4823, "lr": 1.8912210447049882e-07, "epoch": 9.64751085867023, "percentage": 96.48, "elapsed_time": "6:48:01", "remaining_time": "0:14:54", "throughput": 4292.63, "total_tokens": 105088784} +{"current_steps": 86630, "total_steps": 89790, "loss": 0.468, "lr": 1.8852597402813366e-07, "epoch": 9.648067713553848, "percentage": 96.48, "elapsed_time": "6:48:02", "remaining_time": "0:14:53", "throughput": 4292.66, "total_tokens": 105095536} +{"current_steps": 86635, "total_steps": 89790, "loss": 0.4593, "lr": 1.8793078104276663e-07, "epoch": 9.648624568437466, "percentage": 96.49, "elapsed_time": "6:48:03", "remaining_time": "0:14:51", "throughput": 4292.69, "total_tokens": 105101968} +{"current_steps": 86640, "total_steps": 89790, "loss": 0.4695, "lr": 1.8733652553689364e-07, "epoch": 9.649181423321082, "percentage": 96.49, "elapsed_time": "6:48:05", "remaining_time": "0:14:50", "throughput": 4292.71, "total_tokens": 105108336} +{"current_steps": 86645, "total_steps": 89790, "loss": 0.4547, "lr": 1.867432075329606e-07, "epoch": 9.6497382782047, "percentage": 96.5, "elapsed_time": "6:48:06", "remaining_time": "0:14:48", "throughput": 4292.73, "total_tokens": 105113936} +{"current_steps": 86650, "total_steps": 89790, "loss": 0.4651, "lr": 1.8615082705338573e-07, "epoch": 9.650295133088317, "percentage": 96.5, "elapsed_time": "6:48:07", "remaining_time": "0:14:47", "throughput": 4292.75, "total_tokens": 105119888} +{"current_steps": 86655, "total_steps": 89790, "loss": 0.4591, "lr": 1.8555938412055385e-07, "epoch": 9.650851987971935, "percentage": 96.51, "elapsed_time": "6:48:09", "remaining_time": "0:14:45", "throughput": 4292.77, "total_tokens": 105126064} +{"current_steps": 86660, "total_steps": 89790, "loss": 0.4588, "lr": 1.8496887875681102e-07, "epoch": 9.651408842855552, "percentage": 96.51, "elapsed_time": "6:48:10", "remaining_time": "0:14:44", "throughput": 4292.79, "total_tokens": 105132336} +{"current_steps": 86665, "total_steps": 89790, "loss": 0.4646, "lr": 1.8437931098446714e-07, "epoch": 9.651965697739168, "percentage": 96.52, "elapsed_time": "6:48:11", "remaining_time": "0:14:43", "throughput": 4292.82, "total_tokens": 105138544} +{"current_steps": 86670, "total_steps": 89790, "loss": 0.4539, "lr": 1.837906808257961e-07, "epoch": 9.652522552622786, "percentage": 96.53, "elapsed_time": "6:48:13", "remaining_time": "0:14:41", "throughput": 4292.84, "total_tokens": 105144528} +{"current_steps": 86675, "total_steps": 89790, "loss": 0.4627, "lr": 1.8320298830304394e-07, "epoch": 9.653079407506404, "percentage": 96.53, "elapsed_time": "6:48:14", "remaining_time": "0:14:40", "throughput": 4292.86, "total_tokens": 105150704} +{"current_steps": 86680, "total_steps": 89790, "loss": 0.4609, "lr": 1.826162334384096e-07, "epoch": 9.653636262390021, "percentage": 96.54, "elapsed_time": "6:48:15", "remaining_time": "0:14:38", "throughput": 4292.89, "total_tokens": 105156752} +{"current_steps": 86685, "total_steps": 89790, "loss": 0.4706, "lr": 1.820304162540698e-07, "epoch": 9.654193117273639, "percentage": 96.54, "elapsed_time": "6:48:16", "remaining_time": "0:14:37", "throughput": 4292.91, "total_tokens": 105163088} +{"current_steps": 86690, "total_steps": 89790, "loss": 0.4561, "lr": 1.814455367721485e-07, "epoch": 9.654749972157255, "percentage": 96.55, "elapsed_time": "6:48:18", "remaining_time": "0:14:36", "throughput": 4292.93, "total_tokens": 105169136} +{"current_steps": 86695, "total_steps": 89790, "loss": 0.4547, "lr": 1.8086159501475297e-07, "epoch": 9.655306827040873, "percentage": 96.55, "elapsed_time": "6:48:19", "remaining_time": "0:14:34", "throughput": 4292.95, "total_tokens": 105174480} +{"current_steps": 86700, "total_steps": 89790, "loss": 0.4663, "lr": 1.8027859100394063e-07, "epoch": 9.65586368192449, "percentage": 96.56, "elapsed_time": "6:48:20", "remaining_time": "0:14:33", "throughput": 4292.98, "total_tokens": 105180912} +{"current_steps": 86705, "total_steps": 89790, "loss": 0.4757, "lr": 1.7969652476174381e-07, "epoch": 9.656420536808108, "percentage": 96.56, "elapsed_time": "6:48:21", "remaining_time": "0:14:31", "throughput": 4293.0, "total_tokens": 105186928} +{"current_steps": 86710, "total_steps": 89790, "loss": 0.4548, "lr": 1.7911539631015327e-07, "epoch": 9.656977391691726, "percentage": 96.57, "elapsed_time": "6:48:23", "remaining_time": "0:14:30", "throughput": 4293.02, "total_tokens": 105193104} +{"current_steps": 86715, "total_steps": 89790, "loss": 0.4559, "lr": 1.785352056711237e-07, "epoch": 9.657534246575342, "percentage": 96.58, "elapsed_time": "6:48:24", "remaining_time": "0:14:28", "throughput": 4293.05, "total_tokens": 105199344} +{"current_steps": 86720, "total_steps": 89790, "loss": 0.4526, "lr": 1.7795595286657918e-07, "epoch": 9.65809110145896, "percentage": 96.58, "elapsed_time": "6:48:25", "remaining_time": "0:14:27", "throughput": 4293.07, "total_tokens": 105205424} +{"current_steps": 86725, "total_steps": 89790, "loss": 0.459, "lr": 1.77377637918405e-07, "epoch": 9.658647956342577, "percentage": 96.59, "elapsed_time": "6:48:27", "remaining_time": "0:14:26", "throughput": 4293.09, "total_tokens": 105211920} +{"current_steps": 86730, "total_steps": 89790, "loss": 0.4622, "lr": 1.7680026084845036e-07, "epoch": 9.659204811226195, "percentage": 96.59, "elapsed_time": "6:48:28", "remaining_time": "0:14:24", "throughput": 4293.12, "total_tokens": 105217840} +{"current_steps": 86735, "total_steps": 89790, "loss": 0.4776, "lr": 1.7622382167853392e-07, "epoch": 9.659761666109812, "percentage": 96.6, "elapsed_time": "6:48:29", "remaining_time": "0:14:23", "throughput": 4293.14, "total_tokens": 105224208} +{"current_steps": 86740, "total_steps": 89790, "loss": 0.4563, "lr": 1.7564832043043266e-07, "epoch": 9.66031852099343, "percentage": 96.6, "elapsed_time": "6:48:31", "remaining_time": "0:14:21", "throughput": 4293.17, "total_tokens": 105230416} +{"current_steps": 86745, "total_steps": 89790, "loss": 0.4609, "lr": 1.7507375712589037e-07, "epoch": 9.660875375877046, "percentage": 96.61, "elapsed_time": "6:48:32", "remaining_time": "0:14:20", "throughput": 4293.19, "total_tokens": 105236272} +{"current_steps": 86750, "total_steps": 89790, "loss": 0.453, "lr": 1.745001317866174e-07, "epoch": 9.661432230760663, "percentage": 96.61, "elapsed_time": "6:48:33", "remaining_time": "0:14:19", "throughput": 4293.21, "total_tokens": 105242416} +{"current_steps": 86755, "total_steps": 89790, "loss": 0.4517, "lr": 1.739274444342881e-07, "epoch": 9.661989085644281, "percentage": 96.62, "elapsed_time": "6:48:35", "remaining_time": "0:14:17", "throughput": 4293.23, "total_tokens": 105248720} +{"current_steps": 86760, "total_steps": 89790, "loss": 0.4553, "lr": 1.7335569509053796e-07, "epoch": 9.662545940527899, "percentage": 96.63, "elapsed_time": "6:48:36", "remaining_time": "0:14:16", "throughput": 4293.25, "total_tokens": 105254640} +{"current_steps": 86765, "total_steps": 89790, "loss": 0.461, "lr": 1.727848837769691e-07, "epoch": 9.663102795411517, "percentage": 96.63, "elapsed_time": "6:48:37", "remaining_time": "0:14:14", "throughput": 4293.27, "total_tokens": 105260848} +{"current_steps": 86770, "total_steps": 89790, "loss": 0.4699, "lr": 1.722150105151532e-07, "epoch": 9.663659650295132, "percentage": 96.64, "elapsed_time": "6:48:38", "remaining_time": "0:14:13", "throughput": 4293.3, "total_tokens": 105267152} +{"current_steps": 86775, "total_steps": 89790, "loss": 0.4656, "lr": 1.716460753266147e-07, "epoch": 9.66421650517875, "percentage": 96.64, "elapsed_time": "6:48:40", "remaining_time": "0:14:11", "throughput": 4293.32, "total_tokens": 105273552} +{"current_steps": 86780, "total_steps": 89790, "loss": 0.4699, "lr": 1.710780782328586e-07, "epoch": 9.664773360062368, "percentage": 96.65, "elapsed_time": "6:48:41", "remaining_time": "0:14:10", "throughput": 4293.35, "total_tokens": 105279440} +{"current_steps": 86785, "total_steps": 89790, "loss": 0.4765, "lr": 1.7051101925533718e-07, "epoch": 9.665330214945985, "percentage": 96.65, "elapsed_time": "6:48:42", "remaining_time": "0:14:09", "throughput": 4293.37, "total_tokens": 105285648} +{"current_steps": 86790, "total_steps": 89790, "loss": 0.4765, "lr": 1.699448984154778e-07, "epoch": 9.665887069829603, "percentage": 96.66, "elapsed_time": "6:48:44", "remaining_time": "0:14:07", "throughput": 4293.39, "total_tokens": 105291824} +{"current_steps": 86795, "total_steps": 89790, "loss": 0.4541, "lr": 1.6937971573467715e-07, "epoch": 9.666443924713219, "percentage": 96.66, "elapsed_time": "6:48:45", "remaining_time": "0:14:06", "throughput": 4293.42, "total_tokens": 105298224} +{"current_steps": 86800, "total_steps": 89790, "loss": 0.4603, "lr": 1.688154712342821e-07, "epoch": 9.667000779596837, "percentage": 96.67, "elapsed_time": "6:48:46", "remaining_time": "0:14:04", "throughput": 4293.44, "total_tokens": 105303312} +{"current_steps": 86805, "total_steps": 89790, "loss": 0.455, "lr": 1.6825216493561446e-07, "epoch": 9.667557634480454, "percentage": 96.68, "elapsed_time": "6:48:47", "remaining_time": "0:14:03", "throughput": 4293.46, "total_tokens": 105309264} +{"current_steps": 86810, "total_steps": 89790, "loss": 0.4569, "lr": 1.6768979685995445e-07, "epoch": 9.668114489364072, "percentage": 96.68, "elapsed_time": "6:48:49", "remaining_time": "0:14:02", "throughput": 4293.47, "total_tokens": 105315280} +{"current_steps": 86815, "total_steps": 89790, "loss": 0.4522, "lr": 1.6712836702855729e-07, "epoch": 9.66867134424769, "percentage": 96.69, "elapsed_time": "6:48:50", "remaining_time": "0:14:00", "throughput": 4293.5, "total_tokens": 105321776} +{"current_steps": 86820, "total_steps": 89790, "loss": 0.4627, "lr": 1.665678754626282e-07, "epoch": 9.669228199131306, "percentage": 96.69, "elapsed_time": "6:48:51", "remaining_time": "0:13:59", "throughput": 4293.52, "total_tokens": 105327728} +{"current_steps": 86825, "total_steps": 89790, "loss": 0.453, "lr": 1.660083221833475e-07, "epoch": 9.669785054014923, "percentage": 96.7, "elapsed_time": "6:48:53", "remaining_time": "0:13:57", "throughput": 4293.55, "total_tokens": 105334128} +{"current_steps": 86830, "total_steps": 89790, "loss": 0.4523, "lr": 1.6544970721185936e-07, "epoch": 9.670341908898541, "percentage": 96.7, "elapsed_time": "6:48:54", "remaining_time": "0:13:56", "throughput": 4293.57, "total_tokens": 105340368} +{"current_steps": 86835, "total_steps": 89790, "loss": 0.4743, "lr": 1.648920305692636e-07, "epoch": 9.670898763782159, "percentage": 96.71, "elapsed_time": "6:48:55", "remaining_time": "0:13:54", "throughput": 4293.59, "total_tokens": 105346416} +{"current_steps": 86840, "total_steps": 89790, "loss": 0.4535, "lr": 1.643352922766378e-07, "epoch": 9.671455618665776, "percentage": 96.71, "elapsed_time": "6:48:56", "remaining_time": "0:13:53", "throughput": 4293.62, "total_tokens": 105352432} +{"current_steps": 86845, "total_steps": 89790, "loss": 0.4603, "lr": 1.637794923550151e-07, "epoch": 9.672012473549392, "percentage": 96.72, "elapsed_time": "6:48:58", "remaining_time": "0:13:52", "throughput": 4293.64, "total_tokens": 105358800} +{"current_steps": 86850, "total_steps": 89790, "loss": 0.4642, "lr": 1.6322463082539262e-07, "epoch": 9.67256932843301, "percentage": 96.73, "elapsed_time": "6:48:59", "remaining_time": "0:13:50", "throughput": 4293.66, "total_tokens": 105364816} +{"current_steps": 86855, "total_steps": 89790, "loss": 0.4747, "lr": 1.6267070770873971e-07, "epoch": 9.673126183316628, "percentage": 96.73, "elapsed_time": "6:49:00", "remaining_time": "0:13:49", "throughput": 4293.69, "total_tokens": 105371280} +{"current_steps": 86860, "total_steps": 89790, "loss": 0.4677, "lr": 1.621177230259785e-07, "epoch": 9.673683038200245, "percentage": 96.74, "elapsed_time": "6:49:02", "remaining_time": "0:13:47", "throughput": 4293.71, "total_tokens": 105377456} +{"current_steps": 86865, "total_steps": 89790, "loss": 0.4469, "lr": 1.6156567679800893e-07, "epoch": 9.674239893083863, "percentage": 96.74, "elapsed_time": "6:49:03", "remaining_time": "0:13:46", "throughput": 4293.74, "total_tokens": 105383824} +{"current_steps": 86870, "total_steps": 89790, "loss": 0.4693, "lr": 1.6101456904568656e-07, "epoch": 9.67479674796748, "percentage": 96.75, "elapsed_time": "6:49:04", "remaining_time": "0:13:45", "throughput": 4293.76, "total_tokens": 105389680} +{"current_steps": 86875, "total_steps": 89790, "loss": 0.4559, "lr": 1.604643997898364e-07, "epoch": 9.675353602851096, "percentage": 96.75, "elapsed_time": "6:49:06", "remaining_time": "0:13:43", "throughput": 4293.78, "total_tokens": 105396080} +{"current_steps": 86880, "total_steps": 89790, "loss": 0.4637, "lr": 1.5991516905124183e-07, "epoch": 9.675910457734714, "percentage": 96.76, "elapsed_time": "6:49:07", "remaining_time": "0:13:42", "throughput": 4293.8, "total_tokens": 105402128} +{"current_steps": 86885, "total_steps": 89790, "loss": 0.4558, "lr": 1.5936687685065565e-07, "epoch": 9.676467312618332, "percentage": 96.76, "elapsed_time": "6:49:08", "remaining_time": "0:13:40", "throughput": 4293.83, "total_tokens": 105408560} +{"current_steps": 86890, "total_steps": 89790, "loss": 0.446, "lr": 1.5881952320879469e-07, "epoch": 9.67702416750195, "percentage": 96.77, "elapsed_time": "6:49:10", "remaining_time": "0:13:39", "throughput": 4293.85, "total_tokens": 105415024} +{"current_steps": 86895, "total_steps": 89790, "loss": 0.464, "lr": 1.5827310814633955e-07, "epoch": 9.677581022385567, "percentage": 96.78, "elapsed_time": "6:49:11", "remaining_time": "0:13:37", "throughput": 4293.88, "total_tokens": 105421168} +{"current_steps": 86900, "total_steps": 89790, "loss": 0.4506, "lr": 1.577276316839349e-07, "epoch": 9.678137877269183, "percentage": 96.78, "elapsed_time": "6:49:12", "remaining_time": "0:13:36", "throughput": 4293.9, "total_tokens": 105427376} +{"current_steps": 86905, "total_steps": 89790, "loss": 0.4721, "lr": 1.5718309384219197e-07, "epoch": 9.6786947321528, "percentage": 96.79, "elapsed_time": "6:49:14", "remaining_time": "0:13:35", "throughput": 4293.92, "total_tokens": 105433392} +{"current_steps": 86910, "total_steps": 89790, "loss": 0.4681, "lr": 1.5663949464168325e-07, "epoch": 9.679251587036418, "percentage": 96.79, "elapsed_time": "6:49:15", "remaining_time": "0:13:33", "throughput": 4293.95, "total_tokens": 105439344} +{"current_steps": 86915, "total_steps": 89790, "loss": 0.465, "lr": 1.560968341029506e-07, "epoch": 9.679808441920036, "percentage": 96.8, "elapsed_time": "6:49:16", "remaining_time": "0:13:32", "throughput": 4293.97, "total_tokens": 105445520} +{"current_steps": 86920, "total_steps": 89790, "loss": 0.4646, "lr": 1.5555511224649432e-07, "epoch": 9.680365296803654, "percentage": 96.8, "elapsed_time": "6:49:17", "remaining_time": "0:13:30", "throughput": 4293.99, "total_tokens": 105451472} +{"current_steps": 86925, "total_steps": 89790, "loss": 0.4577, "lr": 1.550143290927869e-07, "epoch": 9.68092215168727, "percentage": 96.81, "elapsed_time": "6:49:19", "remaining_time": "0:13:29", "throughput": 4294.01, "total_tokens": 105457584} +{"current_steps": 86930, "total_steps": 89790, "loss": 0.4659, "lr": 1.5447448466225368e-07, "epoch": 9.681479006570887, "percentage": 96.81, "elapsed_time": "6:49:20", "remaining_time": "0:13:28", "throughput": 4294.04, "total_tokens": 105463664} +{"current_steps": 86935, "total_steps": 89790, "loss": 0.4657, "lr": 1.5393557897529776e-07, "epoch": 9.682035861454505, "percentage": 96.82, "elapsed_time": "6:49:21", "remaining_time": "0:13:26", "throughput": 4294.06, "total_tokens": 105469872} +{"current_steps": 86940, "total_steps": 89790, "loss": 0.4577, "lr": 1.5339761205228065e-07, "epoch": 9.682592716338123, "percentage": 96.83, "elapsed_time": "6:49:23", "remaining_time": "0:13:25", "throughput": 4294.08, "total_tokens": 105476080} +{"current_steps": 86945, "total_steps": 89790, "loss": 0.4658, "lr": 1.528605839135222e-07, "epoch": 9.68314957122174, "percentage": 96.83, "elapsed_time": "6:49:24", "remaining_time": "0:13:23", "throughput": 4294.1, "total_tokens": 105481968} +{"current_steps": 86950, "total_steps": 89790, "loss": 0.4531, "lr": 1.5232449457932286e-07, "epoch": 9.683706426105356, "percentage": 96.84, "elapsed_time": "6:49:25", "remaining_time": "0:13:22", "throughput": 4294.12, "total_tokens": 105488144} +{"current_steps": 86955, "total_steps": 89790, "loss": 0.468, "lr": 1.517893440699275e-07, "epoch": 9.684263280988974, "percentage": 96.84, "elapsed_time": "6:49:26", "remaining_time": "0:13:20", "throughput": 4294.14, "total_tokens": 105493680} +{"current_steps": 86960, "total_steps": 89790, "loss": 0.4573, "lr": 1.5125513240556445e-07, "epoch": 9.684820135872592, "percentage": 96.85, "elapsed_time": "6:49:28", "remaining_time": "0:13:19", "throughput": 4294.16, "total_tokens": 105499696} +{"current_steps": 86965, "total_steps": 89790, "loss": 0.4661, "lr": 1.5072185960641194e-07, "epoch": 9.68537699075621, "percentage": 96.85, "elapsed_time": "6:49:29", "remaining_time": "0:13:18", "throughput": 4294.18, "total_tokens": 105505712} +{"current_steps": 86970, "total_steps": 89790, "loss": 0.4423, "lr": 1.5018952569262058e-07, "epoch": 9.685933845639827, "percentage": 96.86, "elapsed_time": "6:49:30", "remaining_time": "0:13:16", "throughput": 4294.21, "total_tokens": 105512048} +{"current_steps": 86975, "total_steps": 89790, "loss": 0.4573, "lr": 1.4965813068430479e-07, "epoch": 9.686490700523443, "percentage": 96.86, "elapsed_time": "6:49:32", "remaining_time": "0:13:15", "throughput": 4294.23, "total_tokens": 105518096} +{"current_steps": 86980, "total_steps": 89790, "loss": 0.4569, "lr": 1.4912767460154297e-07, "epoch": 9.68704755540706, "percentage": 96.87, "elapsed_time": "6:49:33", "remaining_time": "0:13:13", "throughput": 4294.25, "total_tokens": 105524144} +{"current_steps": 86985, "total_steps": 89790, "loss": 0.4627, "lr": 1.4859815746437467e-07, "epoch": 9.687604410290678, "percentage": 96.88, "elapsed_time": "6:49:34", "remaining_time": "0:13:12", "throughput": 4294.27, "total_tokens": 105530448} +{"current_steps": 86990, "total_steps": 89790, "loss": 0.4652, "lr": 1.4806957929280884e-07, "epoch": 9.688161265174296, "percentage": 96.88, "elapsed_time": "6:49:35", "remaining_time": "0:13:11", "throughput": 4294.3, "total_tokens": 105536368} +{"current_steps": 86995, "total_steps": 89790, "loss": 0.4488, "lr": 1.4754194010681565e-07, "epoch": 9.688718120057914, "percentage": 96.89, "elapsed_time": "6:49:37", "remaining_time": "0:13:09", "throughput": 4294.32, "total_tokens": 105542416} +{"current_steps": 87000, "total_steps": 89790, "loss": 0.4578, "lr": 1.4701523992633192e-07, "epoch": 9.68927497494153, "percentage": 96.89, "elapsed_time": "6:49:38", "remaining_time": "0:13:08", "throughput": 4294.34, "total_tokens": 105548464} +{"current_steps": 87005, "total_steps": 89790, "loss": 0.4515, "lr": 1.464894787712584e-07, "epoch": 9.689831829825147, "percentage": 96.9, "elapsed_time": "6:49:39", "remaining_time": "0:13:06", "throughput": 4294.36, "total_tokens": 105554544} +{"current_steps": 87010, "total_steps": 89790, "loss": 0.4599, "lr": 1.4596465666145975e-07, "epoch": 9.690388684708765, "percentage": 96.9, "elapsed_time": "6:49:41", "remaining_time": "0:13:05", "throughput": 4294.38, "total_tokens": 105560464} +{"current_steps": 87015, "total_steps": 89790, "loss": 0.4574, "lr": 1.4544077361676178e-07, "epoch": 9.690945539592382, "percentage": 96.91, "elapsed_time": "6:49:42", "remaining_time": "0:13:03", "throughput": 4294.4, "total_tokens": 105566608} +{"current_steps": 87020, "total_steps": 89790, "loss": 0.4672, "lr": 1.449178296569653e-07, "epoch": 9.691502394476, "percentage": 96.92, "elapsed_time": "6:49:43", "remaining_time": "0:13:02", "throughput": 4294.42, "total_tokens": 105572336} +{"current_steps": 87025, "total_steps": 89790, "loss": 0.462, "lr": 1.44395824801824e-07, "epoch": 9.692059249359616, "percentage": 96.92, "elapsed_time": "6:49:44", "remaining_time": "0:13:01", "throughput": 4294.44, "total_tokens": 105578480} +{"current_steps": 87030, "total_steps": 89790, "loss": 0.4634, "lr": 1.4387475907106096e-07, "epoch": 9.692616104243234, "percentage": 96.93, "elapsed_time": "6:49:46", "remaining_time": "0:12:59", "throughput": 4294.46, "total_tokens": 105584496} +{"current_steps": 87035, "total_steps": 89790, "loss": 0.4564, "lr": 1.43354632484366e-07, "epoch": 9.693172959126851, "percentage": 96.93, "elapsed_time": "6:49:47", "remaining_time": "0:12:58", "throughput": 4294.48, "total_tokens": 105590256} +{"current_steps": 87040, "total_steps": 89790, "loss": 0.4677, "lr": 1.4283544506139e-07, "epoch": 9.693729814010469, "percentage": 96.94, "elapsed_time": "6:49:48", "remaining_time": "0:12:56", "throughput": 4294.5, "total_tokens": 105596272} +{"current_steps": 87045, "total_steps": 89790, "loss": 0.4535, "lr": 1.4231719682175072e-07, "epoch": 9.694286668894087, "percentage": 96.94, "elapsed_time": "6:49:50", "remaining_time": "0:12:55", "throughput": 4294.53, "total_tokens": 105602416} +{"current_steps": 87050, "total_steps": 89790, "loss": 0.4588, "lr": 1.4179988778502685e-07, "epoch": 9.694843523777703, "percentage": 96.95, "elapsed_time": "6:49:51", "remaining_time": "0:12:54", "throughput": 4294.55, "total_tokens": 105608112} +{"current_steps": 87055, "total_steps": 89790, "loss": 0.4582, "lr": 1.412835179707639e-07, "epoch": 9.69540037866132, "percentage": 96.95, "elapsed_time": "6:49:52", "remaining_time": "0:12:52", "throughput": 4294.57, "total_tokens": 105614224} +{"current_steps": 87060, "total_steps": 89790, "loss": 0.4697, "lr": 1.4076808739847403e-07, "epoch": 9.695957233544938, "percentage": 96.96, "elapsed_time": "6:49:53", "remaining_time": "0:12:51", "throughput": 4294.59, "total_tokens": 105620208} +{"current_steps": 87065, "total_steps": 89790, "loss": 0.4635, "lr": 1.4025359608763334e-07, "epoch": 9.696514088428556, "percentage": 96.97, "elapsed_time": "6:49:55", "remaining_time": "0:12:49", "throughput": 4294.61, "total_tokens": 105626352} +{"current_steps": 87070, "total_steps": 89790, "loss": 0.4545, "lr": 1.3974004405767628e-07, "epoch": 9.697070943312173, "percentage": 96.97, "elapsed_time": "6:49:56", "remaining_time": "0:12:48", "throughput": 4294.63, "total_tokens": 105631984} +{"current_steps": 87075, "total_steps": 89790, "loss": 0.4556, "lr": 1.3922743132800952e-07, "epoch": 9.69762779819579, "percentage": 96.98, "elapsed_time": "6:49:57", "remaining_time": "0:12:46", "throughput": 4294.66, "total_tokens": 105638192} +{"current_steps": 87080, "total_steps": 89790, "loss": 0.4561, "lr": 1.3871575791800372e-07, "epoch": 9.698184653079407, "percentage": 96.98, "elapsed_time": "6:49:58", "remaining_time": "0:12:45", "throughput": 4294.68, "total_tokens": 105644176} +{"current_steps": 87085, "total_steps": 89790, "loss": 0.464, "lr": 1.3820502384698508e-07, "epoch": 9.698741507963025, "percentage": 96.99, "elapsed_time": "6:50:00", "remaining_time": "0:12:44", "throughput": 4294.7, "total_tokens": 105650448} +{"current_steps": 87090, "total_steps": 89790, "loss": 0.4596, "lr": 1.376952291342548e-07, "epoch": 9.699298362846642, "percentage": 96.99, "elapsed_time": "6:50:01", "remaining_time": "0:12:42", "throughput": 4294.72, "total_tokens": 105656016} +{"current_steps": 87095, "total_steps": 89790, "loss": 0.4447, "lr": 1.371863737990725e-07, "epoch": 9.69985521773026, "percentage": 97.0, "elapsed_time": "6:50:02", "remaining_time": "0:12:41", "throughput": 4294.74, "total_tokens": 105662160} +{"current_steps": 87100, "total_steps": 89790, "loss": 0.4603, "lr": 1.3667845786066723e-07, "epoch": 9.700412072613878, "percentage": 97.0, "elapsed_time": "6:50:03", "remaining_time": "0:12:39", "throughput": 4294.76, "total_tokens": 105668272} +{"current_steps": 87105, "total_steps": 89790, "loss": 0.4605, "lr": 1.361714813382292e-07, "epoch": 9.700968927497494, "percentage": 97.01, "elapsed_time": "6:50:05", "remaining_time": "0:12:38", "throughput": 4294.78, "total_tokens": 105674160} +{"current_steps": 87110, "total_steps": 89790, "loss": 0.466, "lr": 1.3566544425091253e-07, "epoch": 9.701525782381111, "percentage": 97.02, "elapsed_time": "6:50:06", "remaining_time": "0:12:37", "throughput": 4294.8, "total_tokens": 105679984} +{"current_steps": 87115, "total_steps": 89790, "loss": 0.459, "lr": 1.3516034661783527e-07, "epoch": 9.702082637264729, "percentage": 97.02, "elapsed_time": "6:50:07", "remaining_time": "0:12:35", "throughput": 4294.83, "total_tokens": 105686320} +{"current_steps": 87120, "total_steps": 89790, "loss": 0.4733, "lr": 1.3465618845808493e-07, "epoch": 9.702639492148347, "percentage": 97.03, "elapsed_time": "6:50:09", "remaining_time": "0:12:34", "throughput": 4294.85, "total_tokens": 105692592} +{"current_steps": 87125, "total_steps": 89790, "loss": 0.4385, "lr": 1.3415296979071012e-07, "epoch": 9.703196347031964, "percentage": 97.03, "elapsed_time": "6:50:10", "remaining_time": "0:12:32", "throughput": 4294.88, "total_tokens": 105698928} +{"current_steps": 87130, "total_steps": 89790, "loss": 0.4672, "lr": 1.336506906347207e-07, "epoch": 9.70375320191558, "percentage": 97.04, "elapsed_time": "6:50:11", "remaining_time": "0:12:31", "throughput": 4294.89, "total_tokens": 105704176} +{"current_steps": 87135, "total_steps": 89790, "loss": 0.4639, "lr": 1.3314935100909586e-07, "epoch": 9.704310056799198, "percentage": 97.04, "elapsed_time": "6:50:12", "remaining_time": "0:12:29", "throughput": 4294.92, "total_tokens": 105710512} +{"current_steps": 87140, "total_steps": 89790, "loss": 0.4676, "lr": 1.3264895093277885e-07, "epoch": 9.704866911682815, "percentage": 97.05, "elapsed_time": "6:50:14", "remaining_time": "0:12:28", "throughput": 4294.94, "total_tokens": 105716784} +{"current_steps": 87145, "total_steps": 89790, "loss": 0.464, "lr": 1.3214949042467395e-07, "epoch": 9.705423766566433, "percentage": 97.05, "elapsed_time": "6:50:15", "remaining_time": "0:12:27", "throughput": 4294.96, "total_tokens": 105722544} +{"current_steps": 87150, "total_steps": 89790, "loss": 0.4509, "lr": 1.3165096950365774e-07, "epoch": 9.70598062145005, "percentage": 97.06, "elapsed_time": "6:50:16", "remaining_time": "0:12:25", "throughput": 4294.98, "total_tokens": 105728752} +{"current_steps": 87155, "total_steps": 89790, "loss": 0.4641, "lr": 1.311533881885596e-07, "epoch": 9.706537476333667, "percentage": 97.07, "elapsed_time": "6:50:18", "remaining_time": "0:12:24", "throughput": 4295.0, "total_tokens": 105734640} +{"current_steps": 87160, "total_steps": 89790, "loss": 0.4612, "lr": 1.3065674649818395e-07, "epoch": 9.707094331217284, "percentage": 97.07, "elapsed_time": "6:50:19", "remaining_time": "0:12:22", "throughput": 4295.02, "total_tokens": 105740752} +{"current_steps": 87165, "total_steps": 89790, "loss": 0.472, "lr": 1.3016104445129351e-07, "epoch": 9.707651186100902, "percentage": 97.08, "elapsed_time": "6:50:20", "remaining_time": "0:12:21", "throughput": 4295.04, "total_tokens": 105746992} +{"current_steps": 87170, "total_steps": 89790, "loss": 0.4626, "lr": 1.296662820666178e-07, "epoch": 9.70820804098452, "percentage": 97.08, "elapsed_time": "6:50:21", "remaining_time": "0:12:20", "throughput": 4295.06, "total_tokens": 105752560} +{"current_steps": 87175, "total_steps": 89790, "loss": 0.4485, "lr": 1.2917245936285294e-07, "epoch": 9.708764895868137, "percentage": 97.09, "elapsed_time": "6:50:23", "remaining_time": "0:12:18", "throughput": 4295.08, "total_tokens": 105758800} +{"current_steps": 87180, "total_steps": 89790, "loss": 0.4577, "lr": 1.2867957635865345e-07, "epoch": 9.709321750751753, "percentage": 97.09, "elapsed_time": "6:50:24", "remaining_time": "0:12:17", "throughput": 4295.1, "total_tokens": 105764688} +{"current_steps": 87185, "total_steps": 89790, "loss": 0.462, "lr": 1.2818763307264337e-07, "epoch": 9.709878605635371, "percentage": 97.1, "elapsed_time": "6:50:25", "remaining_time": "0:12:15", "throughput": 4295.13, "total_tokens": 105770896} +{"current_steps": 87190, "total_steps": 89790, "loss": 0.4497, "lr": 1.2769662952341055e-07, "epoch": 9.710435460518989, "percentage": 97.1, "elapsed_time": "6:50:27", "remaining_time": "0:12:14", "throughput": 4295.15, "total_tokens": 105777072} +{"current_steps": 87195, "total_steps": 89790, "loss": 0.4589, "lr": 1.2720656572950685e-07, "epoch": 9.710992315402606, "percentage": 97.11, "elapsed_time": "6:50:28", "remaining_time": "0:12:12", "throughput": 4295.18, "total_tokens": 105783440} +{"current_steps": 87200, "total_steps": 89790, "loss": 0.4534, "lr": 1.26717441709448e-07, "epoch": 9.711549170286224, "percentage": 97.12, "elapsed_time": "6:50:29", "remaining_time": "0:12:11", "throughput": 4295.2, "total_tokens": 105789200} +{"current_steps": 87205, "total_steps": 89790, "loss": 0.4635, "lr": 1.2622925748171366e-07, "epoch": 9.712106025169842, "percentage": 97.12, "elapsed_time": "6:50:30", "remaining_time": "0:12:10", "throughput": 4295.22, "total_tokens": 105795248} +{"current_steps": 87210, "total_steps": 89790, "loss": 0.4663, "lr": 1.257420130647502e-07, "epoch": 9.712662880053458, "percentage": 97.13, "elapsed_time": "6:50:32", "remaining_time": "0:12:08", "throughput": 4295.23, "total_tokens": 105801104} +{"current_steps": 87215, "total_steps": 89790, "loss": 0.4545, "lr": 1.2525570847696787e-07, "epoch": 9.713219734937075, "percentage": 97.13, "elapsed_time": "6:50:33", "remaining_time": "0:12:07", "throughput": 4295.26, "total_tokens": 105807120} +{"current_steps": 87220, "total_steps": 89790, "loss": 0.4584, "lr": 1.2477034373673814e-07, "epoch": 9.713776589820693, "percentage": 97.14, "elapsed_time": "6:50:34", "remaining_time": "0:12:05", "throughput": 4295.28, "total_tokens": 105813104} +{"current_steps": 87225, "total_steps": 89790, "loss": 0.4591, "lr": 1.2428591886240183e-07, "epoch": 9.71433344470431, "percentage": 97.14, "elapsed_time": "6:50:36", "remaining_time": "0:12:04", "throughput": 4295.31, "total_tokens": 105819280} +{"current_steps": 87230, "total_steps": 89790, "loss": 0.4709, "lr": 1.2380243387226097e-07, "epoch": 9.714890299587928, "percentage": 97.15, "elapsed_time": "6:50:37", "remaining_time": "0:12:03", "throughput": 4295.33, "total_tokens": 105825296} +{"current_steps": 87235, "total_steps": 89790, "loss": 0.471, "lr": 1.2331988878458712e-07, "epoch": 9.715447154471544, "percentage": 97.15, "elapsed_time": "6:50:38", "remaining_time": "0:12:01", "throughput": 4295.35, "total_tokens": 105831120} +{"current_steps": 87240, "total_steps": 89790, "loss": 0.4637, "lr": 1.2283828361760452e-07, "epoch": 9.716004009355162, "percentage": 97.16, "elapsed_time": "6:50:39", "remaining_time": "0:12:00", "throughput": 4295.37, "total_tokens": 105837136} +{"current_steps": 87245, "total_steps": 89790, "loss": 0.467, "lr": 1.2235761838951809e-07, "epoch": 9.71656086423878, "percentage": 97.17, "elapsed_time": "6:50:41", "remaining_time": "0:11:58", "throughput": 4295.39, "total_tokens": 105843152} +{"current_steps": 87250, "total_steps": 89790, "loss": 0.4781, "lr": 1.2187789311848274e-07, "epoch": 9.717117719122397, "percentage": 97.17, "elapsed_time": "6:50:42", "remaining_time": "0:11:57", "throughput": 4295.42, "total_tokens": 105849136} +{"current_steps": 87255, "total_steps": 89790, "loss": 0.4597, "lr": 1.2139910782262842e-07, "epoch": 9.717674574006015, "percentage": 97.18, "elapsed_time": "6:50:43", "remaining_time": "0:11:55", "throughput": 4295.44, "total_tokens": 105855472} +{"current_steps": 87260, "total_steps": 89790, "loss": 0.466, "lr": 1.2092126252004342e-07, "epoch": 9.71823142888963, "percentage": 97.18, "elapsed_time": "6:50:44", "remaining_time": "0:11:54", "throughput": 4295.46, "total_tokens": 105860976} +{"current_steps": 87265, "total_steps": 89790, "loss": 0.4763, "lr": 1.2044435722878001e-07, "epoch": 9.718788283773248, "percentage": 97.19, "elapsed_time": "6:50:46", "remaining_time": "0:11:53", "throughput": 4295.48, "total_tokens": 105867280} +{"current_steps": 87270, "total_steps": 89790, "loss": 0.4594, "lr": 1.1996839196685983e-07, "epoch": 9.719345138656866, "percentage": 97.19, "elapsed_time": "6:50:47", "remaining_time": "0:11:51", "throughput": 4295.5, "total_tokens": 105872752} +{"current_steps": 87275, "total_steps": 89790, "loss": 0.4527, "lr": 1.1949336675226574e-07, "epoch": 9.719901993540484, "percentage": 97.2, "elapsed_time": "6:50:48", "remaining_time": "0:11:50", "throughput": 4295.52, "total_tokens": 105878704} +{"current_steps": 87280, "total_steps": 89790, "loss": 0.4633, "lr": 1.1901928160294729e-07, "epoch": 9.720458848424101, "percentage": 97.2, "elapsed_time": "6:50:49", "remaining_time": "0:11:48", "throughput": 4295.55, "total_tokens": 105885008} +{"current_steps": 87285, "total_steps": 89790, "loss": 0.4705, "lr": 1.1854613653681512e-07, "epoch": 9.721015703307717, "percentage": 97.21, "elapsed_time": "6:50:51", "remaining_time": "0:11:47", "throughput": 4295.56, "total_tokens": 105890512} +{"current_steps": 87290, "total_steps": 89790, "loss": 0.4668, "lr": 1.1807393157174384e-07, "epoch": 9.721572558191335, "percentage": 97.22, "elapsed_time": "6:50:52", "remaining_time": "0:11:46", "throughput": 4295.59, "total_tokens": 105896688} +{"current_steps": 87295, "total_steps": 89790, "loss": 0.4592, "lr": 1.1760266672558028e-07, "epoch": 9.722129413074953, "percentage": 97.22, "elapsed_time": "6:50:53", "remaining_time": "0:11:44", "throughput": 4295.61, "total_tokens": 105902512} +{"current_steps": 87300, "total_steps": 89790, "loss": 0.4497, "lr": 1.1713234201612689e-07, "epoch": 9.72268626795857, "percentage": 97.23, "elapsed_time": "6:50:54", "remaining_time": "0:11:43", "throughput": 4295.63, "total_tokens": 105908496} +{"current_steps": 87305, "total_steps": 89790, "loss": 0.4626, "lr": 1.1666295746115275e-07, "epoch": 9.723243122842188, "percentage": 97.23, "elapsed_time": "6:50:56", "remaining_time": "0:11:41", "throughput": 4295.65, "total_tokens": 105914576} +{"current_steps": 87310, "total_steps": 89790, "loss": 0.471, "lr": 1.1619451307839646e-07, "epoch": 9.723799977725804, "percentage": 97.24, "elapsed_time": "6:50:57", "remaining_time": "0:11:40", "throughput": 4295.68, "total_tokens": 105921072} +{"current_steps": 87315, "total_steps": 89790, "loss": 0.4557, "lr": 1.1572700888555499e-07, "epoch": 9.724356832609422, "percentage": 97.24, "elapsed_time": "6:50:58", "remaining_time": "0:11:38", "throughput": 4295.7, "total_tokens": 105927120} +{"current_steps": 87320, "total_steps": 89790, "loss": 0.4485, "lr": 1.1526044490029475e-07, "epoch": 9.72491368749304, "percentage": 97.25, "elapsed_time": "6:51:00", "remaining_time": "0:11:37", "throughput": 4295.72, "total_tokens": 105933200} +{"current_steps": 87325, "total_steps": 89790, "loss": 0.4548, "lr": 1.1479482114023777e-07, "epoch": 9.725470542376657, "percentage": 97.25, "elapsed_time": "6:51:01", "remaining_time": "0:11:36", "throughput": 4295.74, "total_tokens": 105939248} +{"current_steps": 87330, "total_steps": 89790, "loss": 0.4652, "lr": 1.1433013762298384e-07, "epoch": 9.726027397260275, "percentage": 97.26, "elapsed_time": "6:51:02", "remaining_time": "0:11:34", "throughput": 4295.77, "total_tokens": 105945296} +{"current_steps": 87335, "total_steps": 89790, "loss": 0.4713, "lr": 1.1386639436608836e-07, "epoch": 9.72658425214389, "percentage": 97.27, "elapsed_time": "6:51:03", "remaining_time": "0:11:33", "throughput": 4295.79, "total_tokens": 105951216} +{"current_steps": 87340, "total_steps": 89790, "loss": 0.4508, "lr": 1.1340359138707068e-07, "epoch": 9.727141107027508, "percentage": 97.27, "elapsed_time": "6:51:05", "remaining_time": "0:11:31", "throughput": 4295.81, "total_tokens": 105957392} +{"current_steps": 87345, "total_steps": 89790, "loss": 0.449, "lr": 1.1294172870341679e-07, "epoch": 9.727697961911126, "percentage": 97.28, "elapsed_time": "6:51:06", "remaining_time": "0:11:30", "throughput": 4295.83, "total_tokens": 105963504} +{"current_steps": 87350, "total_steps": 89790, "loss": 0.4597, "lr": 1.124808063325794e-07, "epoch": 9.728254816794744, "percentage": 97.28, "elapsed_time": "6:51:07", "remaining_time": "0:11:29", "throughput": 4295.85, "total_tokens": 105969296} +{"current_steps": 87355, "total_steps": 89790, "loss": 0.4635, "lr": 1.1202082429197513e-07, "epoch": 9.728811671678361, "percentage": 97.29, "elapsed_time": "6:51:09", "remaining_time": "0:11:27", "throughput": 4295.88, "total_tokens": 105975472} +{"current_steps": 87360, "total_steps": 89790, "loss": 0.4615, "lr": 1.1156178259898175e-07, "epoch": 9.729368526561977, "percentage": 97.29, "elapsed_time": "6:51:10", "remaining_time": "0:11:26", "throughput": 4295.9, "total_tokens": 105981520} +{"current_steps": 87365, "total_steps": 89790, "loss": 0.4701, "lr": 1.1110368127094095e-07, "epoch": 9.729925381445595, "percentage": 97.3, "elapsed_time": "6:51:11", "remaining_time": "0:11:24", "throughput": 4295.92, "total_tokens": 105987088} +{"current_steps": 87370, "total_steps": 89790, "loss": 0.4651, "lr": 1.1064652032516387e-07, "epoch": 9.730482236329212, "percentage": 97.3, "elapsed_time": "6:51:12", "remaining_time": "0:11:23", "throughput": 4295.94, "total_tokens": 105992944} +{"current_steps": 87375, "total_steps": 89790, "loss": 0.4712, "lr": 1.1019029977892281e-07, "epoch": 9.73103909121283, "percentage": 97.31, "elapsed_time": "6:51:14", "remaining_time": "0:11:21", "throughput": 4295.96, "total_tokens": 105998832} +{"current_steps": 87380, "total_steps": 89790, "loss": 0.4641, "lr": 1.0973501964945675e-07, "epoch": 9.731595946096448, "percentage": 97.32, "elapsed_time": "6:51:15", "remaining_time": "0:11:20", "throughput": 4295.98, "total_tokens": 106004976} +{"current_steps": 87385, "total_steps": 89790, "loss": 0.4634, "lr": 1.0928067995396585e-07, "epoch": 9.732152800980064, "percentage": 97.32, "elapsed_time": "6:51:16", "remaining_time": "0:11:19", "throughput": 4296.01, "total_tokens": 106010768} +{"current_steps": 87390, "total_steps": 89790, "loss": 0.4655, "lr": 1.088272807096169e-07, "epoch": 9.732709655863681, "percentage": 97.33, "elapsed_time": "6:51:17", "remaining_time": "0:11:17", "throughput": 4296.03, "total_tokens": 106017040} +{"current_steps": 87395, "total_steps": 89790, "loss": 0.4496, "lr": 1.0837482193354065e-07, "epoch": 9.733266510747299, "percentage": 97.33, "elapsed_time": "6:51:19", "remaining_time": "0:11:16", "throughput": 4296.05, "total_tokens": 106022576} +{"current_steps": 87400, "total_steps": 89790, "loss": 0.4602, "lr": 1.0792330364283454e-07, "epoch": 9.733823365630917, "percentage": 97.34, "elapsed_time": "6:51:20", "remaining_time": "0:11:14", "throughput": 4296.07, "total_tokens": 106028368} +{"current_steps": 87405, "total_steps": 89790, "loss": 0.4588, "lr": 1.0747272585455437e-07, "epoch": 9.734380220514534, "percentage": 97.34, "elapsed_time": "6:51:21", "remaining_time": "0:11:13", "throughput": 4296.09, "total_tokens": 106034672} +{"current_steps": 87410, "total_steps": 89790, "loss": 0.4641, "lr": 1.0702308858572819e-07, "epoch": 9.73493707539815, "percentage": 97.35, "elapsed_time": "6:51:22", "remaining_time": "0:11:12", "throughput": 4296.11, "total_tokens": 106040816} +{"current_steps": 87415, "total_steps": 89790, "loss": 0.4601, "lr": 1.0657439185334239e-07, "epoch": 9.735493930281768, "percentage": 97.35, "elapsed_time": "6:51:24", "remaining_time": "0:11:10", "throughput": 4296.14, "total_tokens": 106047152} +{"current_steps": 87420, "total_steps": 89790, "loss": 0.4627, "lr": 1.0612663567435289e-07, "epoch": 9.736050785165386, "percentage": 97.36, "elapsed_time": "6:51:25", "remaining_time": "0:11:09", "throughput": 4296.16, "total_tokens": 106053232} +{"current_steps": 87425, "total_steps": 89790, "loss": 0.4673, "lr": 1.0567982006567389e-07, "epoch": 9.736607640049003, "percentage": 97.37, "elapsed_time": "6:51:26", "remaining_time": "0:11:07", "throughput": 4296.18, "total_tokens": 106059376} +{"current_steps": 87430, "total_steps": 89790, "loss": 0.4701, "lr": 1.0523394504418915e-07, "epoch": 9.737164494932621, "percentage": 97.37, "elapsed_time": "6:51:28", "remaining_time": "0:11:06", "throughput": 4296.21, "total_tokens": 106065584} +{"current_steps": 87435, "total_steps": 89790, "loss": 0.4583, "lr": 1.0478901062674351e-07, "epoch": 9.737721349816239, "percentage": 97.38, "elapsed_time": "6:51:29", "remaining_time": "0:11:04", "throughput": 4296.22, "total_tokens": 106071088} +{"current_steps": 87440, "total_steps": 89790, "loss": 0.4673, "lr": 1.043450168301513e-07, "epoch": 9.738278204699855, "percentage": 97.38, "elapsed_time": "6:51:30", "remaining_time": "0:11:03", "throughput": 4296.25, "total_tokens": 106077392} +{"current_steps": 87445, "total_steps": 89790, "loss": 0.4689, "lr": 1.0390196367118521e-07, "epoch": 9.738835059583472, "percentage": 97.39, "elapsed_time": "6:51:31", "remaining_time": "0:11:02", "throughput": 4296.27, "total_tokens": 106083344} +{"current_steps": 87450, "total_steps": 89790, "loss": 0.468, "lr": 1.034598511665874e-07, "epoch": 9.73939191446709, "percentage": 97.39, "elapsed_time": "6:51:33", "remaining_time": "0:11:00", "throughput": 4296.29, "total_tokens": 106089328} +{"current_steps": 87455, "total_steps": 89790, "loss": 0.4481, "lr": 1.030186793330612e-07, "epoch": 9.739948769350708, "percentage": 97.4, "elapsed_time": "6:51:34", "remaining_time": "0:10:59", "throughput": 4296.31, "total_tokens": 106094928} +{"current_steps": 87460, "total_steps": 89790, "loss": 0.4539, "lr": 1.0257844818727658e-07, "epoch": 9.740505624234325, "percentage": 97.41, "elapsed_time": "6:51:35", "remaining_time": "0:10:57", "throughput": 4296.33, "total_tokens": 106101040} +{"current_steps": 87465, "total_steps": 89790, "loss": 0.4399, "lr": 1.021391577458647e-07, "epoch": 9.741062479117941, "percentage": 97.41, "elapsed_time": "6:51:37", "remaining_time": "0:10:56", "throughput": 4296.36, "total_tokens": 106107632} +{"current_steps": 87470, "total_steps": 89790, "loss": 0.4601, "lr": 1.0170080802542336e-07, "epoch": 9.741619334001559, "percentage": 97.42, "elapsed_time": "6:51:38", "remaining_time": "0:10:55", "throughput": 4296.37, "total_tokens": 106113328} +{"current_steps": 87475, "total_steps": 89790, "loss": 0.4551, "lr": 1.0126339904251992e-07, "epoch": 9.742176188885177, "percentage": 97.42, "elapsed_time": "6:51:40", "remaining_time": "0:10:53", "throughput": 4296.32, "total_tokens": 106119344} +{"current_steps": 87480, "total_steps": 89790, "loss": 0.462, "lr": 1.0082693081367445e-07, "epoch": 9.742733043768794, "percentage": 97.43, "elapsed_time": "6:51:41", "remaining_time": "0:10:52", "throughput": 4296.34, "total_tokens": 106125584} +{"current_steps": 87485, "total_steps": 89790, "loss": 0.4531, "lr": 1.003914033553821e-07, "epoch": 9.743289898652412, "percentage": 97.43, "elapsed_time": "6:51:42", "remaining_time": "0:10:50", "throughput": 4296.36, "total_tokens": 106131568} +{"current_steps": 87490, "total_steps": 89790, "loss": 0.4723, "lr": 9.995681668409362e-08, "epoch": 9.743846753536028, "percentage": 97.44, "elapsed_time": "6:51:43", "remaining_time": "0:10:49", "throughput": 4296.39, "total_tokens": 106137168} +{"current_steps": 87495, "total_steps": 89790, "loss": 0.4571, "lr": 9.952317081623752e-08, "epoch": 9.744403608419645, "percentage": 97.44, "elapsed_time": "6:51:45", "remaining_time": "0:10:48", "throughput": 4296.41, "total_tokens": 106143440} +{"current_steps": 87500, "total_steps": 89790, "loss": 0.4702, "lr": 9.909046576818959e-08, "epoch": 9.744960463303263, "percentage": 97.45, "elapsed_time": "6:51:46", "remaining_time": "0:10:46", "throughput": 4296.43, "total_tokens": 106149840} +{"current_steps": 87505, "total_steps": 89790, "loss": 0.4723, "lr": 9.865870155630618e-08, "epoch": 9.74551731818688, "percentage": 97.46, "elapsed_time": "6:51:47", "remaining_time": "0:10:45", "throughput": 4296.45, "total_tokens": 106155344} +{"current_steps": 87510, "total_steps": 89790, "loss": 0.4529, "lr": 9.822787819689371e-08, "epoch": 9.746074173070499, "percentage": 97.46, "elapsed_time": "6:51:48", "remaining_time": "0:10:43", "throughput": 4296.47, "total_tokens": 106161392} +{"current_steps": 87515, "total_steps": 89790, "loss": 0.4614, "lr": 9.779799570623637e-08, "epoch": 9.746631027954114, "percentage": 97.47, "elapsed_time": "6:51:50", "remaining_time": "0:10:42", "throughput": 4296.5, "total_tokens": 106167376} +{"current_steps": 87520, "total_steps": 89790, "loss": 0.4595, "lr": 9.736905410057395e-08, "epoch": 9.747187882837732, "percentage": 97.47, "elapsed_time": "6:51:51", "remaining_time": "0:10:40", "throughput": 4296.52, "total_tokens": 106173520} +{"current_steps": 87525, "total_steps": 89790, "loss": 0.4676, "lr": 9.694105339611015e-08, "epoch": 9.74774473772135, "percentage": 97.48, "elapsed_time": "6:51:52", "remaining_time": "0:10:39", "throughput": 4296.54, "total_tokens": 106179280} +{"current_steps": 87530, "total_steps": 89790, "loss": 0.4654, "lr": 9.651399360902091e-08, "epoch": 9.748301592604967, "percentage": 97.48, "elapsed_time": "6:51:54", "remaining_time": "0:10:38", "throughput": 4296.56, "total_tokens": 106185264} +{"current_steps": 87535, "total_steps": 89790, "loss": 0.4573, "lr": 9.608787475544056e-08, "epoch": 9.748858447488585, "percentage": 97.49, "elapsed_time": "6:51:55", "remaining_time": "0:10:36", "throughput": 4296.59, "total_tokens": 106191568} +{"current_steps": 87540, "total_steps": 89790, "loss": 0.4536, "lr": 9.566269685147011e-08, "epoch": 9.749415302372201, "percentage": 97.49, "elapsed_time": "6:51:56", "remaining_time": "0:10:35", "throughput": 4296.61, "total_tokens": 106197616} +{"current_steps": 87545, "total_steps": 89790, "loss": 0.4597, "lr": 9.523845991317171e-08, "epoch": 9.749972157255819, "percentage": 97.5, "elapsed_time": "6:51:57", "remaining_time": "0:10:33", "throughput": 4296.63, "total_tokens": 106204016} +{"current_steps": 87550, "total_steps": 89790, "loss": 0.4541, "lr": 9.481516395657419e-08, "epoch": 9.750529012139436, "percentage": 97.51, "elapsed_time": "6:51:59", "remaining_time": "0:10:32", "throughput": 4296.65, "total_tokens": 106209808} +{"current_steps": 87555, "total_steps": 89790, "loss": 0.4622, "lr": 9.439280899767311e-08, "epoch": 9.751085867023054, "percentage": 97.51, "elapsed_time": "6:52:00", "remaining_time": "0:10:31", "throughput": 4296.67, "total_tokens": 106215824} +{"current_steps": 87560, "total_steps": 89790, "loss": 0.4555, "lr": 9.397139505242514e-08, "epoch": 9.751642721906672, "percentage": 97.52, "elapsed_time": "6:52:01", "remaining_time": "0:10:29", "throughput": 4296.69, "total_tokens": 106221936} +{"current_steps": 87565, "total_steps": 89790, "loss": 0.4597, "lr": 9.355092213675365e-08, "epoch": 9.75219957679029, "percentage": 97.52, "elapsed_time": "6:52:02", "remaining_time": "0:10:28", "throughput": 4296.71, "total_tokens": 106227472} +{"current_steps": 87570, "total_steps": 89790, "loss": 0.4471, "lr": 9.313139026654594e-08, "epoch": 9.752756431673905, "percentage": 97.53, "elapsed_time": "6:52:04", "remaining_time": "0:10:26", "throughput": 4296.74, "total_tokens": 106233680} +{"current_steps": 87575, "total_steps": 89790, "loss": 0.4645, "lr": 9.271279945765044e-08, "epoch": 9.753313286557523, "percentage": 97.53, "elapsed_time": "6:52:05", "remaining_time": "0:10:25", "throughput": 4296.76, "total_tokens": 106239600} +{"current_steps": 87580, "total_steps": 89790, "loss": 0.4679, "lr": 9.229514972588782e-08, "epoch": 9.75387014144114, "percentage": 97.54, "elapsed_time": "6:52:06", "remaining_time": "0:10:23", "throughput": 4296.78, "total_tokens": 106245648} +{"current_steps": 87585, "total_steps": 89790, "loss": 0.4592, "lr": 9.187844108703159e-08, "epoch": 9.754426996324758, "percentage": 97.54, "elapsed_time": "6:52:08", "remaining_time": "0:10:22", "throughput": 4296.8, "total_tokens": 106251952} +{"current_steps": 87590, "total_steps": 89790, "loss": 0.4612, "lr": 9.146267355683302e-08, "epoch": 9.754983851208376, "percentage": 97.55, "elapsed_time": "6:52:09", "remaining_time": "0:10:21", "throughput": 4296.82, "total_tokens": 106258032} +{"current_steps": 87595, "total_steps": 89790, "loss": 0.4672, "lr": 9.104784715099623e-08, "epoch": 9.755540706091992, "percentage": 97.56, "elapsed_time": "6:52:10", "remaining_time": "0:10:19", "throughput": 4296.85, "total_tokens": 106264304} +{"current_steps": 87600, "total_steps": 89790, "loss": 0.4572, "lr": 9.063396188519479e-08, "epoch": 9.75609756097561, "percentage": 97.56, "elapsed_time": "6:52:12", "remaining_time": "0:10:18", "throughput": 4296.87, "total_tokens": 106270352} +{"current_steps": 87605, "total_steps": 89790, "loss": 0.4621, "lr": 9.022101777506897e-08, "epoch": 9.756654415859227, "percentage": 97.57, "elapsed_time": "6:52:13", "remaining_time": "0:10:16", "throughput": 4296.89, "total_tokens": 106276624} +{"current_steps": 87610, "total_steps": 89790, "loss": 0.4598, "lr": 8.980901483622295e-08, "epoch": 9.757211270742845, "percentage": 97.57, "elapsed_time": "6:52:14", "remaining_time": "0:10:15", "throughput": 4296.92, "total_tokens": 106282544} +{"current_steps": 87615, "total_steps": 89790, "loss": 0.4549, "lr": 8.939795308421927e-08, "epoch": 9.757768125626463, "percentage": 97.58, "elapsed_time": "6:52:15", "remaining_time": "0:10:14", "throughput": 4296.93, "total_tokens": 106288336} +{"current_steps": 87620, "total_steps": 89790, "loss": 0.4653, "lr": 8.898783253458997e-08, "epoch": 9.758324980510078, "percentage": 97.58, "elapsed_time": "6:52:17", "remaining_time": "0:10:12", "throughput": 4296.95, "total_tokens": 106294608} +{"current_steps": 87625, "total_steps": 89790, "loss": 0.4643, "lr": 8.857865320283377e-08, "epoch": 9.758881835393696, "percentage": 97.59, "elapsed_time": "6:52:18", "remaining_time": "0:10:11", "throughput": 4296.98, "total_tokens": 106300464} +{"current_steps": 87630, "total_steps": 89790, "loss": 0.4604, "lr": 8.817041510440771e-08, "epoch": 9.759438690277314, "percentage": 97.59, "elapsed_time": "6:52:19", "remaining_time": "0:10:09", "throughput": 4297.0, "total_tokens": 106306192} +{"current_steps": 87635, "total_steps": 89790, "loss": 0.4579, "lr": 8.77631182547356e-08, "epoch": 9.759995545160931, "percentage": 97.6, "elapsed_time": "6:52:20", "remaining_time": "0:10:08", "throughput": 4297.02, "total_tokens": 106312432} +{"current_steps": 87640, "total_steps": 89790, "loss": 0.4595, "lr": 8.735676266921066e-08, "epoch": 9.76055240004455, "percentage": 97.61, "elapsed_time": "6:52:22", "remaining_time": "0:10:06", "throughput": 4297.04, "total_tokens": 106318672} +{"current_steps": 87645, "total_steps": 89790, "loss": 0.4515, "lr": 8.695134836318175e-08, "epoch": 9.761109254928165, "percentage": 97.61, "elapsed_time": "6:52:23", "remaining_time": "0:10:05", "throughput": 4297.07, "total_tokens": 106324848} +{"current_steps": 87650, "total_steps": 89790, "loss": 0.4657, "lr": 8.654687535196993e-08, "epoch": 9.761666109811783, "percentage": 97.62, "elapsed_time": "6:52:24", "remaining_time": "0:10:04", "throughput": 4297.09, "total_tokens": 106330864} +{"current_steps": 87655, "total_steps": 89790, "loss": 0.4493, "lr": 8.614334365085463e-08, "epoch": 9.7622229646954, "percentage": 97.62, "elapsed_time": "6:52:26", "remaining_time": "0:10:02", "throughput": 4297.11, "total_tokens": 106336976} +{"current_steps": 87660, "total_steps": 89790, "loss": 0.4566, "lr": 8.574075327508479e-08, "epoch": 9.762779819579018, "percentage": 97.63, "elapsed_time": "6:52:27", "remaining_time": "0:10:01", "throughput": 4297.13, "total_tokens": 106342960} +{"current_steps": 87665, "total_steps": 89790, "loss": 0.4755, "lr": 8.533910423987323e-08, "epoch": 9.763336674462636, "percentage": 97.63, "elapsed_time": "6:52:28", "remaining_time": "0:09:59", "throughput": 4297.16, "total_tokens": 106349008} +{"current_steps": 87670, "total_steps": 89790, "loss": 0.4523, "lr": 8.493839656039116e-08, "epoch": 9.763893529346252, "percentage": 97.64, "elapsed_time": "6:52:30", "remaining_time": "0:09:58", "throughput": 4297.18, "total_tokens": 106355216} +{"current_steps": 87675, "total_steps": 89790, "loss": 0.4487, "lr": 8.453863025177921e-08, "epoch": 9.76445038422987, "percentage": 97.64, "elapsed_time": "6:52:31", "remaining_time": "0:09:57", "throughput": 4297.2, "total_tokens": 106361360} +{"current_steps": 87680, "total_steps": 89790, "loss": 0.4638, "lr": 8.413980532914478e-08, "epoch": 9.765007239113487, "percentage": 97.65, "elapsed_time": "6:52:32", "remaining_time": "0:09:55", "throughput": 4297.23, "total_tokens": 106367536} +{"current_steps": 87685, "total_steps": 89790, "loss": 0.4613, "lr": 8.374192180755636e-08, "epoch": 9.765564093997105, "percentage": 97.66, "elapsed_time": "6:52:33", "remaining_time": "0:09:54", "throughput": 4297.25, "total_tokens": 106374032} +{"current_steps": 87690, "total_steps": 89790, "loss": 0.4677, "lr": 8.334497970204636e-08, "epoch": 9.766120948880722, "percentage": 97.66, "elapsed_time": "6:52:35", "remaining_time": "0:09:52", "throughput": 4297.27, "total_tokens": 106379600} +{"current_steps": 87695, "total_steps": 89790, "loss": 0.4565, "lr": 8.294897902761112e-08, "epoch": 9.766677803764338, "percentage": 97.67, "elapsed_time": "6:52:36", "remaining_time": "0:09:51", "throughput": 4297.29, "total_tokens": 106385552} +{"current_steps": 87700, "total_steps": 89790, "loss": 0.4626, "lr": 8.255391979921645e-08, "epoch": 9.767234658647956, "percentage": 97.67, "elapsed_time": "6:52:37", "remaining_time": "0:09:50", "throughput": 4297.31, "total_tokens": 106391056} +{"current_steps": 87705, "total_steps": 89790, "loss": 0.4492, "lr": 8.215980203178375e-08, "epoch": 9.767791513531574, "percentage": 97.68, "elapsed_time": "6:52:38", "remaining_time": "0:09:48", "throughput": 4297.34, "total_tokens": 106397456} +{"current_steps": 87710, "total_steps": 89790, "loss": 0.4608, "lr": 8.176662574020666e-08, "epoch": 9.768348368415191, "percentage": 97.68, "elapsed_time": "6:52:40", "remaining_time": "0:09:47", "throughput": 4297.36, "total_tokens": 106403600} +{"current_steps": 87715, "total_steps": 89790, "loss": 0.459, "lr": 8.137439093934274e-08, "epoch": 9.768905223298809, "percentage": 97.69, "elapsed_time": "6:52:41", "remaining_time": "0:09:45", "throughput": 4297.38, "total_tokens": 106409648} +{"current_steps": 87720, "total_steps": 89790, "loss": 0.453, "lr": 8.098309764400791e-08, "epoch": 9.769462078182425, "percentage": 97.69, "elapsed_time": "6:52:42", "remaining_time": "0:09:44", "throughput": 4297.4, "total_tokens": 106415728} +{"current_steps": 87725, "total_steps": 89790, "loss": 0.4515, "lr": 8.059274586899034e-08, "epoch": 9.770018933066043, "percentage": 97.7, "elapsed_time": "6:52:44", "remaining_time": "0:09:42", "throughput": 4297.42, "total_tokens": 106421584} +{"current_steps": 87730, "total_steps": 89790, "loss": 0.45, "lr": 8.02033356290366e-08, "epoch": 9.77057578794966, "percentage": 97.71, "elapsed_time": "6:52:45", "remaining_time": "0:09:41", "throughput": 4297.44, "total_tokens": 106427088} +{"current_steps": 87735, "total_steps": 89790, "loss": 0.4784, "lr": 7.981486693885986e-08, "epoch": 9.771132642833278, "percentage": 97.71, "elapsed_time": "6:52:46", "remaining_time": "0:09:40", "throughput": 4297.46, "total_tokens": 106433040} +{"current_steps": 87740, "total_steps": 89790, "loss": 0.4551, "lr": 7.942733981313732e-08, "epoch": 9.771689497716896, "percentage": 97.72, "elapsed_time": "6:52:47", "remaining_time": "0:09:38", "throughput": 4297.48, "total_tokens": 106439088} +{"current_steps": 87745, "total_steps": 89790, "loss": 0.4694, "lr": 7.904075426651281e-08, "epoch": 9.772246352600511, "percentage": 97.72, "elapsed_time": "6:52:49", "remaining_time": "0:09:37", "throughput": 4297.5, "total_tokens": 106445136} +{"current_steps": 87750, "total_steps": 89790, "loss": 0.4549, "lr": 7.865511031359129e-08, "epoch": 9.77280320748413, "percentage": 97.73, "elapsed_time": "6:52:50", "remaining_time": "0:09:35", "throughput": 4297.53, "total_tokens": 106451408} +{"current_steps": 87755, "total_steps": 89790, "loss": 0.4616, "lr": 7.827040796894447e-08, "epoch": 9.773360062367747, "percentage": 97.73, "elapsed_time": "6:52:51", "remaining_time": "0:09:34", "throughput": 4297.55, "total_tokens": 106457520} +{"current_steps": 87760, "total_steps": 89790, "loss": 0.4723, "lr": 7.788664724710793e-08, "epoch": 9.773916917251364, "percentage": 97.74, "elapsed_time": "6:52:52", "remaining_time": "0:09:33", "throughput": 4297.58, "total_tokens": 106463824} +{"current_steps": 87765, "total_steps": 89790, "loss": 0.4629, "lr": 7.750382816258117e-08, "epoch": 9.774473772134982, "percentage": 97.74, "elapsed_time": "6:52:54", "remaining_time": "0:09:31", "throughput": 4297.6, "total_tokens": 106469616} +{"current_steps": 87770, "total_steps": 89790, "loss": 0.4505, "lr": 7.712195072982487e-08, "epoch": 9.775030627018598, "percentage": 97.75, "elapsed_time": "6:52:55", "remaining_time": "0:09:30", "throughput": 4297.62, "total_tokens": 106475664} +{"current_steps": 87775, "total_steps": 89790, "loss": 0.4645, "lr": 7.674101496327191e-08, "epoch": 9.775587481902216, "percentage": 97.76, "elapsed_time": "6:52:56", "remaining_time": "0:09:28", "throughput": 4297.64, "total_tokens": 106481616} +{"current_steps": 87780, "total_steps": 89790, "loss": 0.4679, "lr": 7.636102087731633e-08, "epoch": 9.776144336785833, "percentage": 97.76, "elapsed_time": "6:52:58", "remaining_time": "0:09:27", "throughput": 4297.66, "total_tokens": 106487632} +{"current_steps": 87785, "total_steps": 89790, "loss": 0.454, "lr": 7.598196848631056e-08, "epoch": 9.776701191669451, "percentage": 97.77, "elapsed_time": "6:52:59", "remaining_time": "0:09:25", "throughput": 4297.68, "total_tokens": 106493712} +{"current_steps": 87790, "total_steps": 89790, "loss": 0.465, "lr": 7.560385780457924e-08, "epoch": 9.777258046553069, "percentage": 97.77, "elapsed_time": "6:53:00", "remaining_time": "0:09:24", "throughput": 4297.71, "total_tokens": 106500048} +{"current_steps": 87795, "total_steps": 89790, "loss": 0.4461, "lr": 7.522668884640815e-08, "epoch": 9.777814901436686, "percentage": 97.78, "elapsed_time": "6:53:02", "remaining_time": "0:09:23", "throughput": 4297.73, "total_tokens": 106506512} +{"current_steps": 87800, "total_steps": 89790, "loss": 0.4661, "lr": 7.485046162604981e-08, "epoch": 9.778371756320302, "percentage": 97.78, "elapsed_time": "6:53:03", "remaining_time": "0:09:21", "throughput": 4297.76, "total_tokens": 106512976} +{"current_steps": 87805, "total_steps": 89790, "loss": 0.4646, "lr": 7.447517615771505e-08, "epoch": 9.77892861120392, "percentage": 97.79, "elapsed_time": "6:53:04", "remaining_time": "0:09:20", "throughput": 4297.78, "total_tokens": 106519216} +{"current_steps": 87810, "total_steps": 89790, "loss": 0.4503, "lr": 7.410083245558696e-08, "epoch": 9.779485466087538, "percentage": 97.79, "elapsed_time": "6:53:06", "remaining_time": "0:09:18", "throughput": 4297.81, "total_tokens": 106525456} +{"current_steps": 87815, "total_steps": 89790, "loss": 0.4613, "lr": 7.372743053380982e-08, "epoch": 9.780042320971155, "percentage": 97.8, "elapsed_time": "6:53:07", "remaining_time": "0:09:17", "throughput": 4297.83, "total_tokens": 106531888} +{"current_steps": 87820, "total_steps": 89790, "loss": 0.4564, "lr": 7.335497040648898e-08, "epoch": 9.780599175854773, "percentage": 97.81, "elapsed_time": "6:53:08", "remaining_time": "0:09:16", "throughput": 4297.85, "total_tokens": 106537712} +{"current_steps": 87825, "total_steps": 89790, "loss": 0.4536, "lr": 7.29834520876993e-08, "epoch": 9.781156030738389, "percentage": 97.81, "elapsed_time": "6:53:09", "remaining_time": "0:09:14", "throughput": 4297.88, "total_tokens": 106543728} +{"current_steps": 87830, "total_steps": 89790, "loss": 0.4651, "lr": 7.261287559147678e-08, "epoch": 9.781712885622007, "percentage": 97.82, "elapsed_time": "6:53:11", "remaining_time": "0:09:13", "throughput": 4297.9, "total_tokens": 106549840} +{"current_steps": 87835, "total_steps": 89790, "loss": 0.4666, "lr": 7.224324093182411e-08, "epoch": 9.782269740505624, "percentage": 97.82, "elapsed_time": "6:53:12", "remaining_time": "0:09:11", "throughput": 4297.92, "total_tokens": 106555664} +{"current_steps": 87840, "total_steps": 89790, "loss": 0.4642, "lr": 7.187454812270511e-08, "epoch": 9.782826595389242, "percentage": 97.83, "elapsed_time": "6:53:13", "remaining_time": "0:09:10", "throughput": 4297.94, "total_tokens": 106561872} +{"current_steps": 87845, "total_steps": 89790, "loss": 0.4571, "lr": 7.150679717805309e-08, "epoch": 9.78338345027286, "percentage": 97.83, "elapsed_time": "6:53:14", "remaining_time": "0:09:08", "throughput": 4297.96, "total_tokens": 106567472} +{"current_steps": 87850, "total_steps": 89790, "loss": 0.4448, "lr": 7.113998811176247e-08, "epoch": 9.783940305156476, "percentage": 97.84, "elapsed_time": "6:53:16", "remaining_time": "0:09:07", "throughput": 4297.99, "total_tokens": 106574032} +{"current_steps": 87855, "total_steps": 89790, "loss": 0.4584, "lr": 7.077412093769165e-08, "epoch": 9.784497160040093, "percentage": 97.84, "elapsed_time": "6:53:17", "remaining_time": "0:09:06", "throughput": 4298.01, "total_tokens": 106580624} +{"current_steps": 87860, "total_steps": 89790, "loss": 0.4537, "lr": 7.040919566966287e-08, "epoch": 9.78505401492371, "percentage": 97.85, "elapsed_time": "6:53:18", "remaining_time": "0:09:04", "throughput": 4298.03, "total_tokens": 106586576} +{"current_steps": 87865, "total_steps": 89790, "loss": 0.4616, "lr": 7.00452123214651e-08, "epoch": 9.785610869807329, "percentage": 97.86, "elapsed_time": "6:53:20", "remaining_time": "0:09:03", "throughput": 4298.05, "total_tokens": 106592496} +{"current_steps": 87870, "total_steps": 89790, "loss": 0.4594, "lr": 6.968217090685126e-08, "epoch": 9.786167724690946, "percentage": 97.86, "elapsed_time": "6:53:21", "remaining_time": "0:09:01", "throughput": 4298.08, "total_tokens": 106598544} +{"current_steps": 87875, "total_steps": 89790, "loss": 0.4606, "lr": 6.932007143953811e-08, "epoch": 9.786724579574562, "percentage": 97.87, "elapsed_time": "6:53:22", "remaining_time": "0:09:00", "throughput": 4298.1, "total_tokens": 106604624} +{"current_steps": 87880, "total_steps": 89790, "loss": 0.4601, "lr": 6.89589139332092e-08, "epoch": 9.78728143445818, "percentage": 97.87, "elapsed_time": "6:53:23", "remaining_time": "0:08:59", "throughput": 4298.12, "total_tokens": 106610416} +{"current_steps": 87885, "total_steps": 89790, "loss": 0.4547, "lr": 6.859869840150634e-08, "epoch": 9.787838289341797, "percentage": 97.88, "elapsed_time": "6:53:25", "remaining_time": "0:08:57", "throughput": 4298.15, "total_tokens": 106617040} +{"current_steps": 87890, "total_steps": 89790, "loss": 0.4584, "lr": 6.823942485804092e-08, "epoch": 9.788395144225415, "percentage": 97.88, "elapsed_time": "6:53:26", "remaining_time": "0:08:56", "throughput": 4298.17, "total_tokens": 106623152} +{"current_steps": 87895, "total_steps": 89790, "loss": 0.4686, "lr": 6.788109331638814e-08, "epoch": 9.788951999109033, "percentage": 97.89, "elapsed_time": "6:53:27", "remaining_time": "0:08:54", "throughput": 4298.2, "total_tokens": 106629360} +{"current_steps": 87900, "total_steps": 89790, "loss": 0.4512, "lr": 6.752370379008721e-08, "epoch": 9.789508853992649, "percentage": 97.9, "elapsed_time": "6:53:29", "remaining_time": "0:08:53", "throughput": 4298.21, "total_tokens": 106634928} +{"current_steps": 87905, "total_steps": 89790, "loss": 0.4716, "lr": 6.716725629263842e-08, "epoch": 9.790065708876266, "percentage": 97.9, "elapsed_time": "6:53:30", "remaining_time": "0:08:52", "throughput": 4298.24, "total_tokens": 106641264} +{"current_steps": 87910, "total_steps": 89790, "loss": 0.4586, "lr": 6.681175083751434e-08, "epoch": 9.790622563759884, "percentage": 97.91, "elapsed_time": "6:53:31", "remaining_time": "0:08:50", "throughput": 4298.26, "total_tokens": 106647440} +{"current_steps": 87915, "total_steps": 89790, "loss": 0.4567, "lr": 6.64571874381431e-08, "epoch": 9.791179418643502, "percentage": 97.91, "elapsed_time": "6:53:33", "remaining_time": "0:08:49", "throughput": 4298.28, "total_tokens": 106653520} +{"current_steps": 87920, "total_steps": 89790, "loss": 0.4509, "lr": 6.610356610792512e-08, "epoch": 9.79173627352712, "percentage": 97.92, "elapsed_time": "6:53:34", "remaining_time": "0:08:47", "throughput": 4298.3, "total_tokens": 106659504} +{"current_steps": 87925, "total_steps": 89790, "loss": 0.4742, "lr": 6.575088686021635e-08, "epoch": 9.792293128410737, "percentage": 97.92, "elapsed_time": "6:53:35", "remaining_time": "0:08:46", "throughput": 4298.33, "total_tokens": 106665776} +{"current_steps": 87930, "total_steps": 89790, "loss": 0.4651, "lr": 6.539914970834504e-08, "epoch": 9.792849983294353, "percentage": 97.93, "elapsed_time": "6:53:36", "remaining_time": "0:08:44", "throughput": 4298.35, "total_tokens": 106671952} +{"current_steps": 87935, "total_steps": 89790, "loss": 0.4579, "lr": 6.504835466560332e-08, "epoch": 9.79340683817797, "percentage": 97.93, "elapsed_time": "6:53:38", "remaining_time": "0:08:43", "throughput": 4298.38, "total_tokens": 106678000} +{"current_steps": 87940, "total_steps": 89790, "loss": 0.4528, "lr": 6.469850174524172e-08, "epoch": 9.793963693061588, "percentage": 97.94, "elapsed_time": "6:53:39", "remaining_time": "0:08:42", "throughput": 4298.4, "total_tokens": 106683888} +{"current_steps": 87945, "total_steps": 89790, "loss": 0.4515, "lr": 6.434959096047743e-08, "epoch": 9.794520547945206, "percentage": 97.95, "elapsed_time": "6:53:40", "remaining_time": "0:08:40", "throughput": 4298.42, "total_tokens": 106689712} +{"current_steps": 87950, "total_steps": 89790, "loss": 0.4583, "lr": 6.400162232449713e-08, "epoch": 9.795077402828824, "percentage": 97.95, "elapsed_time": "6:53:42", "remaining_time": "0:08:39", "throughput": 4298.44, "total_tokens": 106696016} +{"current_steps": 87955, "total_steps": 89790, "loss": 0.4577, "lr": 6.365459585044864e-08, "epoch": 9.79563425771244, "percentage": 97.96, "elapsed_time": "6:53:43", "remaining_time": "0:08:37", "throughput": 4298.46, "total_tokens": 106702192} +{"current_steps": 87960, "total_steps": 89790, "loss": 0.4537, "lr": 6.330851155144091e-08, "epoch": 9.796191112596057, "percentage": 97.96, "elapsed_time": "6:53:44", "remaining_time": "0:08:36", "throughput": 4298.49, "total_tokens": 106708400} +{"current_steps": 87965, "total_steps": 89790, "loss": 0.4765, "lr": 6.296336944054959e-08, "epoch": 9.796747967479675, "percentage": 97.97, "elapsed_time": "6:53:45", "remaining_time": "0:08:35", "throughput": 4298.51, "total_tokens": 106714480} +{"current_steps": 87970, "total_steps": 89790, "loss": 0.4554, "lr": 6.261916953081704e-08, "epoch": 9.797304822363293, "percentage": 97.97, "elapsed_time": "6:53:47", "remaining_time": "0:08:33", "throughput": 4298.53, "total_tokens": 106720720} +{"current_steps": 87975, "total_steps": 89790, "loss": 0.4526, "lr": 6.22759118352495e-08, "epoch": 9.79786167724691, "percentage": 97.98, "elapsed_time": "6:53:48", "remaining_time": "0:08:32", "throughput": 4298.55, "total_tokens": 106726864} +{"current_steps": 87980, "total_steps": 89790, "loss": 0.4576, "lr": 6.193359636681439e-08, "epoch": 9.798418532130526, "percentage": 97.98, "elapsed_time": "6:53:49", "remaining_time": "0:08:30", "throughput": 4298.58, "total_tokens": 106733040} +{"current_steps": 87985, "total_steps": 89790, "loss": 0.4525, "lr": 6.159222313844582e-08, "epoch": 9.798975387014144, "percentage": 97.99, "elapsed_time": "6:53:51", "remaining_time": "0:08:29", "throughput": 4298.6, "total_tokens": 106739184} +{"current_steps": 87990, "total_steps": 89790, "loss": 0.4588, "lr": 6.125179216304178e-08, "epoch": 9.799532241897762, "percentage": 98.0, "elapsed_time": "6:53:52", "remaining_time": "0:08:27", "throughput": 4298.62, "total_tokens": 106745392} +{"current_steps": 87995, "total_steps": 89790, "loss": 0.4589, "lr": 6.091230345346699e-08, "epoch": 9.80008909678138, "percentage": 98.0, "elapsed_time": "6:53:53", "remaining_time": "0:08:26", "throughput": 4298.65, "total_tokens": 106751792} +{"current_steps": 88000, "total_steps": 89790, "loss": 0.4629, "lr": 6.057375702254453e-08, "epoch": 9.800645951664997, "percentage": 98.01, "elapsed_time": "6:53:55", "remaining_time": "0:08:25", "throughput": 4298.67, "total_tokens": 106757968} +{"current_steps": 88005, "total_steps": 89790, "loss": 0.4584, "lr": 6.023615288306694e-08, "epoch": 9.801202806548613, "percentage": 98.01, "elapsed_time": "6:53:56", "remaining_time": "0:08:23", "throughput": 4298.69, "total_tokens": 106764176} +{"current_steps": 88010, "total_steps": 89790, "loss": 0.4638, "lr": 5.989949104779347e-08, "epoch": 9.80175966143223, "percentage": 98.02, "elapsed_time": "6:53:57", "remaining_time": "0:08:22", "throughput": 4298.71, "total_tokens": 106770384} +{"current_steps": 88015, "total_steps": 89790, "loss": 0.4597, "lr": 5.95637715294417e-08, "epoch": 9.802316516315848, "percentage": 98.02, "elapsed_time": "6:53:59", "remaining_time": "0:08:20", "throughput": 4298.73, "total_tokens": 106776240} +{"current_steps": 88020, "total_steps": 89790, "loss": 0.462, "lr": 5.922899434069595e-08, "epoch": 9.802873371199466, "percentage": 98.03, "elapsed_time": "6:54:00", "remaining_time": "0:08:19", "throughput": 4298.75, "total_tokens": 106782128} +{"current_steps": 88025, "total_steps": 89790, "loss": 0.4679, "lr": 5.889515949420443e-08, "epoch": 9.803430226083083, "percentage": 98.03, "elapsed_time": "6:54:01", "remaining_time": "0:08:18", "throughput": 4298.78, "total_tokens": 106788208} +{"current_steps": 88030, "total_steps": 89790, "loss": 0.4595, "lr": 5.8562267002579276e-08, "epoch": 9.8039870809667, "percentage": 98.04, "elapsed_time": "6:54:02", "remaining_time": "0:08:16", "throughput": 4298.8, "total_tokens": 106794416} +{"current_steps": 88035, "total_steps": 89790, "loss": 0.4529, "lr": 5.823031687840486e-08, "epoch": 9.804543935850317, "percentage": 98.05, "elapsed_time": "6:54:04", "remaining_time": "0:08:15", "throughput": 4298.82, "total_tokens": 106800656} +{"current_steps": 88040, "total_steps": 89790, "loss": 0.4655, "lr": 5.78993091342156e-08, "epoch": 9.805100790733935, "percentage": 98.05, "elapsed_time": "6:54:05", "remaining_time": "0:08:13", "throughput": 4298.84, "total_tokens": 106806224} +{"current_steps": 88045, "total_steps": 89790, "loss": 0.4568, "lr": 5.7569243782523704e-08, "epoch": 9.805657645617552, "percentage": 98.06, "elapsed_time": "6:54:06", "remaining_time": "0:08:12", "throughput": 4298.86, "total_tokens": 106811984} +{"current_steps": 88050, "total_steps": 89790, "loss": 0.4573, "lr": 5.7240120835796996e-08, "epoch": 9.80621450050117, "percentage": 98.06, "elapsed_time": "6:54:07", "remaining_time": "0:08:11", "throughput": 4298.88, "total_tokens": 106818160} +{"current_steps": 88055, "total_steps": 89790, "loss": 0.4549, "lr": 5.6911940306469955e-08, "epoch": 9.806771355384786, "percentage": 98.07, "elapsed_time": "6:54:09", "remaining_time": "0:08:09", "throughput": 4298.9, "total_tokens": 106824208} +{"current_steps": 88060, "total_steps": 89790, "loss": 0.4516, "lr": 5.658470220694656e-08, "epoch": 9.807328210268404, "percentage": 98.07, "elapsed_time": "6:54:10", "remaining_time": "0:08:08", "throughput": 4298.92, "total_tokens": 106830064} +{"current_steps": 88065, "total_steps": 89790, "loss": 0.4536, "lr": 5.625840654958636e-08, "epoch": 9.807885065152021, "percentage": 98.08, "elapsed_time": "6:54:11", "remaining_time": "0:08:06", "throughput": 4298.95, "total_tokens": 106836304} +{"current_steps": 88070, "total_steps": 89790, "loss": 0.4614, "lr": 5.593305334671839e-08, "epoch": 9.808441920035639, "percentage": 98.08, "elapsed_time": "6:54:13", "remaining_time": "0:08:05", "throughput": 4298.96, "total_tokens": 106842224} +{"current_steps": 88075, "total_steps": 89790, "loss": 0.463, "lr": 5.5608642610638364e-08, "epoch": 9.808998774919257, "percentage": 98.09, "elapsed_time": "6:54:14", "remaining_time": "0:08:03", "throughput": 4298.99, "total_tokens": 106848240} +{"current_steps": 88080, "total_steps": 89790, "loss": 0.462, "lr": 5.528517435360314e-08, "epoch": 9.809555629802873, "percentage": 98.1, "elapsed_time": "6:54:15", "remaining_time": "0:08:02", "throughput": 4299.01, "total_tokens": 106854416} +{"current_steps": 88085, "total_steps": 89790, "loss": 0.4594, "lr": 5.496264858783351e-08, "epoch": 9.81011248468649, "percentage": 98.1, "elapsed_time": "6:54:16", "remaining_time": "0:08:01", "throughput": 4299.03, "total_tokens": 106860528} +{"current_steps": 88090, "total_steps": 89790, "loss": 0.4553, "lr": 5.464106532551416e-08, "epoch": 9.810669339570108, "percentage": 98.11, "elapsed_time": "6:54:18", "remaining_time": "0:07:59", "throughput": 4299.05, "total_tokens": 106866608} +{"current_steps": 88095, "total_steps": 89790, "loss": 0.4599, "lr": 5.4320424578796495e-08, "epoch": 9.811226194453726, "percentage": 98.11, "elapsed_time": "6:54:19", "remaining_time": "0:07:58", "throughput": 4299.07, "total_tokens": 106872912} +{"current_steps": 88100, "total_steps": 89790, "loss": 0.4532, "lr": 5.4000726359795807e-08, "epoch": 9.811783049337343, "percentage": 98.12, "elapsed_time": "6:54:20", "remaining_time": "0:07:56", "throughput": 4299.09, "total_tokens": 106878512} +{"current_steps": 88105, "total_steps": 89790, "loss": 0.4648, "lr": 5.368197068059133e-08, "epoch": 9.81233990422096, "percentage": 98.12, "elapsed_time": "6:54:21", "remaining_time": "0:07:55", "throughput": 4299.11, "total_tokens": 106884432} +{"current_steps": 88110, "total_steps": 89790, "loss": 0.4631, "lr": 5.336415755322621e-08, "epoch": 9.812896759104577, "percentage": 98.13, "elapsed_time": "6:54:23", "remaining_time": "0:07:54", "throughput": 4299.13, "total_tokens": 106889904} +{"current_steps": 88115, "total_steps": 89790, "loss": 0.4562, "lr": 5.304728698970751e-08, "epoch": 9.813453613988194, "percentage": 98.13, "elapsed_time": "6:54:24", "remaining_time": "0:07:52", "throughput": 4299.15, "total_tokens": 106896112} +{"current_steps": 88120, "total_steps": 89790, "loss": 0.4695, "lr": 5.273135900201176e-08, "epoch": 9.814010468871812, "percentage": 98.14, "elapsed_time": "6:54:25", "remaining_time": "0:07:51", "throughput": 4299.18, "total_tokens": 106901904} +{"current_steps": 88125, "total_steps": 89790, "loss": 0.4772, "lr": 5.24163736020683e-08, "epoch": 9.81456732375543, "percentage": 98.15, "elapsed_time": "6:54:26", "remaining_time": "0:07:49", "throughput": 4299.2, "total_tokens": 106907920} +{"current_steps": 88130, "total_steps": 89790, "loss": 0.4678, "lr": 5.210233080178706e-08, "epoch": 9.815124178639046, "percentage": 98.15, "elapsed_time": "6:54:28", "remaining_time": "0:07:48", "throughput": 4299.22, "total_tokens": 106914064} +{"current_steps": 88135, "total_steps": 89790, "loss": 0.464, "lr": 5.178923061302521e-08, "epoch": 9.815681033522663, "percentage": 98.16, "elapsed_time": "6:54:29", "remaining_time": "0:07:46", "throughput": 4299.24, "total_tokens": 106919920} +{"current_steps": 88140, "total_steps": 89790, "loss": 0.4599, "lr": 5.147707304762051e-08, "epoch": 9.816237888406281, "percentage": 98.16, "elapsed_time": "6:54:30", "remaining_time": "0:07:45", "throughput": 4299.27, "total_tokens": 106926224} +{"current_steps": 88145, "total_steps": 89790, "loss": 0.4534, "lr": 5.116585811736074e-08, "epoch": 9.816794743289899, "percentage": 98.17, "elapsed_time": "6:54:32", "remaining_time": "0:07:44", "throughput": 4299.29, "total_tokens": 106932400} +{"current_steps": 88150, "total_steps": 89790, "loss": 0.4631, "lr": 5.0855585834008736e-08, "epoch": 9.817351598173516, "percentage": 98.17, "elapsed_time": "6:54:33", "remaining_time": "0:07:42", "throughput": 4299.31, "total_tokens": 106938576} +{"current_steps": 88155, "total_steps": 89790, "loss": 0.4562, "lr": 5.054625620928566e-08, "epoch": 9.817908453057134, "percentage": 98.18, "elapsed_time": "6:54:34", "remaining_time": "0:07:41", "throughput": 4299.34, "total_tokens": 106944752} +{"current_steps": 88160, "total_steps": 89790, "loss": 0.4517, "lr": 5.023786925487939e-08, "epoch": 9.81846530794075, "percentage": 98.18, "elapsed_time": "6:54:36", "remaining_time": "0:07:39", "throughput": 4299.36, "total_tokens": 106950800} +{"current_steps": 88165, "total_steps": 89790, "loss": 0.4481, "lr": 4.993042498244171e-08, "epoch": 9.819022162824368, "percentage": 98.19, "elapsed_time": "6:54:37", "remaining_time": "0:07:38", "throughput": 4299.38, "total_tokens": 106956944} +{"current_steps": 88170, "total_steps": 89790, "loss": 0.4517, "lr": 4.962392340358834e-08, "epoch": 9.819579017707985, "percentage": 98.2, "elapsed_time": "6:54:38", "remaining_time": "0:07:37", "throughput": 4299.4, "total_tokens": 106963120} +{"current_steps": 88175, "total_steps": 89790, "loss": 0.4638, "lr": 4.931836452990168e-08, "epoch": 9.820135872591603, "percentage": 98.2, "elapsed_time": "6:54:39", "remaining_time": "0:07:35", "throughput": 4299.43, "total_tokens": 106969552} +{"current_steps": 88180, "total_steps": 89790, "loss": 0.4491, "lr": 4.901374837292527e-08, "epoch": 9.82069272747522, "percentage": 98.21, "elapsed_time": "6:54:41", "remaining_time": "0:07:34", "throughput": 4299.45, "total_tokens": 106975696} +{"current_steps": 88185, "total_steps": 89790, "loss": 0.4701, "lr": 4.871007494416935e-08, "epoch": 9.821249582358837, "percentage": 98.21, "elapsed_time": "6:54:42", "remaining_time": "0:07:32", "throughput": 4299.47, "total_tokens": 106982000} +{"current_steps": 88190, "total_steps": 89790, "loss": 0.4538, "lr": 4.840734425510807e-08, "epoch": 9.821806437242454, "percentage": 98.22, "elapsed_time": "6:54:43", "remaining_time": "0:07:31", "throughput": 4299.5, "total_tokens": 106988240} +{"current_steps": 88195, "total_steps": 89790, "loss": 0.4615, "lr": 4.8105556317176726e-08, "epoch": 9.822363292126072, "percentage": 98.22, "elapsed_time": "6:54:45", "remaining_time": "0:07:30", "throughput": 4299.52, "total_tokens": 106994288} +{"current_steps": 88200, "total_steps": 89790, "loss": 0.4569, "lr": 4.780471114178009e-08, "epoch": 9.82292014700969, "percentage": 98.23, "elapsed_time": "6:54:46", "remaining_time": "0:07:28", "throughput": 4299.55, "total_tokens": 107000656} +{"current_steps": 88205, "total_steps": 89790, "loss": 0.4651, "lr": 4.750480874028407e-08, "epoch": 9.823477001893307, "percentage": 98.23, "elapsed_time": "6:54:47", "remaining_time": "0:07:27", "throughput": 4299.57, "total_tokens": 107006576} +{"current_steps": 88210, "total_steps": 89790, "loss": 0.4578, "lr": 4.720584912402126e-08, "epoch": 9.824033856776923, "percentage": 98.24, "elapsed_time": "6:54:49", "remaining_time": "0:07:25", "throughput": 4299.6, "total_tokens": 107013008} +{"current_steps": 88215, "total_steps": 89790, "loss": 0.4638, "lr": 4.6907832304288194e-08, "epoch": 9.82459071166054, "percentage": 98.25, "elapsed_time": "6:54:50", "remaining_time": "0:07:24", "throughput": 4299.62, "total_tokens": 107018736} +{"current_steps": 88220, "total_steps": 89790, "loss": 0.4494, "lr": 4.661075829233974e-08, "epoch": 9.825147566544159, "percentage": 98.25, "elapsed_time": "6:54:51", "remaining_time": "0:07:22", "throughput": 4299.63, "total_tokens": 107024752} +{"current_steps": 88225, "total_steps": 89790, "loss": 0.4533, "lr": 4.631462709940859e-08, "epoch": 9.825704421427776, "percentage": 98.26, "elapsed_time": "6:54:52", "remaining_time": "0:07:21", "throughput": 4299.66, "total_tokens": 107030672} +{"current_steps": 88230, "total_steps": 89790, "loss": 0.4496, "lr": 4.601943873667469e-08, "epoch": 9.826261276311394, "percentage": 98.26, "elapsed_time": "6:54:53", "remaining_time": "0:07:20", "throughput": 4299.67, "total_tokens": 107035568} +{"current_steps": 88235, "total_steps": 89790, "loss": 0.4409, "lr": 4.5725193215298556e-08, "epoch": 9.82681813119501, "percentage": 98.27, "elapsed_time": "6:54:55", "remaining_time": "0:07:18", "throughput": 4299.69, "total_tokens": 107041520} +{"current_steps": 88240, "total_steps": 89790, "loss": 0.4661, "lr": 4.543189054639074e-08, "epoch": 9.827374986078627, "percentage": 98.27, "elapsed_time": "6:54:56", "remaining_time": "0:07:17", "throughput": 4299.71, "total_tokens": 107047696} +{"current_steps": 88245, "total_steps": 89790, "loss": 0.474, "lr": 4.513953074103961e-08, "epoch": 9.827931840962245, "percentage": 98.28, "elapsed_time": "6:54:57", "remaining_time": "0:07:15", "throughput": 4299.73, "total_tokens": 107053296} +{"current_steps": 88250, "total_steps": 89790, "loss": 0.4592, "lr": 4.484811381028908e-08, "epoch": 9.828488695845863, "percentage": 98.28, "elapsed_time": "6:54:58", "remaining_time": "0:07:14", "throughput": 4299.75, "total_tokens": 107059216} +{"current_steps": 88255, "total_steps": 89790, "loss": 0.4562, "lr": 4.455763976514982e-08, "epoch": 9.82904555072948, "percentage": 98.29, "elapsed_time": "6:55:00", "remaining_time": "0:07:13", "throughput": 4299.77, "total_tokens": 107065424} +{"current_steps": 88260, "total_steps": 89790, "loss": 0.4581, "lr": 4.426810861659358e-08, "epoch": 9.829602405613098, "percentage": 98.3, "elapsed_time": "6:55:01", "remaining_time": "0:07:11", "throughput": 4299.79, "total_tokens": 107071504} +{"current_steps": 88265, "total_steps": 89790, "loss": 0.4576, "lr": 4.397952037556441e-08, "epoch": 9.830159260496714, "percentage": 98.3, "elapsed_time": "6:55:02", "remaining_time": "0:07:10", "throughput": 4299.81, "total_tokens": 107077584} +{"current_steps": 88270, "total_steps": 89790, "loss": 0.4484, "lr": 4.369187505296468e-08, "epoch": 9.830716115380332, "percentage": 98.31, "elapsed_time": "6:55:04", "remaining_time": "0:07:08", "throughput": 4299.83, "total_tokens": 107083408} +{"current_steps": 88275, "total_steps": 89790, "loss": 0.4557, "lr": 4.340517265966348e-08, "epoch": 9.83127297026395, "percentage": 98.31, "elapsed_time": "6:55:05", "remaining_time": "0:07:07", "throughput": 4299.86, "total_tokens": 107089424} +{"current_steps": 88280, "total_steps": 89790, "loss": 0.4511, "lr": 4.311941320649104e-08, "epoch": 9.831829825147567, "percentage": 98.32, "elapsed_time": "6:55:06", "remaining_time": "0:07:06", "throughput": 4299.88, "total_tokens": 107095952} +{"current_steps": 88285, "total_steps": 89790, "loss": 0.4578, "lr": 4.283459670424428e-08, "epoch": 9.832386680031185, "percentage": 98.32, "elapsed_time": "6:55:07", "remaining_time": "0:07:04", "throughput": 4299.91, "total_tokens": 107102064} +{"current_steps": 88290, "total_steps": 89790, "loss": 0.4597, "lr": 4.2550723163686804e-08, "epoch": 9.8329435349148, "percentage": 98.33, "elapsed_time": "6:55:09", "remaining_time": "0:07:03", "throughput": 4299.93, "total_tokens": 107107792} +{"current_steps": 88295, "total_steps": 89790, "loss": 0.4549, "lr": 4.2267792595543364e-08, "epoch": 9.833500389798418, "percentage": 98.34, "elapsed_time": "6:55:10", "remaining_time": "0:07:01", "throughput": 4299.95, "total_tokens": 107113904} +{"current_steps": 88300, "total_steps": 89790, "loss": 0.4346, "lr": 4.1985805010505416e-08, "epoch": 9.834057244682036, "percentage": 98.34, "elapsed_time": "6:55:11", "remaining_time": "0:07:00", "throughput": 4299.97, "total_tokens": 107119856} +{"current_steps": 88305, "total_steps": 89790, "loss": 0.4677, "lr": 4.1704760419222776e-08, "epoch": 9.834614099565654, "percentage": 98.35, "elapsed_time": "6:55:13", "remaining_time": "0:06:58", "throughput": 4299.99, "total_tokens": 107126320} +{"current_steps": 88310, "total_steps": 89790, "loss": 0.4388, "lr": 4.1424658832317496e-08, "epoch": 9.835170954449271, "percentage": 98.35, "elapsed_time": "6:55:14", "remaining_time": "0:06:57", "throughput": 4300.02, "total_tokens": 107132752} +{"current_steps": 88315, "total_steps": 89790, "loss": 0.4569, "lr": 4.114550026037278e-08, "epoch": 9.835727809332887, "percentage": 98.36, "elapsed_time": "6:55:15", "remaining_time": "0:06:56", "throughput": 4300.04, "total_tokens": 107138928} +{"current_steps": 88320, "total_steps": 89790, "loss": 0.4591, "lr": 4.086728471393575e-08, "epoch": 9.836284664216505, "percentage": 98.36, "elapsed_time": "6:55:17", "remaining_time": "0:06:54", "throughput": 4300.06, "total_tokens": 107145136} +{"current_steps": 88325, "total_steps": 89790, "loss": 0.4419, "lr": 4.059001220351744e-08, "epoch": 9.836841519100123, "percentage": 98.37, "elapsed_time": "6:55:18", "remaining_time": "0:06:53", "throughput": 4300.08, "total_tokens": 107151440} +{"current_steps": 88330, "total_steps": 89790, "loss": 0.4508, "lr": 4.031368273959557e-08, "epoch": 9.83739837398374, "percentage": 98.37, "elapsed_time": "6:55:19", "remaining_time": "0:06:51", "throughput": 4300.1, "total_tokens": 107157680} +{"current_steps": 88335, "total_steps": 89790, "loss": 0.4553, "lr": 4.0038296332609026e-08, "epoch": 9.837955228867358, "percentage": 98.38, "elapsed_time": "6:55:21", "remaining_time": "0:06:50", "throughput": 4300.12, "total_tokens": 107163632} +{"current_steps": 88340, "total_steps": 89790, "loss": 0.461, "lr": 3.9763852992966146e-08, "epoch": 9.838512083750974, "percentage": 98.39, "elapsed_time": "6:55:22", "remaining_time": "0:06:49", "throughput": 4300.14, "total_tokens": 107169776} +{"current_steps": 88345, "total_steps": 89790, "loss": 0.4536, "lr": 3.9490352731030857e-08, "epoch": 9.839068938634592, "percentage": 98.39, "elapsed_time": "6:55:23", "remaining_time": "0:06:47", "throughput": 4300.16, "total_tokens": 107175312} +{"current_steps": 88350, "total_steps": 89790, "loss": 0.4669, "lr": 3.9217795557142113e-08, "epoch": 9.83962579351821, "percentage": 98.4, "elapsed_time": "6:55:24", "remaining_time": "0:06:46", "throughput": 4300.19, "total_tokens": 107181488} +{"current_steps": 88355, "total_steps": 89790, "loss": 0.4624, "lr": 3.894618148159446e-08, "epoch": 9.840182648401827, "percentage": 98.4, "elapsed_time": "6:55:26", "remaining_time": "0:06:44", "throughput": 4300.21, "total_tokens": 107187632} +{"current_steps": 88360, "total_steps": 89790, "loss": 0.4575, "lr": 3.86755105146519e-08, "epoch": 9.840739503285445, "percentage": 98.41, "elapsed_time": "6:55:27", "remaining_time": "0:06:43", "throughput": 4300.23, "total_tokens": 107194064} +{"current_steps": 88365, "total_steps": 89790, "loss": 0.4514, "lr": 3.840578266654238e-08, "epoch": 9.84129635816906, "percentage": 98.41, "elapsed_time": "6:55:28", "remaining_time": "0:06:42", "throughput": 4300.26, "total_tokens": 107200176} +{"current_steps": 88370, "total_steps": 89790, "loss": 0.4609, "lr": 3.813699794745496e-08, "epoch": 9.841853213052678, "percentage": 98.42, "elapsed_time": "6:55:30", "remaining_time": "0:06:40", "throughput": 4300.28, "total_tokens": 107206256} +{"current_steps": 88375, "total_steps": 89790, "loss": 0.4606, "lr": 3.78691563675454e-08, "epoch": 9.842410067936296, "percentage": 98.42, "elapsed_time": "6:55:31", "remaining_time": "0:06:39", "throughput": 4300.3, "total_tokens": 107212688} +{"current_steps": 88380, "total_steps": 89790, "loss": 0.4636, "lr": 3.760225793693617e-08, "epoch": 9.842966922819913, "percentage": 98.43, "elapsed_time": "6:55:32", "remaining_time": "0:06:37", "throughput": 4300.32, "total_tokens": 107218512} +{"current_steps": 88385, "total_steps": 89790, "loss": 0.4581, "lr": 3.733630266570809e-08, "epoch": 9.843523777703531, "percentage": 98.44, "elapsed_time": "6:55:33", "remaining_time": "0:06:36", "throughput": 4300.34, "total_tokens": 107224784} +{"current_steps": 88390, "total_steps": 89790, "loss": 0.4676, "lr": 3.707129056391145e-08, "epoch": 9.844080632587147, "percentage": 98.44, "elapsed_time": "6:55:35", "remaining_time": "0:06:34", "throughput": 4300.36, "total_tokens": 107230768} +{"current_steps": 88395, "total_steps": 89790, "loss": 0.4615, "lr": 3.68072216415577e-08, "epoch": 9.844637487470765, "percentage": 98.45, "elapsed_time": "6:55:36", "remaining_time": "0:06:33", "throughput": 4300.39, "total_tokens": 107236944} +{"current_steps": 88400, "total_steps": 89790, "loss": 0.4571, "lr": 3.654409590862773e-08, "epoch": 9.845194342354382, "percentage": 98.45, "elapsed_time": "6:55:37", "remaining_time": "0:06:32", "throughput": 4300.41, "total_tokens": 107242768} +{"current_steps": 88405, "total_steps": 89790, "loss": 0.4514, "lr": 3.628191337505804e-08, "epoch": 9.845751197238, "percentage": 98.46, "elapsed_time": "6:55:39", "remaining_time": "0:06:30", "throughput": 4300.43, "total_tokens": 107249104} +{"current_steps": 88410, "total_steps": 89790, "loss": 0.4593, "lr": 3.602067405076015e-08, "epoch": 9.846308052121618, "percentage": 98.46, "elapsed_time": "6:55:40", "remaining_time": "0:06:29", "throughput": 4300.45, "total_tokens": 107255024} +{"current_steps": 88415, "total_steps": 89790, "loss": 0.4567, "lr": 3.576037794560394e-08, "epoch": 9.846864907005234, "percentage": 98.47, "elapsed_time": "6:55:41", "remaining_time": "0:06:27", "throughput": 4300.47, "total_tokens": 107260240} +{"current_steps": 88420, "total_steps": 89790, "loss": 0.4763, "lr": 3.550102506942044e-08, "epoch": 9.847421761888851, "percentage": 98.47, "elapsed_time": "6:55:42", "remaining_time": "0:06:26", "throughput": 4300.49, "total_tokens": 107266512} +{"current_steps": 88425, "total_steps": 89790, "loss": 0.4615, "lr": 3.524261543201013e-08, "epoch": 9.847978616772469, "percentage": 98.48, "elapsed_time": "6:55:44", "remaining_time": "0:06:25", "throughput": 4300.51, "total_tokens": 107272816} +{"current_steps": 88430, "total_steps": 89790, "loss": 0.4594, "lr": 3.498514904313743e-08, "epoch": 9.848535471656087, "percentage": 98.49, "elapsed_time": "6:55:45", "remaining_time": "0:06:23", "throughput": 4300.53, "total_tokens": 107278608} +{"current_steps": 88435, "total_steps": 89790, "loss": 0.4695, "lr": 3.472862591253068e-08, "epoch": 9.849092326539704, "percentage": 98.49, "elapsed_time": "6:55:46", "remaining_time": "0:06:22", "throughput": 4300.55, "total_tokens": 107284624} +{"current_steps": 88440, "total_steps": 89790, "loss": 0.4621, "lr": 3.447304604988211e-08, "epoch": 9.84964918142332, "percentage": 98.5, "elapsed_time": "6:55:48", "remaining_time": "0:06:20", "throughput": 4300.58, "total_tokens": 107290928} +{"current_steps": 88445, "total_steps": 89790, "loss": 0.4453, "lr": 3.421840946484789e-08, "epoch": 9.850206036306938, "percentage": 98.5, "elapsed_time": "6:55:49", "remaining_time": "0:06:19", "throughput": 4300.6, "total_tokens": 107296976} +{"current_steps": 88450, "total_steps": 89790, "loss": 0.4654, "lr": 3.396471616704811e-08, "epoch": 9.850762891190556, "percentage": 98.51, "elapsed_time": "6:55:50", "remaining_time": "0:06:17", "throughput": 4300.62, "total_tokens": 107303024} +{"current_steps": 88455, "total_steps": 89790, "loss": 0.4742, "lr": 3.371196616606953e-08, "epoch": 9.851319746074173, "percentage": 98.51, "elapsed_time": "6:55:51", "remaining_time": "0:06:16", "throughput": 4300.64, "total_tokens": 107309200} +{"current_steps": 88460, "total_steps": 89790, "loss": 0.4618, "lr": 3.3460159471460085e-08, "epoch": 9.851876600957791, "percentage": 98.52, "elapsed_time": "6:55:53", "remaining_time": "0:06:15", "throughput": 4300.66, "total_tokens": 107315056} +{"current_steps": 88465, "total_steps": 89790, "loss": 0.4577, "lr": 3.320929609273715e-08, "epoch": 9.852433455841407, "percentage": 98.52, "elapsed_time": "6:55:54", "remaining_time": "0:06:13", "throughput": 4300.68, "total_tokens": 107321232} +{"current_steps": 88470, "total_steps": 89790, "loss": 0.4573, "lr": 3.2959376039373716e-08, "epoch": 9.852990310725025, "percentage": 98.53, "elapsed_time": "6:55:55", "remaining_time": "0:06:12", "throughput": 4300.71, "total_tokens": 107327920} +{"current_steps": 88475, "total_steps": 89790, "loss": 0.4614, "lr": 3.271039932082054e-08, "epoch": 9.853547165608642, "percentage": 98.54, "elapsed_time": "6:55:57", "remaining_time": "0:06:10", "throughput": 4300.73, "total_tokens": 107333648} +{"current_steps": 88480, "total_steps": 89790, "loss": 0.4673, "lr": 3.246236594647567e-08, "epoch": 9.85410402049226, "percentage": 98.54, "elapsed_time": "6:55:58", "remaining_time": "0:06:09", "throughput": 4300.75, "total_tokens": 107338864} +{"current_steps": 88485, "total_steps": 89790, "loss": 0.481, "lr": 3.2215275925717715e-08, "epoch": 9.854660875375878, "percentage": 98.55, "elapsed_time": "6:55:59", "remaining_time": "0:06:08", "throughput": 4300.77, "total_tokens": 107344496} +{"current_steps": 88490, "total_steps": 89790, "loss": 0.4688, "lr": 3.19691292678781e-08, "epoch": 9.855217730259493, "percentage": 98.55, "elapsed_time": "6:56:00", "remaining_time": "0:06:06", "throughput": 4300.79, "total_tokens": 107350576} +{"current_steps": 88495, "total_steps": 89790, "loss": 0.4552, "lr": 3.1723925982260486e-08, "epoch": 9.855774585143111, "percentage": 98.56, "elapsed_time": "6:56:01", "remaining_time": "0:06:05", "throughput": 4300.81, "total_tokens": 107356208} +{"current_steps": 88500, "total_steps": 89790, "loss": 0.4497, "lr": 3.147966607812691e-08, "epoch": 9.856331440026729, "percentage": 98.56, "elapsed_time": "6:56:03", "remaining_time": "0:06:03", "throughput": 4300.83, "total_tokens": 107361904} +{"current_steps": 88505, "total_steps": 89790, "loss": 0.4621, "lr": 3.123634956470611e-08, "epoch": 9.856888294910346, "percentage": 98.57, "elapsed_time": "6:56:04", "remaining_time": "0:06:02", "throughput": 4300.85, "total_tokens": 107367984} +{"current_steps": 88510, "total_steps": 89790, "loss": 0.4624, "lr": 3.0993976451193505e-08, "epoch": 9.857445149793964, "percentage": 98.57, "elapsed_time": "6:56:05", "remaining_time": "0:06:01", "throughput": 4300.88, "total_tokens": 107374128} +{"current_steps": 88515, "total_steps": 89790, "loss": 0.4666, "lr": 3.075254674674566e-08, "epoch": 9.858002004677582, "percentage": 98.58, "elapsed_time": "6:56:06", "remaining_time": "0:05:59", "throughput": 4300.9, "total_tokens": 107379856} +{"current_steps": 88520, "total_steps": 89790, "loss": 0.4378, "lr": 3.0512060460485824e-08, "epoch": 9.858558859561198, "percentage": 98.59, "elapsed_time": "6:56:08", "remaining_time": "0:05:58", "throughput": 4300.92, "total_tokens": 107385904} +{"current_steps": 88525, "total_steps": 89790, "loss": 0.4589, "lr": 3.027251760149563e-08, "epoch": 9.859115714444815, "percentage": 98.59, "elapsed_time": "6:56:09", "remaining_time": "0:05:56", "throughput": 4300.94, "total_tokens": 107392048} +{"current_steps": 88530, "total_steps": 89790, "loss": 0.4465, "lr": 3.003391817883172e-08, "epoch": 9.859672569328433, "percentage": 98.6, "elapsed_time": "6:56:10", "remaining_time": "0:05:55", "throughput": 4300.96, "total_tokens": 107397616} +{"current_steps": 88535, "total_steps": 89790, "loss": 0.4634, "lr": 2.979626220150633e-08, "epoch": 9.86022942421205, "percentage": 98.6, "elapsed_time": "6:56:11", "remaining_time": "0:05:53", "throughput": 4300.98, "total_tokens": 107403824} +{"current_steps": 88540, "total_steps": 89790, "loss": 0.4591, "lr": 2.9559549678498388e-08, "epoch": 9.860786279095668, "percentage": 98.61, "elapsed_time": "6:56:13", "remaining_time": "0:05:52", "throughput": 4301.0, "total_tokens": 107409840} +{"current_steps": 88545, "total_steps": 89790, "loss": 0.4537, "lr": 2.9323780618753516e-08, "epoch": 9.861343133979284, "percentage": 98.61, "elapsed_time": "6:56:14", "remaining_time": "0:05:51", "throughput": 4301.02, "total_tokens": 107415952} +{"current_steps": 88550, "total_steps": 89790, "loss": 0.4679, "lr": 2.90889550311757e-08, "epoch": 9.861899988862902, "percentage": 98.62, "elapsed_time": "6:56:15", "remaining_time": "0:05:49", "throughput": 4301.05, "total_tokens": 107422320} +{"current_steps": 88555, "total_steps": 89790, "loss": 0.4556, "lr": 2.8855072924643955e-08, "epoch": 9.86245684374652, "percentage": 98.62, "elapsed_time": "6:56:17", "remaining_time": "0:05:48", "throughput": 4301.06, "total_tokens": 107428240} +{"current_steps": 88560, "total_steps": 89790, "loss": 0.4613, "lr": 2.86221343079901e-08, "epoch": 9.863013698630137, "percentage": 98.63, "elapsed_time": "6:56:18", "remaining_time": "0:05:46", "throughput": 4301.08, "total_tokens": 107433648} +{"current_steps": 88565, "total_steps": 89790, "loss": 0.4532, "lr": 2.839013919001543e-08, "epoch": 9.863570553513755, "percentage": 98.64, "elapsed_time": "6:56:19", "remaining_time": "0:05:45", "throughput": 4301.1, "total_tokens": 107439728} +{"current_steps": 88570, "total_steps": 89790, "loss": 0.456, "lr": 2.815908757948793e-08, "epoch": 9.864127408397371, "percentage": 98.64, "elapsed_time": "6:56:20", "remaining_time": "0:05:44", "throughput": 4301.12, "total_tokens": 107445872} +{"current_steps": 88575, "total_steps": 89790, "loss": 0.4607, "lr": 2.792897948513673e-08, "epoch": 9.864684263280989, "percentage": 98.65, "elapsed_time": "6:56:22", "remaining_time": "0:05:42", "throughput": 4301.14, "total_tokens": 107451600} +{"current_steps": 88580, "total_steps": 89790, "loss": 0.4679, "lr": 2.7699814915654875e-08, "epoch": 9.865241118164606, "percentage": 98.65, "elapsed_time": "6:56:23", "remaining_time": "0:05:41", "throughput": 4301.16, "total_tokens": 107457648} +{"current_steps": 88585, "total_steps": 89790, "loss": 0.4652, "lr": 2.7471593879702107e-08, "epoch": 9.865797973048224, "percentage": 98.66, "elapsed_time": "6:56:24", "remaining_time": "0:05:39", "throughput": 4301.19, "total_tokens": 107463824} +{"current_steps": 88590, "total_steps": 89790, "loss": 0.4549, "lr": 2.7244316385899304e-08, "epoch": 9.866354827931842, "percentage": 98.66, "elapsed_time": "6:56:25", "remaining_time": "0:05:38", "throughput": 4301.21, "total_tokens": 107469904} +{"current_steps": 88595, "total_steps": 89790, "loss": 0.4647, "lr": 2.701798244283682e-08, "epoch": 9.866911682815457, "percentage": 98.67, "elapsed_time": "6:56:27", "remaining_time": "0:05:37", "throughput": 4301.23, "total_tokens": 107475888} +{"current_steps": 88600, "total_steps": 89790, "loss": 0.4574, "lr": 2.6792592059066145e-08, "epoch": 9.867468537699075, "percentage": 98.67, "elapsed_time": "6:56:28", "remaining_time": "0:05:35", "throughput": 4301.25, "total_tokens": 107482032} +{"current_steps": 88605, "total_steps": 89790, "loss": 0.4499, "lr": 2.6568145243099918e-08, "epoch": 9.868025392582693, "percentage": 98.68, "elapsed_time": "6:56:29", "remaining_time": "0:05:34", "throughput": 4301.27, "total_tokens": 107488016} +{"current_steps": 88610, "total_steps": 89790, "loss": 0.4586, "lr": 2.634464200342024e-08, "epoch": 9.86858224746631, "percentage": 98.69, "elapsed_time": "6:56:31", "remaining_time": "0:05:32", "throughput": 4301.29, "total_tokens": 107493840} +{"current_steps": 88615, "total_steps": 89790, "loss": 0.4624, "lr": 2.612208234847313e-08, "epoch": 9.869139102349928, "percentage": 98.69, "elapsed_time": "6:56:32", "remaining_time": "0:05:31", "throughput": 4301.31, "total_tokens": 107499952} +{"current_steps": 88620, "total_steps": 89790, "loss": 0.4668, "lr": 2.5900466286665758e-08, "epoch": 9.869695957233546, "percentage": 98.7, "elapsed_time": "6:56:33", "remaining_time": "0:05:29", "throughput": 4301.33, "total_tokens": 107506128} +{"current_steps": 88625, "total_steps": 89790, "loss": 0.4653, "lr": 2.567979382637198e-08, "epoch": 9.870252812117162, "percentage": 98.7, "elapsed_time": "6:56:35", "remaining_time": "0:05:28", "throughput": 4301.35, "total_tokens": 107512400} +{"current_steps": 88630, "total_steps": 89790, "loss": 0.4646, "lr": 2.546006497593234e-08, "epoch": 9.87080966700078, "percentage": 98.71, "elapsed_time": "6:56:36", "remaining_time": "0:05:27", "throughput": 4301.38, "total_tokens": 107518544} +{"current_steps": 88635, "total_steps": 89790, "loss": 0.4577, "lr": 2.5241279743642988e-08, "epoch": 9.871366521884397, "percentage": 98.71, "elapsed_time": "6:56:37", "remaining_time": "0:05:25", "throughput": 4301.4, "total_tokens": 107524528} +{"current_steps": 88640, "total_steps": 89790, "loss": 0.4543, "lr": 2.502343813777508e-08, "epoch": 9.871923376768015, "percentage": 98.72, "elapsed_time": "6:56:38", "remaining_time": "0:05:24", "throughput": 4301.42, "total_tokens": 107530480} +{"current_steps": 88645, "total_steps": 89790, "loss": 0.4647, "lr": 2.4806540166558144e-08, "epoch": 9.872480231651632, "percentage": 98.72, "elapsed_time": "6:56:40", "remaining_time": "0:05:22", "throughput": 4301.44, "total_tokens": 107536560} +{"current_steps": 88650, "total_steps": 89790, "loss": 0.4382, "lr": 2.459058583818563e-08, "epoch": 9.873037086535248, "percentage": 98.73, "elapsed_time": "6:56:41", "remaining_time": "0:05:21", "throughput": 4301.46, "total_tokens": 107542320} +{"current_steps": 88655, "total_steps": 89790, "loss": 0.4692, "lr": 2.437557516082045e-08, "epoch": 9.873593941418866, "percentage": 98.74, "elapsed_time": "6:56:42", "remaining_time": "0:05:20", "throughput": 4301.48, "total_tokens": 107548336} +{"current_steps": 88660, "total_steps": 89790, "loss": 0.4616, "lr": 2.416150814258389e-08, "epoch": 9.874150796302484, "percentage": 98.74, "elapsed_time": "6:56:43", "remaining_time": "0:05:18", "throughput": 4301.5, "total_tokens": 107554448} +{"current_steps": 88665, "total_steps": 89790, "loss": 0.4672, "lr": 2.3948384791563916e-08, "epoch": 9.874707651186101, "percentage": 98.75, "elapsed_time": "6:56:45", "remaining_time": "0:05:17", "throughput": 4301.52, "total_tokens": 107560432} +{"current_steps": 88670, "total_steps": 89790, "loss": 0.4682, "lr": 2.3736205115812427e-08, "epoch": 9.875264506069719, "percentage": 98.75, "elapsed_time": "6:56:46", "remaining_time": "0:05:15", "throughput": 4301.54, "total_tokens": 107566768} +{"current_steps": 88675, "total_steps": 89790, "loss": 0.454, "lr": 2.352496912335078e-08, "epoch": 9.875821360953335, "percentage": 98.76, "elapsed_time": "6:56:47", "remaining_time": "0:05:14", "throughput": 4301.57, "total_tokens": 107573296} +{"current_steps": 88680, "total_steps": 89790, "loss": 0.4681, "lr": 2.3314676822153158e-08, "epoch": 9.876378215836953, "percentage": 98.76, "elapsed_time": "6:56:49", "remaining_time": "0:05:13", "throughput": 4301.59, "total_tokens": 107579504} +{"current_steps": 88685, "total_steps": 89790, "loss": 0.4544, "lr": 2.310532822017153e-08, "epoch": 9.87693507072057, "percentage": 98.77, "elapsed_time": "6:56:50", "remaining_time": "0:05:11", "throughput": 4301.61, "total_tokens": 107585584} +{"current_steps": 88690, "total_steps": 89790, "loss": 0.4547, "lr": 2.289692332531068e-08, "epoch": 9.877491925604188, "percentage": 98.77, "elapsed_time": "6:56:51", "remaining_time": "0:05:10", "throughput": 4301.63, "total_tokens": 107591472} +{"current_steps": 88695, "total_steps": 89790, "loss": 0.4667, "lr": 2.2689462145450424e-08, "epoch": 9.878048780487806, "percentage": 98.78, "elapsed_time": "6:56:53", "remaining_time": "0:05:08", "throughput": 4301.65, "total_tokens": 107597616} +{"current_steps": 88700, "total_steps": 89790, "loss": 0.4622, "lr": 2.248294468842338e-08, "epoch": 9.878605635371422, "percentage": 98.79, "elapsed_time": "6:56:54", "remaining_time": "0:05:07", "throughput": 4301.68, "total_tokens": 107604048} +{"current_steps": 88705, "total_steps": 89790, "loss": 0.4573, "lr": 2.2277370962034416e-08, "epoch": 9.87916249025504, "percentage": 98.79, "elapsed_time": "6:56:55", "remaining_time": "0:05:05", "throughput": 4301.7, "total_tokens": 107610096} +{"current_steps": 88710, "total_steps": 89790, "loss": 0.454, "lr": 2.207274097405232e-08, "epoch": 9.879719345138657, "percentage": 98.8, "elapsed_time": "6:56:57", "remaining_time": "0:05:04", "throughput": 4301.72, "total_tokens": 107616336} +{"current_steps": 88715, "total_steps": 89790, "loss": 0.4537, "lr": 2.1869054732209792e-08, "epoch": 9.880276200022275, "percentage": 98.8, "elapsed_time": "6:56:58", "remaining_time": "0:05:03", "throughput": 4301.74, "total_tokens": 107622416} +{"current_steps": 88720, "total_steps": 89790, "loss": 0.4599, "lr": 2.1666312244197905e-08, "epoch": 9.880833054905892, "percentage": 98.81, "elapsed_time": "6:56:59", "remaining_time": "0:05:01", "throughput": 4301.77, "total_tokens": 107628624} +{"current_steps": 88725, "total_steps": 89790, "loss": 0.4711, "lr": 2.146451351768275e-08, "epoch": 9.881389909789508, "percentage": 98.81, "elapsed_time": "6:57:00", "remaining_time": "0:05:00", "throughput": 4301.78, "total_tokens": 107634608} +{"current_steps": 88730, "total_steps": 89790, "loss": 0.4595, "lr": 2.126365856028323e-08, "epoch": 9.881946764673126, "percentage": 98.82, "elapsed_time": "6:57:02", "remaining_time": "0:04:58", "throughput": 4301.8, "total_tokens": 107640464} +{"current_steps": 88735, "total_steps": 89790, "loss": 0.4535, "lr": 2.106374737959049e-08, "epoch": 9.882503619556744, "percentage": 98.83, "elapsed_time": "6:57:03", "remaining_time": "0:04:57", "throughput": 4301.83, "total_tokens": 107646928} +{"current_steps": 88740, "total_steps": 89790, "loss": 0.4653, "lr": 2.086477998315961e-08, "epoch": 9.883060474440361, "percentage": 98.83, "elapsed_time": "6:57:04", "remaining_time": "0:04:56", "throughput": 4301.85, "total_tokens": 107652816} +{"current_steps": 88745, "total_steps": 89790, "loss": 0.4476, "lr": 2.066675637850679e-08, "epoch": 9.883617329323979, "percentage": 98.84, "elapsed_time": "6:57:06", "remaining_time": "0:04:54", "throughput": 4301.87, "total_tokens": 107658992} +{"current_steps": 88750, "total_steps": 89790, "loss": 0.4585, "lr": 2.0469676573114936e-08, "epoch": 9.884174184207595, "percentage": 98.84, "elapsed_time": "6:57:07", "remaining_time": "0:04:53", "throughput": 4301.9, "total_tokens": 107665296} +{"current_steps": 88755, "total_steps": 89790, "loss": 0.444, "lr": 2.0273540574428094e-08, "epoch": 9.884731039091212, "percentage": 98.85, "elapsed_time": "6:57:08", "remaining_time": "0:04:51", "throughput": 4301.92, "total_tokens": 107671856} +{"current_steps": 88760, "total_steps": 89790, "loss": 0.4563, "lr": 2.007834838985978e-08, "epoch": 9.88528789397483, "percentage": 98.85, "elapsed_time": "6:57:10", "remaining_time": "0:04:50", "throughput": 4301.94, "total_tokens": 107677968} +{"current_steps": 88765, "total_steps": 89790, "loss": 0.4566, "lr": 1.988410002678187e-08, "epoch": 9.885844748858448, "percentage": 98.86, "elapsed_time": "6:57:11", "remaining_time": "0:04:49", "throughput": 4301.96, "total_tokens": 107683696} +{"current_steps": 88770, "total_steps": 89790, "loss": 0.4645, "lr": 1.9690795492538493e-08, "epoch": 9.886401603742065, "percentage": 98.86, "elapsed_time": "6:57:12", "remaining_time": "0:04:47", "throughput": 4301.98, "total_tokens": 107689680} +{"current_steps": 88775, "total_steps": 89790, "loss": 0.4731, "lr": 1.949843479442659e-08, "epoch": 9.886958458625681, "percentage": 98.87, "elapsed_time": "6:57:13", "remaining_time": "0:04:46", "throughput": 4302.0, "total_tokens": 107695952} +{"current_steps": 88780, "total_steps": 89790, "loss": 0.4638, "lr": 1.9307017939720895e-08, "epoch": 9.887515313509299, "percentage": 98.88, "elapsed_time": "6:57:15", "remaining_time": "0:04:44", "throughput": 4302.03, "total_tokens": 107702160} +{"current_steps": 88785, "total_steps": 89790, "loss": 0.4399, "lr": 1.911654493564896e-08, "epoch": 9.888072168392917, "percentage": 98.88, "elapsed_time": "6:57:16", "remaining_time": "0:04:43", "throughput": 4302.05, "total_tokens": 107708336} +{"current_steps": 88790, "total_steps": 89790, "loss": 0.46, "lr": 1.892701578940781e-08, "epoch": 9.888629023276534, "percentage": 98.89, "elapsed_time": "6:57:17", "remaining_time": "0:04:41", "throughput": 4302.07, "total_tokens": 107714032} +{"current_steps": 88795, "total_steps": 89790, "loss": 0.4665, "lr": 1.8738430508161155e-08, "epoch": 9.889185878160152, "percentage": 98.89, "elapsed_time": "6:57:18", "remaining_time": "0:04:40", "throughput": 4302.09, "total_tokens": 107719728} +{"current_steps": 88800, "total_steps": 89790, "loss": 0.4647, "lr": 1.855078909903385e-08, "epoch": 9.889742733043768, "percentage": 98.9, "elapsed_time": "6:57:20", "remaining_time": "0:04:39", "throughput": 4302.11, "total_tokens": 107726032} +{"current_steps": 88805, "total_steps": 89790, "loss": 0.4529, "lr": 1.8364091569114672e-08, "epoch": 9.890299587927386, "percentage": 98.9, "elapsed_time": "6:57:21", "remaining_time": "0:04:37", "throughput": 4302.13, "total_tokens": 107731888} +{"current_steps": 88810, "total_steps": 89790, "loss": 0.4577, "lr": 1.8178337925456314e-08, "epoch": 9.890856442811003, "percentage": 98.91, "elapsed_time": "6:57:22", "remaining_time": "0:04:36", "throughput": 4302.15, "total_tokens": 107738160} +{"current_steps": 88815, "total_steps": 89790, "loss": 0.4567, "lr": 1.7993528175078157e-08, "epoch": 9.891413297694621, "percentage": 98.91, "elapsed_time": "6:57:24", "remaining_time": "0:04:34", "throughput": 4302.17, "total_tokens": 107744304} +{"current_steps": 88820, "total_steps": 89790, "loss": 0.4516, "lr": 1.7809662324963505e-08, "epoch": 9.891970152578239, "percentage": 98.92, "elapsed_time": "6:57:25", "remaining_time": "0:04:33", "throughput": 4302.19, "total_tokens": 107750448} +{"current_steps": 88825, "total_steps": 89790, "loss": 0.4524, "lr": 1.762674038205958e-08, "epoch": 9.892527007461855, "percentage": 98.93, "elapsed_time": "6:57:26", "remaining_time": "0:04:32", "throughput": 4302.21, "total_tokens": 107756144} +{"current_steps": 88830, "total_steps": 89790, "loss": 0.4623, "lr": 1.7444762353277522e-08, "epoch": 9.893083862345472, "percentage": 98.93, "elapsed_time": "6:57:27", "remaining_time": "0:04:30", "throughput": 4302.24, "total_tokens": 107762256} +{"current_steps": 88835, "total_steps": 89790, "loss": 0.4601, "lr": 1.726372824549516e-08, "epoch": 9.89364071722909, "percentage": 98.94, "elapsed_time": "6:57:29", "remaining_time": "0:04:29", "throughput": 4302.25, "total_tokens": 107768176} +{"current_steps": 88840, "total_steps": 89790, "loss": 0.461, "lr": 1.7083638065545914e-08, "epoch": 9.894197572112708, "percentage": 98.94, "elapsed_time": "6:57:30", "remaining_time": "0:04:27", "throughput": 4302.27, "total_tokens": 107774224} +{"current_steps": 88845, "total_steps": 89790, "loss": 0.4633, "lr": 1.690449182024101e-08, "epoch": 9.894754426996325, "percentage": 98.95, "elapsed_time": "6:57:31", "remaining_time": "0:04:26", "throughput": 4302.29, "total_tokens": 107780400} +{"current_steps": 88850, "total_steps": 89790, "loss": 0.4582, "lr": 1.6726289516347248e-08, "epoch": 9.895311281879943, "percentage": 98.95, "elapsed_time": "6:57:33", "remaining_time": "0:04:25", "throughput": 4302.32, "total_tokens": 107786512} +{"current_steps": 88855, "total_steps": 89790, "loss": 0.4566, "lr": 1.6549031160595364e-08, "epoch": 9.895868136763559, "percentage": 98.96, "elapsed_time": "6:57:34", "remaining_time": "0:04:23", "throughput": 4302.34, "total_tokens": 107792624} +{"current_steps": 88860, "total_steps": 89790, "loss": 0.4559, "lr": 1.6372716759685546e-08, "epoch": 9.896424991647176, "percentage": 98.96, "elapsed_time": "6:57:35", "remaining_time": "0:04:22", "throughput": 4302.36, "total_tokens": 107798736} +{"current_steps": 88865, "total_steps": 89790, "loss": 0.4593, "lr": 1.619734632027914e-08, "epoch": 9.896981846530794, "percentage": 98.97, "elapsed_time": "6:57:36", "remaining_time": "0:04:20", "throughput": 4302.39, "total_tokens": 107804848} +{"current_steps": 88870, "total_steps": 89790, "loss": 0.4602, "lr": 1.6022919848998618e-08, "epoch": 9.897538701414412, "percentage": 98.98, "elapsed_time": "6:57:38", "remaining_time": "0:04:19", "throughput": 4302.4, "total_tokens": 107810672} +{"current_steps": 88875, "total_steps": 89790, "loss": 0.4567, "lr": 1.5849437352438712e-08, "epoch": 9.89809555629803, "percentage": 98.98, "elapsed_time": "6:57:39", "remaining_time": "0:04:17", "throughput": 4302.42, "total_tokens": 107816528} +{"current_steps": 88880, "total_steps": 89790, "loss": 0.4687, "lr": 1.5676898837155285e-08, "epoch": 9.898652411181645, "percentage": 98.99, "elapsed_time": "6:57:40", "remaining_time": "0:04:16", "throughput": 4302.44, "total_tokens": 107822480} +{"current_steps": 88885, "total_steps": 89790, "loss": 0.4673, "lr": 1.5505304309662573e-08, "epoch": 9.899209266065263, "percentage": 98.99, "elapsed_time": "6:57:42", "remaining_time": "0:04:15", "throughput": 4302.47, "total_tokens": 107828720} +{"current_steps": 88890, "total_steps": 89790, "loss": 0.4493, "lr": 1.533465377644705e-08, "epoch": 9.89976612094888, "percentage": 99.0, "elapsed_time": "6:57:43", "remaining_time": "0:04:13", "throughput": 4302.49, "total_tokens": 107834896} +{"current_steps": 88895, "total_steps": 89790, "loss": 0.4503, "lr": 1.5164947243953566e-08, "epoch": 9.900322975832498, "percentage": 99.0, "elapsed_time": "6:57:44", "remaining_time": "0:04:12", "throughput": 4302.52, "total_tokens": 107840752} +{"current_steps": 88900, "total_steps": 89790, "loss": 0.4738, "lr": 1.4996184718599204e-08, "epoch": 9.900879830716116, "percentage": 99.01, "elapsed_time": "6:57:45", "remaining_time": "0:04:10", "throughput": 4302.54, "total_tokens": 107846768} +{"current_steps": 88905, "total_steps": 89790, "loss": 0.4596, "lr": 1.4828366206753875e-08, "epoch": 9.901436685599732, "percentage": 99.01, "elapsed_time": "6:57:47", "remaining_time": "0:04:09", "throughput": 4302.56, "total_tokens": 107852848} +{"current_steps": 88910, "total_steps": 89790, "loss": 0.455, "lr": 1.4661491714762498e-08, "epoch": 9.90199354048335, "percentage": 99.02, "elapsed_time": "6:57:48", "remaining_time": "0:04:08", "throughput": 4302.58, "total_tokens": 107859056} +{"current_steps": 88915, "total_steps": 89790, "loss": 0.4593, "lr": 1.4495561248931145e-08, "epoch": 9.902550395366967, "percentage": 99.03, "elapsed_time": "6:57:49", "remaining_time": "0:04:06", "throughput": 4302.6, "total_tokens": 107865104} +{"current_steps": 88920, "total_steps": 89790, "loss": 0.4633, "lr": 1.433057481552702e-08, "epoch": 9.903107250250585, "percentage": 99.03, "elapsed_time": "6:57:50", "remaining_time": "0:04:05", "throughput": 4302.62, "total_tokens": 107870896} +{"current_steps": 88925, "total_steps": 89790, "loss": 0.4675, "lr": 1.4166532420784028e-08, "epoch": 9.903664105134203, "percentage": 99.04, "elapsed_time": "6:57:52", "remaining_time": "0:04:03", "throughput": 4302.64, "total_tokens": 107877104} +{"current_steps": 88930, "total_steps": 89790, "loss": 0.4626, "lr": 1.4003434070902766e-08, "epoch": 9.904220960017819, "percentage": 99.04, "elapsed_time": "6:57:53", "remaining_time": "0:04:02", "throughput": 4302.66, "total_tokens": 107882640} +{"current_steps": 88935, "total_steps": 89790, "loss": 0.4564, "lr": 1.3841279772039417e-08, "epoch": 9.904777814901436, "percentage": 99.05, "elapsed_time": "6:57:54", "remaining_time": "0:04:01", "throughput": 4302.68, "total_tokens": 107888688} +{"current_steps": 88940, "total_steps": 89790, "loss": 0.4665, "lr": 1.3680069530327966e-08, "epoch": 9.905334669785054, "percentage": 99.05, "elapsed_time": "6:57:56", "remaining_time": "0:03:59", "throughput": 4302.71, "total_tokens": 107894864} +{"current_steps": 88945, "total_steps": 89790, "loss": 0.4736, "lr": 1.3519803351852434e-08, "epoch": 9.905891524668672, "percentage": 99.06, "elapsed_time": "6:57:57", "remaining_time": "0:03:58", "throughput": 4302.73, "total_tokens": 107900912} +{"current_steps": 88950, "total_steps": 89790, "loss": 0.4648, "lr": 1.3360481242674638e-08, "epoch": 9.90644837955229, "percentage": 99.06, "elapsed_time": "6:57:58", "remaining_time": "0:03:56", "throughput": 4302.75, "total_tokens": 107907120} +{"current_steps": 88955, "total_steps": 89790, "loss": 0.4568, "lr": 1.3202103208809213e-08, "epoch": 9.907005234435905, "percentage": 99.07, "elapsed_time": "6:57:59", "remaining_time": "0:03:55", "throughput": 4302.77, "total_tokens": 107913200} +{"current_steps": 88960, "total_steps": 89790, "loss": 0.464, "lr": 1.3044669256245812e-08, "epoch": 9.907562089319523, "percentage": 99.08, "elapsed_time": "6:58:01", "remaining_time": "0:03:54", "throughput": 4302.79, "total_tokens": 107919088} +{"current_steps": 88965, "total_steps": 89790, "loss": 0.4652, "lr": 1.2888179390926903e-08, "epoch": 9.90811894420314, "percentage": 99.08, "elapsed_time": "6:58:02", "remaining_time": "0:03:52", "throughput": 4302.81, "total_tokens": 107925168} +{"current_steps": 88970, "total_steps": 89790, "loss": 0.4493, "lr": 1.2732633618767197e-08, "epoch": 9.908675799086758, "percentage": 99.09, "elapsed_time": "6:58:03", "remaining_time": "0:03:51", "throughput": 4302.83, "total_tokens": 107931440} +{"current_steps": 88975, "total_steps": 89790, "loss": 0.4634, "lr": 1.257803194564533e-08, "epoch": 9.909232653970376, "percentage": 99.09, "elapsed_time": "6:58:04", "remaining_time": "0:03:49", "throughput": 4302.85, "total_tokens": 107936496} +{"current_steps": 88980, "total_steps": 89790, "loss": 0.4611, "lr": 1.2424374377403847e-08, "epoch": 9.909789508853994, "percentage": 99.1, "elapsed_time": "6:58:06", "remaining_time": "0:03:48", "throughput": 4302.87, "total_tokens": 107942640} +{"current_steps": 88985, "total_steps": 89790, "loss": 0.4579, "lr": 1.2271660919843664e-08, "epoch": 9.91034636373761, "percentage": 99.1, "elapsed_time": "6:58:07", "remaining_time": "0:03:46", "throughput": 4302.89, "total_tokens": 107948912} +{"current_steps": 88990, "total_steps": 89790, "loss": 0.4636, "lr": 1.2119891578735166e-08, "epoch": 9.910903218621227, "percentage": 99.11, "elapsed_time": "6:58:08", "remaining_time": "0:03:45", "throughput": 4302.91, "total_tokens": 107955056} +{"current_steps": 88995, "total_steps": 89790, "loss": 0.4624, "lr": 1.1969066359818204e-08, "epoch": 9.911460073504845, "percentage": 99.11, "elapsed_time": "6:58:10", "remaining_time": "0:03:44", "throughput": 4302.93, "total_tokens": 107960464} +{"current_steps": 89000, "total_steps": 89790, "loss": 0.4698, "lr": 1.1819185268788225e-08, "epoch": 9.912016928388462, "percentage": 99.12, "elapsed_time": "6:58:11", "remaining_time": "0:03:42", "throughput": 4302.95, "total_tokens": 107966736} +{"current_steps": 89005, "total_steps": 89790, "loss": 0.4686, "lr": 1.1670248311304589e-08, "epoch": 9.91257378327208, "percentage": 99.13, "elapsed_time": "6:58:12", "remaining_time": "0:03:41", "throughput": 4302.97, "total_tokens": 107972752} +{"current_steps": 89010, "total_steps": 89790, "loss": 0.4577, "lr": 1.1522255493001677e-08, "epoch": 9.913130638155696, "percentage": 99.13, "elapsed_time": "6:58:13", "remaining_time": "0:03:39", "throughput": 4302.99, "total_tokens": 107979088} +{"current_steps": 89015, "total_steps": 89790, "loss": 0.4536, "lr": 1.1375206819463913e-08, "epoch": 9.913687493039314, "percentage": 99.14, "elapsed_time": "6:58:15", "remaining_time": "0:03:38", "throughput": 4303.02, "total_tokens": 107985200} +{"current_steps": 89020, "total_steps": 89790, "loss": 0.4635, "lr": 1.1229102296253512e-08, "epoch": 9.914244347922931, "percentage": 99.14, "elapsed_time": "6:58:16", "remaining_time": "0:03:37", "throughput": 4303.04, "total_tokens": 107991216} +{"current_steps": 89025, "total_steps": 89790, "loss": 0.4637, "lr": 1.1083941928888287e-08, "epoch": 9.914801202806549, "percentage": 99.15, "elapsed_time": "6:58:17", "remaining_time": "0:03:35", "throughput": 4303.06, "total_tokens": 107997104} +{"current_steps": 89030, "total_steps": 89790, "loss": 0.4577, "lr": 1.0939725722849959e-08, "epoch": 9.915358057690167, "percentage": 99.15, "elapsed_time": "6:58:19", "remaining_time": "0:03:34", "throughput": 4303.08, "total_tokens": 108003056} +{"current_steps": 89035, "total_steps": 89790, "loss": 0.4629, "lr": 1.07964536835925e-08, "epoch": 9.915914912573783, "percentage": 99.16, "elapsed_time": "6:58:20", "remaining_time": "0:03:32", "throughput": 4303.1, "total_tokens": 108009264} +{"current_steps": 89040, "total_steps": 89790, "loss": 0.4562, "lr": 1.0654125816525473e-08, "epoch": 9.9164717674574, "percentage": 99.16, "elapsed_time": "6:58:21", "remaining_time": "0:03:31", "throughput": 4303.12, "total_tokens": 108015504} +{"current_steps": 89045, "total_steps": 89790, "loss": 0.4702, "lr": 1.0512742127027908e-08, "epoch": 9.917028622341018, "percentage": 99.17, "elapsed_time": "6:58:22", "remaining_time": "0:03:30", "throughput": 4303.15, "total_tokens": 108021488} +{"current_steps": 89050, "total_steps": 89790, "loss": 0.4576, "lr": 1.0372302620442754e-08, "epoch": 9.917585477224636, "percentage": 99.18, "elapsed_time": "6:58:24", "remaining_time": "0:03:28", "throughput": 4303.17, "total_tokens": 108027696} +{"current_steps": 89055, "total_steps": 89790, "loss": 0.4578, "lr": 1.0232807302074099e-08, "epoch": 9.918142332108253, "percentage": 99.18, "elapsed_time": "6:58:25", "remaining_time": "0:03:27", "throughput": 4303.19, "total_tokens": 108033872} +{"current_steps": 89060, "total_steps": 89790, "loss": 0.4556, "lr": 1.0094256177195504e-08, "epoch": 9.91869918699187, "percentage": 99.19, "elapsed_time": "6:58:26", "remaining_time": "0:03:25", "throughput": 4303.2, "total_tokens": 108039728} +{"current_steps": 89065, "total_steps": 89790, "loss": 0.4641, "lr": 9.956649251038897e-09, "epoch": 9.919256041875487, "percentage": 99.19, "elapsed_time": "6:58:27", "remaining_time": "0:03:24", "throughput": 4303.22, "total_tokens": 108045168} +{"current_steps": 89070, "total_steps": 89790, "loss": 0.4524, "lr": 9.819986528802894e-09, "epoch": 9.919812896759105, "percentage": 99.2, "elapsed_time": "6:58:29", "remaining_time": "0:03:22", "throughput": 4303.24, "total_tokens": 108051248} +{"current_steps": 89075, "total_steps": 89790, "loss": 0.4551, "lr": 9.684268015655585e-09, "epoch": 9.920369751642722, "percentage": 99.2, "elapsed_time": "6:58:30", "remaining_time": "0:03:21", "throughput": 4303.26, "total_tokens": 108057136} +{"current_steps": 89080, "total_steps": 89790, "loss": 0.4475, "lr": 9.549493716720647e-09, "epoch": 9.92092660652634, "percentage": 99.21, "elapsed_time": "6:58:31", "remaining_time": "0:03:20", "throughput": 4303.28, "total_tokens": 108062864} +{"current_steps": 89085, "total_steps": 89790, "loss": 0.4637, "lr": 9.415663637091232e-09, "epoch": 9.921483461409956, "percentage": 99.21, "elapsed_time": "6:58:33", "remaining_time": "0:03:18", "throughput": 4303.3, "total_tokens": 108069200} +{"current_steps": 89090, "total_steps": 89790, "loss": 0.4449, "lr": 9.282777781824403e-09, "epoch": 9.922040316293574, "percentage": 99.22, "elapsed_time": "6:58:34", "remaining_time": "0:03:17", "throughput": 4303.32, "total_tokens": 108075600} +{"current_steps": 89095, "total_steps": 89790, "loss": 0.457, "lr": 9.150836155941146e-09, "epoch": 9.922597171177191, "percentage": 99.23, "elapsed_time": "6:58:35", "remaining_time": "0:03:15", "throughput": 4303.35, "total_tokens": 108081776} +{"current_steps": 89100, "total_steps": 89790, "loss": 0.464, "lr": 9.019838764429133e-09, "epoch": 9.923154026060809, "percentage": 99.23, "elapsed_time": "6:58:37", "remaining_time": "0:03:14", "throughput": 4303.37, "total_tokens": 108087952} +{"current_steps": 89105, "total_steps": 89790, "loss": 0.4671, "lr": 8.889785612231639e-09, "epoch": 9.923710880944427, "percentage": 99.24, "elapsed_time": "6:58:38", "remaining_time": "0:03:13", "throughput": 4303.39, "total_tokens": 108093840} +{"current_steps": 89110, "total_steps": 89790, "loss": 0.4555, "lr": 8.760676704266946e-09, "epoch": 9.924267735828042, "percentage": 99.24, "elapsed_time": "6:58:39", "remaining_time": "0:03:11", "throughput": 4303.41, "total_tokens": 108099728} +{"current_steps": 89115, "total_steps": 89790, "loss": 0.4564, "lr": 8.632512045411711e-09, "epoch": 9.92482459071166, "percentage": 99.25, "elapsed_time": "6:58:40", "remaining_time": "0:03:10", "throughput": 4303.43, "total_tokens": 108106128} +{"current_steps": 89120, "total_steps": 89790, "loss": 0.4603, "lr": 8.505291640509282e-09, "epoch": 9.925381445595278, "percentage": 99.25, "elapsed_time": "6:58:42", "remaining_time": "0:03:08", "throughput": 4303.45, "total_tokens": 108112080} +{"current_steps": 89125, "total_steps": 89790, "loss": 0.4723, "lr": 8.379015494366927e-09, "epoch": 9.925938300478895, "percentage": 99.26, "elapsed_time": "6:58:43", "remaining_time": "0:03:07", "throughput": 4303.47, "total_tokens": 108118256} +{"current_steps": 89130, "total_steps": 89790, "loss": 0.4689, "lr": 8.253683611755825e-09, "epoch": 9.926495155362513, "percentage": 99.26, "elapsed_time": "6:58:44", "remaining_time": "0:03:06", "throughput": 4303.5, "total_tokens": 108124752} +{"current_steps": 89135, "total_steps": 89790, "loss": 0.4521, "lr": 8.129295997408304e-09, "epoch": 9.927052010246129, "percentage": 99.27, "elapsed_time": "6:58:46", "remaining_time": "0:03:04", "throughput": 4303.52, "total_tokens": 108131056} +{"current_steps": 89140, "total_steps": 89790, "loss": 0.4618, "lr": 8.005852656026159e-09, "epoch": 9.927608865129747, "percentage": 99.28, "elapsed_time": "6:58:47", "remaining_time": "0:03:03", "throughput": 4303.54, "total_tokens": 108136816} +{"current_steps": 89145, "total_steps": 89790, "loss": 0.4631, "lr": 7.8833535922751e-09, "epoch": 9.928165720013364, "percentage": 99.28, "elapsed_time": "6:58:48", "remaining_time": "0:03:01", "throughput": 4303.56, "total_tokens": 108143024} +{"current_steps": 89150, "total_steps": 89790, "loss": 0.4549, "lr": 7.761798810781984e-09, "epoch": 9.928722574896982, "percentage": 99.29, "elapsed_time": "6:58:50", "remaining_time": "0:03:00", "throughput": 4303.59, "total_tokens": 108149392} +{"current_steps": 89155, "total_steps": 89790, "loss": 0.4675, "lr": 7.641188316140358e-09, "epoch": 9.9292794297806, "percentage": 99.29, "elapsed_time": "6:58:51", "remaining_time": "0:02:58", "throughput": 4303.61, "total_tokens": 108155728} +{"current_steps": 89160, "total_steps": 89790, "loss": 0.4595, "lr": 7.52152211290491e-09, "epoch": 9.929836284664216, "percentage": 99.3, "elapsed_time": "6:58:52", "remaining_time": "0:02:57", "throughput": 4303.63, "total_tokens": 108161648} +{"current_steps": 89165, "total_steps": 89790, "loss": 0.4644, "lr": 7.402800205599803e-09, "epoch": 9.930393139547833, "percentage": 99.3, "elapsed_time": "6:58:53", "remaining_time": "0:02:56", "throughput": 4303.66, "total_tokens": 108168016} +{"current_steps": 89170, "total_steps": 89790, "loss": 0.4705, "lr": 7.2850225987075586e-09, "epoch": 9.930949994431451, "percentage": 99.31, "elapsed_time": "6:58:55", "remaining_time": "0:02:54", "throughput": 4303.68, "total_tokens": 108174416} +{"current_steps": 89175, "total_steps": 89790, "loss": 0.4396, "lr": 7.168189296682948e-09, "epoch": 9.931506849315069, "percentage": 99.32, "elapsed_time": "6:58:56", "remaining_time": "0:02:53", "throughput": 4303.71, "total_tokens": 108180720} +{"current_steps": 89180, "total_steps": 89790, "loss": 0.4562, "lr": 7.052300303936332e-09, "epoch": 9.932063704198686, "percentage": 99.32, "elapsed_time": "6:58:57", "remaining_time": "0:02:51", "throughput": 4303.73, "total_tokens": 108186800} +{"current_steps": 89185, "total_steps": 89790, "loss": 0.4682, "lr": 6.9373556248475415e-09, "epoch": 9.932620559082302, "percentage": 99.33, "elapsed_time": "6:58:59", "remaining_time": "0:02:50", "throughput": 4303.75, "total_tokens": 108192688} +{"current_steps": 89190, "total_steps": 89790, "loss": 0.4553, "lr": 6.823355263760322e-09, "epoch": 9.93317741396592, "percentage": 99.33, "elapsed_time": "6:59:00", "remaining_time": "0:02:49", "throughput": 4303.77, "total_tokens": 108198960} +{"current_steps": 89195, "total_steps": 89790, "loss": 0.4675, "lr": 6.710299224979566e-09, "epoch": 9.933734268849538, "percentage": 99.34, "elapsed_time": "6:59:01", "remaining_time": "0:02:47", "throughput": 4303.79, "total_tokens": 108205232} +{"current_steps": 89200, "total_steps": 89790, "loss": 0.4538, "lr": 6.5981875127824054e-09, "epoch": 9.934291123733155, "percentage": 99.34, "elapsed_time": "6:59:03", "remaining_time": "0:02:46", "throughput": 4303.82, "total_tokens": 108211408} +{"current_steps": 89205, "total_steps": 89790, "loss": 0.4638, "lr": 6.487020131396015e-09, "epoch": 9.934847978616773, "percentage": 99.35, "elapsed_time": "6:59:04", "remaining_time": "0:02:44", "throughput": 4303.84, "total_tokens": 108217680} +{"current_steps": 89210, "total_steps": 89790, "loss": 0.4628, "lr": 6.376797085028141e-09, "epoch": 9.93540483350039, "percentage": 99.35, "elapsed_time": "6:59:05", "remaining_time": "0:02:43", "throughput": 4303.86, "total_tokens": 108223760} +{"current_steps": 89215, "total_steps": 89790, "loss": 0.4583, "lr": 6.267518377842118e-09, "epoch": 9.935961688384007, "percentage": 99.36, "elapsed_time": "6:59:07", "remaining_time": "0:02:42", "throughput": 4303.88, "total_tokens": 108230032} +{"current_steps": 89220, "total_steps": 89790, "loss": 0.4604, "lr": 6.1591840139652025e-09, "epoch": 9.936518543267624, "percentage": 99.37, "elapsed_time": "6:59:08", "remaining_time": "0:02:40", "throughput": 4303.9, "total_tokens": 108235920} +{"current_steps": 89225, "total_steps": 89790, "loss": 0.4633, "lr": 6.051793997488564e-09, "epoch": 9.937075398151242, "percentage": 99.37, "elapsed_time": "6:59:09", "remaining_time": "0:02:39", "throughput": 4303.92, "total_tokens": 108242352} +{"current_steps": 89230, "total_steps": 89790, "loss": 0.4599, "lr": 5.94534833247562e-09, "epoch": 9.93763225303486, "percentage": 99.38, "elapsed_time": "6:59:10", "remaining_time": "0:02:37", "throughput": 4303.95, "total_tokens": 108248496} +{"current_steps": 89235, "total_steps": 89790, "loss": 0.4608, "lr": 5.839847022942602e-09, "epoch": 9.938189107918477, "percentage": 99.38, "elapsed_time": "6:59:12", "remaining_time": "0:02:36", "throughput": 4303.97, "total_tokens": 108254800} +{"current_steps": 89240, "total_steps": 89790, "loss": 0.4619, "lr": 5.7352900728779856e-09, "epoch": 9.938745962802093, "percentage": 99.39, "elapsed_time": "6:59:13", "remaining_time": "0:02:35", "throughput": 4303.98, "total_tokens": 108260528} +{"current_steps": 89245, "total_steps": 89790, "loss": 0.474, "lr": 5.63167748623139e-09, "epoch": 9.93930281768571, "percentage": 99.39, "elapsed_time": "6:59:14", "remaining_time": "0:02:33", "throughput": 4304.01, "total_tokens": 108266736} +{"current_steps": 89250, "total_steps": 89790, "loss": 0.4639, "lr": 5.5290092669219025e-09, "epoch": 9.939859672569328, "percentage": 99.4, "elapsed_time": "6:59:16", "remaining_time": "0:02:32", "throughput": 4304.03, "total_tokens": 108272336} +{"current_steps": 89255, "total_steps": 89790, "loss": 0.4635, "lr": 5.4272854188214265e-09, "epoch": 9.940416527452946, "percentage": 99.4, "elapsed_time": "6:59:17", "remaining_time": "0:02:30", "throughput": 4304.05, "total_tokens": 108278576} +{"current_steps": 89260, "total_steps": 89790, "loss": 0.4534, "lr": 5.326505945779658e-09, "epoch": 9.940973382336564, "percentage": 99.41, "elapsed_time": "6:59:18", "remaining_time": "0:02:29", "throughput": 4304.08, "total_tokens": 108284976} +{"current_steps": 89265, "total_steps": 89790, "loss": 0.4621, "lr": 5.226670851599113e-09, "epoch": 9.94153023722018, "percentage": 99.42, "elapsed_time": "6:59:20", "remaining_time": "0:02:27", "throughput": 4304.1, "total_tokens": 108291216} +{"current_steps": 89270, "total_steps": 89790, "loss": 0.452, "lr": 5.127780140057325e-09, "epoch": 9.942087092103797, "percentage": 99.42, "elapsed_time": "6:59:21", "remaining_time": "0:02:26", "throughput": 4304.12, "total_tokens": 108297328} +{"current_steps": 89275, "total_steps": 89790, "loss": 0.4686, "lr": 5.029833814887419e-09, "epoch": 9.942643946987415, "percentage": 99.43, "elapsed_time": "6:59:22", "remaining_time": "0:02:25", "throughput": 4304.14, "total_tokens": 108303536} +{"current_steps": 89280, "total_steps": 89790, "loss": 0.4521, "lr": 4.932831879789213e-09, "epoch": 9.943200801871033, "percentage": 99.43, "elapsed_time": "6:59:23", "remaining_time": "0:02:23", "throughput": 4304.16, "total_tokens": 108309712} +{"current_steps": 89285, "total_steps": 89790, "loss": 0.4536, "lr": 4.836774338429218e-09, "epoch": 9.94375765675465, "percentage": 99.44, "elapsed_time": "6:59:25", "remaining_time": "0:02:22", "throughput": 4304.18, "total_tokens": 108315568} +{"current_steps": 89290, "total_steps": 89790, "loss": 0.4685, "lr": 4.741661194437863e-09, "epoch": 9.944314511638266, "percentage": 99.44, "elapsed_time": "6:59:26", "remaining_time": "0:02:20", "throughput": 4304.21, "total_tokens": 108321744} +{"current_steps": 89295, "total_steps": 89790, "loss": 0.4615, "lr": 4.647492451409497e-09, "epoch": 9.944871366521884, "percentage": 99.45, "elapsed_time": "6:59:27", "remaining_time": "0:02:19", "throughput": 4304.22, "total_tokens": 108327632} +{"current_steps": 89300, "total_steps": 89790, "loss": 0.456, "lr": 4.554268112896831e-09, "epoch": 9.945428221405502, "percentage": 99.45, "elapsed_time": "6:59:29", "remaining_time": "0:02:18", "throughput": 4304.25, "total_tokens": 108334032} +{"current_steps": 89305, "total_steps": 89790, "loss": 0.4526, "lr": 4.461988182427601e-09, "epoch": 9.94598507628912, "percentage": 99.46, "elapsed_time": "6:59:30", "remaining_time": "0:02:16", "throughput": 4304.27, "total_tokens": 108340208} +{"current_steps": 89310, "total_steps": 89790, "loss": 0.4603, "lr": 4.370652663487906e-09, "epoch": 9.946541931172737, "percentage": 99.47, "elapsed_time": "6:59:31", "remaining_time": "0:02:15", "throughput": 4304.29, "total_tokens": 108346384} +{"current_steps": 89315, "total_steps": 89790, "loss": 0.4789, "lr": 4.28026155952499e-09, "epoch": 9.947098786056353, "percentage": 99.47, "elapsed_time": "6:59:33", "remaining_time": "0:02:13", "throughput": 4304.32, "total_tokens": 108352560} +{"current_steps": 89320, "total_steps": 89790, "loss": 0.4608, "lr": 4.1908148739583375e-09, "epoch": 9.94765564093997, "percentage": 99.48, "elapsed_time": "6:59:34", "remaining_time": "0:02:12", "throughput": 4304.34, "total_tokens": 108359056} +{"current_steps": 89325, "total_steps": 89790, "loss": 0.4573, "lr": 4.102312610165804e-09, "epoch": 9.948212495823588, "percentage": 99.48, "elapsed_time": "6:59:35", "remaining_time": "0:02:11", "throughput": 4304.36, "total_tokens": 108365264} +{"current_steps": 89330, "total_steps": 89790, "loss": 0.4632, "lr": 4.01475477148916e-09, "epoch": 9.948769350707206, "percentage": 99.49, "elapsed_time": "6:59:36", "remaining_time": "0:02:09", "throughput": 4304.39, "total_tokens": 108371344} +{"current_steps": 89335, "total_steps": 89790, "loss": 0.44, "lr": 3.928141361239646e-09, "epoch": 9.949326205590824, "percentage": 99.49, "elapsed_time": "6:59:38", "remaining_time": "0:02:08", "throughput": 4304.41, "total_tokens": 108377296} +{"current_steps": 89340, "total_steps": 89790, "loss": 0.4584, "lr": 3.842472382689643e-09, "epoch": 9.949883060474441, "percentage": 99.5, "elapsed_time": "6:59:39", "remaining_time": "0:02:06", "throughput": 4304.43, "total_tokens": 108383280} +{"current_steps": 89345, "total_steps": 89790, "loss": 0.4589, "lr": 3.757747839075454e-09, "epoch": 9.950439915358057, "percentage": 99.5, "elapsed_time": "6:59:40", "remaining_time": "0:02:05", "throughput": 4304.45, "total_tokens": 108389264} +{"current_steps": 89350, "total_steps": 89790, "loss": 0.4601, "lr": 3.673967733594519e-09, "epoch": 9.950996770241675, "percentage": 99.51, "elapsed_time": "6:59:42", "remaining_time": "0:02:04", "throughput": 4304.47, "total_tokens": 108395248} +{"current_steps": 89355, "total_steps": 89790, "loss": 0.4658, "lr": 3.5911320694193007e-09, "epoch": 9.951553625125293, "percentage": 99.52, "elapsed_time": "6:59:43", "remaining_time": "0:02:02", "throughput": 4304.49, "total_tokens": 108401200} +{"current_steps": 89360, "total_steps": 89790, "loss": 0.4584, "lr": 3.5092408496750773e-09, "epoch": 9.95211048000891, "percentage": 99.52, "elapsed_time": "6:59:44", "remaining_time": "0:02:01", "throughput": 4304.51, "total_tokens": 108407344} +{"current_steps": 89365, "total_steps": 89790, "loss": 0.4582, "lr": 3.4282940774565953e-09, "epoch": 9.952667334892528, "percentage": 99.53, "elapsed_time": "6:59:45", "remaining_time": "0:01:59", "throughput": 4304.53, "total_tokens": 108413680} +{"current_steps": 89370, "total_steps": 89790, "loss": 0.4633, "lr": 3.348291755822519e-09, "epoch": 9.953224189776144, "percentage": 99.53, "elapsed_time": "6:59:47", "remaining_time": "0:01:58", "throughput": 4304.56, "total_tokens": 108419760} +{"current_steps": 89375, "total_steps": 89790, "loss": 0.4442, "lr": 3.269233887795431e-09, "epoch": 9.953781044659761, "percentage": 99.54, "elapsed_time": "6:59:48", "remaining_time": "0:01:56", "throughput": 4304.58, "total_tokens": 108425808} +{"current_steps": 89380, "total_steps": 89790, "loss": 0.459, "lr": 3.1911204763646063e-09, "epoch": 9.954337899543379, "percentage": 99.54, "elapsed_time": "6:59:49", "remaining_time": "0:01:55", "throughput": 4304.59, "total_tokens": 108431632} +{"current_steps": 89385, "total_steps": 89790, "loss": 0.4781, "lr": 3.113951524477687e-09, "epoch": 9.954894754426997, "percentage": 99.55, "elapsed_time": "6:59:51", "remaining_time": "0:01:54", "throughput": 4304.61, "total_tokens": 108437808} +{"current_steps": 89390, "total_steps": 89790, "loss": 0.4724, "lr": 3.037727035051785e-09, "epoch": 9.955451609310614, "percentage": 99.55, "elapsed_time": "6:59:52", "remaining_time": "0:01:52", "throughput": 4304.64, "total_tokens": 108444016} +{"current_steps": 89395, "total_steps": 89790, "loss": 0.4603, "lr": 2.9624470109679282e-09, "epoch": 9.95600846419423, "percentage": 99.56, "elapsed_time": "6:59:53", "remaining_time": "0:01:51", "throughput": 4304.66, "total_tokens": 108450096} +{"current_steps": 89400, "total_steps": 89790, "loss": 0.4643, "lr": 2.888111455071063e-09, "epoch": 9.956565319077848, "percentage": 99.57, "elapsed_time": "6:59:54", "remaining_time": "0:01:49", "throughput": 4304.67, "total_tokens": 108455472} +{"current_steps": 89405, "total_steps": 89790, "loss": 0.4633, "lr": 2.8147203701672784e-09, "epoch": 9.957122173961466, "percentage": 99.57, "elapsed_time": "6:59:56", "remaining_time": "0:01:48", "throughput": 4304.69, "total_tokens": 108461712} +{"current_steps": 89410, "total_steps": 89790, "loss": 0.4594, "lr": 2.742273759029357e-09, "epoch": 9.957679028845083, "percentage": 99.58, "elapsed_time": "6:59:57", "remaining_time": "0:01:47", "throughput": 4304.71, "total_tokens": 108467792} +{"current_steps": 89415, "total_steps": 89790, "loss": 0.4687, "lr": 2.6707716243967727e-09, "epoch": 9.958235883728701, "percentage": 99.58, "elapsed_time": "6:59:58", "remaining_time": "0:01:45", "throughput": 4304.74, "total_tokens": 108473808} +{"current_steps": 89420, "total_steps": 89790, "loss": 0.4615, "lr": 2.6002139689729198e-09, "epoch": 9.958792738612317, "percentage": 99.59, "elapsed_time": "6:59:59", "remaining_time": "0:01:44", "throughput": 4304.75, "total_tokens": 108479760} +{"current_steps": 89425, "total_steps": 89790, "loss": 0.4655, "lr": 2.5306007954167822e-09, "epoch": 9.959349593495935, "percentage": 99.59, "elapsed_time": "7:00:01", "remaining_time": "0:01:42", "throughput": 4304.78, "total_tokens": 108485872} +{"current_steps": 89430, "total_steps": 89790, "loss": 0.4619, "lr": 2.461932106365139e-09, "epoch": 9.959906448379552, "percentage": 99.6, "elapsed_time": "7:00:02", "remaining_time": "0:01:41", "throughput": 4304.8, "total_tokens": 108491984} +{"current_steps": 89435, "total_steps": 89790, "loss": 0.4585, "lr": 2.3942079044103615e-09, "epoch": 9.96046330326317, "percentage": 99.6, "elapsed_time": "7:00:03", "remaining_time": "0:01:40", "throughput": 4304.82, "total_tokens": 108498096} +{"current_steps": 89440, "total_steps": 89790, "loss": 0.4694, "lr": 2.327428192111514e-09, "epoch": 9.961020158146788, "percentage": 99.61, "elapsed_time": "7:00:05", "remaining_time": "0:01:38", "throughput": 4304.84, "total_tokens": 108504176} +{"current_steps": 89445, "total_steps": 89790, "loss": 0.4615, "lr": 2.2615929719915776e-09, "epoch": 9.961577013030404, "percentage": 99.62, "elapsed_time": "7:00:06", "remaining_time": "0:01:37", "throughput": 4304.86, "total_tokens": 108510288} +{"current_steps": 89450, "total_steps": 89790, "loss": 0.4619, "lr": 2.196702246537452e-09, "epoch": 9.962133867914021, "percentage": 99.62, "elapsed_time": "7:00:07", "remaining_time": "0:01:35", "throughput": 4304.88, "total_tokens": 108516464} +{"current_steps": 89455, "total_steps": 89790, "loss": 0.4689, "lr": 2.132756018199955e-09, "epoch": 9.962690722797639, "percentage": 99.63, "elapsed_time": "7:00:09", "remaining_time": "0:01:34", "throughput": 4304.9, "total_tokens": 108522800} +{"current_steps": 89460, "total_steps": 89790, "loss": 0.4622, "lr": 2.0697542893993727e-09, "epoch": 9.963247577681257, "percentage": 99.63, "elapsed_time": "7:00:10", "remaining_time": "0:01:32", "throughput": 4304.92, "total_tokens": 108528944} +{"current_steps": 89465, "total_steps": 89790, "loss": 0.4656, "lr": 2.007697062511582e-09, "epoch": 9.963804432564874, "percentage": 99.64, "elapsed_time": "7:00:11", "remaining_time": "0:01:31", "throughput": 4304.95, "total_tokens": 108534640} +{"current_steps": 89470, "total_steps": 89790, "loss": 0.465, "lr": 1.9465843398819295e-09, "epoch": 9.96436128744849, "percentage": 99.64, "elapsed_time": "7:00:12", "remaining_time": "0:01:30", "throughput": 4304.96, "total_tokens": 108540624} +{"current_steps": 89475, "total_steps": 89790, "loss": 0.4553, "lr": 1.8864161238224544e-09, "epoch": 9.964918142332108, "percentage": 99.65, "elapsed_time": "7:00:14", "remaining_time": "0:01:28", "throughput": 4304.99, "total_tokens": 108547248} +{"current_steps": 89480, "total_steps": 89790, "loss": 0.4612, "lr": 1.8271924166035625e-09, "epoch": 9.965474997215725, "percentage": 99.65, "elapsed_time": "7:00:15", "remaining_time": "0:01:27", "throughput": 4305.02, "total_tokens": 108553488} +{"current_steps": 89485, "total_steps": 89790, "loss": 0.453, "lr": 1.7689132204623538e-09, "epoch": 9.966031852099343, "percentage": 99.66, "elapsed_time": "7:00:16", "remaining_time": "0:01:25", "throughput": 4305.04, "total_tokens": 108559760} +{"current_steps": 89490, "total_steps": 89790, "loss": 0.4675, "lr": 1.7115785376053962e-09, "epoch": 9.96658870698296, "percentage": 99.67, "elapsed_time": "7:00:18", "remaining_time": "0:01:24", "throughput": 4305.06, "total_tokens": 108565744} +{"current_steps": 89495, "total_steps": 89790, "loss": 0.4686, "lr": 1.655188370194849e-09, "epoch": 9.967145561866577, "percentage": 99.67, "elapsed_time": "7:00:19", "remaining_time": "0:01:23", "throughput": 4305.08, "total_tokens": 108572080} +{"current_steps": 89500, "total_steps": 89790, "loss": 0.4633, "lr": 1.5997427203595649e-09, "epoch": 9.967702416750194, "percentage": 99.68, "elapsed_time": "7:00:20", "remaining_time": "0:01:21", "throughput": 4305.1, "total_tokens": 108577968} +{"current_steps": 89505, "total_steps": 89790, "loss": 0.4725, "lr": 1.5452415902006411e-09, "epoch": 9.968259271633812, "percentage": 99.68, "elapsed_time": "7:00:22", "remaining_time": "0:01:20", "throughput": 4305.12, "total_tokens": 108583856} +{"current_steps": 89510, "total_steps": 89790, "loss": 0.4554, "lr": 1.4916849817747659e-09, "epoch": 9.96881612651743, "percentage": 99.69, "elapsed_time": "7:00:23", "remaining_time": "0:01:18", "throughput": 4305.14, "total_tokens": 108589744} +{"current_steps": 89515, "total_steps": 89790, "loss": 0.4623, "lr": 1.4390728971025447e-09, "epoch": 9.969372981401047, "percentage": 99.69, "elapsed_time": "7:00:24", "remaining_time": "0:01:17", "throughput": 4305.16, "total_tokens": 108595856} +{"current_steps": 89520, "total_steps": 89790, "loss": 0.4703, "lr": 1.3874053381740526e-09, "epoch": 9.969929836284663, "percentage": 99.7, "elapsed_time": "7:00:25", "remaining_time": "0:01:16", "throughput": 4305.18, "total_tokens": 108601808} +{"current_steps": 89525, "total_steps": 89790, "loss": 0.4621, "lr": 1.3366823069405066e-09, "epoch": 9.970486691168281, "percentage": 99.7, "elapsed_time": "7:00:27", "remaining_time": "0:01:14", "throughput": 4305.2, "total_tokens": 108607920} +{"current_steps": 89530, "total_steps": 89790, "loss": 0.4543, "lr": 1.2869038053225924e-09, "epoch": 9.971043546051899, "percentage": 99.71, "elapsed_time": "7:00:28", "remaining_time": "0:01:13", "throughput": 4305.22, "total_tokens": 108614000} +{"current_steps": 89535, "total_steps": 89790, "loss": 0.4546, "lr": 1.2380698351938113e-09, "epoch": 9.971600400935516, "percentage": 99.72, "elapsed_time": "7:00:29", "remaining_time": "0:01:11", "throughput": 4305.24, "total_tokens": 108619984} +{"current_steps": 89540, "total_steps": 89790, "loss": 0.4676, "lr": 1.1901803984054605e-09, "epoch": 9.972157255819134, "percentage": 99.72, "elapsed_time": "7:00:31", "remaining_time": "0:01:10", "throughput": 4305.27, "total_tokens": 108626352} +{"current_steps": 89545, "total_steps": 89790, "loss": 0.4583, "lr": 1.1432354967644277e-09, "epoch": 9.97271411070275, "percentage": 99.73, "elapsed_time": "7:00:32", "remaining_time": "0:01:09", "throughput": 4305.29, "total_tokens": 108632464} +{"current_steps": 89550, "total_steps": 89790, "loss": 0.4486, "lr": 1.0972351320442942e-09, "epoch": 9.973270965586368, "percentage": 99.73, "elapsed_time": "7:00:33", "remaining_time": "0:01:07", "throughput": 4305.31, "total_tokens": 108638544} +{"current_steps": 89555, "total_steps": 89790, "loss": 0.4593, "lr": 1.0521793059853347e-09, "epoch": 9.973827820469985, "percentage": 99.74, "elapsed_time": "7:00:34", "remaining_time": "0:01:06", "throughput": 4305.33, "total_tokens": 108644816} +{"current_steps": 89560, "total_steps": 89790, "loss": 0.4608, "lr": 1.0080680202861903e-09, "epoch": 9.974384675353603, "percentage": 99.74, "elapsed_time": "7:00:36", "remaining_time": "0:01:04", "throughput": 4305.35, "total_tokens": 108650896} +{"current_steps": 89565, "total_steps": 89790, "loss": 0.4729, "lr": 9.649012766177467e-10, "epoch": 9.97494153023722, "percentage": 99.75, "elapsed_time": "7:00:37", "remaining_time": "0:01:03", "throughput": 4305.37, "total_tokens": 108656944} +{"current_steps": 89570, "total_steps": 89790, "loss": 0.4586, "lr": 9.226790766064808e-10, "epoch": 9.975498385120838, "percentage": 99.75, "elapsed_time": "7:00:38", "remaining_time": "0:01:01", "throughput": 4305.4, "total_tokens": 108663088} +{"current_steps": 89575, "total_steps": 89790, "loss": 0.4563, "lr": 8.81401421848338e-10, "epoch": 9.976055240004454, "percentage": 99.76, "elapsed_time": "7:00:40", "remaining_time": "0:01:00", "throughput": 4305.42, "total_tokens": 108669456} +{"current_steps": 89580, "total_steps": 89790, "loss": 0.4595, "lr": 8.410683139087328e-10, "epoch": 9.976612094888072, "percentage": 99.77, "elapsed_time": "7:00:41", "remaining_time": "0:00:59", "throughput": 4305.44, "total_tokens": 108675632} +{"current_steps": 89585, "total_steps": 89790, "loss": 0.4724, "lr": 8.016797543031196e-10, "epoch": 9.97716894977169, "percentage": 99.77, "elapsed_time": "7:00:42", "remaining_time": "0:00:57", "throughput": 4305.47, "total_tokens": 108681776} +{"current_steps": 89590, "total_steps": 89790, "loss": 0.4525, "lr": 7.63235744527524e-10, "epoch": 9.977725804655307, "percentage": 99.78, "elapsed_time": "7:00:44", "remaining_time": "0:00:56", "throughput": 4305.49, "total_tokens": 108688016} +{"current_steps": 89595, "total_steps": 89790, "loss": 0.4657, "lr": 7.257362860280115e-10, "epoch": 9.978282659538925, "percentage": 99.78, "elapsed_time": "7:00:45", "remaining_time": "0:00:54", "throughput": 4305.52, "total_tokens": 108694384} +{"current_steps": 89600, "total_steps": 89790, "loss": 0.4527, "lr": 6.891813802256674e-10, "epoch": 9.97883951442254, "percentage": 99.79, "elapsed_time": "7:00:46", "remaining_time": "0:00:53", "throughput": 4305.54, "total_tokens": 108700624} +{"current_steps": 89605, "total_steps": 89790, "loss": 0.45, "lr": 6.535710284999441e-10, "epoch": 9.979396369306158, "percentage": 99.79, "elapsed_time": "7:00:47", "remaining_time": "0:00:52", "throughput": 4305.56, "total_tokens": 108706768} +{"current_steps": 89610, "total_steps": 89790, "loss": 0.4595, "lr": 6.189052321969868e-10, "epoch": 9.979953224189776, "percentage": 99.8, "elapsed_time": "7:00:49", "remaining_time": "0:00:50", "throughput": 4305.58, "total_tokens": 108712784} +{"current_steps": 89615, "total_steps": 89790, "loss": 0.4601, "lr": 5.851839926268588e-10, "epoch": 9.980510079073394, "percentage": 99.81, "elapsed_time": "7:00:50", "remaining_time": "0:00:49", "throughput": 4305.6, "total_tokens": 108718448} +{"current_steps": 89620, "total_steps": 89790, "loss": 0.4491, "lr": 5.524073110607652e-10, "epoch": 9.981066933957011, "percentage": 99.81, "elapsed_time": "7:00:51", "remaining_time": "0:00:47", "throughput": 4305.62, "total_tokens": 108724688} +{"current_steps": 89625, "total_steps": 89790, "loss": 0.4579, "lr": 5.205751887421561e-10, "epoch": 9.981623788840627, "percentage": 99.82, "elapsed_time": "7:00:53", "remaining_time": "0:00:46", "throughput": 4305.64, "total_tokens": 108730928} +{"current_steps": 89630, "total_steps": 89790, "loss": 0.4474, "lr": 4.896876268672967e-10, "epoch": 9.982180643724245, "percentage": 99.82, "elapsed_time": "7:00:54", "remaining_time": "0:00:45", "throughput": 4305.67, "total_tokens": 108737424} +{"current_steps": 89635, "total_steps": 89790, "loss": 0.466, "lr": 4.5974462661024787e-10, "epoch": 9.982737498607863, "percentage": 99.83, "elapsed_time": "7:00:55", "remaining_time": "0:00:43", "throughput": 4305.69, "total_tokens": 108743408} +{"current_steps": 89640, "total_steps": 89790, "loss": 0.4627, "lr": 4.307461890978859e-10, "epoch": 9.98329435349148, "percentage": 99.83, "elapsed_time": "7:00:57", "remaining_time": "0:00:42", "throughput": 4305.72, "total_tokens": 108749552} +{"current_steps": 89645, "total_steps": 89790, "loss": 0.4647, "lr": 4.0269231542655606e-10, "epoch": 9.983851208375098, "percentage": 99.84, "elapsed_time": "7:00:58", "remaining_time": "0:00:40", "throughput": 4305.74, "total_tokens": 108755760} +{"current_steps": 89650, "total_steps": 89790, "loss": 0.4657, "lr": 3.7558300665652136e-10, "epoch": 9.984408063258714, "percentage": 99.84, "elapsed_time": "7:00:59", "remaining_time": "0:00:39", "throughput": 4305.76, "total_tokens": 108761968} +{"current_steps": 89655, "total_steps": 89790, "loss": 0.4583, "lr": 3.4941826381473806e-10, "epoch": 9.984964918142332, "percentage": 99.85, "elapsed_time": "7:01:00", "remaining_time": "0:00:38", "throughput": 4305.79, "total_tokens": 108768144} +{"current_steps": 89660, "total_steps": 89790, "loss": 0.474, "lr": 3.2419808788375363e-10, "epoch": 9.98552177302595, "percentage": 99.86, "elapsed_time": "7:01:02", "remaining_time": "0:00:36", "throughput": 4305.81, "total_tokens": 108774352} +{"current_steps": 89665, "total_steps": 89790, "loss": 0.4426, "lr": 2.999224798211353e-10, "epoch": 9.986078627909567, "percentage": 99.86, "elapsed_time": "7:01:03", "remaining_time": "0:00:35", "throughput": 4305.83, "total_tokens": 108780272} +{"current_steps": 89670, "total_steps": 89790, "loss": 0.4631, "lr": 2.765914405455927e-10, "epoch": 9.986635482793185, "percentage": 99.87, "elapsed_time": "7:01:04", "remaining_time": "0:00:33", "throughput": 4305.85, "total_tokens": 108786576} +{"current_steps": 89675, "total_steps": 89790, "loss": 0.4732, "lr": 2.542049709314265e-10, "epoch": 9.987192337676802, "percentage": 99.87, "elapsed_time": "7:01:06", "remaining_time": "0:00:32", "throughput": 4305.87, "total_tokens": 108792752} +{"current_steps": 89680, "total_steps": 89790, "loss": 0.4682, "lr": 2.3276307183350831e-10, "epoch": 9.987749192560418, "percentage": 99.88, "elapsed_time": "7:01:07", "remaining_time": "0:00:30", "throughput": 4305.9, "total_tokens": 108798832} +{"current_steps": 89685, "total_steps": 89790, "loss": 0.4538, "lr": 2.1226574405397437e-10, "epoch": 9.988306047444036, "percentage": 99.88, "elapsed_time": "7:01:08", "remaining_time": "0:00:29", "throughput": 4305.92, "total_tokens": 108805200} +{"current_steps": 89690, "total_steps": 89790, "loss": 0.468, "lr": 1.9271298837275632e-10, "epoch": 9.988862902327654, "percentage": 99.89, "elapsed_time": "7:01:09", "remaining_time": "0:00:28", "throughput": 4305.94, "total_tokens": 108810960} +{"current_steps": 89695, "total_steps": 89790, "loss": 0.4597, "lr": 1.741048055253769e-10, "epoch": 9.989419757211271, "percentage": 99.89, "elapsed_time": "7:01:11", "remaining_time": "0:00:26", "throughput": 4305.96, "total_tokens": 108817040} +{"current_steps": 89700, "total_steps": 89790, "loss": 0.4685, "lr": 1.5644119621682774e-10, "epoch": 9.989976612094889, "percentage": 99.9, "elapsed_time": "7:01:12", "remaining_time": "0:00:25", "throughput": 4305.98, "total_tokens": 108822608} +{"current_steps": 89705, "total_steps": 89790, "loss": 0.4591, "lr": 1.3972216111324266e-10, "epoch": 9.990533466978505, "percentage": 99.91, "elapsed_time": "7:01:13", "remaining_time": "0:00:23", "throughput": 4306.0, "total_tokens": 108828912} +{"current_steps": 89710, "total_steps": 89790, "loss": 0.476, "lr": 1.2394770084744877e-10, "epoch": 9.991090321862123, "percentage": 99.91, "elapsed_time": "7:01:15", "remaining_time": "0:00:22", "throughput": 4306.02, "total_tokens": 108835024} +{"current_steps": 89715, "total_steps": 89790, "loss": 0.4745, "lr": 1.0911781601619097e-10, "epoch": 9.99164717674574, "percentage": 99.92, "elapsed_time": "7:01:16", "remaining_time": "0:00:21", "throughput": 4306.04, "total_tokens": 108841040} +{"current_steps": 89720, "total_steps": 89790, "loss": 0.4655, "lr": 9.523250717735632e-11, "epoch": 9.992204031629358, "percentage": 99.92, "elapsed_time": "7:01:17", "remaining_time": "0:00:19", "throughput": 4306.06, "total_tokens": 108847280} +{"current_steps": 89725, "total_steps": 89790, "loss": 0.4561, "lr": 8.22917748555252e-11, "epoch": 9.992760886512976, "percentage": 99.93, "elapsed_time": "7:01:18", "remaining_time": "0:00:18", "throughput": 4306.08, "total_tokens": 108853264} +{"current_steps": 89730, "total_steps": 89790, "loss": 0.4625, "lr": 7.029561954197129e-11, "epoch": 9.993317741396591, "percentage": 99.93, "elapsed_time": "7:01:20", "remaining_time": "0:00:16", "throughput": 4306.1, "total_tokens": 108859536} +{"current_steps": 89735, "total_steps": 89790, "loss": 0.4643, "lr": 5.924404168911046e-11, "epoch": 9.99387459628021, "percentage": 99.94, "elapsed_time": "7:01:21", "remaining_time": "0:00:15", "throughput": 4306.12, "total_tokens": 108865680} +{"current_steps": 89740, "total_steps": 89790, "loss": 0.4604, "lr": 4.9137041716051937e-11, "epoch": 9.994431451163827, "percentage": 99.94, "elapsed_time": "7:01:22", "remaining_time": "0:00:14", "throughput": 4306.15, "total_tokens": 108871696} +{"current_steps": 89745, "total_steps": 89790, "loss": 0.4624, "lr": 3.9974620000271525e-11, "epoch": 9.994988306047444, "percentage": 99.95, "elapsed_time": "7:01:24", "remaining_time": "0:00:12", "throughput": 4306.17, "total_tokens": 108877872} +{"current_steps": 89750, "total_steps": 89790, "loss": 0.4484, "lr": 3.175677689148948e-11, "epoch": 9.995545160931062, "percentage": 99.96, "elapsed_time": "7:01:25", "remaining_time": "0:00:11", "throughput": 4306.19, "total_tokens": 108883632} +{"current_steps": 89755, "total_steps": 89790, "loss": 0.4574, "lr": 2.44835126977927e-11, "epoch": 9.996102015814678, "percentage": 99.96, "elapsed_time": "7:01:26", "remaining_time": "0:00:09", "throughput": 4306.21, "total_tokens": 108889776} +{"current_steps": 89760, "total_steps": 89790, "loss": 0.4609, "lr": 1.8154827696736932e-11, "epoch": 9.996658870698296, "percentage": 99.97, "elapsed_time": "7:01:27", "remaining_time": "0:00:08", "throughput": 4306.23, "total_tokens": 108895760} +{"current_steps": 89765, "total_steps": 89790, "loss": 0.4617, "lr": 1.277072212702013e-11, "epoch": 9.997215725581913, "percentage": 99.97, "elapsed_time": "7:01:29", "remaining_time": "0:00:07", "throughput": 4306.25, "total_tokens": 108901776} +{"current_steps": 89770, "total_steps": 89790, "loss": 0.4514, "lr": 8.331196191257994e-12, "epoch": 9.997772580465531, "percentage": 99.98, "elapsed_time": "7:01:30", "remaining_time": "0:00:05", "throughput": 4306.27, "total_tokens": 108907728} +{"current_steps": 89775, "total_steps": 89790, "loss": 0.4576, "lr": 4.836250055983982e-12, "epoch": 9.998329435349149, "percentage": 99.98, "elapsed_time": "7:01:31", "remaining_time": "0:00:04", "throughput": 4306.29, "total_tokens": 108913840} +{"current_steps": 89780, "total_steps": 89790, "loss": 0.4598, "lr": 2.285883854424853e-12, "epoch": 9.998886290232765, "percentage": 99.99, "elapsed_time": "7:01:33", "remaining_time": "0:00:02", "throughput": 4306.31, "total_tokens": 108919824} +{"current_steps": 89785, "total_steps": 89790, "loss": 0.4595, "lr": 6.800976837251227e-13, "epoch": 9.999443145116382, "percentage": 99.99, "elapsed_time": "7:01:34", "remaining_time": "0:00:01", "throughput": 4306.33, "total_tokens": 108925200} +{"current_steps": 89790, "total_steps": 89790, "loss": 0.466, "lr": 1.889160217150021e-14, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "7:01:35", "remaining_time": "0:00:00", "throughput": 4306.33, "total_tokens": 108930064} +{"current_steps": 89790, "total_steps": 89790, "epoch": 10.0, "percentage": 100.0, "elapsed_time": "7:01:36", "remaining_time": "0:00:00", "throughput": 4306.09, "total_tokens": 108930064}