diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -16183,3 +16183,902 @@ {"current_steps": 80825, "total_steps": 89790, "loss": 0.4789, "lr": 1.503366180478802e-06, "epoch": 9.001559193674128, "percentage": 90.02, "elapsed_time": "6:21:16", "remaining_time": "0:42:17", "throughput": 4286.31, "total_tokens": 98057264} {"current_steps": 80830, "total_steps": 89790, "loss": 0.4576, "lr": 1.5017068938524725e-06, "epoch": 9.002116048557745, "percentage": 90.02, "elapsed_time": "6:21:18", "remaining_time": "0:42:16", "throughput": 4286.33, "total_tokens": 98063056} {"current_steps": 80835, "total_steps": 89790, "loss": 0.4607, "lr": 1.5000484950669663e-06, "epoch": 9.002672903441363, "percentage": 90.03, "elapsed_time": "6:21:19", "remaining_time": "0:42:14", "throughput": 4286.34, "total_tokens": 98068432} +{"current_steps": 80840, "total_steps": 89790, "loss": 0.4705, "lr": 1.4983909841849332e-06, "epoch": 9.00322975832498, "percentage": 90.03, "elapsed_time": "6:21:20", "remaining_time": "0:42:13", "throughput": 4286.37, "total_tokens": 98074640} +{"current_steps": 80845, "total_steps": 89790, "loss": 0.4673, "lr": 1.4967343612690033e-06, "epoch": 9.003786613208598, "percentage": 90.04, "elapsed_time": "6:21:21", "remaining_time": "0:42:11", "throughput": 4286.4, "total_tokens": 98080560} +{"current_steps": 80850, "total_steps": 89790, "loss": 0.4593, "lr": 1.495078626381774e-06, "epoch": 9.004343468092214, "percentage": 90.04, "elapsed_time": "6:21:23", "remaining_time": "0:42:10", "throughput": 4286.42, "total_tokens": 98086096} +{"current_steps": 80855, "total_steps": 89790, "loss": 0.4745, "lr": 1.4934237795857952e-06, "epoch": 9.004900322975832, "percentage": 90.05, "elapsed_time": "6:21:24", "remaining_time": "0:42:08", "throughput": 4286.44, "total_tokens": 98092272} +{"current_steps": 80860, "total_steps": 89790, "loss": 0.4574, "lr": 1.4917698209435977e-06, "epoch": 9.00545717785945, "percentage": 90.05, "elapsed_time": "6:21:25", "remaining_time": "0:42:07", "throughput": 4286.47, "total_tokens": 98098480} +{"current_steps": 80865, "total_steps": 89790, "loss": 0.4531, "lr": 1.4901167505176728e-06, "epoch": 9.006014032743067, "percentage": 90.06, "elapsed_time": "6:21:26", "remaining_time": "0:42:06", "throughput": 4286.49, "total_tokens": 98104560} +{"current_steps": 80870, "total_steps": 89790, "loss": 0.4681, "lr": 1.488464568370479e-06, "epoch": 9.006570887626685, "percentage": 90.07, "elapsed_time": "6:21:28", "remaining_time": "0:42:04", "throughput": 4286.51, "total_tokens": 98110768} +{"current_steps": 80875, "total_steps": 89790, "loss": 0.4558, "lr": 1.4868132745644358e-06, "epoch": 9.007127742510303, "percentage": 90.07, "elapsed_time": "6:21:29", "remaining_time": "0:42:03", "throughput": 4286.54, "total_tokens": 98116880} +{"current_steps": 80880, "total_steps": 89790, "loss": 0.4669, "lr": 1.4851628691619407e-06, "epoch": 9.007684597393919, "percentage": 90.08, "elapsed_time": "6:21:30", "remaining_time": "0:42:01", "throughput": 4286.57, "total_tokens": 98122992} +{"current_steps": 80885, "total_steps": 89790, "loss": 0.4565, "lr": 1.4835133522253519e-06, "epoch": 9.008241452277536, "percentage": 90.08, "elapsed_time": "6:21:32", "remaining_time": "0:42:00", "throughput": 4286.59, "total_tokens": 98129168} +{"current_steps": 80890, "total_steps": 89790, "loss": 0.4643, "lr": 1.481864723816989e-06, "epoch": 9.008798307161154, "percentage": 90.09, "elapsed_time": "6:21:33", "remaining_time": "0:41:58", "throughput": 4286.62, "total_tokens": 98135472} +{"current_steps": 80895, "total_steps": 89790, "loss": 0.4756, "lr": 1.480216983999147e-06, "epoch": 9.009355162044772, "percentage": 90.09, "elapsed_time": "6:21:34", "remaining_time": "0:41:57", "throughput": 4286.65, "total_tokens": 98141904} +{"current_steps": 80900, "total_steps": 89790, "loss": 0.4554, "lr": 1.4785701328340757e-06, "epoch": 9.00991201692839, "percentage": 90.1, "elapsed_time": "6:21:35", "remaining_time": "0:41:56", "throughput": 4286.67, "total_tokens": 98147536} +{"current_steps": 80905, "total_steps": 89790, "loss": 0.4667, "lr": 1.4769241703840058e-06, "epoch": 9.010468871812005, "percentage": 90.1, "elapsed_time": "6:21:37", "remaining_time": "0:41:54", "throughput": 4286.7, "total_tokens": 98153680} +{"current_steps": 80910, "total_steps": 89790, "loss": 0.4686, "lr": 1.475279096711124e-06, "epoch": 9.011025726695623, "percentage": 90.11, "elapsed_time": "6:21:38", "remaining_time": "0:41:53", "throughput": 4286.72, "total_tokens": 98159824} +{"current_steps": 80915, "total_steps": 89790, "loss": 0.4615, "lr": 1.4736349118775834e-06, "epoch": 9.01158258157924, "percentage": 90.12, "elapsed_time": "6:21:39", "remaining_time": "0:41:51", "throughput": 4286.75, "total_tokens": 98165936} +{"current_steps": 80920, "total_steps": 89790, "loss": 0.4613, "lr": 1.4719916159455143e-06, "epoch": 9.012139436462858, "percentage": 90.12, "elapsed_time": "6:21:41", "remaining_time": "0:41:50", "throughput": 4286.77, "total_tokens": 98171984} +{"current_steps": 80925, "total_steps": 89790, "loss": 0.4688, "lr": 1.4703492089769982e-06, "epoch": 9.012696291346476, "percentage": 90.13, "elapsed_time": "6:21:42", "remaining_time": "0:41:48", "throughput": 4286.8, "total_tokens": 98178384} +{"current_steps": 80930, "total_steps": 89790, "loss": 0.4453, "lr": 1.4687076910340963e-06, "epoch": 9.013253146230092, "percentage": 90.13, "elapsed_time": "6:21:43", "remaining_time": "0:41:47", "throughput": 4286.82, "total_tokens": 98184656} +{"current_steps": 80935, "total_steps": 89790, "loss": 0.4622, "lr": 1.467067062178823e-06, "epoch": 9.01381000111371, "percentage": 90.14, "elapsed_time": "6:21:45", "remaining_time": "0:41:46", "throughput": 4286.85, "total_tokens": 98190672} +{"current_steps": 80940, "total_steps": 89790, "loss": 0.4703, "lr": 1.465427322473173e-06, "epoch": 9.014366855997327, "percentage": 90.14, "elapsed_time": "6:21:46", "remaining_time": "0:41:44", "throughput": 4286.87, "total_tokens": 98196688} +{"current_steps": 80945, "total_steps": 89790, "loss": 0.4612, "lr": 1.4637884719791024e-06, "epoch": 9.014923710880945, "percentage": 90.15, "elapsed_time": "6:21:47", "remaining_time": "0:41:43", "throughput": 4286.89, "total_tokens": 98202256} +{"current_steps": 80950, "total_steps": 89790, "loss": 0.456, "lr": 1.4621505107585254e-06, "epoch": 9.015480565764562, "percentage": 90.15, "elapsed_time": "6:21:48", "remaining_time": "0:41:41", "throughput": 4286.91, "total_tokens": 98208080} +{"current_steps": 80955, "total_steps": 89790, "loss": 0.4718, "lr": 1.4605134388733345e-06, "epoch": 9.016037420648178, "percentage": 90.16, "elapsed_time": "6:21:50", "remaining_time": "0:41:40", "throughput": 4286.93, "total_tokens": 98214192} +{"current_steps": 80960, "total_steps": 89790, "loss": 0.4584, "lr": 1.4588772563853797e-06, "epoch": 9.016594275531796, "percentage": 90.17, "elapsed_time": "6:21:51", "remaining_time": "0:41:38", "throughput": 4286.96, "total_tokens": 98220528} +{"current_steps": 80965, "total_steps": 89790, "loss": 0.4645, "lr": 1.457241963356487e-06, "epoch": 9.017151130415414, "percentage": 90.17, "elapsed_time": "6:21:52", "remaining_time": "0:41:37", "throughput": 4286.98, "total_tokens": 98226448} +{"current_steps": 80970, "total_steps": 89790, "loss": 0.4545, "lr": 1.4556075598484349e-06, "epoch": 9.017707985299031, "percentage": 90.18, "elapsed_time": "6:21:54", "remaining_time": "0:41:36", "throughput": 4287.01, "total_tokens": 98232656} +{"current_steps": 80975, "total_steps": 89790, "loss": 0.4524, "lr": 1.4539740459229817e-06, "epoch": 9.018264840182649, "percentage": 90.18, "elapsed_time": "6:21:55", "remaining_time": "0:41:34", "throughput": 4287.03, "total_tokens": 98238640} +{"current_steps": 80980, "total_steps": 89790, "loss": 0.4614, "lr": 1.4523414216418507e-06, "epoch": 9.018821695066265, "percentage": 90.19, "elapsed_time": "6:21:56", "remaining_time": "0:41:33", "throughput": 4287.06, "total_tokens": 98245136} +{"current_steps": 80985, "total_steps": 89790, "loss": 0.4735, "lr": 1.4507096870667174e-06, "epoch": 9.019378549949883, "percentage": 90.19, "elapsed_time": "6:21:58", "remaining_time": "0:41:31", "throughput": 4287.09, "total_tokens": 98251568} +{"current_steps": 80990, "total_steps": 89790, "loss": 0.4667, "lr": 1.449078842259244e-06, "epoch": 9.0199354048335, "percentage": 90.2, "elapsed_time": "6:21:59", "remaining_time": "0:41:30", "throughput": 4287.11, "total_tokens": 98257680} +{"current_steps": 80995, "total_steps": 89790, "loss": 0.4553, "lr": 1.4474488872810416e-06, "epoch": 9.020492259717118, "percentage": 90.2, "elapsed_time": "6:22:00", "remaining_time": "0:41:28", "throughput": 4287.13, "total_tokens": 98263760} +{"current_steps": 81000, "total_steps": 89790, "loss": 0.4531, "lr": 1.4458198221937002e-06, "epoch": 9.021049114600736, "percentage": 90.21, "elapsed_time": "6:22:01", "remaining_time": "0:41:27", "throughput": 4287.16, "total_tokens": 98269712} +{"current_steps": 81005, "total_steps": 89790, "loss": 0.4607, "lr": 1.444191647058768e-06, "epoch": 9.021605969484352, "percentage": 90.22, "elapsed_time": "6:22:03", "remaining_time": "0:41:26", "throughput": 4287.18, "total_tokens": 98275920} +{"current_steps": 81010, "total_steps": 89790, "loss": 0.4624, "lr": 1.4425643619377592e-06, "epoch": 9.02216282436797, "percentage": 90.22, "elapsed_time": "6:22:04", "remaining_time": "0:41:24", "throughput": 4287.2, "total_tokens": 98281456} +{"current_steps": 81015, "total_steps": 89790, "loss": 0.4642, "lr": 1.4409379668921696e-06, "epoch": 9.022719679251587, "percentage": 90.23, "elapsed_time": "6:22:05", "remaining_time": "0:41:23", "throughput": 4287.22, "total_tokens": 98287504} +{"current_steps": 81020, "total_steps": 89790, "loss": 0.4694, "lr": 1.4393124619834386e-06, "epoch": 9.023276534135205, "percentage": 90.23, "elapsed_time": "6:22:06", "remaining_time": "0:41:21", "throughput": 4287.25, "total_tokens": 98293744} +{"current_steps": 81025, "total_steps": 89790, "loss": 0.4792, "lr": 1.4376878472729893e-06, "epoch": 9.023833389018822, "percentage": 90.24, "elapsed_time": "6:22:08", "remaining_time": "0:41:20", "throughput": 4287.27, "total_tokens": 98299632} +{"current_steps": 81030, "total_steps": 89790, "loss": 0.4548, "lr": 1.4360641228221977e-06, "epoch": 9.024390243902438, "percentage": 90.24, "elapsed_time": "6:22:09", "remaining_time": "0:41:18", "throughput": 4287.3, "total_tokens": 98305776} +{"current_steps": 81035, "total_steps": 89790, "loss": 0.4593, "lr": 1.434441288692423e-06, "epoch": 9.024947098786056, "percentage": 90.25, "elapsed_time": "6:22:10", "remaining_time": "0:41:17", "throughput": 4287.32, "total_tokens": 98311856} +{"current_steps": 81040, "total_steps": 89790, "loss": 0.4651, "lr": 1.4328193449449717e-06, "epoch": 9.025503953669674, "percentage": 90.26, "elapsed_time": "6:22:12", "remaining_time": "0:41:16", "throughput": 4287.35, "total_tokens": 98318192} +{"current_steps": 81045, "total_steps": 89790, "loss": 0.4699, "lr": 1.4311982916411309e-06, "epoch": 9.026060808553291, "percentage": 90.26, "elapsed_time": "6:22:13", "remaining_time": "0:41:14", "throughput": 4287.38, "total_tokens": 98324368} +{"current_steps": 81050, "total_steps": 89790, "loss": 0.4667, "lr": 1.4295781288421516e-06, "epoch": 9.026617663436909, "percentage": 90.27, "elapsed_time": "6:22:14", "remaining_time": "0:41:13", "throughput": 4287.4, "total_tokens": 98330576} +{"current_steps": 81055, "total_steps": 89790, "loss": 0.4601, "lr": 1.4279588566092432e-06, "epoch": 9.027174518320527, "percentage": 90.27, "elapsed_time": "6:22:16", "remaining_time": "0:41:11", "throughput": 4287.43, "total_tokens": 98336624} +{"current_steps": 81060, "total_steps": 89790, "loss": 0.4615, "lr": 1.426340475003593e-06, "epoch": 9.027731373204142, "percentage": 90.28, "elapsed_time": "6:22:17", "remaining_time": "0:41:10", "throughput": 4287.44, "total_tokens": 98341904} +{"current_steps": 81065, "total_steps": 89790, "loss": 0.4631, "lr": 1.4247229840863406e-06, "epoch": 9.02828822808776, "percentage": 90.28, "elapsed_time": "6:22:18", "remaining_time": "0:41:08", "throughput": 4287.47, "total_tokens": 98348176} +{"current_steps": 81070, "total_steps": 89790, "loss": 0.4591, "lr": 1.4231063839186042e-06, "epoch": 9.028845082971378, "percentage": 90.29, "elapsed_time": "6:22:19", "remaining_time": "0:41:07", "throughput": 4287.49, "total_tokens": 98353840} +{"current_steps": 81075, "total_steps": 89790, "loss": 0.4633, "lr": 1.4214906745614682e-06, "epoch": 9.029401937854995, "percentage": 90.29, "elapsed_time": "6:22:21", "remaining_time": "0:41:05", "throughput": 4287.51, "total_tokens": 98359888} +{"current_steps": 81080, "total_steps": 89790, "loss": 0.4541, "lr": 1.4198758560759723e-06, "epoch": 9.029958792738613, "percentage": 90.3, "elapsed_time": "6:22:22", "remaining_time": "0:41:04", "throughput": 4287.53, "total_tokens": 98365904} +{"current_steps": 81085, "total_steps": 89790, "loss": 0.4617, "lr": 1.4182619285231375e-06, "epoch": 9.030515647622229, "percentage": 90.31, "elapsed_time": "6:22:23", "remaining_time": "0:41:03", "throughput": 4287.56, "total_tokens": 98371984} +{"current_steps": 81090, "total_steps": 89790, "loss": 0.4579, "lr": 1.4166488919639315e-06, "epoch": 9.031072502505847, "percentage": 90.31, "elapsed_time": "6:22:24", "remaining_time": "0:41:01", "throughput": 4287.58, "total_tokens": 98378032} +{"current_steps": 81095, "total_steps": 89790, "loss": 0.4546, "lr": 1.4150367464593139e-06, "epoch": 9.031629357389464, "percentage": 90.32, "elapsed_time": "6:22:26", "remaining_time": "0:41:00", "throughput": 4287.62, "total_tokens": 98384432} +{"current_steps": 81100, "total_steps": 89790, "loss": 0.4517, "lr": 1.4134254920701862e-06, "epoch": 9.032186212273082, "percentage": 90.32, "elapsed_time": "6:22:27", "remaining_time": "0:40:58", "throughput": 4287.64, "total_tokens": 98390608} +{"current_steps": 81105, "total_steps": 89790, "loss": 0.4664, "lr": 1.4118151288574271e-06, "epoch": 9.0327430671567, "percentage": 90.33, "elapsed_time": "6:22:28", "remaining_time": "0:40:57", "throughput": 4287.67, "total_tokens": 98397200} +{"current_steps": 81110, "total_steps": 89790, "loss": 0.4549, "lr": 1.4102056568818912e-06, "epoch": 9.033299922040316, "percentage": 90.33, "elapsed_time": "6:22:30", "remaining_time": "0:40:56", "throughput": 4287.69, "total_tokens": 98403216} +{"current_steps": 81115, "total_steps": 89790, "loss": 0.4616, "lr": 1.4085970762043765e-06, "epoch": 9.033856776923933, "percentage": 90.34, "elapsed_time": "6:22:31", "remaining_time": "0:40:54", "throughput": 4287.72, "total_tokens": 98409392} +{"current_steps": 81120, "total_steps": 89790, "loss": 0.4599, "lr": 1.4069893868856738e-06, "epoch": 9.034413631807551, "percentage": 90.34, "elapsed_time": "6:22:32", "remaining_time": "0:40:53", "throughput": 4287.74, "total_tokens": 98415504} +{"current_steps": 81125, "total_steps": 89790, "loss": 0.4532, "lr": 1.4053825889865173e-06, "epoch": 9.034970486691169, "percentage": 90.35, "elapsed_time": "6:22:34", "remaining_time": "0:40:51", "throughput": 4287.77, "total_tokens": 98421648} +{"current_steps": 81130, "total_steps": 89790, "loss": 0.4507, "lr": 1.4037766825676147e-06, "epoch": 9.035527341574786, "percentage": 90.36, "elapsed_time": "6:22:35", "remaining_time": "0:40:50", "throughput": 4287.8, "total_tokens": 98427792} +{"current_steps": 81135, "total_steps": 89790, "loss": 0.4776, "lr": 1.4021716676896529e-06, "epoch": 9.036084196458402, "percentage": 90.36, "elapsed_time": "6:22:36", "remaining_time": "0:40:48", "throughput": 4287.82, "total_tokens": 98433616} +{"current_steps": 81140, "total_steps": 89790, "loss": 0.4578, "lr": 1.4005675444132644e-06, "epoch": 9.03664105134202, "percentage": 90.37, "elapsed_time": "6:22:37", "remaining_time": "0:40:47", "throughput": 4287.84, "total_tokens": 98439760} +{"current_steps": 81145, "total_steps": 89790, "loss": 0.4694, "lr": 1.3989643127990642e-06, "epoch": 9.037197906225638, "percentage": 90.37, "elapsed_time": "6:22:39", "remaining_time": "0:40:46", "throughput": 4287.87, "total_tokens": 98445872} +{"current_steps": 81150, "total_steps": 89790, "loss": 0.4535, "lr": 1.3973619729076209e-06, "epoch": 9.037754761109255, "percentage": 90.38, "elapsed_time": "6:22:40", "remaining_time": "0:40:44", "throughput": 4287.89, "total_tokens": 98452176} +{"current_steps": 81155, "total_steps": 89790, "loss": 0.4485, "lr": 1.3957605247994833e-06, "epoch": 9.038311615992873, "percentage": 90.38, "elapsed_time": "6:22:41", "remaining_time": "0:40:43", "throughput": 4287.91, "total_tokens": 98457488} +{"current_steps": 81160, "total_steps": 89790, "loss": 0.4618, "lr": 1.394159968535161e-06, "epoch": 9.038868470876489, "percentage": 90.39, "elapsed_time": "6:22:42", "remaining_time": "0:40:41", "throughput": 4287.94, "total_tokens": 98463856} +{"current_steps": 81165, "total_steps": 89790, "loss": 0.4534, "lr": 1.3925603041751167e-06, "epoch": 9.039425325760106, "percentage": 90.39, "elapsed_time": "6:22:44", "remaining_time": "0:40:40", "throughput": 4287.96, "total_tokens": 98469744} +{"current_steps": 81170, "total_steps": 89790, "loss": 0.4642, "lr": 1.3909615317798025e-06, "epoch": 9.039982180643724, "percentage": 90.4, "elapsed_time": "6:22:45", "remaining_time": "0:40:38", "throughput": 4287.98, "total_tokens": 98475664} +{"current_steps": 81175, "total_steps": 89790, "loss": 0.4691, "lr": 1.3893636514096198e-06, "epoch": 9.040539035527342, "percentage": 90.41, "elapsed_time": "6:22:46", "remaining_time": "0:40:37", "throughput": 4288.0, "total_tokens": 98481712} +{"current_steps": 81180, "total_steps": 89790, "loss": 0.4541, "lr": 1.3877666631249426e-06, "epoch": 9.04109589041096, "percentage": 90.41, "elapsed_time": "6:22:48", "remaining_time": "0:40:36", "throughput": 4288.03, "total_tokens": 98488048} +{"current_steps": 81185, "total_steps": 89790, "loss": 0.4649, "lr": 1.3861705669861087e-06, "epoch": 9.041652745294575, "percentage": 90.42, "elapsed_time": "6:22:49", "remaining_time": "0:40:34", "throughput": 4288.05, "total_tokens": 98494032} +{"current_steps": 81190, "total_steps": 89790, "loss": 0.463, "lr": 1.3845753630534225e-06, "epoch": 9.042209600178193, "percentage": 90.42, "elapsed_time": "6:22:50", "remaining_time": "0:40:33", "throughput": 4288.07, "total_tokens": 98500112} +{"current_steps": 81195, "total_steps": 89790, "loss": 0.4558, "lr": 1.3829810513871638e-06, "epoch": 9.04276645506181, "percentage": 90.43, "elapsed_time": "6:22:51", "remaining_time": "0:40:31", "throughput": 4288.1, "total_tokens": 98506128} +{"current_steps": 81200, "total_steps": 89790, "loss": 0.4574, "lr": 1.3813876320475622e-06, "epoch": 9.043323309945428, "percentage": 90.43, "elapsed_time": "6:22:53", "remaining_time": "0:40:30", "throughput": 4288.12, "total_tokens": 98512432} +{"current_steps": 81205, "total_steps": 89790, "loss": 0.451, "lr": 1.3797951050948277e-06, "epoch": 9.043880164829046, "percentage": 90.44, "elapsed_time": "6:22:54", "remaining_time": "0:40:28", "throughput": 4288.14, "total_tokens": 98518384} +{"current_steps": 81210, "total_steps": 89790, "loss": 0.4657, "lr": 1.3782034705891261e-06, "epoch": 9.044437019712662, "percentage": 90.44, "elapsed_time": "6:22:55", "remaining_time": "0:40:27", "throughput": 4288.17, "total_tokens": 98524624} +{"current_steps": 81215, "total_steps": 89790, "loss": 0.4516, "lr": 1.3766127285905955e-06, "epoch": 9.04499387459628, "percentage": 90.45, "elapsed_time": "6:22:57", "remaining_time": "0:40:26", "throughput": 4288.19, "total_tokens": 98530736} +{"current_steps": 81220, "total_steps": 89790, "loss": 0.4544, "lr": 1.3750228791593462e-06, "epoch": 9.045550729479897, "percentage": 90.46, "elapsed_time": "6:22:58", "remaining_time": "0:40:24", "throughput": 4288.22, "total_tokens": 98536912} +{"current_steps": 81225, "total_steps": 89790, "loss": 0.4768, "lr": 1.3734339223554382e-06, "epoch": 9.046107584363515, "percentage": 90.46, "elapsed_time": "6:22:59", "remaining_time": "0:40:23", "throughput": 4288.25, "total_tokens": 98543120} +{"current_steps": 81230, "total_steps": 89790, "loss": 0.4562, "lr": 1.3718458582389154e-06, "epoch": 9.046664439247133, "percentage": 90.47, "elapsed_time": "6:23:01", "remaining_time": "0:40:21", "throughput": 4288.28, "total_tokens": 98549424} +{"current_steps": 81235, "total_steps": 89790, "loss": 0.4483, "lr": 1.3702586868697714e-06, "epoch": 9.04722129413075, "percentage": 90.47, "elapsed_time": "6:23:02", "remaining_time": "0:40:20", "throughput": 4288.3, "total_tokens": 98555632} +{"current_steps": 81240, "total_steps": 89790, "loss": 0.4637, "lr": 1.368672408307986e-06, "epoch": 9.047778149014366, "percentage": 90.48, "elapsed_time": "6:23:03", "remaining_time": "0:40:18", "throughput": 4288.32, "total_tokens": 98561072} +{"current_steps": 81245, "total_steps": 89790, "loss": 0.4642, "lr": 1.3670870226134807e-06, "epoch": 9.048335003897984, "percentage": 90.48, "elapsed_time": "6:23:04", "remaining_time": "0:40:17", "throughput": 4288.35, "total_tokens": 98567024} +{"current_steps": 81250, "total_steps": 89790, "loss": 0.4685, "lr": 1.365502529846166e-06, "epoch": 9.048891858781602, "percentage": 90.49, "elapsed_time": "6:23:06", "remaining_time": "0:40:16", "throughput": 4288.36, "total_tokens": 98572752} +{"current_steps": 81255, "total_steps": 89790, "loss": 0.4751, "lr": 1.3639189300659077e-06, "epoch": 9.04944871366522, "percentage": 90.49, "elapsed_time": "6:23:07", "remaining_time": "0:40:14", "throughput": 4288.39, "total_tokens": 98578960} +{"current_steps": 81260, "total_steps": 89790, "loss": 0.46, "lr": 1.3623362233325331e-06, "epoch": 9.050005568548837, "percentage": 90.5, "elapsed_time": "6:23:08", "remaining_time": "0:40:13", "throughput": 4288.41, "total_tokens": 98584976} +{"current_steps": 81265, "total_steps": 89790, "loss": 0.458, "lr": 1.3607544097058527e-06, "epoch": 9.050562423432453, "percentage": 90.51, "elapsed_time": "6:23:10", "remaining_time": "0:40:11", "throughput": 4288.44, "total_tokens": 98591184} +{"current_steps": 81270, "total_steps": 89790, "loss": 0.4623, "lr": 1.3591734892456215e-06, "epoch": 9.05111927831607, "percentage": 90.51, "elapsed_time": "6:23:11", "remaining_time": "0:40:10", "throughput": 4288.46, "total_tokens": 98597104} +{"current_steps": 81275, "total_steps": 89790, "loss": 0.4468, "lr": 1.3575934620115804e-06, "epoch": 9.051676133199688, "percentage": 90.52, "elapsed_time": "6:23:12", "remaining_time": "0:40:08", "throughput": 4288.48, "total_tokens": 98602928} +{"current_steps": 81280, "total_steps": 89790, "loss": 0.4626, "lr": 1.3560143280634209e-06, "epoch": 9.052232988083306, "percentage": 90.52, "elapsed_time": "6:23:13", "remaining_time": "0:40:07", "throughput": 4288.51, "total_tokens": 98609200} +{"current_steps": 81285, "total_steps": 89790, "loss": 0.4586, "lr": 1.3544360874608114e-06, "epoch": 9.052789842966924, "percentage": 90.53, "elapsed_time": "6:23:15", "remaining_time": "0:40:06", "throughput": 4288.54, "total_tokens": 98615536} +{"current_steps": 81290, "total_steps": 89790, "loss": 0.4389, "lr": 1.3528587402633851e-06, "epoch": 9.05334669785054, "percentage": 90.53, "elapsed_time": "6:23:16", "remaining_time": "0:40:04", "throughput": 4288.56, "total_tokens": 98622064} +{"current_steps": 81295, "total_steps": 89790, "loss": 0.4572, "lr": 1.3512822865307335e-06, "epoch": 9.053903552734157, "percentage": 90.54, "elapsed_time": "6:23:17", "remaining_time": "0:40:03", "throughput": 4288.59, "total_tokens": 98628016} +{"current_steps": 81300, "total_steps": 89790, "loss": 0.4457, "lr": 1.349706726322425e-06, "epoch": 9.054460407617775, "percentage": 90.54, "elapsed_time": "6:23:19", "remaining_time": "0:40:01", "throughput": 4288.61, "total_tokens": 98634576} +{"current_steps": 81305, "total_steps": 89790, "loss": 0.459, "lr": 1.3481320596979873e-06, "epoch": 9.055017262501392, "percentage": 90.55, "elapsed_time": "6:23:20", "remaining_time": "0:40:00", "throughput": 4288.64, "total_tokens": 98640816} +{"current_steps": 81310, "total_steps": 89790, "loss": 0.46, "lr": 1.3465582867169175e-06, "epoch": 9.05557411738501, "percentage": 90.56, "elapsed_time": "6:23:21", "remaining_time": "0:39:58", "throughput": 4288.66, "total_tokens": 98646768} +{"current_steps": 81315, "total_steps": 89790, "loss": 0.4535, "lr": 1.344985407438673e-06, "epoch": 9.056130972268626, "percentage": 90.56, "elapsed_time": "6:23:23", "remaining_time": "0:39:57", "throughput": 4288.69, "total_tokens": 98652848} +{"current_steps": 81320, "total_steps": 89790, "loss": 0.4598, "lr": 1.3434134219226874e-06, "epoch": 9.056687827152244, "percentage": 90.57, "elapsed_time": "6:23:24", "remaining_time": "0:39:56", "throughput": 4288.71, "total_tokens": 98658352} +{"current_steps": 81325, "total_steps": 89790, "loss": 0.4589, "lr": 1.3418423302283572e-06, "epoch": 9.057244682035861, "percentage": 90.57, "elapsed_time": "6:23:25", "remaining_time": "0:39:54", "throughput": 4288.73, "total_tokens": 98664496} +{"current_steps": 81330, "total_steps": 89790, "loss": 0.467, "lr": 1.3402721324150352e-06, "epoch": 9.057801536919479, "percentage": 90.58, "elapsed_time": "6:23:26", "remaining_time": "0:39:53", "throughput": 4288.76, "total_tokens": 98670576} +{"current_steps": 81335, "total_steps": 89790, "loss": 0.4684, "lr": 1.3387028285420599e-06, "epoch": 9.058358391803097, "percentage": 90.58, "elapsed_time": "6:23:28", "remaining_time": "0:39:51", "throughput": 4288.78, "total_tokens": 98676560} +{"current_steps": 81340, "total_steps": 89790, "loss": 0.4594, "lr": 1.3371344186687118e-06, "epoch": 9.058915246686713, "percentage": 90.59, "elapsed_time": "6:23:29", "remaining_time": "0:39:50", "throughput": 4288.81, "total_tokens": 98682608} +{"current_steps": 81345, "total_steps": 89790, "loss": 0.4592, "lr": 1.3355669028542573e-06, "epoch": 9.05947210157033, "percentage": 90.59, "elapsed_time": "6:23:30", "remaining_time": "0:39:48", "throughput": 4288.82, "total_tokens": 98688176} +{"current_steps": 81350, "total_steps": 89790, "loss": 0.4505, "lr": 1.3340002811579267e-06, "epoch": 9.060028956453948, "percentage": 90.6, "elapsed_time": "6:23:31", "remaining_time": "0:39:47", "throughput": 4288.85, "total_tokens": 98694384} +{"current_steps": 81355, "total_steps": 89790, "loss": 0.4748, "lr": 1.3324345536389005e-06, "epoch": 9.060585811337566, "percentage": 90.61, "elapsed_time": "6:23:33", "remaining_time": "0:39:46", "throughput": 4288.87, "total_tokens": 98700624} +{"current_steps": 81360, "total_steps": 89790, "loss": 0.4558, "lr": 1.3308697203563509e-06, "epoch": 9.061142666221183, "percentage": 90.61, "elapsed_time": "6:23:34", "remaining_time": "0:39:44", "throughput": 4288.9, "total_tokens": 98706096} +{"current_steps": 81365, "total_steps": 89790, "loss": 0.4658, "lr": 1.3293057813693888e-06, "epoch": 9.0616995211048, "percentage": 90.62, "elapsed_time": "6:23:35", "remaining_time": "0:39:43", "throughput": 4288.92, "total_tokens": 98712240} +{"current_steps": 81370, "total_steps": 89790, "loss": 0.4533, "lr": 1.3277427367371141e-06, "epoch": 9.062256375988417, "percentage": 90.62, "elapsed_time": "6:23:36", "remaining_time": "0:39:41", "throughput": 4288.95, "total_tokens": 98718576} +{"current_steps": 81375, "total_steps": 89790, "loss": 0.471, "lr": 1.3261805865185745e-06, "epoch": 9.062813230872035, "percentage": 90.63, "elapsed_time": "6:23:38", "remaining_time": "0:39:40", "throughput": 4288.98, "total_tokens": 98724816} +{"current_steps": 81380, "total_steps": 89790, "loss": 0.4508, "lr": 1.3246193307728028e-06, "epoch": 9.063370085755652, "percentage": 90.63, "elapsed_time": "6:23:39", "remaining_time": "0:39:38", "throughput": 4289.0, "total_tokens": 98730992} +{"current_steps": 81385, "total_steps": 89790, "loss": 0.4578, "lr": 1.3230589695587853e-06, "epoch": 9.06392694063927, "percentage": 90.64, "elapsed_time": "6:23:40", "remaining_time": "0:39:37", "throughput": 4289.03, "total_tokens": 98737232} +{"current_steps": 81390, "total_steps": 89790, "loss": 0.4503, "lr": 1.321499502935475e-06, "epoch": 9.064483795522886, "percentage": 90.64, "elapsed_time": "6:23:42", "remaining_time": "0:39:36", "throughput": 4289.05, "total_tokens": 98743056} +{"current_steps": 81395, "total_steps": 89790, "loss": 0.4576, "lr": 1.3199409309617967e-06, "epoch": 9.065040650406504, "percentage": 90.65, "elapsed_time": "6:23:43", "remaining_time": "0:39:34", "throughput": 4289.07, "total_tokens": 98749296} +{"current_steps": 81400, "total_steps": 89790, "loss": 0.4579, "lr": 1.3183832536966339e-06, "epoch": 9.065597505290121, "percentage": 90.66, "elapsed_time": "6:23:44", "remaining_time": "0:39:33", "throughput": 4289.1, "total_tokens": 98755344} +{"current_steps": 81405, "total_steps": 89790, "loss": 0.4634, "lr": 1.3168264711988455e-06, "epoch": 9.066154360173739, "percentage": 90.66, "elapsed_time": "6:23:46", "remaining_time": "0:39:31", "throughput": 4289.13, "total_tokens": 98761680} +{"current_steps": 81410, "total_steps": 89790, "loss": 0.4691, "lr": 1.3152705835272478e-06, "epoch": 9.066711215057357, "percentage": 90.67, "elapsed_time": "6:23:47", "remaining_time": "0:39:30", "throughput": 4289.15, "total_tokens": 98767856} +{"current_steps": 81415, "total_steps": 89790, "loss": 0.4635, "lr": 1.3137155907406274e-06, "epoch": 9.067268069940974, "percentage": 90.67, "elapsed_time": "6:23:48", "remaining_time": "0:39:28", "throughput": 4289.18, "total_tokens": 98774128} +{"current_steps": 81420, "total_steps": 89790, "loss": 0.4686, "lr": 1.3121614928977427e-06, "epoch": 9.06782492482459, "percentage": 90.68, "elapsed_time": "6:23:49", "remaining_time": "0:39:27", "throughput": 4289.2, "total_tokens": 98779920} +{"current_steps": 81425, "total_steps": 89790, "loss": 0.4574, "lr": 1.3106082900573052e-06, "epoch": 9.068381779708208, "percentage": 90.68, "elapsed_time": "6:23:51", "remaining_time": "0:39:26", "throughput": 4289.22, "total_tokens": 98785968} +{"current_steps": 81430, "total_steps": 89790, "loss": 0.4628, "lr": 1.3090559822780041e-06, "epoch": 9.068938634591825, "percentage": 90.69, "elapsed_time": "6:23:52", "remaining_time": "0:39:24", "throughput": 4289.25, "total_tokens": 98792240} +{"current_steps": 81435, "total_steps": 89790, "loss": 0.4741, "lr": 1.3075045696184869e-06, "epoch": 9.069495489475443, "percentage": 90.69, "elapsed_time": "6:23:53", "remaining_time": "0:39:23", "throughput": 4289.27, "total_tokens": 98797968} +{"current_steps": 81440, "total_steps": 89790, "loss": 0.4598, "lr": 1.3059540521373759e-06, "epoch": 9.07005234435906, "percentage": 90.7, "elapsed_time": "6:23:55", "remaining_time": "0:39:21", "throughput": 4289.29, "total_tokens": 98804112} +{"current_steps": 81445, "total_steps": 89790, "loss": 0.4493, "lr": 1.3044044298932524e-06, "epoch": 9.070609199242677, "percentage": 90.71, "elapsed_time": "6:23:56", "remaining_time": "0:39:20", "throughput": 4289.31, "total_tokens": 98810192} +{"current_steps": 81450, "total_steps": 89790, "loss": 0.4539, "lr": 1.3028557029446635e-06, "epoch": 9.071166054126294, "percentage": 90.71, "elapsed_time": "6:23:57", "remaining_time": "0:39:18", "throughput": 4289.34, "total_tokens": 98815792} +{"current_steps": 81455, "total_steps": 89790, "loss": 0.4642, "lr": 1.3013078713501325e-06, "epoch": 9.071722909009912, "percentage": 90.72, "elapsed_time": "6:23:58", "remaining_time": "0:39:17", "throughput": 4289.36, "total_tokens": 98822096} +{"current_steps": 81460, "total_steps": 89790, "loss": 0.4748, "lr": 1.299760935168129e-06, "epoch": 9.07227976389353, "percentage": 90.72, "elapsed_time": "6:24:00", "remaining_time": "0:39:16", "throughput": 4289.38, "total_tokens": 98827984} +{"current_steps": 81465, "total_steps": 89790, "loss": 0.4696, "lr": 1.2982148944571144e-06, "epoch": 9.072836618777147, "percentage": 90.73, "elapsed_time": "6:24:01", "remaining_time": "0:39:14", "throughput": 4289.41, "total_tokens": 98834224} +{"current_steps": 81470, "total_steps": 89790, "loss": 0.4558, "lr": 1.2966697492754948e-06, "epoch": 9.073393473660763, "percentage": 90.73, "elapsed_time": "6:24:02", "remaining_time": "0:39:13", "throughput": 4289.43, "total_tokens": 98840368} +{"current_steps": 81475, "total_steps": 89790, "loss": 0.4546, "lr": 1.2951254996816514e-06, "epoch": 9.073950328544381, "percentage": 90.74, "elapsed_time": "6:24:04", "remaining_time": "0:39:11", "throughput": 4289.46, "total_tokens": 98846736} +{"current_steps": 81480, "total_steps": 89790, "loss": 0.4657, "lr": 1.2935821457339374e-06, "epoch": 9.074507183427999, "percentage": 90.75, "elapsed_time": "6:24:05", "remaining_time": "0:39:10", "throughput": 4289.48, "total_tokens": 98852752} +{"current_steps": 81485, "total_steps": 89790, "loss": 0.464, "lr": 1.2920396874906565e-06, "epoch": 9.075064038311616, "percentage": 90.75, "elapsed_time": "6:24:06", "remaining_time": "0:39:08", "throughput": 4289.51, "total_tokens": 98858992} +{"current_steps": 81490, "total_steps": 89790, "loss": 0.4557, "lr": 1.290498125010095e-06, "epoch": 9.075620893195234, "percentage": 90.76, "elapsed_time": "6:24:07", "remaining_time": "0:39:07", "throughput": 4289.53, "total_tokens": 98864976} +{"current_steps": 81495, "total_steps": 89790, "loss": 0.4456, "lr": 1.2889574583504926e-06, "epoch": 9.07617774807885, "percentage": 90.76, "elapsed_time": "6:24:09", "remaining_time": "0:39:06", "throughput": 4289.55, "total_tokens": 98870864} +{"current_steps": 81500, "total_steps": 89790, "loss": 0.4647, "lr": 1.2874176875700666e-06, "epoch": 9.076734602962468, "percentage": 90.77, "elapsed_time": "6:24:10", "remaining_time": "0:39:04", "throughput": 4289.58, "total_tokens": 98877008} +{"current_steps": 81505, "total_steps": 89790, "loss": 0.4544, "lr": 1.2858788127269873e-06, "epoch": 9.077291457846085, "percentage": 90.77, "elapsed_time": "6:24:11", "remaining_time": "0:39:03", "throughput": 4289.6, "total_tokens": 98883024} +{"current_steps": 81510, "total_steps": 89790, "loss": 0.4546, "lr": 1.2843408338794022e-06, "epoch": 9.077848312729703, "percentage": 90.78, "elapsed_time": "6:24:13", "remaining_time": "0:39:01", "throughput": 4289.63, "total_tokens": 98889552} +{"current_steps": 81515, "total_steps": 89790, "loss": 0.4495, "lr": 1.2828037510854235e-06, "epoch": 9.07840516761332, "percentage": 90.78, "elapsed_time": "6:24:14", "remaining_time": "0:39:00", "throughput": 4289.65, "total_tokens": 98895472} +{"current_steps": 81520, "total_steps": 89790, "loss": 0.4663, "lr": 1.2812675644031214e-06, "epoch": 9.078962022496937, "percentage": 90.79, "elapsed_time": "6:24:15", "remaining_time": "0:38:58", "throughput": 4289.68, "total_tokens": 98901936} +{"current_steps": 81525, "total_steps": 89790, "loss": 0.4633, "lr": 1.2797322738905466e-06, "epoch": 9.079518877380554, "percentage": 90.8, "elapsed_time": "6:24:16", "remaining_time": "0:38:57", "throughput": 4289.7, "total_tokens": 98907376} +{"current_steps": 81530, "total_steps": 89790, "loss": 0.4564, "lr": 1.2781978796056998e-06, "epoch": 9.080075732264172, "percentage": 90.8, "elapsed_time": "6:24:18", "remaining_time": "0:38:56", "throughput": 4289.73, "total_tokens": 98913424} +{"current_steps": 81535, "total_steps": 89790, "loss": 0.4624, "lr": 1.2766643816065544e-06, "epoch": 9.08063258714779, "percentage": 90.81, "elapsed_time": "6:24:19", "remaining_time": "0:38:54", "throughput": 4289.75, "total_tokens": 98919536} +{"current_steps": 81540, "total_steps": 89790, "loss": 0.463, "lr": 1.2751317799510582e-06, "epoch": 9.081189442031407, "percentage": 90.81, "elapsed_time": "6:24:20", "remaining_time": "0:38:53", "throughput": 4289.78, "total_tokens": 98925712} +{"current_steps": 81545, "total_steps": 89790, "loss": 0.4647, "lr": 1.2736000746971067e-06, "epoch": 9.081746296915023, "percentage": 90.82, "elapsed_time": "6:24:22", "remaining_time": "0:38:51", "throughput": 4289.8, "total_tokens": 98931920} +{"current_steps": 81550, "total_steps": 89790, "loss": 0.4441, "lr": 1.2720692659025867e-06, "epoch": 9.08230315179864, "percentage": 90.82, "elapsed_time": "6:24:23", "remaining_time": "0:38:50", "throughput": 4289.81, "total_tokens": 98937072} +{"current_steps": 81555, "total_steps": 89790, "loss": 0.47, "lr": 1.2705393536253247e-06, "epoch": 9.082860006682258, "percentage": 90.83, "elapsed_time": "6:24:24", "remaining_time": "0:38:48", "throughput": 4289.84, "total_tokens": 98943280} +{"current_steps": 81560, "total_steps": 89790, "loss": 0.4556, "lr": 1.2690103379231295e-06, "epoch": 9.083416861565876, "percentage": 90.83, "elapsed_time": "6:24:25", "remaining_time": "0:38:47", "throughput": 4289.86, "total_tokens": 98949392} +{"current_steps": 81565, "total_steps": 89790, "loss": 0.4489, "lr": 1.26748221885378e-06, "epoch": 9.083973716449494, "percentage": 90.84, "elapsed_time": "6:24:27", "remaining_time": "0:38:46", "throughput": 4289.89, "total_tokens": 98955312} +{"current_steps": 81570, "total_steps": 89790, "loss": 0.4651, "lr": 1.2659549964750024e-06, "epoch": 9.084530571333111, "percentage": 90.85, "elapsed_time": "6:24:28", "remaining_time": "0:38:44", "throughput": 4289.91, "total_tokens": 98961520} +{"current_steps": 81575, "total_steps": 89790, "loss": 0.4655, "lr": 1.2644286708445058e-06, "epoch": 9.085087426216727, "percentage": 90.85, "elapsed_time": "6:24:29", "remaining_time": "0:38:43", "throughput": 4289.94, "total_tokens": 98967792} +{"current_steps": 81580, "total_steps": 89790, "loss": 0.4744, "lr": 1.2629032420199554e-06, "epoch": 9.085644281100345, "percentage": 90.86, "elapsed_time": "6:24:31", "remaining_time": "0:38:41", "throughput": 4289.96, "total_tokens": 98973904} +{"current_steps": 81585, "total_steps": 89790, "loss": 0.4635, "lr": 1.2613787100589941e-06, "epoch": 9.086201135983963, "percentage": 90.86, "elapsed_time": "6:24:32", "remaining_time": "0:38:40", "throughput": 4289.99, "total_tokens": 98979824} +{"current_steps": 81590, "total_steps": 89790, "loss": 0.4534, "lr": 1.2598550750192173e-06, "epoch": 9.08675799086758, "percentage": 90.87, "elapsed_time": "6:24:33", "remaining_time": "0:38:38", "throughput": 4290.01, "total_tokens": 98985904} +{"current_steps": 81595, "total_steps": 89790, "loss": 0.4574, "lr": 1.2583323369581928e-06, "epoch": 9.087314845751198, "percentage": 90.87, "elapsed_time": "6:24:34", "remaining_time": "0:38:37", "throughput": 4290.04, "total_tokens": 98992048} +{"current_steps": 81600, "total_steps": 89790, "loss": 0.4622, "lr": 1.2568104959334608e-06, "epoch": 9.087871700634814, "percentage": 90.88, "elapsed_time": "6:24:36", "remaining_time": "0:38:36", "throughput": 4290.06, "total_tokens": 98998128} +{"current_steps": 81605, "total_steps": 89790, "loss": 0.4573, "lr": 1.2552895520025115e-06, "epoch": 9.088428555518432, "percentage": 90.88, "elapsed_time": "6:24:37", "remaining_time": "0:38:34", "throughput": 4290.08, "total_tokens": 99003984} +{"current_steps": 81610, "total_steps": 89790, "loss": 0.4553, "lr": 1.2537695052228239e-06, "epoch": 9.08898541040205, "percentage": 90.89, "elapsed_time": "6:24:38", "remaining_time": "0:38:33", "throughput": 4290.1, "total_tokens": 99010000} +{"current_steps": 81615, "total_steps": 89790, "loss": 0.4713, "lr": 1.2522503556518156e-06, "epoch": 9.089542265285667, "percentage": 90.9, "elapsed_time": "6:24:40", "remaining_time": "0:38:31", "throughput": 4290.13, "total_tokens": 99016304} +{"current_steps": 81620, "total_steps": 89790, "loss": 0.4575, "lr": 1.250732103346894e-06, "epoch": 9.090099120169285, "percentage": 90.9, "elapsed_time": "6:24:41", "remaining_time": "0:38:30", "throughput": 4290.16, "total_tokens": 99022384} +{"current_steps": 81625, "total_steps": 89790, "loss": 0.4661, "lr": 1.2492147483654265e-06, "epoch": 9.0906559750529, "percentage": 90.91, "elapsed_time": "6:24:42", "remaining_time": "0:38:28", "throughput": 4290.18, "total_tokens": 99028528} +{"current_steps": 81630, "total_steps": 89790, "loss": 0.4531, "lr": 1.2476982907647345e-06, "epoch": 9.091212829936518, "percentage": 90.91, "elapsed_time": "6:24:43", "remaining_time": "0:38:27", "throughput": 4290.2, "total_tokens": 99034320} +{"current_steps": 81635, "total_steps": 89790, "loss": 0.4598, "lr": 1.2461827306021217e-06, "epoch": 9.091769684820136, "percentage": 90.92, "elapsed_time": "6:24:45", "remaining_time": "0:38:26", "throughput": 4290.23, "total_tokens": 99040656} +{"current_steps": 81640, "total_steps": 89790, "loss": 0.4494, "lr": 1.2446680679348455e-06, "epoch": 9.092326539703754, "percentage": 90.92, "elapsed_time": "6:24:46", "remaining_time": "0:38:24", "throughput": 4290.26, "total_tokens": 99046480} +{"current_steps": 81645, "total_steps": 89790, "loss": 0.4567, "lr": 1.2431543028201403e-06, "epoch": 9.092883394587371, "percentage": 90.93, "elapsed_time": "6:24:47", "remaining_time": "0:38:23", "throughput": 4290.28, "total_tokens": 99052496} +{"current_steps": 81650, "total_steps": 89790, "loss": 0.4494, "lr": 1.2416414353151968e-06, "epoch": 9.093440249470987, "percentage": 90.93, "elapsed_time": "6:24:48", "remaining_time": "0:38:21", "throughput": 4290.3, "total_tokens": 99058512} +{"current_steps": 81655, "total_steps": 89790, "loss": 0.4673, "lr": 1.2401294654771744e-06, "epoch": 9.093997104354605, "percentage": 90.94, "elapsed_time": "6:24:50", "remaining_time": "0:38:20", "throughput": 4290.33, "total_tokens": 99064720} +{"current_steps": 81660, "total_steps": 89790, "loss": 0.4629, "lr": 1.2386183933632084e-06, "epoch": 9.094553959238223, "percentage": 90.95, "elapsed_time": "6:24:51", "remaining_time": "0:38:18", "throughput": 4290.35, "total_tokens": 99070736} +{"current_steps": 81665, "total_steps": 89790, "loss": 0.4616, "lr": 1.2371082190303806e-06, "epoch": 9.09511081412184, "percentage": 90.95, "elapsed_time": "6:24:52", "remaining_time": "0:38:17", "throughput": 4290.37, "total_tokens": 99076752} +{"current_steps": 81670, "total_steps": 89790, "loss": 0.4642, "lr": 1.2355989425357622e-06, "epoch": 9.095667669005458, "percentage": 90.96, "elapsed_time": "6:24:54", "remaining_time": "0:38:16", "throughput": 4290.39, "total_tokens": 99082608} +{"current_steps": 81675, "total_steps": 89790, "loss": 0.4664, "lr": 1.2340905639363686e-06, "epoch": 9.096224523889074, "percentage": 90.96, "elapsed_time": "6:24:55", "remaining_time": "0:38:14", "throughput": 4290.41, "total_tokens": 99087984} +{"current_steps": 81680, "total_steps": 89790, "loss": 0.4633, "lr": 1.2325830832891989e-06, "epoch": 9.096781378772691, "percentage": 90.97, "elapsed_time": "6:24:56", "remaining_time": "0:38:13", "throughput": 4290.43, "total_tokens": 99093808} +{"current_steps": 81685, "total_steps": 89790, "loss": 0.4527, "lr": 1.2310765006512015e-06, "epoch": 9.09733823365631, "percentage": 90.97, "elapsed_time": "6:24:57", "remaining_time": "0:38:11", "throughput": 4290.46, "total_tokens": 99100048} +{"current_steps": 81690, "total_steps": 89790, "loss": 0.4572, "lr": 1.2295708160793063e-06, "epoch": 9.097895088539927, "percentage": 90.98, "elapsed_time": "6:24:58", "remaining_time": "0:38:10", "throughput": 4290.48, "total_tokens": 99105392} +{"current_steps": 81695, "total_steps": 89790, "loss": 0.4543, "lr": 1.2280660296304064e-06, "epoch": 9.098451943423544, "percentage": 90.98, "elapsed_time": "6:25:00", "remaining_time": "0:38:08", "throughput": 4290.5, "total_tokens": 99111312} +{"current_steps": 81700, "total_steps": 89790, "loss": 0.4565, "lr": 1.226562141361348e-06, "epoch": 9.09900879830716, "percentage": 90.99, "elapsed_time": "6:25:01", "remaining_time": "0:38:07", "throughput": 4290.53, "total_tokens": 99117584} +{"current_steps": 81705, "total_steps": 89790, "loss": 0.4511, "lr": 1.225059151328961e-06, "epoch": 9.099565653190778, "percentage": 91.0, "elapsed_time": "6:25:02", "remaining_time": "0:38:06", "throughput": 4290.55, "total_tokens": 99123376} +{"current_steps": 81710, "total_steps": 89790, "loss": 0.4611, "lr": 1.2235570595900247e-06, "epoch": 9.100122508074396, "percentage": 91.0, "elapsed_time": "6:25:04", "remaining_time": "0:38:04", "throughput": 4290.58, "total_tokens": 99129520} +{"current_steps": 81715, "total_steps": 89790, "loss": 0.4578, "lr": 1.2220558662013022e-06, "epoch": 9.100679362958013, "percentage": 91.01, "elapsed_time": "6:25:05", "remaining_time": "0:38:03", "throughput": 4290.6, "total_tokens": 99135664} +{"current_steps": 81720, "total_steps": 89790, "loss": 0.4635, "lr": 1.220555571219509e-06, "epoch": 9.101236217841631, "percentage": 91.01, "elapsed_time": "6:25:06", "remaining_time": "0:38:01", "throughput": 4290.62, "total_tokens": 99141584} +{"current_steps": 81725, "total_steps": 89790, "loss": 0.4612, "lr": 1.21905617470133e-06, "epoch": 9.101793072725247, "percentage": 91.02, "elapsed_time": "6:25:07", "remaining_time": "0:38:00", "throughput": 4290.65, "total_tokens": 99147568} +{"current_steps": 81730, "total_steps": 89790, "loss": 0.4658, "lr": 1.2175576767034208e-06, "epoch": 9.102349927608865, "percentage": 91.02, "elapsed_time": "6:25:09", "remaining_time": "0:37:58", "throughput": 4290.68, "total_tokens": 99153872} +{"current_steps": 81735, "total_steps": 89790, "loss": 0.4639, "lr": 1.2160600772823938e-06, "epoch": 9.102906782492482, "percentage": 91.03, "elapsed_time": "6:25:10", "remaining_time": "0:37:57", "throughput": 4290.7, "total_tokens": 99160144} +{"current_steps": 81740, "total_steps": 89790, "loss": 0.4522, "lr": 1.21456337649484e-06, "epoch": 9.1034636373761, "percentage": 91.03, "elapsed_time": "6:25:11", "remaining_time": "0:37:56", "throughput": 4290.72, "total_tokens": 99166000} +{"current_steps": 81745, "total_steps": 89790, "loss": 0.4571, "lr": 1.213067574397303e-06, "epoch": 9.104020492259718, "percentage": 91.04, "elapsed_time": "6:25:13", "remaining_time": "0:37:54", "throughput": 4290.75, "total_tokens": 99172144} +{"current_steps": 81750, "total_steps": 89790, "loss": 0.4602, "lr": 1.2115726710463016e-06, "epoch": 9.104577347143334, "percentage": 91.05, "elapsed_time": "6:25:14", "remaining_time": "0:37:53", "throughput": 4290.77, "total_tokens": 99177712} +{"current_steps": 81755, "total_steps": 89790, "loss": 0.4725, "lr": 1.210078666498321e-06, "epoch": 9.105134202026951, "percentage": 91.05, "elapsed_time": "6:25:15", "remaining_time": "0:37:51", "throughput": 4290.79, "total_tokens": 99183760} +{"current_steps": 81760, "total_steps": 89790, "loss": 0.4547, "lr": 1.208585560809805e-06, "epoch": 9.105691056910569, "percentage": 91.06, "elapsed_time": "6:25:16", "remaining_time": "0:37:50", "throughput": 4290.81, "total_tokens": 99189616} +{"current_steps": 81765, "total_steps": 89790, "loss": 0.4526, "lr": 1.2070933540371726e-06, "epoch": 9.106247911794187, "percentage": 91.06, "elapsed_time": "6:25:18", "remaining_time": "0:37:48", "throughput": 4290.84, "total_tokens": 99195920} +{"current_steps": 81770, "total_steps": 89790, "loss": 0.4671, "lr": 1.2056020462367978e-06, "epoch": 9.106804766677804, "percentage": 91.07, "elapsed_time": "6:25:19", "remaining_time": "0:37:47", "throughput": 4290.86, "total_tokens": 99202192} +{"current_steps": 81775, "total_steps": 89790, "loss": 0.4608, "lr": 1.2041116374650357e-06, "epoch": 9.107361621561422, "percentage": 91.07, "elapsed_time": "6:25:20", "remaining_time": "0:37:46", "throughput": 4290.88, "total_tokens": 99207760} +{"current_steps": 81780, "total_steps": 89790, "loss": 0.4633, "lr": 1.2026221277781885e-06, "epoch": 9.107918476445038, "percentage": 91.08, "elapsed_time": "6:25:21", "remaining_time": "0:37:44", "throughput": 4290.9, "total_tokens": 99213072} +{"current_steps": 81785, "total_steps": 89790, "loss": 0.4684, "lr": 1.2011335172325389e-06, "epoch": 9.108475331328655, "percentage": 91.08, "elapsed_time": "6:25:23", "remaining_time": "0:37:43", "throughput": 4290.93, "total_tokens": 99219344} +{"current_steps": 81790, "total_steps": 89790, "loss": 0.458, "lr": 1.199645805884339e-06, "epoch": 9.109032186212273, "percentage": 91.09, "elapsed_time": "6:25:24", "remaining_time": "0:37:41", "throughput": 4290.95, "total_tokens": 99225776} +{"current_steps": 81795, "total_steps": 89790, "loss": 0.4595, "lr": 1.1981589937897858e-06, "epoch": 9.10958904109589, "percentage": 91.1, "elapsed_time": "6:25:25", "remaining_time": "0:37:40", "throughput": 4290.97, "total_tokens": 99231728} +{"current_steps": 81800, "total_steps": 89790, "loss": 0.4613, "lr": 1.1966730810050676e-06, "epoch": 9.110145895979509, "percentage": 91.1, "elapsed_time": "6:25:26", "remaining_time": "0:37:38", "throughput": 4291.0, "total_tokens": 99237808} +{"current_steps": 81805, "total_steps": 89790, "loss": 0.4669, "lr": 1.1951880675863169e-06, "epoch": 9.110702750863124, "percentage": 91.11, "elapsed_time": "6:25:28", "remaining_time": "0:37:37", "throughput": 4291.02, "total_tokens": 99244144} +{"current_steps": 81810, "total_steps": 89790, "loss": 0.46, "lr": 1.1937039535896532e-06, "epoch": 9.111259605746742, "percentage": 91.11, "elapsed_time": "6:25:29", "remaining_time": "0:37:36", "throughput": 4291.05, "total_tokens": 99250288} +{"current_steps": 81815, "total_steps": 89790, "loss": 0.4548, "lr": 1.19222073907114e-06, "epoch": 9.11181646063036, "percentage": 91.12, "elapsed_time": "6:25:30", "remaining_time": "0:37:34", "throughput": 4291.08, "total_tokens": 99256784} +{"current_steps": 81820, "total_steps": 89790, "loss": 0.467, "lr": 1.1907384240868236e-06, "epoch": 9.112373315513977, "percentage": 91.12, "elapsed_time": "6:25:32", "remaining_time": "0:37:33", "throughput": 4291.1, "total_tokens": 99262928} +{"current_steps": 81825, "total_steps": 89790, "loss": 0.4612, "lr": 1.1892570086927123e-06, "epoch": 9.112930170397595, "percentage": 91.13, "elapsed_time": "6:25:33", "remaining_time": "0:37:31", "throughput": 4291.12, "total_tokens": 99268304} +{"current_steps": 81830, "total_steps": 89790, "loss": 0.47, "lr": 1.1877764929447754e-06, "epoch": 9.113487025281211, "percentage": 91.13, "elapsed_time": "6:25:34", "remaining_time": "0:37:30", "throughput": 4291.14, "total_tokens": 99274512} +{"current_steps": 81835, "total_steps": 89790, "loss": 0.4602, "lr": 1.186296876898954e-06, "epoch": 9.114043880164829, "percentage": 91.14, "elapsed_time": "6:25:36", "remaining_time": "0:37:29", "throughput": 4291.17, "total_tokens": 99280528} +{"current_steps": 81840, "total_steps": 89790, "loss": 0.4684, "lr": 1.1848181606111481e-06, "epoch": 9.114600735048446, "percentage": 91.15, "elapsed_time": "6:25:37", "remaining_time": "0:37:27", "throughput": 4291.19, "total_tokens": 99286576} +{"current_steps": 81845, "total_steps": 89790, "loss": 0.4615, "lr": 1.183340344137232e-06, "epoch": 9.115157589932064, "percentage": 91.15, "elapsed_time": "6:25:38", "remaining_time": "0:37:26", "throughput": 4291.21, "total_tokens": 99292496} +{"current_steps": 81850, "total_steps": 89790, "loss": 0.4492, "lr": 1.1818634275330449e-06, "epoch": 9.115714444815682, "percentage": 91.16, "elapsed_time": "6:25:39", "remaining_time": "0:37:24", "throughput": 4291.24, "total_tokens": 99298608} +{"current_steps": 81855, "total_steps": 89790, "loss": 0.4764, "lr": 1.1803874108543833e-06, "epoch": 9.116271299699298, "percentage": 91.16, "elapsed_time": "6:25:41", "remaining_time": "0:37:23", "throughput": 4291.26, "total_tokens": 99304656} +{"current_steps": 81860, "total_steps": 89790, "loss": 0.449, "lr": 1.1789122941570253e-06, "epoch": 9.116828154582915, "percentage": 91.17, "elapsed_time": "6:25:42", "remaining_time": "0:37:21", "throughput": 4291.28, "total_tokens": 99310832} +{"current_steps": 81865, "total_steps": 89790, "loss": 0.4626, "lr": 1.1774380774966926e-06, "epoch": 9.117385009466533, "percentage": 91.17, "elapsed_time": "6:25:43", "remaining_time": "0:37:20", "throughput": 4291.31, "total_tokens": 99316784} +{"current_steps": 81870, "total_steps": 89790, "loss": 0.453, "lr": 1.1759647609290964e-06, "epoch": 9.11794186435015, "percentage": 91.18, "elapsed_time": "6:25:45", "remaining_time": "0:37:19", "throughput": 4291.33, "total_tokens": 99323152} +{"current_steps": 81875, "total_steps": 89790, "loss": 0.4572, "lr": 1.1744923445098949e-06, "epoch": 9.118498719233768, "percentage": 91.18, "elapsed_time": "6:25:46", "remaining_time": "0:37:17", "throughput": 4291.36, "total_tokens": 99329392} +{"current_steps": 81880, "total_steps": 89790, "loss": 0.4695, "lr": 1.173020828294727e-06, "epoch": 9.119055574117384, "percentage": 91.19, "elapsed_time": "6:25:47", "remaining_time": "0:37:16", "throughput": 4291.39, "total_tokens": 99335536} +{"current_steps": 81885, "total_steps": 89790, "loss": 0.4658, "lr": 1.1715502123391924e-06, "epoch": 9.119612429001002, "percentage": 91.2, "elapsed_time": "6:25:48", "remaining_time": "0:37:14", "throughput": 4291.41, "total_tokens": 99341552} +{"current_steps": 81890, "total_steps": 89790, "loss": 0.4629, "lr": 1.1700804966988498e-06, "epoch": 9.12016928388462, "percentage": 91.2, "elapsed_time": "6:25:50", "remaining_time": "0:37:13", "throughput": 4291.43, "total_tokens": 99347728} +{"current_steps": 81895, "total_steps": 89790, "loss": 0.4593, "lr": 1.1686116814292353e-06, "epoch": 9.120726138768237, "percentage": 91.21, "elapsed_time": "6:25:51", "remaining_time": "0:37:11", "throughput": 4291.46, "total_tokens": 99354032} +{"current_steps": 81900, "total_steps": 89790, "loss": 0.4598, "lr": 1.1671437665858403e-06, "epoch": 9.121282993651855, "percentage": 91.21, "elapsed_time": "6:25:52", "remaining_time": "0:37:10", "throughput": 4291.48, "total_tokens": 99360368} +{"current_steps": 81905, "total_steps": 89790, "loss": 0.4587, "lr": 1.1656767522241318e-06, "epoch": 9.12183984853547, "percentage": 91.22, "elapsed_time": "6:25:54", "remaining_time": "0:37:09", "throughput": 4291.51, "total_tokens": 99366608} +{"current_steps": 81910, "total_steps": 89790, "loss": 0.4563, "lr": 1.164210638399535e-06, "epoch": 9.122396703419088, "percentage": 91.22, "elapsed_time": "6:25:55", "remaining_time": "0:37:07", "throughput": 4291.54, "total_tokens": 99372848} +{"current_steps": 81915, "total_steps": 89790, "loss": 0.465, "lr": 1.162745425167444e-06, "epoch": 9.122953558302706, "percentage": 91.23, "elapsed_time": "6:25:56", "remaining_time": "0:37:06", "throughput": 4291.56, "total_tokens": 99378992} +{"current_steps": 81920, "total_steps": 89790, "loss": 0.4639, "lr": 1.1612811125832263e-06, "epoch": 9.123510413186324, "percentage": 91.24, "elapsed_time": "6:25:58", "remaining_time": "0:37:04", "throughput": 4291.58, "total_tokens": 99385008} +{"current_steps": 81925, "total_steps": 89790, "loss": 0.4629, "lr": 1.1598177007021983e-06, "epoch": 9.124067268069942, "percentage": 91.24, "elapsed_time": "6:25:59", "remaining_time": "0:37:03", "throughput": 4291.6, "total_tokens": 99390992} +{"current_steps": 81930, "total_steps": 89790, "loss": 0.4512, "lr": 1.158355189579663e-06, "epoch": 9.12462412295356, "percentage": 91.25, "elapsed_time": "6:26:00", "remaining_time": "0:37:01", "throughput": 4291.63, "total_tokens": 99396816} +{"current_steps": 81935, "total_steps": 89790, "loss": 0.4621, "lr": 1.156893579270868e-06, "epoch": 9.125180977837175, "percentage": 91.25, "elapsed_time": "6:26:01", "remaining_time": "0:37:00", "throughput": 4291.65, "total_tokens": 99402960} +{"current_steps": 81940, "total_steps": 89790, "loss": 0.4667, "lr": 1.1554328698310413e-06, "epoch": 9.125737832720793, "percentage": 91.26, "elapsed_time": "6:26:03", "remaining_time": "0:36:59", "throughput": 4291.67, "total_tokens": 99408944} +{"current_steps": 81945, "total_steps": 89790, "loss": 0.4492, "lr": 1.1539730613153803e-06, "epoch": 9.12629468760441, "percentage": 91.26, "elapsed_time": "6:26:04", "remaining_time": "0:36:57", "throughput": 4291.7, "total_tokens": 99415184} +{"current_steps": 81950, "total_steps": 89790, "loss": 0.4696, "lr": 1.152514153779033e-06, "epoch": 9.126851542488028, "percentage": 91.27, "elapsed_time": "6:26:05", "remaining_time": "0:36:56", "throughput": 4291.72, "total_tokens": 99421520} +{"current_steps": 81955, "total_steps": 89790, "loss": 0.4531, "lr": 1.1510561472771241e-06, "epoch": 9.127408397371646, "percentage": 91.27, "elapsed_time": "6:26:07", "remaining_time": "0:36:54", "throughput": 4291.75, "total_tokens": 99427696} +{"current_steps": 81960, "total_steps": 89790, "loss": 0.4509, "lr": 1.1495990418647378e-06, "epoch": 9.127965252255262, "percentage": 91.28, "elapsed_time": "6:26:08", "remaining_time": "0:36:53", "throughput": 4291.77, "total_tokens": 99433712} +{"current_steps": 81965, "total_steps": 89790, "loss": 0.4636, "lr": 1.1481428375969356e-06, "epoch": 9.12852210713888, "percentage": 91.29, "elapsed_time": "6:26:09", "remaining_time": "0:36:51", "throughput": 4291.8, "total_tokens": 99440208} +{"current_steps": 81970, "total_steps": 89790, "loss": 0.4444, "lr": 1.1466875345287343e-06, "epoch": 9.129078962022497, "percentage": 91.29, "elapsed_time": "6:26:11", "remaining_time": "0:36:50", "throughput": 4291.82, "total_tokens": 99446192} +{"current_steps": 81975, "total_steps": 89790, "loss": 0.4675, "lr": 1.1452331327151177e-06, "epoch": 9.129635816906115, "percentage": 91.3, "elapsed_time": "6:26:12", "remaining_time": "0:36:49", "throughput": 4291.85, "total_tokens": 99452624} +{"current_steps": 81980, "total_steps": 89790, "loss": 0.46, "lr": 1.1437796322110423e-06, "epoch": 9.130192671789732, "percentage": 91.3, "elapsed_time": "6:26:13", "remaining_time": "0:36:47", "throughput": 4291.87, "total_tokens": 99458480} +{"current_steps": 81985, "total_steps": 89790, "loss": 0.4595, "lr": 1.1423270330714192e-06, "epoch": 9.130749526673348, "percentage": 91.31, "elapsed_time": "6:26:14", "remaining_time": "0:36:46", "throughput": 4291.89, "total_tokens": 99464496} +{"current_steps": 81990, "total_steps": 89790, "loss": 0.4569, "lr": 1.1408753353511408e-06, "epoch": 9.131306381556966, "percentage": 91.31, "elapsed_time": "6:26:16", "remaining_time": "0:36:44", "throughput": 4291.92, "total_tokens": 99470480} +{"current_steps": 81995, "total_steps": 89790, "loss": 0.4741, "lr": 1.1394245391050495e-06, "epoch": 9.131863236440584, "percentage": 91.32, "elapsed_time": "6:26:17", "remaining_time": "0:36:43", "throughput": 4291.94, "total_tokens": 99476688} +{"current_steps": 82000, "total_steps": 89790, "loss": 0.4736, "lr": 1.1379746443879623e-06, "epoch": 9.132420091324201, "percentage": 91.32, "elapsed_time": "6:26:18", "remaining_time": "0:36:41", "throughput": 4291.96, "total_tokens": 99482576} +{"current_steps": 82005, "total_steps": 89790, "loss": 0.4633, "lr": 1.136525651254669e-06, "epoch": 9.132976946207819, "percentage": 91.33, "elapsed_time": "6:26:20", "remaining_time": "0:36:40", "throughput": 4291.98, "total_tokens": 99488208} +{"current_steps": 82010, "total_steps": 89790, "loss": 0.4436, "lr": 1.1350775597599062e-06, "epoch": 9.133533801091435, "percentage": 91.34, "elapsed_time": "6:26:21", "remaining_time": "0:36:39", "throughput": 4292.01, "total_tokens": 99494192} +{"current_steps": 82015, "total_steps": 89790, "loss": 0.4521, "lr": 1.1336303699583938e-06, "epoch": 9.134090655975053, "percentage": 91.34, "elapsed_time": "6:26:22", "remaining_time": "0:36:37", "throughput": 4292.03, "total_tokens": 99500048} +{"current_steps": 82020, "total_steps": 89790, "loss": 0.4427, "lr": 1.132184081904808e-06, "epoch": 9.13464751085867, "percentage": 91.35, "elapsed_time": "6:26:23", "remaining_time": "0:36:36", "throughput": 4292.06, "total_tokens": 99506320} +{"current_steps": 82025, "total_steps": 89790, "loss": 0.4528, "lr": 1.1307386956537963e-06, "epoch": 9.135204365742288, "percentage": 91.35, "elapsed_time": "6:26:25", "remaining_time": "0:36:34", "throughput": 4292.08, "total_tokens": 99512240} +{"current_steps": 82030, "total_steps": 89790, "loss": 0.4521, "lr": 1.1292942112599707e-06, "epoch": 9.135761220625906, "percentage": 91.36, "elapsed_time": "6:26:26", "remaining_time": "0:36:33", "throughput": 4292.11, "total_tokens": 99518672} +{"current_steps": 82035, "total_steps": 89790, "loss": 0.4637, "lr": 1.1278506287779073e-06, "epoch": 9.136318075509521, "percentage": 91.36, "elapsed_time": "6:26:27", "remaining_time": "0:36:32", "throughput": 4292.13, "total_tokens": 99524848} +{"current_steps": 82040, "total_steps": 89790, "loss": 0.4528, "lr": 1.1264079482621482e-06, "epoch": 9.13687493039314, "percentage": 91.37, "elapsed_time": "6:26:29", "remaining_time": "0:36:30", "throughput": 4292.15, "total_tokens": 99531024} +{"current_steps": 82045, "total_steps": 89790, "loss": 0.465, "lr": 1.1249661697672027e-06, "epoch": 9.137431785276757, "percentage": 91.37, "elapsed_time": "6:26:30", "remaining_time": "0:36:29", "throughput": 4292.18, "total_tokens": 99537296} +{"current_steps": 82050, "total_steps": 89790, "loss": 0.4689, "lr": 1.1235252933475493e-06, "epoch": 9.137988640160374, "percentage": 91.38, "elapsed_time": "6:26:31", "remaining_time": "0:36:27", "throughput": 4292.2, "total_tokens": 99543152} +{"current_steps": 82055, "total_steps": 89790, "loss": 0.4674, "lr": 1.1220853190576224e-06, "epoch": 9.138545495043992, "percentage": 91.39, "elapsed_time": "6:26:32", "remaining_time": "0:36:26", "throughput": 4292.22, "total_tokens": 99549392} +{"current_steps": 82060, "total_steps": 89790, "loss": 0.4559, "lr": 1.1206462469518342e-06, "epoch": 9.139102349927608, "percentage": 91.39, "elapsed_time": "6:26:34", "remaining_time": "0:36:24", "throughput": 4292.25, "total_tokens": 99555408} +{"current_steps": 82065, "total_steps": 89790, "loss": 0.4611, "lr": 1.1192080770845603e-06, "epoch": 9.139659204811226, "percentage": 91.4, "elapsed_time": "6:26:35", "remaining_time": "0:36:23", "throughput": 4292.27, "total_tokens": 99561808} +{"current_steps": 82070, "total_steps": 89790, "loss": 0.4642, "lr": 1.1177708095101296e-06, "epoch": 9.140216059694843, "percentage": 91.4, "elapsed_time": "6:26:36", "remaining_time": "0:36:22", "throughput": 4292.3, "total_tokens": 99568496} +{"current_steps": 82075, "total_steps": 89790, "loss": 0.4569, "lr": 1.1163344442828544e-06, "epoch": 9.140772914578461, "percentage": 91.41, "elapsed_time": "6:26:38", "remaining_time": "0:36:20", "throughput": 4292.32, "total_tokens": 99574448} +{"current_steps": 82080, "total_steps": 89790, "loss": 0.4553, "lr": 1.1148989814570021e-06, "epoch": 9.141329769462079, "percentage": 91.41, "elapsed_time": "6:26:39", "remaining_time": "0:36:19", "throughput": 4292.35, "total_tokens": 99580272} +{"current_steps": 82085, "total_steps": 89790, "loss": 0.4573, "lr": 1.11346442108681e-06, "epoch": 9.141886624345695, "percentage": 91.42, "elapsed_time": "6:26:40", "remaining_time": "0:36:17", "throughput": 4292.37, "total_tokens": 99586576} +{"current_steps": 82090, "total_steps": 89790, "loss": 0.473, "lr": 1.1120307632264792e-06, "epoch": 9.142443479229312, "percentage": 91.42, "elapsed_time": "6:26:42", "remaining_time": "0:36:16", "throughput": 4292.4, "total_tokens": 99592656} +{"current_steps": 82095, "total_steps": 89790, "loss": 0.4663, "lr": 1.1105980079301803e-06, "epoch": 9.14300033411293, "percentage": 91.43, "elapsed_time": "6:26:43", "remaining_time": "0:36:14", "throughput": 4292.42, "total_tokens": 99598704} +{"current_steps": 82100, "total_steps": 89790, "loss": 0.468, "lr": 1.1091661552520449e-06, "epoch": 9.143557188996548, "percentage": 91.44, "elapsed_time": "6:26:44", "remaining_time": "0:36:13", "throughput": 4292.44, "total_tokens": 99604784} +{"current_steps": 82105, "total_steps": 89790, "loss": 0.4538, "lr": 1.1077352052461742e-06, "epoch": 9.144114043880165, "percentage": 91.44, "elapsed_time": "6:26:45", "remaining_time": "0:36:12", "throughput": 4292.46, "total_tokens": 99610672} +{"current_steps": 82110, "total_steps": 89790, "loss": 0.451, "lr": 1.1063051579666362e-06, "epoch": 9.144670898763783, "percentage": 91.45, "elapsed_time": "6:26:47", "remaining_time": "0:36:10", "throughput": 4292.48, "total_tokens": 99616848} +{"current_steps": 82115, "total_steps": 89790, "loss": 0.4636, "lr": 1.1048760134674569e-06, "epoch": 9.145227753647399, "percentage": 91.45, "elapsed_time": "6:26:48", "remaining_time": "0:36:09", "throughput": 4292.51, "total_tokens": 99622608} +{"current_steps": 82120, "total_steps": 89790, "loss": 0.454, "lr": 1.1034477718026404e-06, "epoch": 9.145784608531017, "percentage": 91.46, "elapsed_time": "6:26:49", "remaining_time": "0:36:07", "throughput": 4292.53, "total_tokens": 99628784} +{"current_steps": 82125, "total_steps": 89790, "loss": 0.447, "lr": 1.1020204330261463e-06, "epoch": 9.146341463414634, "percentage": 91.46, "elapsed_time": "6:26:51", "remaining_time": "0:36:06", "throughput": 4292.55, "total_tokens": 99634960} +{"current_steps": 82130, "total_steps": 89790, "loss": 0.4634, "lr": 1.1005939971919038e-06, "epoch": 9.146898318298252, "percentage": 91.47, "elapsed_time": "6:26:52", "remaining_time": "0:36:04", "throughput": 4292.58, "total_tokens": 99641008} +{"current_steps": 82135, "total_steps": 89790, "loss": 0.4563, "lr": 1.099168464353814e-06, "epoch": 9.14745517318187, "percentage": 91.47, "elapsed_time": "6:26:53", "remaining_time": "0:36:03", "throughput": 4292.6, "total_tokens": 99646768} +{"current_steps": 82140, "total_steps": 89790, "loss": 0.4656, "lr": 1.0977438345657287e-06, "epoch": 9.148012028065486, "percentage": 91.48, "elapsed_time": "6:26:54", "remaining_time": "0:36:02", "throughput": 4292.62, "total_tokens": 99652944} +{"current_steps": 82145, "total_steps": 89790, "loss": 0.4607, "lr": 1.0963201078814822e-06, "epoch": 9.148568882949103, "percentage": 91.49, "elapsed_time": "6:26:56", "remaining_time": "0:36:00", "throughput": 4292.65, "total_tokens": 99658864} +{"current_steps": 82150, "total_steps": 89790, "loss": 0.4606, "lr": 1.0948972843548649e-06, "epoch": 9.14912573783272, "percentage": 91.49, "elapsed_time": "6:26:57", "remaining_time": "0:35:59", "throughput": 4292.68, "total_tokens": 99664912} +{"current_steps": 82155, "total_steps": 89790, "loss": 0.464, "lr": 1.093475364039634e-06, "epoch": 9.149682592716339, "percentage": 91.5, "elapsed_time": "6:26:58", "remaining_time": "0:35:57", "throughput": 4292.7, "total_tokens": 99671248} +{"current_steps": 82160, "total_steps": 89790, "loss": 0.4608, "lr": 1.0920543469895184e-06, "epoch": 9.150239447599956, "percentage": 91.5, "elapsed_time": "6:27:00", "remaining_time": "0:35:56", "throughput": 4292.73, "total_tokens": 99677456} +{"current_steps": 82165, "total_steps": 89790, "loss": 0.4643, "lr": 1.0906342332582031e-06, "epoch": 9.150796302483572, "percentage": 91.51, "elapsed_time": "6:27:01", "remaining_time": "0:35:54", "throughput": 4292.75, "total_tokens": 99683472} +{"current_steps": 82170, "total_steps": 89790, "loss": 0.4509, "lr": 1.0892150228993537e-06, "epoch": 9.15135315736719, "percentage": 91.51, "elapsed_time": "6:27:02", "remaining_time": "0:35:53", "throughput": 4292.78, "total_tokens": 99689776} +{"current_steps": 82175, "total_steps": 89790, "loss": 0.4585, "lr": 1.0877967159665826e-06, "epoch": 9.151910012250807, "percentage": 91.52, "elapsed_time": "6:27:03", "remaining_time": "0:35:52", "throughput": 4292.8, "total_tokens": 99695984} +{"current_steps": 82180, "total_steps": 89790, "loss": 0.4603, "lr": 1.086379312513483e-06, "epoch": 9.152466867134425, "percentage": 91.52, "elapsed_time": "6:27:05", "remaining_time": "0:35:50", "throughput": 4292.83, "total_tokens": 99702256} +{"current_steps": 82185, "total_steps": 89790, "loss": 0.4573, "lr": 1.0849628125936068e-06, "epoch": 9.153023722018043, "percentage": 91.53, "elapsed_time": "6:27:06", "remaining_time": "0:35:49", "throughput": 4292.86, "total_tokens": 99708464} +{"current_steps": 82190, "total_steps": 89790, "loss": 0.4683, "lr": 1.0835472162604748e-06, "epoch": 9.153580576901659, "percentage": 91.54, "elapsed_time": "6:27:07", "remaining_time": "0:35:47", "throughput": 4292.88, "total_tokens": 99714672} +{"current_steps": 82195, "total_steps": 89790, "loss": 0.4576, "lr": 1.082132523567575e-06, "epoch": 9.154137431785276, "percentage": 91.54, "elapsed_time": "6:27:09", "remaining_time": "0:35:46", "throughput": 4292.9, "total_tokens": 99720944} +{"current_steps": 82200, "total_steps": 89790, "loss": 0.4531, "lr": 1.0807187345683535e-06, "epoch": 9.154694286668894, "percentage": 91.55, "elapsed_time": "6:27:10", "remaining_time": "0:35:45", "throughput": 4292.93, "total_tokens": 99726800} +{"current_steps": 82205, "total_steps": 89790, "loss": 0.4574, "lr": 1.0793058493162367e-06, "epoch": 9.155251141552512, "percentage": 91.55, "elapsed_time": "6:27:11", "remaining_time": "0:35:43", "throughput": 4292.95, "total_tokens": 99732912} +{"current_steps": 82210, "total_steps": 89790, "loss": 0.4643, "lr": 1.077893867864599e-06, "epoch": 9.15580799643613, "percentage": 91.56, "elapsed_time": "6:27:13", "remaining_time": "0:35:42", "throughput": 4292.98, "total_tokens": 99739152} +{"current_steps": 82215, "total_steps": 89790, "loss": 0.4557, "lr": 1.0764827902667947e-06, "epoch": 9.156364851319745, "percentage": 91.56, "elapsed_time": "6:27:14", "remaining_time": "0:35:40", "throughput": 4293.0, "total_tokens": 99745008} +{"current_steps": 82220, "total_steps": 89790, "loss": 0.4555, "lr": 1.0750726165761339e-06, "epoch": 9.156921706203363, "percentage": 91.57, "elapsed_time": "6:27:15", "remaining_time": "0:35:39", "throughput": 4293.03, "total_tokens": 99751024} +{"current_steps": 82225, "total_steps": 89790, "loss": 0.4422, "lr": 1.0736633468459017e-06, "epoch": 9.15747856108698, "percentage": 91.57, "elapsed_time": "6:27:16", "remaining_time": "0:35:37", "throughput": 4293.05, "total_tokens": 99757104} +{"current_steps": 82230, "total_steps": 89790, "loss": 0.4469, "lr": 1.0722549811293476e-06, "epoch": 9.158035415970598, "percentage": 91.58, "elapsed_time": "6:27:18", "remaining_time": "0:35:36", "throughput": 4293.08, "total_tokens": 99763472} +{"current_steps": 82235, "total_steps": 89790, "loss": 0.4476, "lr": 1.0708475194796757e-06, "epoch": 9.158592270854216, "percentage": 91.59, "elapsed_time": "6:27:19", "remaining_time": "0:35:35", "throughput": 4293.1, "total_tokens": 99769168} +{"current_steps": 82240, "total_steps": 89790, "loss": 0.4578, "lr": 1.0694409619500744e-06, "epoch": 9.159149125737832, "percentage": 91.59, "elapsed_time": "6:27:20", "remaining_time": "0:35:33", "throughput": 4293.13, "total_tokens": 99775536} +{"current_steps": 82245, "total_steps": 89790, "loss": 0.4557, "lr": 1.068035308593679e-06, "epoch": 9.15970598062145, "percentage": 91.6, "elapsed_time": "6:27:22", "remaining_time": "0:35:32", "throughput": 4293.15, "total_tokens": 99781648} +{"current_steps": 82250, "total_steps": 89790, "loss": 0.4638, "lr": 1.066630559463605e-06, "epoch": 9.160262835505067, "percentage": 91.6, "elapsed_time": "6:27:23", "remaining_time": "0:35:30", "throughput": 4293.17, "total_tokens": 99787216} +{"current_steps": 82255, "total_steps": 89790, "loss": 0.4603, "lr": 1.065226714612927e-06, "epoch": 9.160819690388685, "percentage": 91.61, "elapsed_time": "6:27:24", "remaining_time": "0:35:29", "throughput": 4293.19, "total_tokens": 99793584} +{"current_steps": 82260, "total_steps": 89790, "loss": 0.4517, "lr": 1.0638237740946855e-06, "epoch": 9.161376545272303, "percentage": 91.61, "elapsed_time": "6:27:25", "remaining_time": "0:35:27", "throughput": 4293.21, "total_tokens": 99799440} +{"current_steps": 82265, "total_steps": 89790, "loss": 0.4625, "lr": 1.0624217379618912e-06, "epoch": 9.161933400155919, "percentage": 91.62, "elapsed_time": "6:27:27", "remaining_time": "0:35:26", "throughput": 4293.24, "total_tokens": 99805392} +{"current_steps": 82270, "total_steps": 89790, "loss": 0.4574, "lr": 1.0610206062675126e-06, "epoch": 9.162490255039536, "percentage": 91.62, "elapsed_time": "6:27:28", "remaining_time": "0:35:25", "throughput": 4293.26, "total_tokens": 99811920} +{"current_steps": 82275, "total_steps": 89790, "loss": 0.4564, "lr": 1.0596203790644938e-06, "epoch": 9.163047109923154, "percentage": 91.63, "elapsed_time": "6:27:29", "remaining_time": "0:35:23", "throughput": 4293.29, "total_tokens": 99817744} +{"current_steps": 82280, "total_steps": 89790, "loss": 0.4648, "lr": 1.0582210564057337e-06, "epoch": 9.163603964806772, "percentage": 91.64, "elapsed_time": "6:27:30", "remaining_time": "0:35:22", "throughput": 4293.31, "total_tokens": 99823568} +{"current_steps": 82285, "total_steps": 89790, "loss": 0.4557, "lr": 1.0568226383441098e-06, "epoch": 9.16416081969039, "percentage": 91.64, "elapsed_time": "6:27:32", "remaining_time": "0:35:20", "throughput": 4293.34, "total_tokens": 99830064} +{"current_steps": 82290, "total_steps": 89790, "loss": 0.4563, "lr": 1.0554251249324577e-06, "epoch": 9.164717674574007, "percentage": 91.65, "elapsed_time": "6:27:33", "remaining_time": "0:35:19", "throughput": 4293.36, "total_tokens": 99835952} +{"current_steps": 82295, "total_steps": 89790, "loss": 0.4766, "lr": 1.0540285162235763e-06, "epoch": 9.165274529457623, "percentage": 91.65, "elapsed_time": "6:27:34", "remaining_time": "0:35:17", "throughput": 4293.39, "total_tokens": 99842224} +{"current_steps": 82300, "total_steps": 89790, "loss": 0.4586, "lr": 1.0526328122702407e-06, "epoch": 9.16583138434124, "percentage": 91.66, "elapsed_time": "6:27:36", "remaining_time": "0:35:16", "throughput": 4293.41, "total_tokens": 99848112} +{"current_steps": 82305, "total_steps": 89790, "loss": 0.4612, "lr": 1.0512380131251749e-06, "epoch": 9.166388239224858, "percentage": 91.66, "elapsed_time": "6:27:37", "remaining_time": "0:35:15", "throughput": 4293.43, "total_tokens": 99854320} +{"current_steps": 82310, "total_steps": 89790, "loss": 0.4664, "lr": 1.0498441188410896e-06, "epoch": 9.166945094108476, "percentage": 91.67, "elapsed_time": "6:27:38", "remaining_time": "0:35:13", "throughput": 4293.45, "total_tokens": 99860304} +{"current_steps": 82315, "total_steps": 89790, "loss": 0.4659, "lr": 1.048451129470643e-06, "epoch": 9.167501948992093, "percentage": 91.68, "elapsed_time": "6:27:40", "remaining_time": "0:35:12", "throughput": 4293.48, "total_tokens": 99866288} +{"current_steps": 82320, "total_steps": 89790, "loss": 0.4515, "lr": 1.0470590450664674e-06, "epoch": 9.16805880387571, "percentage": 91.68, "elapsed_time": "6:27:41", "remaining_time": "0:35:10", "throughput": 4293.5, "total_tokens": 99872048} +{"current_steps": 82325, "total_steps": 89790, "loss": 0.4714, "lr": 1.045667865681166e-06, "epoch": 9.168615658759327, "percentage": 91.69, "elapsed_time": "6:27:42", "remaining_time": "0:35:09", "throughput": 4293.53, "total_tokens": 99878192} +{"current_steps": 82330, "total_steps": 89790, "loss": 0.4581, "lr": 1.044277591367293e-06, "epoch": 9.169172513642945, "percentage": 91.69, "elapsed_time": "6:27:43", "remaining_time": "0:35:07", "throughput": 4293.55, "total_tokens": 99884112} +{"current_steps": 82335, "total_steps": 89790, "loss": 0.4649, "lr": 1.0428882221773878e-06, "epoch": 9.169729368526562, "percentage": 91.7, "elapsed_time": "6:27:45", "remaining_time": "0:35:06", "throughput": 4293.57, "total_tokens": 99890224} +{"current_steps": 82340, "total_steps": 89790, "loss": 0.4547, "lr": 1.0414997581639357e-06, "epoch": 9.17028622341018, "percentage": 91.7, "elapsed_time": "6:27:46", "remaining_time": "0:35:05", "throughput": 4293.6, "total_tokens": 99896368} +{"current_steps": 82345, "total_steps": 89790, "loss": 0.4592, "lr": 1.0401121993794033e-06, "epoch": 9.170843078293796, "percentage": 91.71, "elapsed_time": "6:27:47", "remaining_time": "0:35:03", "throughput": 4293.62, "total_tokens": 99902448} +{"current_steps": 82350, "total_steps": 89790, "loss": 0.4614, "lr": 1.0387255458762153e-06, "epoch": 9.171399933177414, "percentage": 91.71, "elapsed_time": "6:27:48", "remaining_time": "0:35:02", "throughput": 4293.64, "total_tokens": 99908496} +{"current_steps": 82355, "total_steps": 89790, "loss": 0.4695, "lr": 1.0373397977067656e-06, "epoch": 9.171956788061031, "percentage": 91.72, "elapsed_time": "6:27:50", "remaining_time": "0:35:00", "throughput": 4293.67, "total_tokens": 99914576} +{"current_steps": 82360, "total_steps": 89790, "loss": 0.4501, "lr": 1.0359549549234099e-06, "epoch": 9.172513642944649, "percentage": 91.73, "elapsed_time": "6:27:51", "remaining_time": "0:34:59", "throughput": 4293.69, "total_tokens": 99920560} +{"current_steps": 82365, "total_steps": 89790, "loss": 0.4573, "lr": 1.0345710175784702e-06, "epoch": 9.173070497828267, "percentage": 91.73, "elapsed_time": "6:27:52", "remaining_time": "0:34:57", "throughput": 4293.71, "total_tokens": 99926576} +{"current_steps": 82370, "total_steps": 89790, "loss": 0.4517, "lr": 1.0331879857242405e-06, "epoch": 9.173627352711883, "percentage": 91.74, "elapsed_time": "6:27:54", "remaining_time": "0:34:56", "throughput": 4293.73, "total_tokens": 99932208} +{"current_steps": 82375, "total_steps": 89790, "loss": 0.4659, "lr": 1.0318058594129737e-06, "epoch": 9.1741842075955, "percentage": 91.74, "elapsed_time": "6:27:55", "remaining_time": "0:34:55", "throughput": 4293.75, "total_tokens": 99938000} +{"current_steps": 82380, "total_steps": 89790, "loss": 0.463, "lr": 1.030424638696889e-06, "epoch": 9.174741062479118, "percentage": 91.75, "elapsed_time": "6:27:56", "remaining_time": "0:34:53", "throughput": 4293.77, "total_tokens": 99944176} +{"current_steps": 82385, "total_steps": 89790, "loss": 0.4491, "lr": 1.029044323628181e-06, "epoch": 9.175297917362736, "percentage": 91.75, "elapsed_time": "6:27:57", "remaining_time": "0:34:52", "throughput": 4293.79, "total_tokens": 99949744} +{"current_steps": 82390, "total_steps": 89790, "loss": 0.4664, "lr": 1.0276649142589912e-06, "epoch": 9.175854772246353, "percentage": 91.76, "elapsed_time": "6:27:59", "remaining_time": "0:34:50", "throughput": 4293.81, "total_tokens": 99955792} +{"current_steps": 82395, "total_steps": 89790, "loss": 0.4528, "lr": 1.0262864106414444e-06, "epoch": 9.17641162712997, "percentage": 91.76, "elapsed_time": "6:28:00", "remaining_time": "0:34:49", "throughput": 4293.84, "total_tokens": 99962032} +{"current_steps": 82400, "total_steps": 89790, "loss": 0.475, "lr": 1.0249088128276297e-06, "epoch": 9.176968482013587, "percentage": 91.77, "elapsed_time": "6:28:01", "remaining_time": "0:34:47", "throughput": 4293.86, "total_tokens": 99968016} +{"current_steps": 82405, "total_steps": 89790, "loss": 0.4692, "lr": 1.0235321208695887e-06, "epoch": 9.177525336897205, "percentage": 91.78, "elapsed_time": "6:28:02", "remaining_time": "0:34:46", "throughput": 4293.89, "total_tokens": 99974000} +{"current_steps": 82410, "total_steps": 89790, "loss": 0.4667, "lr": 1.0221563348193408e-06, "epoch": 9.178082191780822, "percentage": 91.78, "elapsed_time": "6:28:04", "remaining_time": "0:34:45", "throughput": 4293.91, "total_tokens": 99979856} +{"current_steps": 82415, "total_steps": 89790, "loss": 0.4532, "lr": 1.0207814547288669e-06, "epoch": 9.17863904666444, "percentage": 91.79, "elapsed_time": "6:28:05", "remaining_time": "0:34:43", "throughput": 4293.93, "total_tokens": 99985840} +{"current_steps": 82420, "total_steps": 89790, "loss": 0.4679, "lr": 1.019407480650117e-06, "epoch": 9.179195901548056, "percentage": 91.79, "elapsed_time": "6:28:06", "remaining_time": "0:34:42", "throughput": 4293.95, "total_tokens": 99991792} +{"current_steps": 82425, "total_steps": 89790, "loss": 0.4564, "lr": 1.0180344126349994e-06, "epoch": 9.179752756431673, "percentage": 91.8, "elapsed_time": "6:28:07", "remaining_time": "0:34:40", "throughput": 4293.97, "total_tokens": 99997584} +{"current_steps": 82430, "total_steps": 89790, "loss": 0.4509, "lr": 1.016662250735395e-06, "epoch": 9.180309611315291, "percentage": 91.8, "elapsed_time": "6:28:09", "remaining_time": "0:34:39", "throughput": 4293.99, "total_tokens": 100003824} +{"current_steps": 82435, "total_steps": 89790, "loss": 0.4621, "lr": 1.0152909950031515e-06, "epoch": 9.180866466198909, "percentage": 91.81, "elapsed_time": "6:28:10", "remaining_time": "0:34:38", "throughput": 4294.01, "total_tokens": 100009936} +{"current_steps": 82440, "total_steps": 89790, "loss": 0.4597, "lr": 1.0139206454900767e-06, "epoch": 9.181423321082526, "percentage": 91.81, "elapsed_time": "6:28:11", "remaining_time": "0:34:36", "throughput": 4294.04, "total_tokens": 100015888} +{"current_steps": 82445, "total_steps": 89790, "loss": 0.46, "lr": 1.0125512022479467e-06, "epoch": 9.181980175966142, "percentage": 91.82, "elapsed_time": "6:28:13", "remaining_time": "0:34:35", "throughput": 4294.06, "total_tokens": 100022352} +{"current_steps": 82450, "total_steps": 89790, "loss": 0.4556, "lr": 1.0111826653285027e-06, "epoch": 9.18253703084976, "percentage": 91.83, "elapsed_time": "6:28:14", "remaining_time": "0:34:33", "throughput": 4294.08, "total_tokens": 100028464} +{"current_steps": 82455, "total_steps": 89790, "loss": 0.4608, "lr": 1.0098150347834567e-06, "epoch": 9.183093885733378, "percentage": 91.83, "elapsed_time": "6:28:15", "remaining_time": "0:34:32", "throughput": 4294.11, "total_tokens": 100034512} +{"current_steps": 82460, "total_steps": 89790, "loss": 0.4609, "lr": 1.0084483106644754e-06, "epoch": 9.183650740616995, "percentage": 91.84, "elapsed_time": "6:28:17", "remaining_time": "0:34:30", "throughput": 4294.13, "total_tokens": 100040400} +{"current_steps": 82465, "total_steps": 89790, "loss": 0.4583, "lr": 1.0070824930232036e-06, "epoch": 9.184207595500613, "percentage": 91.84, "elapsed_time": "6:28:18", "remaining_time": "0:34:29", "throughput": 4294.15, "total_tokens": 100046288} +{"current_steps": 82470, "total_steps": 89790, "loss": 0.4574, "lr": 1.0057175819112447e-06, "epoch": 9.18476445038423, "percentage": 91.85, "elapsed_time": "6:28:19", "remaining_time": "0:34:28", "throughput": 4294.16, "total_tokens": 100051568} +{"current_steps": 82475, "total_steps": 89790, "loss": 0.4602, "lr": 1.0043535773801655e-06, "epoch": 9.185321305267847, "percentage": 91.85, "elapsed_time": "6:28:20", "remaining_time": "0:34:26", "throughput": 4294.18, "total_tokens": 100057520} +{"current_steps": 82480, "total_steps": 89790, "loss": 0.4607, "lr": 1.002990479481511e-06, "epoch": 9.185878160151464, "percentage": 91.86, "elapsed_time": "6:28:21", "remaining_time": "0:34:25", "throughput": 4294.21, "total_tokens": 100063568} +{"current_steps": 82485, "total_steps": 89790, "loss": 0.4608, "lr": 1.001628288266776e-06, "epoch": 9.186435015035082, "percentage": 91.86, "elapsed_time": "6:28:23", "remaining_time": "0:34:23", "throughput": 4294.23, "total_tokens": 100069392} +{"current_steps": 82490, "total_steps": 89790, "loss": 0.4565, "lr": 1.0002670037874307e-06, "epoch": 9.1869918699187, "percentage": 91.87, "elapsed_time": "6:28:24", "remaining_time": "0:34:22", "throughput": 4294.25, "total_tokens": 100075280} +{"current_steps": 82495, "total_steps": 89790, "loss": 0.4554, "lr": 9.989066260949088e-07, "epoch": 9.187548724802317, "percentage": 91.88, "elapsed_time": "6:28:25", "remaining_time": "0:34:20", "throughput": 4294.28, "total_tokens": 100081904} +{"current_steps": 82500, "total_steps": 89790, "loss": 0.4669, "lr": 9.97547155240608e-07, "epoch": 9.188105579685933, "percentage": 91.88, "elapsed_time": "6:28:27", "remaining_time": "0:34:19", "throughput": 4294.3, "total_tokens": 100087984} +{"current_steps": 82505, "total_steps": 89790, "loss": 0.4693, "lr": 9.961885912759012e-07, "epoch": 9.188662434569551, "percentage": 91.89, "elapsed_time": "6:28:28", "remaining_time": "0:34:18", "throughput": 4294.32, "total_tokens": 100093776} +{"current_steps": 82510, "total_steps": 89790, "loss": 0.4693, "lr": 9.948309342521083e-07, "epoch": 9.189219289453169, "percentage": 91.89, "elapsed_time": "6:28:29", "remaining_time": "0:34:16", "throughput": 4294.35, "total_tokens": 100099760} +{"current_steps": 82515, "total_steps": 89790, "loss": 0.4641, "lr": 9.934741842205331e-07, "epoch": 9.189776144336786, "percentage": 91.9, "elapsed_time": "6:28:30", "remaining_time": "0:34:15", "throughput": 4294.37, "total_tokens": 100105712} +{"current_steps": 82520, "total_steps": 89790, "loss": 0.4599, "lr": 9.921183412324342e-07, "epoch": 9.190332999220404, "percentage": 91.9, "elapsed_time": "6:28:32", "remaining_time": "0:34:13", "throughput": 4294.39, "total_tokens": 100111792} +{"current_steps": 82525, "total_steps": 89790, "loss": 0.4536, "lr": 9.907634053390402e-07, "epoch": 9.19088985410402, "percentage": 91.91, "elapsed_time": "6:28:33", "remaining_time": "0:34:12", "throughput": 4294.42, "total_tokens": 100118096} +{"current_steps": 82530, "total_steps": 89790, "loss": 0.4622, "lr": 9.89409376591549e-07, "epoch": 9.191446708987637, "percentage": 91.91, "elapsed_time": "6:28:34", "remaining_time": "0:34:10", "throughput": 4294.44, "total_tokens": 100124144} +{"current_steps": 82535, "total_steps": 89790, "loss": 0.4623, "lr": 9.88056255041117e-07, "epoch": 9.192003563871255, "percentage": 91.92, "elapsed_time": "6:28:36", "remaining_time": "0:34:09", "throughput": 4294.46, "total_tokens": 100129968} +{"current_steps": 82540, "total_steps": 89790, "loss": 0.4554, "lr": 9.8670404073887e-07, "epoch": 9.192560418754873, "percentage": 91.93, "elapsed_time": "6:28:37", "remaining_time": "0:34:08", "throughput": 4294.49, "total_tokens": 100136528} +{"current_steps": 82545, "total_steps": 89790, "loss": 0.4613, "lr": 9.853527337358974e-07, "epoch": 9.19311727363849, "percentage": 91.93, "elapsed_time": "6:28:38", "remaining_time": "0:34:06", "throughput": 4294.51, "total_tokens": 100142640} +{"current_steps": 82550, "total_steps": 89790, "loss": 0.4447, "lr": 9.84002334083259e-07, "epoch": 9.193674128522106, "percentage": 91.94, "elapsed_time": "6:28:40", "remaining_time": "0:34:05", "throughput": 4294.54, "total_tokens": 100148848} +{"current_steps": 82555, "total_steps": 89790, "loss": 0.4594, "lr": 9.826528418319742e-07, "epoch": 9.194230983405724, "percentage": 91.94, "elapsed_time": "6:28:41", "remaining_time": "0:34:03", "throughput": 4294.56, "total_tokens": 100154928} +{"current_steps": 82560, "total_steps": 89790, "loss": 0.4722, "lr": 9.813042570330306e-07, "epoch": 9.194787838289342, "percentage": 91.95, "elapsed_time": "6:28:42", "remaining_time": "0:34:02", "throughput": 4294.57, "total_tokens": 100160752} +{"current_steps": 82565, "total_steps": 89790, "loss": 0.4622, "lr": 9.799565797373872e-07, "epoch": 9.19534469317296, "percentage": 91.95, "elapsed_time": "6:28:43", "remaining_time": "0:34:01", "throughput": 4294.6, "total_tokens": 100166928} +{"current_steps": 82570, "total_steps": 89790, "loss": 0.4813, "lr": 9.78609809995959e-07, "epoch": 9.195901548056577, "percentage": 91.96, "elapsed_time": "6:28:45", "remaining_time": "0:33:59", "throughput": 4294.62, "total_tokens": 100173296} +{"current_steps": 82575, "total_steps": 89790, "loss": 0.4516, "lr": 9.77263947859633e-07, "epoch": 9.196458402940193, "percentage": 91.96, "elapsed_time": "6:28:46", "remaining_time": "0:33:58", "throughput": 4294.65, "total_tokens": 100179344} +{"current_steps": 82580, "total_steps": 89790, "loss": 0.4704, "lr": 9.759189933792573e-07, "epoch": 9.19701525782381, "percentage": 91.97, "elapsed_time": "6:28:47", "remaining_time": "0:33:56", "throughput": 4294.67, "total_tokens": 100185360} +{"current_steps": 82585, "total_steps": 89790, "loss": 0.465, "lr": 9.745749466056554e-07, "epoch": 9.197572112707428, "percentage": 91.98, "elapsed_time": "6:28:48", "remaining_time": "0:33:55", "throughput": 4294.69, "total_tokens": 100190672} +{"current_steps": 82590, "total_steps": 89790, "loss": 0.4596, "lr": 9.732318075896003e-07, "epoch": 9.198128967591046, "percentage": 91.98, "elapsed_time": "6:28:50", "remaining_time": "0:33:53", "throughput": 4294.7, "total_tokens": 100195760} +{"current_steps": 82595, "total_steps": 89790, "loss": 0.469, "lr": 9.718895763818459e-07, "epoch": 9.198685822474664, "percentage": 91.99, "elapsed_time": "6:28:51", "remaining_time": "0:33:52", "throughput": 4294.73, "total_tokens": 100202032} +{"current_steps": 82600, "total_steps": 89790, "loss": 0.4644, "lr": 9.7054825303311e-07, "epoch": 9.19924267735828, "percentage": 91.99, "elapsed_time": "6:28:52", "remaining_time": "0:33:51", "throughput": 4294.75, "total_tokens": 100208144} +{"current_steps": 82605, "total_steps": 89790, "loss": 0.482, "lr": 9.692078375940605e-07, "epoch": 9.199799532241897, "percentage": 92.0, "elapsed_time": "6:28:53", "remaining_time": "0:33:49", "throughput": 4294.78, "total_tokens": 100214288} +{"current_steps": 82610, "total_steps": 89790, "loss": 0.4656, "lr": 9.678683301153568e-07, "epoch": 9.200356387125515, "percentage": 92.0, "elapsed_time": "6:28:55", "remaining_time": "0:33:48", "throughput": 4294.81, "total_tokens": 100220720} +{"current_steps": 82615, "total_steps": 89790, "loss": 0.4571, "lr": 9.665297306475946e-07, "epoch": 9.200913242009133, "percentage": 92.01, "elapsed_time": "6:28:56", "remaining_time": "0:33:46", "throughput": 4294.83, "total_tokens": 100226960} +{"current_steps": 82620, "total_steps": 89790, "loss": 0.459, "lr": 9.65192039241361e-07, "epoch": 9.20147009689275, "percentage": 92.01, "elapsed_time": "6:28:57", "remaining_time": "0:33:45", "throughput": 4294.85, "total_tokens": 100233136} +{"current_steps": 82625, "total_steps": 89790, "loss": 0.4579, "lr": 9.638552559471992e-07, "epoch": 9.202026951776368, "percentage": 92.02, "elapsed_time": "6:28:59", "remaining_time": "0:33:43", "throughput": 4294.88, "total_tokens": 100239600} +{"current_steps": 82630, "total_steps": 89790, "loss": 0.4648, "lr": 9.625193808156075e-07, "epoch": 9.202583806659984, "percentage": 92.03, "elapsed_time": "6:29:00", "remaining_time": "0:33:42", "throughput": 4294.91, "total_tokens": 100245904} +{"current_steps": 82635, "total_steps": 89790, "loss": 0.4641, "lr": 9.611844138970705e-07, "epoch": 9.203140661543602, "percentage": 92.03, "elapsed_time": "6:29:01", "remaining_time": "0:33:41", "throughput": 4294.93, "total_tokens": 100252144} +{"current_steps": 82640, "total_steps": 89790, "loss": 0.4695, "lr": 9.5985035524202e-07, "epoch": 9.20369751642722, "percentage": 92.04, "elapsed_time": "6:29:03", "remaining_time": "0:33:39", "throughput": 4294.96, "total_tokens": 100258608} +{"current_steps": 82645, "total_steps": 89790, "loss": 0.4712, "lr": 9.58517204900866e-07, "epoch": 9.204254371310837, "percentage": 92.04, "elapsed_time": "6:29:04", "remaining_time": "0:33:38", "throughput": 4294.98, "total_tokens": 100264624} +{"current_steps": 82650, "total_steps": 89790, "loss": 0.4689, "lr": 9.571849629239738e-07, "epoch": 9.204811226194455, "percentage": 92.05, "elapsed_time": "6:29:05", "remaining_time": "0:33:36", "throughput": 4295.01, "total_tokens": 100270672} +{"current_steps": 82655, "total_steps": 89790, "loss": 0.4576, "lr": 9.558536293616831e-07, "epoch": 9.20536808107807, "percentage": 92.05, "elapsed_time": "6:29:07", "remaining_time": "0:33:35", "throughput": 4295.02, "total_tokens": 100276560} +{"current_steps": 82660, "total_steps": 89790, "loss": 0.4578, "lr": 9.54523204264296e-07, "epoch": 9.205924935961688, "percentage": 92.06, "elapsed_time": "6:29:08", "remaining_time": "0:33:33", "throughput": 4295.05, "total_tokens": 100282864} +{"current_steps": 82665, "total_steps": 89790, "loss": 0.4612, "lr": 9.531936876820802e-07, "epoch": 9.206481790845306, "percentage": 92.06, "elapsed_time": "6:29:09", "remaining_time": "0:33:32", "throughput": 4295.08, "total_tokens": 100289200} +{"current_steps": 82670, "total_steps": 89790, "loss": 0.4484, "lr": 9.518650796652706e-07, "epoch": 9.207038645728923, "percentage": 92.07, "elapsed_time": "6:29:11", "remaining_time": "0:33:31", "throughput": 4295.11, "total_tokens": 100295568} +{"current_steps": 82675, "total_steps": 89790, "loss": 0.4526, "lr": 9.505373802640605e-07, "epoch": 9.207595500612541, "percentage": 92.08, "elapsed_time": "6:29:12", "remaining_time": "0:33:29", "throughput": 4295.13, "total_tokens": 100302032} +{"current_steps": 82680, "total_steps": 89790, "loss": 0.4663, "lr": 9.492105895286207e-07, "epoch": 9.208152355496157, "percentage": 92.08, "elapsed_time": "6:29:13", "remaining_time": "0:33:28", "throughput": 4295.16, "total_tokens": 100308208} +{"current_steps": 82685, "total_steps": 89790, "loss": 0.4546, "lr": 9.47884707509078e-07, "epoch": 9.208709210379775, "percentage": 92.09, "elapsed_time": "6:29:15", "remaining_time": "0:33:26", "throughput": 4295.18, "total_tokens": 100314096} +{"current_steps": 82690, "total_steps": 89790, "loss": 0.4558, "lr": 9.465597342555283e-07, "epoch": 9.209266065263392, "percentage": 92.09, "elapsed_time": "6:29:16", "remaining_time": "0:33:25", "throughput": 4295.2, "total_tokens": 100320368} +{"current_steps": 82695, "total_steps": 89790, "loss": 0.4537, "lr": 9.452356698180398e-07, "epoch": 9.20982292014701, "percentage": 92.1, "elapsed_time": "6:29:17", "remaining_time": "0:33:24", "throughput": 4295.22, "total_tokens": 100326352} +{"current_steps": 82700, "total_steps": 89790, "loss": 0.4582, "lr": 9.43912514246631e-07, "epoch": 9.210379775030628, "percentage": 92.1, "elapsed_time": "6:29:18", "remaining_time": "0:33:22", "throughput": 4295.25, "total_tokens": 100332432} +{"current_steps": 82705, "total_steps": 89790, "loss": 0.4567, "lr": 9.425902675913006e-07, "epoch": 9.210936629914244, "percentage": 92.11, "elapsed_time": "6:29:20", "remaining_time": "0:33:21", "throughput": 4295.27, "total_tokens": 100338704} +{"current_steps": 82710, "total_steps": 89790, "loss": 0.4578, "lr": 9.412689299020033e-07, "epoch": 9.211493484797861, "percentage": 92.11, "elapsed_time": "6:29:21", "remaining_time": "0:33:19", "throughput": 4295.29, "total_tokens": 100344656} +{"current_steps": 82715, "total_steps": 89790, "loss": 0.455, "lr": 9.399485012286713e-07, "epoch": 9.212050339681479, "percentage": 92.12, "elapsed_time": "6:29:22", "remaining_time": "0:33:18", "throughput": 4295.32, "total_tokens": 100350864} +{"current_steps": 82720, "total_steps": 89790, "loss": 0.4677, "lr": 9.386289816211841e-07, "epoch": 9.212607194565097, "percentage": 92.13, "elapsed_time": "6:29:24", "remaining_time": "0:33:16", "throughput": 4295.34, "total_tokens": 100356784} +{"current_steps": 82725, "total_steps": 89790, "loss": 0.4632, "lr": 9.373103711294018e-07, "epoch": 9.213164049448714, "percentage": 92.13, "elapsed_time": "6:29:25", "remaining_time": "0:33:15", "throughput": 4295.36, "total_tokens": 100362928} +{"current_steps": 82730, "total_steps": 89790, "loss": 0.4509, "lr": 9.359926698031512e-07, "epoch": 9.21372090433233, "percentage": 92.14, "elapsed_time": "6:29:26", "remaining_time": "0:33:14", "throughput": 4295.38, "total_tokens": 100368912} +{"current_steps": 82735, "total_steps": 89790, "loss": 0.4617, "lr": 9.346758776922093e-07, "epoch": 9.214277759215948, "percentage": 92.14, "elapsed_time": "6:29:28", "remaining_time": "0:33:12", "throughput": 4295.41, "total_tokens": 100375056} +{"current_steps": 82740, "total_steps": 89790, "loss": 0.4605, "lr": 9.33359994846339e-07, "epoch": 9.214834614099566, "percentage": 92.15, "elapsed_time": "6:29:29", "remaining_time": "0:33:11", "throughput": 4295.43, "total_tokens": 100381200} +{"current_steps": 82745, "total_steps": 89790, "loss": 0.4748, "lr": 9.320450213152476e-07, "epoch": 9.215391468983183, "percentage": 92.15, "elapsed_time": "6:29:30", "remaining_time": "0:33:09", "throughput": 4295.45, "total_tokens": 100387376} +{"current_steps": 82750, "total_steps": 89790, "loss": 0.4628, "lr": 9.307309571486289e-07, "epoch": 9.215948323866801, "percentage": 92.16, "elapsed_time": "6:29:31", "remaining_time": "0:33:08", "throughput": 4295.47, "total_tokens": 100392912} +{"current_steps": 82755, "total_steps": 89790, "loss": 0.4699, "lr": 9.294178023961292e-07, "epoch": 9.216505178750417, "percentage": 92.17, "elapsed_time": "6:29:33", "remaining_time": "0:33:06", "throughput": 4295.49, "total_tokens": 100398864} +{"current_steps": 82760, "total_steps": 89790, "loss": 0.4483, "lr": 9.281055571073588e-07, "epoch": 9.217062033634035, "percentage": 92.17, "elapsed_time": "6:29:34", "remaining_time": "0:33:05", "throughput": 4295.51, "total_tokens": 100404464} +{"current_steps": 82765, "total_steps": 89790, "loss": 0.468, "lr": 9.267942213319087e-07, "epoch": 9.217618888517652, "percentage": 92.18, "elapsed_time": "6:29:35", "remaining_time": "0:33:04", "throughput": 4295.54, "total_tokens": 100410960} +{"current_steps": 82770, "total_steps": 89790, "loss": 0.4637, "lr": 9.254837951193141e-07, "epoch": 9.21817574340127, "percentage": 92.18, "elapsed_time": "6:29:36", "remaining_time": "0:33:02", "throughput": 4295.56, "total_tokens": 100416944} +{"current_steps": 82775, "total_steps": 89790, "loss": 0.456, "lr": 9.241742785190938e-07, "epoch": 9.218732598284888, "percentage": 92.19, "elapsed_time": "6:29:38", "remaining_time": "0:33:01", "throughput": 4295.58, "total_tokens": 100423312} +{"current_steps": 82780, "total_steps": 89790, "loss": 0.4537, "lr": 9.228656715807249e-07, "epoch": 9.219289453168503, "percentage": 92.19, "elapsed_time": "6:29:39", "remaining_time": "0:32:59", "throughput": 4295.6, "total_tokens": 100429136} +{"current_steps": 82785, "total_steps": 89790, "loss": 0.4579, "lr": 9.215579743536484e-07, "epoch": 9.219846308052121, "percentage": 92.2, "elapsed_time": "6:29:40", "remaining_time": "0:32:58", "throughput": 4295.63, "total_tokens": 100435344} +{"current_steps": 82790, "total_steps": 89790, "loss": 0.4524, "lr": 9.202511868872777e-07, "epoch": 9.220403162935739, "percentage": 92.2, "elapsed_time": "6:29:42", "remaining_time": "0:32:56", "throughput": 4295.64, "total_tokens": 100441040} +{"current_steps": 82795, "total_steps": 89790, "loss": 0.4628, "lr": 9.189453092309785e-07, "epoch": 9.220960017819356, "percentage": 92.21, "elapsed_time": "6:29:43", "remaining_time": "0:32:55", "throughput": 4295.67, "total_tokens": 100447184} +{"current_steps": 82800, "total_steps": 89790, "loss": 0.4595, "lr": 9.176403414341006e-07, "epoch": 9.221516872702974, "percentage": 92.22, "elapsed_time": "6:29:44", "remaining_time": "0:32:54", "throughput": 4295.69, "total_tokens": 100453488} +{"current_steps": 82805, "total_steps": 89790, "loss": 0.4722, "lr": 9.163362835459488e-07, "epoch": 9.22207372758659, "percentage": 92.22, "elapsed_time": "6:29:45", "remaining_time": "0:32:52", "throughput": 4295.71, "total_tokens": 100459376} +{"current_steps": 82810, "total_steps": 89790, "loss": 0.4727, "lr": 9.150331356157865e-07, "epoch": 9.222630582470208, "percentage": 92.23, "elapsed_time": "6:29:47", "remaining_time": "0:32:51", "throughput": 4295.74, "total_tokens": 100465360} +{"current_steps": 82815, "total_steps": 89790, "loss": 0.4638, "lr": 9.137308976928632e-07, "epoch": 9.223187437353825, "percentage": 92.23, "elapsed_time": "6:29:48", "remaining_time": "0:32:49", "throughput": 4295.76, "total_tokens": 100471440} +{"current_steps": 82820, "total_steps": 89790, "loss": 0.4634, "lr": 9.124295698263702e-07, "epoch": 9.223744292237443, "percentage": 92.24, "elapsed_time": "6:29:49", "remaining_time": "0:32:48", "throughput": 4295.78, "total_tokens": 100477104} +{"current_steps": 82825, "total_steps": 89790, "loss": 0.4675, "lr": 9.111291520654819e-07, "epoch": 9.22430114712106, "percentage": 92.24, "elapsed_time": "6:29:51", "remaining_time": "0:32:47", "throughput": 4295.81, "total_tokens": 100483408} +{"current_steps": 82830, "total_steps": 89790, "loss": 0.4546, "lr": 9.098296444593285e-07, "epoch": 9.224858002004678, "percentage": 92.25, "elapsed_time": "6:29:52", "remaining_time": "0:32:45", "throughput": 4295.83, "total_tokens": 100489520} +{"current_steps": 82835, "total_steps": 89790, "loss": 0.4477, "lr": 9.085310470570124e-07, "epoch": 9.225414856888294, "percentage": 92.25, "elapsed_time": "6:29:53", "remaining_time": "0:32:44", "throughput": 4295.85, "total_tokens": 100495216} +{"current_steps": 82840, "total_steps": 89790, "loss": 0.4686, "lr": 9.072333599076028e-07, "epoch": 9.225971711771912, "percentage": 92.26, "elapsed_time": "6:29:54", "remaining_time": "0:32:42", "throughput": 4295.87, "total_tokens": 100501104} +{"current_steps": 82845, "total_steps": 89790, "loss": 0.4552, "lr": 9.059365830601213e-07, "epoch": 9.22652856665553, "percentage": 92.27, "elapsed_time": "6:29:56", "remaining_time": "0:32:41", "throughput": 4295.9, "total_tokens": 100507280} +{"current_steps": 82850, "total_steps": 89790, "loss": 0.4674, "lr": 9.046407165635706e-07, "epoch": 9.227085421539147, "percentage": 92.27, "elapsed_time": "6:29:57", "remaining_time": "0:32:39", "throughput": 4295.92, "total_tokens": 100513200} +{"current_steps": 82855, "total_steps": 89790, "loss": 0.4732, "lr": 9.033457604669115e-07, "epoch": 9.227642276422765, "percentage": 92.28, "elapsed_time": "6:29:58", "remaining_time": "0:32:38", "throughput": 4295.94, "total_tokens": 100519056} +{"current_steps": 82860, "total_steps": 89790, "loss": 0.457, "lr": 9.020517148190716e-07, "epoch": 9.228199131306381, "percentage": 92.28, "elapsed_time": "6:29:59", "remaining_time": "0:32:37", "throughput": 4295.96, "total_tokens": 100525008} +{"current_steps": 82865, "total_steps": 89790, "loss": 0.4606, "lr": 9.007585796689394e-07, "epoch": 9.228755986189999, "percentage": 92.29, "elapsed_time": "6:30:01", "remaining_time": "0:32:35", "throughput": 4295.99, "total_tokens": 100531216} +{"current_steps": 82870, "total_steps": 89790, "loss": 0.4684, "lr": 8.994663550653815e-07, "epoch": 9.229312841073616, "percentage": 92.29, "elapsed_time": "6:30:02", "remaining_time": "0:32:34", "throughput": 4296.01, "total_tokens": 100537136} +{"current_steps": 82875, "total_steps": 89790, "loss": 0.4678, "lr": 8.981750410572199e-07, "epoch": 9.229869695957234, "percentage": 92.3, "elapsed_time": "6:30:03", "remaining_time": "0:32:32", "throughput": 4296.03, "total_tokens": 100542768} +{"current_steps": 82880, "total_steps": 89790, "loss": 0.4613, "lr": 8.968846376932377e-07, "epoch": 9.230426550840852, "percentage": 92.3, "elapsed_time": "6:30:04", "remaining_time": "0:32:31", "throughput": 4296.06, "total_tokens": 100549104} +{"current_steps": 82885, "total_steps": 89790, "loss": 0.4666, "lr": 8.955951450222017e-07, "epoch": 9.230983405724468, "percentage": 92.31, "elapsed_time": "6:30:06", "remaining_time": "0:32:29", "throughput": 4296.07, "total_tokens": 100554480} +{"current_steps": 82890, "total_steps": 89790, "loss": 0.4614, "lr": 8.943065630928254e-07, "epoch": 9.231540260608085, "percentage": 92.32, "elapsed_time": "6:30:07", "remaining_time": "0:32:28", "throughput": 4296.09, "total_tokens": 100560496} +{"current_steps": 82895, "total_steps": 89790, "loss": 0.4576, "lr": 8.930188919537952e-07, "epoch": 9.232097115491703, "percentage": 92.32, "elapsed_time": "6:30:08", "remaining_time": "0:32:27", "throughput": 4296.12, "total_tokens": 100566736} +{"current_steps": 82900, "total_steps": 89790, "loss": 0.4455, "lr": 8.917321316537719e-07, "epoch": 9.23265397037532, "percentage": 92.33, "elapsed_time": "6:30:10", "remaining_time": "0:32:25", "throughput": 4296.14, "total_tokens": 100572976} +{"current_steps": 82905, "total_steps": 89790, "loss": 0.4543, "lr": 8.904462822413611e-07, "epoch": 9.233210825258938, "percentage": 92.33, "elapsed_time": "6:30:11", "remaining_time": "0:32:24", "throughput": 4296.17, "total_tokens": 100579024} +{"current_steps": 82910, "total_steps": 89790, "loss": 0.4447, "lr": 8.891613437651574e-07, "epoch": 9.233767680142554, "percentage": 92.34, "elapsed_time": "6:30:12", "remaining_time": "0:32:22", "throughput": 4296.19, "total_tokens": 100585136} +{"current_steps": 82915, "total_steps": 89790, "loss": 0.4609, "lr": 8.878773162737025e-07, "epoch": 9.234324535026172, "percentage": 92.34, "elapsed_time": "6:30:13", "remaining_time": "0:32:21", "throughput": 4296.21, "total_tokens": 100591024} +{"current_steps": 82920, "total_steps": 89790, "loss": 0.4546, "lr": 8.865941998155158e-07, "epoch": 9.23488138990979, "percentage": 92.35, "elapsed_time": "6:30:15", "remaining_time": "0:32:19", "throughput": 4296.24, "total_tokens": 100597392} +{"current_steps": 82925, "total_steps": 89790, "loss": 0.4636, "lr": 8.853119944390726e-07, "epoch": 9.235438244793407, "percentage": 92.35, "elapsed_time": "6:30:16", "remaining_time": "0:32:18", "throughput": 4296.26, "total_tokens": 100603376} +{"current_steps": 82930, "total_steps": 89790, "loss": 0.473, "lr": 8.840307001928227e-07, "epoch": 9.235995099677025, "percentage": 92.36, "elapsed_time": "6:30:17", "remaining_time": "0:32:17", "throughput": 4296.29, "total_tokens": 100609744} +{"current_steps": 82935, "total_steps": 89790, "loss": 0.4586, "lr": 8.827503171251777e-07, "epoch": 9.23655195456064, "percentage": 92.37, "elapsed_time": "6:30:19", "remaining_time": "0:32:15", "throughput": 4296.31, "total_tokens": 100616112} +{"current_steps": 82940, "total_steps": 89790, "loss": 0.4731, "lr": 8.8147084528451e-07, "epoch": 9.237108809444258, "percentage": 92.37, "elapsed_time": "6:30:20", "remaining_time": "0:32:14", "throughput": 4296.34, "total_tokens": 100622320} +{"current_steps": 82945, "total_steps": 89790, "loss": 0.4557, "lr": 8.801922847191696e-07, "epoch": 9.237665664327876, "percentage": 92.38, "elapsed_time": "6:30:21", "remaining_time": "0:32:12", "throughput": 4296.36, "total_tokens": 100628240} +{"current_steps": 82950, "total_steps": 89790, "loss": 0.4553, "lr": 8.789146354774569e-07, "epoch": 9.238222519211494, "percentage": 92.38, "elapsed_time": "6:30:22", "remaining_time": "0:32:11", "throughput": 4296.38, "total_tokens": 100633680} +{"current_steps": 82955, "total_steps": 89790, "loss": 0.4688, "lr": 8.776378976076527e-07, "epoch": 9.238779374095111, "percentage": 92.39, "elapsed_time": "6:30:24", "remaining_time": "0:32:10", "throughput": 4296.4, "total_tokens": 100639856} +{"current_steps": 82960, "total_steps": 89790, "loss": 0.4434, "lr": 8.763620711579906e-07, "epoch": 9.239336228978727, "percentage": 92.39, "elapsed_time": "6:30:25", "remaining_time": "0:32:08", "throughput": 4296.42, "total_tokens": 100646000} +{"current_steps": 82965, "total_steps": 89790, "loss": 0.4571, "lr": 8.750871561766766e-07, "epoch": 9.239893083862345, "percentage": 92.4, "elapsed_time": "6:30:26", "remaining_time": "0:32:07", "throughput": 4296.45, "total_tokens": 100652432} +{"current_steps": 82970, "total_steps": 89790, "loss": 0.4507, "lr": 8.738131527118831e-07, "epoch": 9.240449938745963, "percentage": 92.4, "elapsed_time": "6:30:28", "remaining_time": "0:32:05", "throughput": 4296.47, "total_tokens": 100658384} +{"current_steps": 82975, "total_steps": 89790, "loss": 0.459, "lr": 8.72540060811744e-07, "epoch": 9.24100679362958, "percentage": 92.41, "elapsed_time": "6:30:29", "remaining_time": "0:32:04", "throughput": 4296.49, "total_tokens": 100664432} +{"current_steps": 82980, "total_steps": 89790, "loss": 0.4583, "lr": 8.712678805243624e-07, "epoch": 9.241563648513198, "percentage": 92.42, "elapsed_time": "6:30:30", "remaining_time": "0:32:02", "throughput": 4296.52, "total_tokens": 100670576} +{"current_steps": 82985, "total_steps": 89790, "loss": 0.4521, "lr": 8.699966118978025e-07, "epoch": 9.242120503396816, "percentage": 92.42, "elapsed_time": "6:30:31", "remaining_time": "0:32:01", "throughput": 4296.54, "total_tokens": 100676528} +{"current_steps": 82990, "total_steps": 89790, "loss": 0.4623, "lr": 8.687262549801039e-07, "epoch": 9.242677358280432, "percentage": 92.43, "elapsed_time": "6:30:33", "remaining_time": "0:32:00", "throughput": 4296.57, "total_tokens": 100682736} +{"current_steps": 82995, "total_steps": 89790, "loss": 0.4665, "lr": 8.67456809819256e-07, "epoch": 9.24323421316405, "percentage": 92.43, "elapsed_time": "6:30:34", "remaining_time": "0:31:58", "throughput": 4296.59, "total_tokens": 100688304} +{"current_steps": 83000, "total_steps": 89790, "loss": 0.4673, "lr": 8.661882764632257e-07, "epoch": 9.243791068047667, "percentage": 92.44, "elapsed_time": "6:30:35", "remaining_time": "0:31:57", "throughput": 4296.61, "total_tokens": 100694416} +{"current_steps": 83005, "total_steps": 89790, "loss": 0.461, "lr": 8.649206549599443e-07, "epoch": 9.244347922931285, "percentage": 92.44, "elapsed_time": "6:30:37", "remaining_time": "0:31:55", "throughput": 4296.64, "total_tokens": 100700432} +{"current_steps": 83010, "total_steps": 89790, "loss": 0.4631, "lr": 8.636539453573039e-07, "epoch": 9.244904777814902, "percentage": 92.45, "elapsed_time": "6:30:38", "remaining_time": "0:31:54", "throughput": 4296.66, "total_tokens": 100706576} +{"current_steps": 83015, "total_steps": 89790, "loss": 0.4566, "lr": 8.623881477031693e-07, "epoch": 9.245461632698518, "percentage": 92.45, "elapsed_time": "6:30:39", "remaining_time": "0:31:52", "throughput": 4296.68, "total_tokens": 100712304} +{"current_steps": 83020, "total_steps": 89790, "loss": 0.4496, "lr": 8.611232620453602e-07, "epoch": 9.246018487582136, "percentage": 92.46, "elapsed_time": "6:30:40", "remaining_time": "0:31:51", "throughput": 4296.71, "total_tokens": 100718576} +{"current_steps": 83025, "total_steps": 89790, "loss": 0.4643, "lr": 8.59859288431672e-07, "epoch": 9.246575342465754, "percentage": 92.47, "elapsed_time": "6:30:42", "remaining_time": "0:31:50", "throughput": 4296.73, "total_tokens": 100724336} +{"current_steps": 83030, "total_steps": 89790, "loss": 0.4616, "lr": 8.585962269098608e-07, "epoch": 9.247132197349371, "percentage": 92.47, "elapsed_time": "6:30:43", "remaining_time": "0:31:48", "throughput": 4296.75, "total_tokens": 100730608} +{"current_steps": 83035, "total_steps": 89790, "loss": 0.4569, "lr": 8.573340775276495e-07, "epoch": 9.247689052232989, "percentage": 92.48, "elapsed_time": "6:30:44", "remaining_time": "0:31:47", "throughput": 4296.78, "total_tokens": 100736752} +{"current_steps": 83040, "total_steps": 89790, "loss": 0.4495, "lr": 8.560728403327279e-07, "epoch": 9.248245907116605, "percentage": 92.48, "elapsed_time": "6:30:45", "remaining_time": "0:31:45", "throughput": 4296.8, "total_tokens": 100742352} +{"current_steps": 83045, "total_steps": 89790, "loss": 0.4696, "lr": 8.548125153727438e-07, "epoch": 9.248802762000222, "percentage": 92.49, "elapsed_time": "6:30:47", "remaining_time": "0:31:44", "throughput": 4296.81, "total_tokens": 100748016} +{"current_steps": 83050, "total_steps": 89790, "loss": 0.4549, "lr": 8.535531026953231e-07, "epoch": 9.24935961688384, "percentage": 92.49, "elapsed_time": "6:30:48", "remaining_time": "0:31:42", "throughput": 4296.84, "total_tokens": 100753936} +{"current_steps": 83055, "total_steps": 89790, "loss": 0.4721, "lr": 8.522946023480416e-07, "epoch": 9.249916471767458, "percentage": 92.5, "elapsed_time": "6:30:49", "remaining_time": "0:31:41", "throughput": 4296.85, "total_tokens": 100759600} +{"current_steps": 83060, "total_steps": 89790, "loss": 0.4604, "lr": 8.510370143784586e-07, "epoch": 9.250473326651075, "percentage": 92.5, "elapsed_time": "6:30:50", "remaining_time": "0:31:40", "throughput": 4296.88, "total_tokens": 100765424} +{"current_steps": 83065, "total_steps": 89790, "loss": 0.4639, "lr": 8.497803388340886e-07, "epoch": 9.251030181534691, "percentage": 92.51, "elapsed_time": "6:30:52", "remaining_time": "0:31:38", "throughput": 4296.91, "total_tokens": 100771792} +{"current_steps": 83070, "total_steps": 89790, "loss": 0.4595, "lr": 8.485245757624077e-07, "epoch": 9.251587036418309, "percentage": 92.52, "elapsed_time": "6:30:53", "remaining_time": "0:31:37", "throughput": 4296.93, "total_tokens": 100778032} +{"current_steps": 83075, "total_steps": 89790, "loss": 0.4521, "lr": 8.472697252108669e-07, "epoch": 9.252143891301927, "percentage": 92.52, "elapsed_time": "6:30:54", "remaining_time": "0:31:35", "throughput": 4296.95, "total_tokens": 100783824} +{"current_steps": 83080, "total_steps": 89790, "loss": 0.4548, "lr": 8.460157872268754e-07, "epoch": 9.252700746185544, "percentage": 92.53, "elapsed_time": "6:30:56", "remaining_time": "0:31:34", "throughput": 4296.98, "total_tokens": 100790320} +{"current_steps": 83085, "total_steps": 89790, "loss": 0.4626, "lr": 8.447627618578174e-07, "epoch": 9.253257601069162, "percentage": 92.53, "elapsed_time": "6:30:57", "remaining_time": "0:31:33", "throughput": 4297.0, "total_tokens": 100796432} +{"current_steps": 83090, "total_steps": 89790, "loss": 0.4516, "lr": 8.435106491510247e-07, "epoch": 9.253814455952778, "percentage": 92.54, "elapsed_time": "6:30:58", "remaining_time": "0:31:31", "throughput": 4297.02, "total_tokens": 100802192} +{"current_steps": 83095, "total_steps": 89790, "loss": 0.4685, "lr": 8.42259449153815e-07, "epoch": 9.254371310836396, "percentage": 92.54, "elapsed_time": "6:30:59", "remaining_time": "0:31:30", "throughput": 4297.05, "total_tokens": 100808496} +{"current_steps": 83100, "total_steps": 89790, "loss": 0.4583, "lr": 8.410091619134641e-07, "epoch": 9.254928165720013, "percentage": 92.55, "elapsed_time": "6:31:01", "remaining_time": "0:31:28", "throughput": 4297.06, "total_tokens": 100813808} +{"current_steps": 83105, "total_steps": 89790, "loss": 0.4579, "lr": 8.397597874772067e-07, "epoch": 9.255485020603631, "percentage": 92.55, "elapsed_time": "6:31:02", "remaining_time": "0:31:27", "throughput": 4297.08, "total_tokens": 100819728} +{"current_steps": 83110, "total_steps": 89790, "loss": 0.4455, "lr": 8.385113258922495e-07, "epoch": 9.256041875487249, "percentage": 92.56, "elapsed_time": "6:31:03", "remaining_time": "0:31:25", "throughput": 4297.11, "total_tokens": 100825648} +{"current_steps": 83115, "total_steps": 89790, "loss": 0.459, "lr": 8.372637772057628e-07, "epoch": 9.256598730370865, "percentage": 92.57, "elapsed_time": "6:31:04", "remaining_time": "0:31:24", "throughput": 4297.13, "total_tokens": 100831760} +{"current_steps": 83120, "total_steps": 89790, "loss": 0.4704, "lr": 8.360171414648815e-07, "epoch": 9.257155585254482, "percentage": 92.57, "elapsed_time": "6:31:06", "remaining_time": "0:31:23", "throughput": 4297.15, "total_tokens": 100838128} +{"current_steps": 83125, "total_steps": 89790, "loss": 0.4678, "lr": 8.347714187167149e-07, "epoch": 9.2577124401381, "percentage": 92.58, "elapsed_time": "6:31:07", "remaining_time": "0:31:21", "throughput": 4297.18, "total_tokens": 100844112} +{"current_steps": 83130, "total_steps": 89790, "loss": 0.4583, "lr": 8.335266090083227e-07, "epoch": 9.258269295021718, "percentage": 92.58, "elapsed_time": "6:31:08", "remaining_time": "0:31:20", "throughput": 4297.2, "total_tokens": 100850288} +{"current_steps": 83135, "total_steps": 89790, "loss": 0.453, "lr": 8.322827123867421e-07, "epoch": 9.258826149905335, "percentage": 92.59, "elapsed_time": "6:31:10", "remaining_time": "0:31:18", "throughput": 4297.22, "total_tokens": 100856048} +{"current_steps": 83140, "total_steps": 89790, "loss": 0.4683, "lr": 8.310397288989691e-07, "epoch": 9.259383004788951, "percentage": 92.59, "elapsed_time": "6:31:11", "remaining_time": "0:31:17", "throughput": 4297.24, "total_tokens": 100862160} +{"current_steps": 83145, "total_steps": 89790, "loss": 0.46, "lr": 8.297976585919686e-07, "epoch": 9.259939859672569, "percentage": 92.6, "elapsed_time": "6:31:12", "remaining_time": "0:31:15", "throughput": 4297.27, "total_tokens": 100868464} +{"current_steps": 83150, "total_steps": 89790, "loss": 0.4572, "lr": 8.2855650151267e-07, "epoch": 9.260496714556187, "percentage": 92.6, "elapsed_time": "6:31:13", "remaining_time": "0:31:14", "throughput": 4297.29, "total_tokens": 100874384} +{"current_steps": 83155, "total_steps": 89790, "loss": 0.4588, "lr": 8.273162577079662e-07, "epoch": 9.261053569439804, "percentage": 92.61, "elapsed_time": "6:31:15", "remaining_time": "0:31:13", "throughput": 4297.32, "total_tokens": 100880592} +{"current_steps": 83160, "total_steps": 89790, "loss": 0.4651, "lr": 8.260769272247198e-07, "epoch": 9.261610424323422, "percentage": 92.62, "elapsed_time": "6:31:16", "remaining_time": "0:31:11", "throughput": 4297.34, "total_tokens": 100886672} +{"current_steps": 83165, "total_steps": 89790, "loss": 0.4649, "lr": 8.248385101097572e-07, "epoch": 9.262167279207038, "percentage": 92.62, "elapsed_time": "6:31:17", "remaining_time": "0:31:10", "throughput": 4297.36, "total_tokens": 100892688} +{"current_steps": 83170, "total_steps": 89790, "loss": 0.4604, "lr": 8.236010064098687e-07, "epoch": 9.262724134090655, "percentage": 92.63, "elapsed_time": "6:31:19", "remaining_time": "0:31:08", "throughput": 4297.39, "total_tokens": 100898992} +{"current_steps": 83175, "total_steps": 89790, "loss": 0.451, "lr": 8.223644161718141e-07, "epoch": 9.263280988974273, "percentage": 92.63, "elapsed_time": "6:31:20", "remaining_time": "0:31:07", "throughput": 4297.41, "total_tokens": 100904976} +{"current_steps": 83180, "total_steps": 89790, "loss": 0.4558, "lr": 8.21128739442309e-07, "epoch": 9.26383784385789, "percentage": 92.64, "elapsed_time": "6:31:21", "remaining_time": "0:31:06", "throughput": 4297.43, "total_tokens": 100910896} +{"current_steps": 83185, "total_steps": 89790, "loss": 0.4601, "lr": 8.198939762680463e-07, "epoch": 9.264394698741508, "percentage": 92.64, "elapsed_time": "6:31:23", "remaining_time": "0:31:04", "throughput": 4297.46, "total_tokens": 100917264} +{"current_steps": 83190, "total_steps": 89790, "loss": 0.4471, "lr": 8.186601266956778e-07, "epoch": 9.264951553625126, "percentage": 92.65, "elapsed_time": "6:31:24", "remaining_time": "0:31:03", "throughput": 4297.48, "total_tokens": 100922800} +{"current_steps": 83195, "total_steps": 89790, "loss": 0.4618, "lr": 8.174271907718245e-07, "epoch": 9.265508408508742, "percentage": 92.66, "elapsed_time": "6:31:25", "remaining_time": "0:31:01", "throughput": 4297.5, "total_tokens": 100928880} +{"current_steps": 83200, "total_steps": 89790, "loss": 0.4627, "lr": 8.161951685430658e-07, "epoch": 9.26606526339236, "percentage": 92.66, "elapsed_time": "6:31:26", "remaining_time": "0:31:00", "throughput": 4297.52, "total_tokens": 100935248} +{"current_steps": 83205, "total_steps": 89790, "loss": 0.4685, "lr": 8.149640600559533e-07, "epoch": 9.266622118275977, "percentage": 92.67, "elapsed_time": "6:31:28", "remaining_time": "0:30:58", "throughput": 4297.54, "total_tokens": 100941168} +{"current_steps": 83210, "total_steps": 89790, "loss": 0.4685, "lr": 8.137338653570081e-07, "epoch": 9.267178973159595, "percentage": 92.67, "elapsed_time": "6:31:29", "remaining_time": "0:30:57", "throughput": 4297.57, "total_tokens": 100947248} +{"current_steps": 83215, "total_steps": 89790, "loss": 0.457, "lr": 8.125045844927016e-07, "epoch": 9.267735828043213, "percentage": 92.68, "elapsed_time": "6:31:30", "remaining_time": "0:30:56", "throughput": 4297.59, "total_tokens": 100953520} +{"current_steps": 83220, "total_steps": 89790, "loss": 0.4561, "lr": 8.112762175094879e-07, "epoch": 9.268292682926829, "percentage": 92.68, "elapsed_time": "6:31:31", "remaining_time": "0:30:54", "throughput": 4297.62, "total_tokens": 100959408} +{"current_steps": 83225, "total_steps": 89790, "loss": 0.4605, "lr": 8.100487644537747e-07, "epoch": 9.268849537810446, "percentage": 92.69, "elapsed_time": "6:31:33", "remaining_time": "0:30:53", "throughput": 4297.64, "total_tokens": 100965456} +{"current_steps": 83230, "total_steps": 89790, "loss": 0.4481, "lr": 8.088222253719386e-07, "epoch": 9.269406392694064, "percentage": 92.69, "elapsed_time": "6:31:34", "remaining_time": "0:30:51", "throughput": 4297.65, "total_tokens": 100970224} +{"current_steps": 83235, "total_steps": 89790, "loss": 0.4555, "lr": 8.075966003103231e-07, "epoch": 9.269963247577682, "percentage": 92.7, "elapsed_time": "6:31:35", "remaining_time": "0:30:50", "throughput": 4297.68, "total_tokens": 100976592} +{"current_steps": 83240, "total_steps": 89790, "loss": 0.4681, "lr": 8.063718893152356e-07, "epoch": 9.2705201024613, "percentage": 92.71, "elapsed_time": "6:31:36", "remaining_time": "0:30:48", "throughput": 4297.7, "total_tokens": 100982352} +{"current_steps": 83245, "total_steps": 89790, "loss": 0.4561, "lr": 8.051480924329529e-07, "epoch": 9.271076957344915, "percentage": 92.71, "elapsed_time": "6:31:38", "remaining_time": "0:30:47", "throughput": 4297.72, "total_tokens": 100988144} +{"current_steps": 83250, "total_steps": 89790, "loss": 0.467, "lr": 8.039252097097105e-07, "epoch": 9.271633812228533, "percentage": 92.72, "elapsed_time": "6:31:39", "remaining_time": "0:30:46", "throughput": 4297.74, "total_tokens": 100993808} +{"current_steps": 83255, "total_steps": 89790, "loss": 0.451, "lr": 8.027032411917157e-07, "epoch": 9.27219066711215, "percentage": 92.72, "elapsed_time": "6:31:40", "remaining_time": "0:30:44", "throughput": 4297.75, "total_tokens": 100999472} +{"current_steps": 83260, "total_steps": 89790, "loss": 0.469, "lr": 8.014821869251315e-07, "epoch": 9.272747521995768, "percentage": 92.73, "elapsed_time": "6:31:41", "remaining_time": "0:30:43", "throughput": 4297.78, "total_tokens": 101005776} +{"current_steps": 83265, "total_steps": 89790, "loss": 0.4438, "lr": 8.002620469561045e-07, "epoch": 9.273304376879386, "percentage": 92.73, "elapsed_time": "6:31:43", "remaining_time": "0:30:41", "throughput": 4297.8, "total_tokens": 101011984} +{"current_steps": 83270, "total_steps": 89790, "loss": 0.4616, "lr": 7.990428213307227e-07, "epoch": 9.273861231763002, "percentage": 92.74, "elapsed_time": "6:31:44", "remaining_time": "0:30:40", "throughput": 4297.82, "total_tokens": 101017936} +{"current_steps": 83275, "total_steps": 89790, "loss": 0.4624, "lr": 7.978245100950632e-07, "epoch": 9.27441808664662, "percentage": 92.74, "elapsed_time": "6:31:45", "remaining_time": "0:30:38", "throughput": 4297.85, "total_tokens": 101024016} +{"current_steps": 83280, "total_steps": 89790, "loss": 0.4719, "lr": 7.966071132951531e-07, "epoch": 9.274974941530237, "percentage": 92.75, "elapsed_time": "6:31:47", "remaining_time": "0:30:37", "throughput": 4297.87, "total_tokens": 101030064} +{"current_steps": 83285, "total_steps": 89790, "loss": 0.4682, "lr": 7.953906309769887e-07, "epoch": 9.275531796413855, "percentage": 92.76, "elapsed_time": "6:31:48", "remaining_time": "0:30:36", "throughput": 4297.9, "total_tokens": 101036528} +{"current_steps": 83290, "total_steps": 89790, "loss": 0.46, "lr": 7.941750631865336e-07, "epoch": 9.276088651297473, "percentage": 92.76, "elapsed_time": "6:31:49", "remaining_time": "0:30:34", "throughput": 4297.92, "total_tokens": 101042288} +{"current_steps": 83295, "total_steps": 89790, "loss": 0.4643, "lr": 7.929604099697174e-07, "epoch": 9.276645506181088, "percentage": 92.77, "elapsed_time": "6:31:50", "remaining_time": "0:30:33", "throughput": 4297.94, "total_tokens": 101048400} +{"current_steps": 83300, "total_steps": 89790, "loss": 0.4689, "lr": 7.917466713724286e-07, "epoch": 9.277202361064706, "percentage": 92.77, "elapsed_time": "6:31:52", "remaining_time": "0:30:31", "throughput": 4297.96, "total_tokens": 101054320} +{"current_steps": 83305, "total_steps": 89790, "loss": 0.4643, "lr": 7.905338474405333e-07, "epoch": 9.277759215948324, "percentage": 92.78, "elapsed_time": "6:31:53", "remaining_time": "0:30:30", "throughput": 4297.98, "total_tokens": 101060560} +{"current_steps": 83310, "total_steps": 89790, "loss": 0.4625, "lr": 7.893219382198502e-07, "epoch": 9.278316070831941, "percentage": 92.78, "elapsed_time": "6:31:54", "remaining_time": "0:30:29", "throughput": 4298.0, "total_tokens": 101066192} +{"current_steps": 83315, "total_steps": 89790, "loss": 0.4546, "lr": 7.881109437561762e-07, "epoch": 9.278872925715559, "percentage": 92.79, "elapsed_time": "6:31:55", "remaining_time": "0:30:27", "throughput": 4298.02, "total_tokens": 101071792} +{"current_steps": 83320, "total_steps": 89790, "loss": 0.4639, "lr": 7.869008640952552e-07, "epoch": 9.279429780599175, "percentage": 92.79, "elapsed_time": "6:31:57", "remaining_time": "0:30:26", "throughput": 4298.04, "total_tokens": 101077904} +{"current_steps": 83325, "total_steps": 89790, "loss": 0.4575, "lr": 7.856916992828173e-07, "epoch": 9.279986635482793, "percentage": 92.8, "elapsed_time": "6:31:58", "remaining_time": "0:30:24", "throughput": 4298.07, "total_tokens": 101083952} +{"current_steps": 83330, "total_steps": 89790, "loss": 0.454, "lr": 7.844834493645454e-07, "epoch": 9.28054349036641, "percentage": 92.81, "elapsed_time": "6:31:59", "remaining_time": "0:30:23", "throughput": 4298.09, "total_tokens": 101089968} +{"current_steps": 83335, "total_steps": 89790, "loss": 0.4519, "lr": 7.83276114386089e-07, "epoch": 9.281100345250028, "percentage": 92.81, "elapsed_time": "6:32:01", "remaining_time": "0:30:21", "throughput": 4298.11, "total_tokens": 101095984} +{"current_steps": 83340, "total_steps": 89790, "loss": 0.4733, "lr": 7.820696943930699e-07, "epoch": 9.281657200133646, "percentage": 92.82, "elapsed_time": "6:32:02", "remaining_time": "0:30:20", "throughput": 4298.13, "total_tokens": 101102096} +{"current_steps": 83345, "total_steps": 89790, "loss": 0.4563, "lr": 7.808641894310659e-07, "epoch": 9.282214055017263, "percentage": 92.82, "elapsed_time": "6:32:03", "remaining_time": "0:30:19", "throughput": 4298.16, "total_tokens": 101108176} +{"current_steps": 83350, "total_steps": 89790, "loss": 0.4653, "lr": 7.796595995456318e-07, "epoch": 9.28277090990088, "percentage": 92.83, "elapsed_time": "6:32:04", "remaining_time": "0:30:17", "throughput": 4298.18, "total_tokens": 101113776} +{"current_steps": 83355, "total_steps": 89790, "loss": 0.4637, "lr": 7.784559247822703e-07, "epoch": 9.283327764784497, "percentage": 92.83, "elapsed_time": "6:32:06", "remaining_time": "0:30:16", "throughput": 4298.2, "total_tokens": 101119856} +{"current_steps": 83360, "total_steps": 89790, "loss": 0.4551, "lr": 7.772531651864673e-07, "epoch": 9.283884619668115, "percentage": 92.84, "elapsed_time": "6:32:07", "remaining_time": "0:30:14", "throughput": 4298.23, "total_tokens": 101126224} +{"current_steps": 83365, "total_steps": 89790, "loss": 0.4724, "lr": 7.760513208036669e-07, "epoch": 9.284441474551732, "percentage": 92.84, "elapsed_time": "6:32:08", "remaining_time": "0:30:13", "throughput": 4298.25, "total_tokens": 101132304} +{"current_steps": 83370, "total_steps": 89790, "loss": 0.4609, "lr": 7.748503916792743e-07, "epoch": 9.28499832943535, "percentage": 92.85, "elapsed_time": "6:32:10", "remaining_time": "0:30:11", "throughput": 4298.28, "total_tokens": 101138672} +{"current_steps": 83375, "total_steps": 89790, "loss": 0.4567, "lr": 7.736503778586701e-07, "epoch": 9.285555184318966, "percentage": 92.86, "elapsed_time": "6:32:11", "remaining_time": "0:30:10", "throughput": 4298.3, "total_tokens": 101144912} +{"current_steps": 83380, "total_steps": 89790, "loss": 0.4755, "lr": 7.724512793871874e-07, "epoch": 9.286112039202584, "percentage": 92.86, "elapsed_time": "6:32:12", "remaining_time": "0:30:09", "throughput": 4298.32, "total_tokens": 101150672} +{"current_steps": 83385, "total_steps": 89790, "loss": 0.4563, "lr": 7.712530963101427e-07, "epoch": 9.286668894086201, "percentage": 92.87, "elapsed_time": "6:32:13", "remaining_time": "0:30:07", "throughput": 4298.35, "total_tokens": 101156976} +{"current_steps": 83390, "total_steps": 89790, "loss": 0.4578, "lr": 7.700558286727944e-07, "epoch": 9.287225748969819, "percentage": 92.87, "elapsed_time": "6:32:15", "remaining_time": "0:30:06", "throughput": 4298.37, "total_tokens": 101162960} +{"current_steps": 83395, "total_steps": 89790, "loss": 0.4825, "lr": 7.688594765203893e-07, "epoch": 9.287782603853437, "percentage": 92.88, "elapsed_time": "6:32:16", "remaining_time": "0:30:04", "throughput": 4298.39, "total_tokens": 101168560} +{"current_steps": 83400, "total_steps": 89790, "loss": 0.4756, "lr": 7.67664039898125e-07, "epoch": 9.288339458737052, "percentage": 92.88, "elapsed_time": "6:32:17", "remaining_time": "0:30:03", "throughput": 4298.41, "total_tokens": 101174608} +{"current_steps": 83405, "total_steps": 89790, "loss": 0.467, "lr": 7.664695188511705e-07, "epoch": 9.28889631362067, "percentage": 92.89, "elapsed_time": "6:32:18", "remaining_time": "0:30:02", "throughput": 4298.44, "total_tokens": 101180784} +{"current_steps": 83410, "total_steps": 89790, "loss": 0.4567, "lr": 7.652759134246568e-07, "epoch": 9.289453168504288, "percentage": 92.89, "elapsed_time": "6:32:20", "remaining_time": "0:30:00", "throughput": 4298.46, "total_tokens": 101187024} +{"current_steps": 83415, "total_steps": 89790, "loss": 0.4488, "lr": 7.640832236636836e-07, "epoch": 9.290010023387905, "percentage": 92.9, "elapsed_time": "6:32:21", "remaining_time": "0:29:59", "throughput": 4298.49, "total_tokens": 101193104} +{"current_steps": 83420, "total_steps": 89790, "loss": 0.4699, "lr": 7.628914496133149e-07, "epoch": 9.290566878271523, "percentage": 92.91, "elapsed_time": "6:32:22", "remaining_time": "0:29:57", "throughput": 4298.51, "total_tokens": 101199152} +{"current_steps": 83425, "total_steps": 89790, "loss": 0.4629, "lr": 7.617005913185759e-07, "epoch": 9.291123733155139, "percentage": 92.91, "elapsed_time": "6:32:24", "remaining_time": "0:29:56", "throughput": 4298.53, "total_tokens": 101205008} +{"current_steps": 83430, "total_steps": 89790, "loss": 0.4718, "lr": 7.60510648824464e-07, "epoch": 9.291680588038757, "percentage": 92.92, "elapsed_time": "6:32:25", "remaining_time": "0:29:54", "throughput": 4298.56, "total_tokens": 101211248} +{"current_steps": 83435, "total_steps": 89790, "loss": 0.4672, "lr": 7.593216221759431e-07, "epoch": 9.292237442922374, "percentage": 92.92, "elapsed_time": "6:32:26", "remaining_time": "0:29:53", "throughput": 4298.58, "total_tokens": 101217392} +{"current_steps": 83440, "total_steps": 89790, "loss": 0.456, "lr": 7.5813351141793e-07, "epoch": 9.292794297805992, "percentage": 92.93, "elapsed_time": "6:32:27", "remaining_time": "0:29:52", "throughput": 4298.61, "total_tokens": 101223440} +{"current_steps": 83445, "total_steps": 89790, "loss": 0.463, "lr": 7.569463165953223e-07, "epoch": 9.29335115268961, "percentage": 92.93, "elapsed_time": "6:32:29", "remaining_time": "0:29:50", "throughput": 4298.63, "total_tokens": 101229296} +{"current_steps": 83450, "total_steps": 89790, "loss": 0.4552, "lr": 7.557600377529728e-07, "epoch": 9.293908007573226, "percentage": 92.94, "elapsed_time": "6:32:30", "remaining_time": "0:29:49", "throughput": 4298.65, "total_tokens": 101235312} +{"current_steps": 83455, "total_steps": 89790, "loss": 0.4504, "lr": 7.545746749357041e-07, "epoch": 9.294464862456843, "percentage": 92.94, "elapsed_time": "6:32:31", "remaining_time": "0:29:47", "throughput": 4298.67, "total_tokens": 101241584} +{"current_steps": 83460, "total_steps": 89790, "loss": 0.4629, "lr": 7.533902281882998e-07, "epoch": 9.295021717340461, "percentage": 92.95, "elapsed_time": "6:32:33", "remaining_time": "0:29:46", "throughput": 4298.69, "total_tokens": 101247344} +{"current_steps": 83465, "total_steps": 89790, "loss": 0.4647, "lr": 7.522066975555159e-07, "epoch": 9.295578572224079, "percentage": 92.96, "elapsed_time": "6:32:34", "remaining_time": "0:29:44", "throughput": 4298.72, "total_tokens": 101253488} +{"current_steps": 83470, "total_steps": 89790, "loss": 0.4425, "lr": 7.51024083082072e-07, "epoch": 9.296135427107696, "percentage": 92.96, "elapsed_time": "6:32:35", "remaining_time": "0:29:43", "throughput": 4298.74, "total_tokens": 101259600} +{"current_steps": 83475, "total_steps": 89790, "loss": 0.4562, "lr": 7.498423848126463e-07, "epoch": 9.296692281991312, "percentage": 92.97, "elapsed_time": "6:32:36", "remaining_time": "0:29:42", "throughput": 4298.77, "total_tokens": 101265744} +{"current_steps": 83480, "total_steps": 89790, "loss": 0.4591, "lr": 7.486616027918892e-07, "epoch": 9.29724913687493, "percentage": 92.97, "elapsed_time": "6:32:38", "remaining_time": "0:29:40", "throughput": 4298.79, "total_tokens": 101271664} +{"current_steps": 83485, "total_steps": 89790, "loss": 0.4676, "lr": 7.474817370644122e-07, "epoch": 9.297805991758548, "percentage": 92.98, "elapsed_time": "6:32:39", "remaining_time": "0:29:39", "throughput": 4298.81, "total_tokens": 101277680} +{"current_steps": 83490, "total_steps": 89790, "loss": 0.4528, "lr": 7.463027876747963e-07, "epoch": 9.298362846642165, "percentage": 92.98, "elapsed_time": "6:32:40", "remaining_time": "0:29:37", "throughput": 4298.84, "total_tokens": 101283952} +{"current_steps": 83495, "total_steps": 89790, "loss": 0.4747, "lr": 7.451247546675866e-07, "epoch": 9.298919701525783, "percentage": 92.99, "elapsed_time": "6:32:42", "remaining_time": "0:29:36", "throughput": 4298.86, "total_tokens": 101289872} +{"current_steps": 83500, "total_steps": 89790, "loss": 0.4571, "lr": 7.439476380872917e-07, "epoch": 9.299476556409399, "percentage": 92.99, "elapsed_time": "6:32:43", "remaining_time": "0:29:35", "throughput": 4298.88, "total_tokens": 101295952} +{"current_steps": 83505, "total_steps": 89790, "loss": 0.4688, "lr": 7.427714379783874e-07, "epoch": 9.300033411293017, "percentage": 93.0, "elapsed_time": "6:32:44", "remaining_time": "0:29:33", "throughput": 4298.9, "total_tokens": 101302224} +{"current_steps": 83510, "total_steps": 89790, "loss": 0.466, "lr": 7.415961543853155e-07, "epoch": 9.300590266176634, "percentage": 93.01, "elapsed_time": "6:32:45", "remaining_time": "0:29:32", "throughput": 4298.93, "total_tokens": 101308496} +{"current_steps": 83515, "total_steps": 89790, "loss": 0.4717, "lr": 7.404217873524799e-07, "epoch": 9.301147121060252, "percentage": 93.01, "elapsed_time": "6:32:47", "remaining_time": "0:29:30", "throughput": 4298.95, "total_tokens": 101314512} +{"current_steps": 83520, "total_steps": 89790, "loss": 0.4615, "lr": 7.392483369242531e-07, "epoch": 9.30170397594387, "percentage": 93.02, "elapsed_time": "6:32:48", "remaining_time": "0:29:29", "throughput": 4298.97, "total_tokens": 101320432} +{"current_steps": 83525, "total_steps": 89790, "loss": 0.4613, "lr": 7.380758031449691e-07, "epoch": 9.302260830827485, "percentage": 93.02, "elapsed_time": "6:32:49", "remaining_time": "0:29:27", "throughput": 4298.99, "total_tokens": 101326224} +{"current_steps": 83530, "total_steps": 89790, "loss": 0.4719, "lr": 7.369041860589371e-07, "epoch": 9.302817685711103, "percentage": 93.03, "elapsed_time": "6:32:51", "remaining_time": "0:29:26", "throughput": 4299.01, "total_tokens": 101332304} +{"current_steps": 83535, "total_steps": 89790, "loss": 0.4675, "lr": 7.357334857104159e-07, "epoch": 9.30337454059472, "percentage": 93.03, "elapsed_time": "6:32:52", "remaining_time": "0:29:25", "throughput": 4299.04, "total_tokens": 101338256} +{"current_steps": 83540, "total_steps": 89790, "loss": 0.4582, "lr": 7.345637021436452e-07, "epoch": 9.303931395478338, "percentage": 93.04, "elapsed_time": "6:32:53", "remaining_time": "0:29:23", "throughput": 4299.06, "total_tokens": 101344144} +{"current_steps": 83545, "total_steps": 89790, "loss": 0.477, "lr": 7.333948354028175e-07, "epoch": 9.304488250361956, "percentage": 93.04, "elapsed_time": "6:32:54", "remaining_time": "0:29:22", "throughput": 4299.08, "total_tokens": 101350320} +{"current_steps": 83550, "total_steps": 89790, "loss": 0.4612, "lr": 7.322268855321001e-07, "epoch": 9.305045105245574, "percentage": 93.05, "elapsed_time": "6:32:56", "remaining_time": "0:29:20", "throughput": 4299.11, "total_tokens": 101356752} +{"current_steps": 83555, "total_steps": 89790, "loss": 0.4659, "lr": 7.310598525756218e-07, "epoch": 9.30560196012919, "percentage": 93.06, "elapsed_time": "6:32:57", "remaining_time": "0:29:19", "throughput": 4299.13, "total_tokens": 101362992} +{"current_steps": 83560, "total_steps": 89790, "loss": 0.467, "lr": 7.298937365774722e-07, "epoch": 9.306158815012807, "percentage": 93.06, "elapsed_time": "6:32:58", "remaining_time": "0:29:17", "throughput": 4299.15, "total_tokens": 101369072} +{"current_steps": 83565, "total_steps": 89790, "loss": 0.4552, "lr": 7.287285375817188e-07, "epoch": 9.306715669896425, "percentage": 93.07, "elapsed_time": "6:33:00", "remaining_time": "0:29:16", "throughput": 4299.18, "total_tokens": 101375024} +{"current_steps": 83570, "total_steps": 89790, "loss": 0.4506, "lr": 7.27564255632382e-07, "epoch": 9.307272524780043, "percentage": 93.07, "elapsed_time": "6:33:01", "remaining_time": "0:29:15", "throughput": 4299.19, "total_tokens": 101380432} +{"current_steps": 83575, "total_steps": 89790, "loss": 0.4587, "lr": 7.264008907734515e-07, "epoch": 9.30782937966366, "percentage": 93.08, "elapsed_time": "6:33:02", "remaining_time": "0:29:13", "throughput": 4299.21, "total_tokens": 101386320} +{"current_steps": 83580, "total_steps": 89790, "loss": 0.4555, "lr": 7.25238443048884e-07, "epoch": 9.308386234547276, "percentage": 93.08, "elapsed_time": "6:33:03", "remaining_time": "0:29:12", "throughput": 4299.24, "total_tokens": 101392496} +{"current_steps": 83585, "total_steps": 89790, "loss": 0.4661, "lr": 7.240769125026025e-07, "epoch": 9.308943089430894, "percentage": 93.09, "elapsed_time": "6:33:05", "remaining_time": "0:29:10", "throughput": 4299.26, "total_tokens": 101398576} +{"current_steps": 83590, "total_steps": 89790, "loss": 0.4752, "lr": 7.229162991784888e-07, "epoch": 9.309499944314512, "percentage": 93.09, "elapsed_time": "6:33:06", "remaining_time": "0:29:09", "throughput": 4299.29, "total_tokens": 101405072} +{"current_steps": 83595, "total_steps": 89790, "loss": 0.4705, "lr": 7.217566031203965e-07, "epoch": 9.31005679919813, "percentage": 93.1, "elapsed_time": "6:33:07", "remaining_time": "0:29:08", "throughput": 4299.31, "total_tokens": 101411184} +{"current_steps": 83600, "total_steps": 89790, "loss": 0.4664, "lr": 7.205978243721462e-07, "epoch": 9.310613654081747, "percentage": 93.11, "elapsed_time": "6:33:09", "remaining_time": "0:29:06", "throughput": 4299.34, "total_tokens": 101417392} +{"current_steps": 83605, "total_steps": 89790, "loss": 0.4686, "lr": 7.194399629775139e-07, "epoch": 9.311170508965363, "percentage": 93.11, "elapsed_time": "6:33:10", "remaining_time": "0:29:05", "throughput": 4299.36, "total_tokens": 101423376} +{"current_steps": 83610, "total_steps": 89790, "loss": 0.4659, "lr": 7.182830189802509e-07, "epoch": 9.31172736384898, "percentage": 93.12, "elapsed_time": "6:33:11", "remaining_time": "0:29:03", "throughput": 4299.38, "total_tokens": 101429328} +{"current_steps": 83615, "total_steps": 89790, "loss": 0.4557, "lr": 7.17126992424072e-07, "epoch": 9.312284218732598, "percentage": 93.12, "elapsed_time": "6:33:12", "remaining_time": "0:29:02", "throughput": 4299.4, "total_tokens": 101435504} +{"current_steps": 83620, "total_steps": 89790, "loss": 0.4533, "lr": 7.159718833526536e-07, "epoch": 9.312841073616216, "percentage": 93.13, "elapsed_time": "6:33:14", "remaining_time": "0:29:00", "throughput": 4299.42, "total_tokens": 101441200} +{"current_steps": 83625, "total_steps": 89790, "loss": 0.4699, "lr": 7.148176918096383e-07, "epoch": 9.313397928499834, "percentage": 93.13, "elapsed_time": "6:33:15", "remaining_time": "0:28:59", "throughput": 4299.44, "total_tokens": 101447152} +{"current_steps": 83630, "total_steps": 89790, "loss": 0.4556, "lr": 7.136644178386359e-07, "epoch": 9.31395478338345, "percentage": 93.14, "elapsed_time": "6:33:16", "remaining_time": "0:28:58", "throughput": 4299.47, "total_tokens": 101453584} +{"current_steps": 83635, "total_steps": 89790, "loss": 0.4521, "lr": 7.125120614832225e-07, "epoch": 9.314511638267067, "percentage": 93.15, "elapsed_time": "6:33:18", "remaining_time": "0:28:56", "throughput": 4299.49, "total_tokens": 101459568} +{"current_steps": 83640, "total_steps": 89790, "loss": 0.4563, "lr": 7.113606227869357e-07, "epoch": 9.315068493150685, "percentage": 93.15, "elapsed_time": "6:33:19", "remaining_time": "0:28:55", "throughput": 4299.52, "total_tokens": 101465744} +{"current_steps": 83645, "total_steps": 89790, "loss": 0.4628, "lr": 7.102101017932794e-07, "epoch": 9.315625348034303, "percentage": 93.16, "elapsed_time": "6:33:20", "remaining_time": "0:28:53", "throughput": 4299.54, "total_tokens": 101471856} +{"current_steps": 83650, "total_steps": 89790, "loss": 0.4657, "lr": 7.0906049854573e-07, "epoch": 9.31618220291792, "percentage": 93.16, "elapsed_time": "6:33:21", "remaining_time": "0:28:52", "throughput": 4299.56, "total_tokens": 101477936} +{"current_steps": 83655, "total_steps": 89790, "loss": 0.4467, "lr": 7.079118130877166e-07, "epoch": 9.316739057801536, "percentage": 93.17, "elapsed_time": "6:33:23", "remaining_time": "0:28:50", "throughput": 4299.59, "total_tokens": 101484272} +{"current_steps": 83660, "total_steps": 89790, "loss": 0.4598, "lr": 7.067640454626434e-07, "epoch": 9.317295912685154, "percentage": 93.17, "elapsed_time": "6:33:24", "remaining_time": "0:28:49", "throughput": 4299.61, "total_tokens": 101490256} +{"current_steps": 83665, "total_steps": 89790, "loss": 0.4658, "lr": 7.056171957138757e-07, "epoch": 9.317852767568771, "percentage": 93.18, "elapsed_time": "6:33:25", "remaining_time": "0:28:48", "throughput": 4299.64, "total_tokens": 101496752} +{"current_steps": 83670, "total_steps": 89790, "loss": 0.4621, "lr": 7.044712638847428e-07, "epoch": 9.31840962245239, "percentage": 93.18, "elapsed_time": "6:33:27", "remaining_time": "0:28:46", "throughput": 4299.66, "total_tokens": 101502704} +{"current_steps": 83675, "total_steps": 89790, "loss": 0.4607, "lr": 7.033262500185489e-07, "epoch": 9.318966477336007, "percentage": 93.19, "elapsed_time": "6:33:28", "remaining_time": "0:28:45", "throughput": 4299.68, "total_tokens": 101508720} +{"current_steps": 83680, "total_steps": 89790, "loss": 0.4651, "lr": 7.02182154158551e-07, "epoch": 9.319523332219624, "percentage": 93.2, "elapsed_time": "6:33:29", "remaining_time": "0:28:43", "throughput": 4299.7, "total_tokens": 101514576} +{"current_steps": 83685, "total_steps": 89790, "loss": 0.4711, "lr": 7.010389763479786e-07, "epoch": 9.32008018710324, "percentage": 93.2, "elapsed_time": "6:33:30", "remaining_time": "0:28:42", "throughput": 4299.72, "total_tokens": 101520560} +{"current_steps": 83690, "total_steps": 89790, "loss": 0.4763, "lr": 6.998967166300191e-07, "epoch": 9.320637041986858, "percentage": 93.21, "elapsed_time": "6:33:32", "remaining_time": "0:28:41", "throughput": 4299.75, "total_tokens": 101526320} +{"current_steps": 83695, "total_steps": 89790, "loss": 0.4619, "lr": 6.987553750478382e-07, "epoch": 9.321193896870476, "percentage": 93.21, "elapsed_time": "6:33:33", "remaining_time": "0:28:39", "throughput": 4299.77, "total_tokens": 101532336} +{"current_steps": 83700, "total_steps": 89790, "loss": 0.4597, "lr": 6.976149516445541e-07, "epoch": 9.321750751754093, "percentage": 93.22, "elapsed_time": "6:33:34", "remaining_time": "0:28:38", "throughput": 4299.79, "total_tokens": 101538320} +{"current_steps": 83705, "total_steps": 89790, "loss": 0.457, "lr": 6.9647544646326e-07, "epoch": 9.322307606637711, "percentage": 93.22, "elapsed_time": "6:33:36", "remaining_time": "0:28:36", "throughput": 4299.82, "total_tokens": 101544560} +{"current_steps": 83710, "total_steps": 89790, "loss": 0.4713, "lr": 6.953368595470078e-07, "epoch": 9.322864461521327, "percentage": 93.23, "elapsed_time": "6:33:37", "remaining_time": "0:28:35", "throughput": 4299.84, "total_tokens": 101550800} +{"current_steps": 83715, "total_steps": 89790, "loss": 0.4659, "lr": 6.941991909388157e-07, "epoch": 9.323421316404945, "percentage": 93.23, "elapsed_time": "6:33:38", "remaining_time": "0:28:33", "throughput": 4299.86, "total_tokens": 101556912} +{"current_steps": 83720, "total_steps": 89790, "loss": 0.4552, "lr": 6.930624406816743e-07, "epoch": 9.323978171288562, "percentage": 93.24, "elapsed_time": "6:33:39", "remaining_time": "0:28:32", "throughput": 4299.89, "total_tokens": 101563248} +{"current_steps": 83725, "total_steps": 89790, "loss": 0.4652, "lr": 6.919266088185244e-07, "epoch": 9.32453502617218, "percentage": 93.25, "elapsed_time": "6:33:41", "remaining_time": "0:28:31", "throughput": 4299.91, "total_tokens": 101569392} +{"current_steps": 83730, "total_steps": 89790, "loss": 0.4515, "lr": 6.907916953922899e-07, "epoch": 9.325091881055798, "percentage": 93.25, "elapsed_time": "6:33:42", "remaining_time": "0:28:29", "throughput": 4299.94, "total_tokens": 101575856} +{"current_steps": 83735, "total_steps": 89790, "loss": 0.4627, "lr": 6.896577004458449e-07, "epoch": 9.325648735939414, "percentage": 93.26, "elapsed_time": "6:33:43", "remaining_time": "0:28:28", "throughput": 4299.96, "total_tokens": 101581200} +{"current_steps": 83740, "total_steps": 89790, "loss": 0.4679, "lr": 6.885246240220383e-07, "epoch": 9.326205590823031, "percentage": 93.26, "elapsed_time": "6:33:45", "remaining_time": "0:28:26", "throughput": 4299.98, "total_tokens": 101587312} +{"current_steps": 83745, "total_steps": 89790, "loss": 0.4556, "lr": 6.873924661636833e-07, "epoch": 9.326762445706649, "percentage": 93.27, "elapsed_time": "6:33:46", "remaining_time": "0:28:25", "throughput": 4300.01, "total_tokens": 101593392} +{"current_steps": 83750, "total_steps": 89790, "loss": 0.4614, "lr": 6.862612269135538e-07, "epoch": 9.327319300590267, "percentage": 93.27, "elapsed_time": "6:33:47", "remaining_time": "0:28:24", "throughput": 4300.02, "total_tokens": 101599024} +{"current_steps": 83755, "total_steps": 89790, "loss": 0.4662, "lr": 6.851309063143934e-07, "epoch": 9.327876155473884, "percentage": 93.28, "elapsed_time": "6:33:48", "remaining_time": "0:28:22", "throughput": 4300.04, "total_tokens": 101604656} +{"current_steps": 83760, "total_steps": 89790, "loss": 0.4553, "lr": 6.840015044089043e-07, "epoch": 9.3284330103575, "percentage": 93.28, "elapsed_time": "6:33:50", "remaining_time": "0:28:21", "throughput": 4300.07, "total_tokens": 101611024} +{"current_steps": 83765, "total_steps": 89790, "loss": 0.4679, "lr": 6.828730212397688e-07, "epoch": 9.328989865241118, "percentage": 93.29, "elapsed_time": "6:33:51", "remaining_time": "0:28:19", "throughput": 4300.09, "total_tokens": 101617168} +{"current_steps": 83770, "total_steps": 89790, "loss": 0.4511, "lr": 6.81745456849614e-07, "epoch": 9.329546720124736, "percentage": 93.3, "elapsed_time": "6:33:52", "remaining_time": "0:28:18", "throughput": 4300.11, "total_tokens": 101623312} +{"current_steps": 83775, "total_steps": 89790, "loss": 0.4552, "lr": 6.806188112810475e-07, "epoch": 9.330103575008353, "percentage": 93.3, "elapsed_time": "6:33:54", "remaining_time": "0:28:16", "throughput": 4300.13, "total_tokens": 101629392} +{"current_steps": 83780, "total_steps": 89790, "loss": 0.4714, "lr": 6.794930845766407e-07, "epoch": 9.33066042989197, "percentage": 93.31, "elapsed_time": "6:33:55", "remaining_time": "0:28:15", "throughput": 4300.16, "total_tokens": 101635888} +{"current_steps": 83785, "total_steps": 89790, "loss": 0.454, "lr": 6.783682767789206e-07, "epoch": 9.331217284775587, "percentage": 93.31, "elapsed_time": "6:33:56", "remaining_time": "0:28:14", "throughput": 4300.19, "total_tokens": 101642128} +{"current_steps": 83790, "total_steps": 89790, "loss": 0.4642, "lr": 6.772443879303925e-07, "epoch": 9.331774139659204, "percentage": 93.32, "elapsed_time": "6:33:57", "remaining_time": "0:28:12", "throughput": 4300.21, "total_tokens": 101648048} +{"current_steps": 83795, "total_steps": 89790, "loss": 0.4497, "lr": 6.761214180735137e-07, "epoch": 9.332330994542822, "percentage": 93.32, "elapsed_time": "6:33:59", "remaining_time": "0:28:11", "throughput": 4300.24, "total_tokens": 101654576} +{"current_steps": 83800, "total_steps": 89790, "loss": 0.4622, "lr": 6.749993672507199e-07, "epoch": 9.33288784942644, "percentage": 93.33, "elapsed_time": "6:34:00", "remaining_time": "0:28:09", "throughput": 4300.26, "total_tokens": 101660336} +{"current_steps": 83805, "total_steps": 89790, "loss": 0.4522, "lr": 6.738782355044049e-07, "epoch": 9.333444704310057, "percentage": 93.33, "elapsed_time": "6:34:01", "remaining_time": "0:28:08", "throughput": 4300.28, "total_tokens": 101666352} +{"current_steps": 83810, "total_steps": 89790, "loss": 0.4679, "lr": 6.727580228769237e-07, "epoch": 9.334001559193673, "percentage": 93.34, "elapsed_time": "6:34:02", "remaining_time": "0:28:06", "throughput": 4300.29, "total_tokens": 101671664} +{"current_steps": 83815, "total_steps": 89790, "loss": 0.4694, "lr": 6.716387294106091e-07, "epoch": 9.334558414077291, "percentage": 93.35, "elapsed_time": "6:34:04", "remaining_time": "0:28:05", "throughput": 4300.32, "total_tokens": 101678032} +{"current_steps": 83820, "total_steps": 89790, "loss": 0.4672, "lr": 6.705203551477441e-07, "epoch": 9.335115268960909, "percentage": 93.35, "elapsed_time": "6:34:05", "remaining_time": "0:28:04", "throughput": 4300.34, "total_tokens": 101684048} +{"current_steps": 83825, "total_steps": 89790, "loss": 0.4641, "lr": 6.69402900130589e-07, "epoch": 9.335672123844526, "percentage": 93.36, "elapsed_time": "6:34:06", "remaining_time": "0:28:02", "throughput": 4300.36, "total_tokens": 101689456} +{"current_steps": 83830, "total_steps": 89790, "loss": 0.4611, "lr": 6.682863644013632e-07, "epoch": 9.336228978728144, "percentage": 93.36, "elapsed_time": "6:34:08", "remaining_time": "0:28:01", "throughput": 4300.38, "total_tokens": 101695696} +{"current_steps": 83835, "total_steps": 89790, "loss": 0.4596, "lr": 6.671707480022521e-07, "epoch": 9.33678583361176, "percentage": 93.37, "elapsed_time": "6:34:09", "remaining_time": "0:27:59", "throughput": 4300.4, "total_tokens": 101701776} +{"current_steps": 83840, "total_steps": 89790, "loss": 0.4575, "lr": 6.66056050975411e-07, "epoch": 9.337342688495378, "percentage": 93.37, "elapsed_time": "6:34:10", "remaining_time": "0:27:58", "throughput": 4300.43, "total_tokens": 101708240} +{"current_steps": 83845, "total_steps": 89790, "loss": 0.4497, "lr": 6.649422733629507e-07, "epoch": 9.337899543378995, "percentage": 93.38, "elapsed_time": "6:34:12", "remaining_time": "0:27:57", "throughput": 4300.45, "total_tokens": 101714320} +{"current_steps": 83850, "total_steps": 89790, "loss": 0.4474, "lr": 6.638294152069597e-07, "epoch": 9.338456398262613, "percentage": 93.38, "elapsed_time": "6:34:13", "remaining_time": "0:27:55", "throughput": 4300.48, "total_tokens": 101720528} +{"current_steps": 83855, "total_steps": 89790, "loss": 0.462, "lr": 6.62717476549482e-07, "epoch": 9.33901325314623, "percentage": 93.39, "elapsed_time": "6:34:14", "remaining_time": "0:27:54", "throughput": 4300.5, "total_tokens": 101726576} +{"current_steps": 83860, "total_steps": 89790, "loss": 0.4622, "lr": 6.616064574325315e-07, "epoch": 9.339570108029847, "percentage": 93.4, "elapsed_time": "6:34:15", "remaining_time": "0:27:52", "throughput": 4300.52, "total_tokens": 101732400} +{"current_steps": 83865, "total_steps": 89790, "loss": 0.4675, "lr": 6.604963578980828e-07, "epoch": 9.340126962913464, "percentage": 93.4, "elapsed_time": "6:34:17", "remaining_time": "0:27:51", "throughput": 4300.54, "total_tokens": 101738672} +{"current_steps": 83870, "total_steps": 89790, "loss": 0.4537, "lr": 6.593871779880828e-07, "epoch": 9.340683817797082, "percentage": 93.41, "elapsed_time": "6:34:18", "remaining_time": "0:27:49", "throughput": 4300.57, "total_tokens": 101745232} +{"current_steps": 83875, "total_steps": 89790, "loss": 0.4746, "lr": 6.582789177444399e-07, "epoch": 9.3412406726807, "percentage": 93.41, "elapsed_time": "6:34:19", "remaining_time": "0:27:48", "throughput": 4300.6, "total_tokens": 101751216} +{"current_steps": 83880, "total_steps": 89790, "loss": 0.4633, "lr": 6.571715772090231e-07, "epoch": 9.341797527564317, "percentage": 93.42, "elapsed_time": "6:34:21", "remaining_time": "0:27:47", "throughput": 4300.62, "total_tokens": 101757200} +{"current_steps": 83885, "total_steps": 89790, "loss": 0.4753, "lr": 6.560651564236797e-07, "epoch": 9.342354382447935, "percentage": 93.42, "elapsed_time": "6:34:22", "remaining_time": "0:27:45", "throughput": 4300.64, "total_tokens": 101763312} +{"current_steps": 83890, "total_steps": 89790, "loss": 0.4625, "lr": 6.54959655430204e-07, "epoch": 9.34291123733155, "percentage": 93.43, "elapsed_time": "6:34:23", "remaining_time": "0:27:44", "throughput": 4300.66, "total_tokens": 101769456} +{"current_steps": 83895, "total_steps": 89790, "loss": 0.4688, "lr": 6.538550742703709e-07, "epoch": 9.343468092215168, "percentage": 93.43, "elapsed_time": "6:34:24", "remaining_time": "0:27:42", "throughput": 4300.69, "total_tokens": 101775568} +{"current_steps": 83900, "total_steps": 89790, "loss": 0.4664, "lr": 6.527514129859136e-07, "epoch": 9.344024947098786, "percentage": 93.44, "elapsed_time": "6:34:26", "remaining_time": "0:27:41", "throughput": 4300.71, "total_tokens": 101782000} +{"current_steps": 83905, "total_steps": 89790, "loss": 0.4552, "lr": 6.516486716185349e-07, "epoch": 9.344581801982404, "percentage": 93.45, "elapsed_time": "6:34:27", "remaining_time": "0:27:40", "throughput": 4300.74, "total_tokens": 101788272} +{"current_steps": 83910, "total_steps": 89790, "loss": 0.4564, "lr": 6.50546850209896e-07, "epoch": 9.345138656866022, "percentage": 93.45, "elapsed_time": "6:34:28", "remaining_time": "0:27:38", "throughput": 4300.76, "total_tokens": 101794256} +{"current_steps": 83915, "total_steps": 89790, "loss": 0.4521, "lr": 6.494459488016274e-07, "epoch": 9.345695511749637, "percentage": 93.46, "elapsed_time": "6:34:30", "remaining_time": "0:27:37", "throughput": 4300.78, "total_tokens": 101800464} +{"current_steps": 83920, "total_steps": 89790, "loss": 0.4702, "lr": 6.483459674353293e-07, "epoch": 9.346252366633255, "percentage": 93.46, "elapsed_time": "6:34:31", "remaining_time": "0:27:35", "throughput": 4300.81, "total_tokens": 101806160} +{"current_steps": 83925, "total_steps": 89790, "loss": 0.4564, "lr": 6.472469061525571e-07, "epoch": 9.346809221516873, "percentage": 93.47, "elapsed_time": "6:34:32", "remaining_time": "0:27:34", "throughput": 4300.83, "total_tokens": 101811760} +{"current_steps": 83930, "total_steps": 89790, "loss": 0.4531, "lr": 6.461487649948389e-07, "epoch": 9.34736607640049, "percentage": 93.47, "elapsed_time": "6:34:33", "remaining_time": "0:27:32", "throughput": 4300.85, "total_tokens": 101818000} +{"current_steps": 83935, "total_steps": 89790, "loss": 0.4475, "lr": 6.450515440036692e-07, "epoch": 9.347922931284108, "percentage": 93.48, "elapsed_time": "6:34:35", "remaining_time": "0:27:31", "throughput": 4300.88, "total_tokens": 101824368} +{"current_steps": 83940, "total_steps": 89790, "loss": 0.4572, "lr": 6.439552432204982e-07, "epoch": 9.348479786167724, "percentage": 93.48, "elapsed_time": "6:34:36", "remaining_time": "0:27:30", "throughput": 4300.9, "total_tokens": 101830416} +{"current_steps": 83945, "total_steps": 89790, "loss": 0.484, "lr": 6.42859862686751e-07, "epoch": 9.349036641051342, "percentage": 93.49, "elapsed_time": "6:34:37", "remaining_time": "0:27:28", "throughput": 4300.92, "total_tokens": 101836560} +{"current_steps": 83950, "total_steps": 89790, "loss": 0.4455, "lr": 6.417654024438141e-07, "epoch": 9.34959349593496, "percentage": 93.5, "elapsed_time": "6:34:39", "remaining_time": "0:27:27", "throughput": 4300.95, "total_tokens": 101842800} +{"current_steps": 83955, "total_steps": 89790, "loss": 0.4582, "lr": 6.406718625330432e-07, "epoch": 9.350150350818577, "percentage": 93.5, "elapsed_time": "6:34:40", "remaining_time": "0:27:25", "throughput": 4300.97, "total_tokens": 101848720} +{"current_steps": 83960, "total_steps": 89790, "loss": 0.4557, "lr": 6.395792429957498e-07, "epoch": 9.350707205702195, "percentage": 93.51, "elapsed_time": "6:34:41", "remaining_time": "0:27:24", "throughput": 4300.99, "total_tokens": 101854704} +{"current_steps": 83965, "total_steps": 89790, "loss": 0.4525, "lr": 6.384875438732202e-07, "epoch": 9.35126406058581, "percentage": 93.51, "elapsed_time": "6:34:43", "remaining_time": "0:27:22", "throughput": 4301.01, "total_tokens": 101860784} +{"current_steps": 83970, "total_steps": 89790, "loss": 0.4613, "lr": 6.37396765206702e-07, "epoch": 9.351820915469428, "percentage": 93.52, "elapsed_time": "6:34:44", "remaining_time": "0:27:21", "throughput": 4301.03, "total_tokens": 101866928} +{"current_steps": 83975, "total_steps": 89790, "loss": 0.4469, "lr": 6.363069070374067e-07, "epoch": 9.352377770353046, "percentage": 93.52, "elapsed_time": "6:34:45", "remaining_time": "0:27:20", "throughput": 4301.06, "total_tokens": 101873264} +{"current_steps": 83980, "total_steps": 89790, "loss": 0.4505, "lr": 6.352179694065152e-07, "epoch": 9.352934625236664, "percentage": 93.53, "elapsed_time": "6:34:46", "remaining_time": "0:27:18", "throughput": 4301.08, "total_tokens": 101879056} +{"current_steps": 83985, "total_steps": 89790, "loss": 0.4509, "lr": 6.34129952355167e-07, "epoch": 9.353491480120281, "percentage": 93.53, "elapsed_time": "6:34:48", "remaining_time": "0:27:17", "throughput": 4301.09, "total_tokens": 101884464} +{"current_steps": 83990, "total_steps": 89790, "loss": 0.471, "lr": 6.33042855924476e-07, "epoch": 9.354048335003897, "percentage": 93.54, "elapsed_time": "6:34:49", "remaining_time": "0:27:15", "throughput": 4301.11, "total_tokens": 101890512} +{"current_steps": 83995, "total_steps": 89790, "loss": 0.4686, "lr": 6.319566801555126e-07, "epoch": 9.354605189887515, "percentage": 93.55, "elapsed_time": "6:34:50", "remaining_time": "0:27:14", "throughput": 4301.13, "total_tokens": 101895824} +{"current_steps": 84000, "total_steps": 89790, "loss": 0.4563, "lr": 6.308714250893188e-07, "epoch": 9.355162044771133, "percentage": 93.55, "elapsed_time": "6:34:51", "remaining_time": "0:27:13", "throughput": 4301.15, "total_tokens": 101901680} +{"current_steps": 84005, "total_steps": 89790, "loss": 0.451, "lr": 6.297870907668979e-07, "epoch": 9.35571889965475, "percentage": 93.56, "elapsed_time": "6:34:52", "remaining_time": "0:27:11", "throughput": 4301.18, "total_tokens": 101907728} +{"current_steps": 84010, "total_steps": 89790, "loss": 0.4638, "lr": 6.287036772292143e-07, "epoch": 9.356275754538368, "percentage": 93.56, "elapsed_time": "6:34:54", "remaining_time": "0:27:10", "throughput": 4301.2, "total_tokens": 101913808} +{"current_steps": 84015, "total_steps": 89790, "loss": 0.4611, "lr": 6.276211845172103e-07, "epoch": 9.356832609421984, "percentage": 93.57, "elapsed_time": "6:34:55", "remaining_time": "0:27:08", "throughput": 4301.22, "total_tokens": 101920016} +{"current_steps": 84020, "total_steps": 89790, "loss": 0.469, "lr": 6.265396126717837e-07, "epoch": 9.357389464305601, "percentage": 93.57, "elapsed_time": "6:34:56", "remaining_time": "0:27:07", "throughput": 4301.24, "total_tokens": 101925008} +{"current_steps": 84025, "total_steps": 89790, "loss": 0.4542, "lr": 6.254589617337964e-07, "epoch": 9.35794631918922, "percentage": 93.58, "elapsed_time": "6:34:57", "remaining_time": "0:27:05", "throughput": 4301.26, "total_tokens": 101931152} +{"current_steps": 84030, "total_steps": 89790, "loss": 0.4603, "lr": 6.243792317440849e-07, "epoch": 9.358503174072837, "percentage": 93.59, "elapsed_time": "6:34:59", "remaining_time": "0:27:04", "throughput": 4301.28, "total_tokens": 101937392} +{"current_steps": 84035, "total_steps": 89790, "loss": 0.454, "lr": 6.233004227434391e-07, "epoch": 9.359060028956455, "percentage": 93.59, "elapsed_time": "6:35:00", "remaining_time": "0:27:03", "throughput": 4301.3, "total_tokens": 101943152} +{"current_steps": 84040, "total_steps": 89790, "loss": 0.4625, "lr": 6.222225347726235e-07, "epoch": 9.359616883840072, "percentage": 93.6, "elapsed_time": "6:35:01", "remaining_time": "0:27:01", "throughput": 4301.32, "total_tokens": 101948656} +{"current_steps": 84045, "total_steps": 89790, "loss": 0.4702, "lr": 6.21145567872361e-07, "epoch": 9.360173738723688, "percentage": 93.6, "elapsed_time": "6:35:02", "remaining_time": "0:27:00", "throughput": 4301.35, "total_tokens": 101954768} +{"current_steps": 84050, "total_steps": 89790, "loss": 0.4566, "lr": 6.200695220833469e-07, "epoch": 9.360730593607306, "percentage": 93.61, "elapsed_time": "6:35:04", "remaining_time": "0:26:58", "throughput": 4301.37, "total_tokens": 101960592} +{"current_steps": 84055, "total_steps": 89790, "loss": 0.4591, "lr": 6.189943974462348e-07, "epoch": 9.361287448490923, "percentage": 93.61, "elapsed_time": "6:35:05", "remaining_time": "0:26:57", "throughput": 4301.39, "total_tokens": 101966800} +{"current_steps": 84060, "total_steps": 89790, "loss": 0.4667, "lr": 6.179201940016477e-07, "epoch": 9.361844303374541, "percentage": 93.62, "elapsed_time": "6:35:06", "remaining_time": "0:26:55", "throughput": 4301.41, "total_tokens": 101972752} +{"current_steps": 84065, "total_steps": 89790, "loss": 0.4734, "lr": 6.168469117901727e-07, "epoch": 9.362401158258159, "percentage": 93.62, "elapsed_time": "6:35:08", "remaining_time": "0:26:54", "throughput": 4301.44, "total_tokens": 101978832} +{"current_steps": 84070, "total_steps": 89790, "loss": 0.461, "lr": 6.157745508523577e-07, "epoch": 9.362958013141775, "percentage": 93.63, "elapsed_time": "6:35:09", "remaining_time": "0:26:53", "throughput": 4301.46, "total_tokens": 101985168} +{"current_steps": 84075, "total_steps": 89790, "loss": 0.4645, "lr": 6.147031112287261e-07, "epoch": 9.363514868025392, "percentage": 93.64, "elapsed_time": "6:35:10", "remaining_time": "0:26:51", "throughput": 4301.49, "total_tokens": 101991504} +{"current_steps": 84080, "total_steps": 89790, "loss": 0.4571, "lr": 6.136325929597564e-07, "epoch": 9.36407172290901, "percentage": 93.64, "elapsed_time": "6:35:12", "remaining_time": "0:26:50", "throughput": 4301.51, "total_tokens": 101997424} +{"current_steps": 84085, "total_steps": 89790, "loss": 0.4723, "lr": 6.12562996085897e-07, "epoch": 9.364628577792628, "percentage": 93.65, "elapsed_time": "6:35:13", "remaining_time": "0:26:48", "throughput": 4301.53, "total_tokens": 102003440} +{"current_steps": 84090, "total_steps": 89790, "loss": 0.4656, "lr": 6.114943206475626e-07, "epoch": 9.365185432676245, "percentage": 93.65, "elapsed_time": "6:35:14", "remaining_time": "0:26:47", "throughput": 4301.55, "total_tokens": 102009616} +{"current_steps": 84095, "total_steps": 89790, "loss": 0.4621, "lr": 6.104265666851294e-07, "epoch": 9.365742287559861, "percentage": 93.66, "elapsed_time": "6:35:15", "remaining_time": "0:26:46", "throughput": 4301.58, "total_tokens": 102015600} +{"current_steps": 84100, "total_steps": 89790, "loss": 0.4631, "lr": 6.093597342389401e-07, "epoch": 9.366299142443479, "percentage": 93.66, "elapsed_time": "6:35:17", "remaining_time": "0:26:44", "throughput": 4301.6, "total_tokens": 102021680} +{"current_steps": 84105, "total_steps": 89790, "loss": 0.4743, "lr": 6.082938233493041e-07, "epoch": 9.366855997327097, "percentage": 93.67, "elapsed_time": "6:35:18", "remaining_time": "0:26:43", "throughput": 4301.62, "total_tokens": 102027504} +{"current_steps": 84110, "total_steps": 89790, "loss": 0.4724, "lr": 6.072288340564919e-07, "epoch": 9.367412852210714, "percentage": 93.67, "elapsed_time": "6:35:19", "remaining_time": "0:26:41", "throughput": 4301.64, "total_tokens": 102033520} +{"current_steps": 84115, "total_steps": 89790, "loss": 0.4625, "lr": 6.061647664007492e-07, "epoch": 9.367969707094332, "percentage": 93.68, "elapsed_time": "6:35:21", "remaining_time": "0:26:40", "throughput": 4301.66, "total_tokens": 102039792} +{"current_steps": 84120, "total_steps": 89790, "loss": 0.4552, "lr": 6.051016204222714e-07, "epoch": 9.368526561977948, "percentage": 93.69, "elapsed_time": "6:35:22", "remaining_time": "0:26:38", "throughput": 4301.69, "total_tokens": 102045904} +{"current_steps": 84125, "total_steps": 89790, "loss": 0.4612, "lr": 6.040393961612351e-07, "epoch": 9.369083416861566, "percentage": 93.69, "elapsed_time": "6:35:23", "remaining_time": "0:26:37", "throughput": 4301.71, "total_tokens": 102052048} +{"current_steps": 84130, "total_steps": 89790, "loss": 0.4652, "lr": 6.029780936577689e-07, "epoch": 9.369640271745183, "percentage": 93.7, "elapsed_time": "6:35:24", "remaining_time": "0:26:36", "throughput": 4301.73, "total_tokens": 102057936} +{"current_steps": 84135, "total_steps": 89790, "loss": 0.4585, "lr": 6.019177129519743e-07, "epoch": 9.3701971266288, "percentage": 93.7, "elapsed_time": "6:35:26", "remaining_time": "0:26:34", "throughput": 4301.75, "total_tokens": 102064016} +{"current_steps": 84140, "total_steps": 89790, "loss": 0.456, "lr": 6.008582540839164e-07, "epoch": 9.370753981512419, "percentage": 93.71, "elapsed_time": "6:35:27", "remaining_time": "0:26:33", "throughput": 4301.78, "total_tokens": 102070448} +{"current_steps": 84145, "total_steps": 89790, "loss": 0.4702, "lr": 5.997997170936242e-07, "epoch": 9.371310836396034, "percentage": 93.71, "elapsed_time": "6:35:28", "remaining_time": "0:26:31", "throughput": 4301.8, "total_tokens": 102076656} +{"current_steps": 84150, "total_steps": 89790, "loss": 0.4647, "lr": 5.987421020210937e-07, "epoch": 9.371867691279652, "percentage": 93.72, "elapsed_time": "6:35:30", "remaining_time": "0:26:30", "throughput": 4301.83, "total_tokens": 102082736} +{"current_steps": 84155, "total_steps": 89790, "loss": 0.4669, "lr": 5.976854089062844e-07, "epoch": 9.37242454616327, "percentage": 93.72, "elapsed_time": "6:35:31", "remaining_time": "0:26:29", "throughput": 4301.85, "total_tokens": 102089040} +{"current_steps": 84160, "total_steps": 89790, "loss": 0.4701, "lr": 5.966296377891229e-07, "epoch": 9.372981401046887, "percentage": 93.73, "elapsed_time": "6:35:32", "remaining_time": "0:26:27", "throughput": 4301.87, "total_tokens": 102095152} +{"current_steps": 84165, "total_steps": 89790, "loss": 0.4557, "lr": 5.955747887094937e-07, "epoch": 9.373538255930505, "percentage": 93.74, "elapsed_time": "6:35:33", "remaining_time": "0:26:26", "throughput": 4301.89, "total_tokens": 102101104} +{"current_steps": 84170, "total_steps": 89790, "loss": 0.4555, "lr": 5.945208617072623e-07, "epoch": 9.374095110814121, "percentage": 93.74, "elapsed_time": "6:35:35", "remaining_time": "0:26:24", "throughput": 4301.92, "total_tokens": 102107120} +{"current_steps": 84175, "total_steps": 89790, "loss": 0.4607, "lr": 5.934678568222385e-07, "epoch": 9.374651965697739, "percentage": 93.75, "elapsed_time": "6:35:36", "remaining_time": "0:26:23", "throughput": 4301.94, "total_tokens": 102113232} +{"current_steps": 84180, "total_steps": 89790, "loss": 0.4631, "lr": 5.924157740942155e-07, "epoch": 9.375208820581356, "percentage": 93.75, "elapsed_time": "6:35:37", "remaining_time": "0:26:21", "throughput": 4301.96, "total_tokens": 102119056} +{"current_steps": 84185, "total_steps": 89790, "loss": 0.4625, "lr": 5.913646135629447e-07, "epoch": 9.375765675464974, "percentage": 93.76, "elapsed_time": "6:35:39", "remaining_time": "0:26:20", "throughput": 4301.98, "total_tokens": 102125008} +{"current_steps": 84190, "total_steps": 89790, "loss": 0.453, "lr": 5.903143752681389e-07, "epoch": 9.376322530348592, "percentage": 93.76, "elapsed_time": "6:35:40", "remaining_time": "0:26:19", "throughput": 4302.0, "total_tokens": 102131216} +{"current_steps": 84195, "total_steps": 89790, "loss": 0.4576, "lr": 5.892650592494803e-07, "epoch": 9.376879385232208, "percentage": 93.77, "elapsed_time": "6:35:41", "remaining_time": "0:26:17", "throughput": 4302.02, "total_tokens": 102137456} +{"current_steps": 84200, "total_steps": 89790, "loss": 0.4441, "lr": 5.882166655466149e-07, "epoch": 9.377436240115825, "percentage": 93.77, "elapsed_time": "6:35:42", "remaining_time": "0:26:16", "throughput": 4302.04, "total_tokens": 102143088} +{"current_steps": 84205, "total_steps": 89790, "loss": 0.4492, "lr": 5.871691941991553e-07, "epoch": 9.377993094999443, "percentage": 93.78, "elapsed_time": "6:35:44", "remaining_time": "0:26:14", "throughput": 4302.06, "total_tokens": 102149008} +{"current_steps": 84210, "total_steps": 89790, "loss": 0.4647, "lr": 5.861226452466812e-07, "epoch": 9.37854994988306, "percentage": 93.79, "elapsed_time": "6:35:45", "remaining_time": "0:26:13", "throughput": 4302.09, "total_tokens": 102155088} +{"current_steps": 84215, "total_steps": 89790, "loss": 0.4654, "lr": 5.850770187287303e-07, "epoch": 9.379106804766678, "percentage": 93.79, "elapsed_time": "6:35:46", "remaining_time": "0:26:12", "throughput": 4302.11, "total_tokens": 102161264} +{"current_steps": 84220, "total_steps": 89790, "loss": 0.453, "lr": 5.840323146848098e-07, "epoch": 9.379663659650294, "percentage": 93.8, "elapsed_time": "6:35:48", "remaining_time": "0:26:10", "throughput": 4302.13, "total_tokens": 102167504} +{"current_steps": 84225, "total_steps": 89790, "loss": 0.4668, "lr": 5.829885331543939e-07, "epoch": 9.380220514533912, "percentage": 93.8, "elapsed_time": "6:35:49", "remaining_time": "0:26:09", "throughput": 4302.16, "total_tokens": 102173808} +{"current_steps": 84230, "total_steps": 89790, "loss": 0.4679, "lr": 5.819456741769203e-07, "epoch": 9.38077736941753, "percentage": 93.81, "elapsed_time": "6:35:50", "remaining_time": "0:26:07", "throughput": 4302.18, "total_tokens": 102179952} +{"current_steps": 84235, "total_steps": 89790, "loss": 0.4631, "lr": 5.809037377917909e-07, "epoch": 9.381334224301147, "percentage": 93.81, "elapsed_time": "6:35:51", "remaining_time": "0:26:06", "throughput": 4302.2, "total_tokens": 102185296} +{"current_steps": 84240, "total_steps": 89790, "loss": 0.4689, "lr": 5.798627240383686e-07, "epoch": 9.381891079184765, "percentage": 93.82, "elapsed_time": "6:35:53", "remaining_time": "0:26:04", "throughput": 4302.22, "total_tokens": 102191568} +{"current_steps": 84245, "total_steps": 89790, "loss": 0.4705, "lr": 5.788226329559971e-07, "epoch": 9.382447934068383, "percentage": 93.82, "elapsed_time": "6:35:54", "remaining_time": "0:26:03", "throughput": 4302.25, "total_tokens": 102197648} +{"current_steps": 84250, "total_steps": 89790, "loss": 0.4745, "lr": 5.777834645839641e-07, "epoch": 9.383004788951999, "percentage": 93.83, "elapsed_time": "6:35:55", "remaining_time": "0:26:02", "throughput": 4302.27, "total_tokens": 102203696} +{"current_steps": 84255, "total_steps": 89790, "loss": 0.4652, "lr": 5.767452189615385e-07, "epoch": 9.383561643835616, "percentage": 93.84, "elapsed_time": "6:35:57", "remaining_time": "0:26:00", "throughput": 4302.29, "total_tokens": 102209904} +{"current_steps": 84260, "total_steps": 89790, "loss": 0.4346, "lr": 5.757078961279444e-07, "epoch": 9.384118498719234, "percentage": 93.84, "elapsed_time": "6:35:58", "remaining_time": "0:25:59", "throughput": 4302.31, "total_tokens": 102216240} +{"current_steps": 84265, "total_steps": 89790, "loss": 0.4523, "lr": 5.746714961223809e-07, "epoch": 9.384675353602852, "percentage": 93.85, "elapsed_time": "6:35:59", "remaining_time": "0:25:57", "throughput": 4302.34, "total_tokens": 102222384} +{"current_steps": 84270, "total_steps": 89790, "loss": 0.4573, "lr": 5.736360189840001e-07, "epoch": 9.38523220848647, "percentage": 93.85, "elapsed_time": "6:36:01", "remaining_time": "0:25:56", "throughput": 4302.36, "total_tokens": 102228496} +{"current_steps": 84275, "total_steps": 89790, "loss": 0.4608, "lr": 5.72601464751929e-07, "epoch": 9.385789063370085, "percentage": 93.86, "elapsed_time": "6:36:02", "remaining_time": "0:25:55", "throughput": 4302.38, "total_tokens": 102234576} +{"current_steps": 84280, "total_steps": 89790, "loss": 0.4612, "lr": 5.715678334652585e-07, "epoch": 9.386345918253703, "percentage": 93.86, "elapsed_time": "6:36:03", "remaining_time": "0:25:53", "throughput": 4302.41, "total_tokens": 102240624} +{"current_steps": 84285, "total_steps": 89790, "loss": 0.4623, "lr": 5.705351251630381e-07, "epoch": 9.38690277313732, "percentage": 93.87, "elapsed_time": "6:36:04", "remaining_time": "0:25:52", "throughput": 4302.43, "total_tokens": 102246928} +{"current_steps": 84290, "total_steps": 89790, "loss": 0.4638, "lr": 5.695033398842892e-07, "epoch": 9.387459628020938, "percentage": 93.87, "elapsed_time": "6:36:06", "remaining_time": "0:25:50", "throughput": 4302.45, "total_tokens": 102253232} +{"current_steps": 84295, "total_steps": 89790, "loss": 0.4523, "lr": 5.684724776679945e-07, "epoch": 9.388016482904556, "percentage": 93.88, "elapsed_time": "6:36:07", "remaining_time": "0:25:49", "throughput": 4302.48, "total_tokens": 102259344} +{"current_steps": 84300, "total_steps": 89790, "loss": 0.4584, "lr": 5.674425385531035e-07, "epoch": 9.388573337788172, "percentage": 93.89, "elapsed_time": "6:36:08", "remaining_time": "0:25:47", "throughput": 4302.5, "total_tokens": 102265552} +{"current_steps": 84305, "total_steps": 89790, "loss": 0.462, "lr": 5.66413522578535e-07, "epoch": 9.38913019267179, "percentage": 93.89, "elapsed_time": "6:36:10", "remaining_time": "0:25:46", "throughput": 4302.53, "total_tokens": 102271728} +{"current_steps": 84310, "total_steps": 89790, "loss": 0.4561, "lr": 5.653854297831606e-07, "epoch": 9.389687047555407, "percentage": 93.9, "elapsed_time": "6:36:11", "remaining_time": "0:25:45", "throughput": 4302.55, "total_tokens": 102277744} +{"current_steps": 84315, "total_steps": 89790, "loss": 0.4765, "lr": 5.643582602058329e-07, "epoch": 9.390243902439025, "percentage": 93.9, "elapsed_time": "6:36:12", "remaining_time": "0:25:43", "throughput": 4302.58, "total_tokens": 102284112} +{"current_steps": 84320, "total_steps": 89790, "loss": 0.4604, "lr": 5.633320138853537e-07, "epoch": 9.390800757322642, "percentage": 93.91, "elapsed_time": "6:36:14", "remaining_time": "0:25:42", "throughput": 4302.6, "total_tokens": 102290320} +{"current_steps": 84325, "total_steps": 89790, "loss": 0.4693, "lr": 5.623066908605063e-07, "epoch": 9.391357612206258, "percentage": 93.91, "elapsed_time": "6:36:15", "remaining_time": "0:25:40", "throughput": 4302.62, "total_tokens": 102296112} +{"current_steps": 84330, "total_steps": 89790, "loss": 0.4444, "lr": 5.61282291170026e-07, "epoch": 9.391914467089876, "percentage": 93.92, "elapsed_time": "6:36:16", "remaining_time": "0:25:39", "throughput": 4302.64, "total_tokens": 102302384} +{"current_steps": 84335, "total_steps": 89790, "loss": 0.4568, "lr": 5.602588148526156e-07, "epoch": 9.392471321973494, "percentage": 93.92, "elapsed_time": "6:36:17", "remaining_time": "0:25:38", "throughput": 4302.67, "total_tokens": 102308432} +{"current_steps": 84340, "total_steps": 89790, "loss": 0.4558, "lr": 5.592362619469521e-07, "epoch": 9.393028176857111, "percentage": 93.93, "elapsed_time": "6:36:19", "remaining_time": "0:25:36", "throughput": 4302.69, "total_tokens": 102314480} +{"current_steps": 84345, "total_steps": 89790, "loss": 0.4575, "lr": 5.582146324916632e-07, "epoch": 9.393585031740729, "percentage": 93.94, "elapsed_time": "6:36:20", "remaining_time": "0:25:35", "throughput": 4302.71, "total_tokens": 102320304} +{"current_steps": 84350, "total_steps": 89790, "loss": 0.4564, "lr": 5.571939265253568e-07, "epoch": 9.394141886624345, "percentage": 93.94, "elapsed_time": "6:36:21", "remaining_time": "0:25:33", "throughput": 4302.73, "total_tokens": 102326384} +{"current_steps": 84355, "total_steps": 89790, "loss": 0.4662, "lr": 5.561741440865909e-07, "epoch": 9.394698741507963, "percentage": 93.95, "elapsed_time": "6:36:23", "remaining_time": "0:25:32", "throughput": 4302.76, "total_tokens": 102332464} +{"current_steps": 84360, "total_steps": 89790, "loss": 0.4556, "lr": 5.551552852139042e-07, "epoch": 9.39525559639158, "percentage": 93.95, "elapsed_time": "6:36:24", "remaining_time": "0:25:30", "throughput": 4302.78, "total_tokens": 102338832} +{"current_steps": 84365, "total_steps": 89790, "loss": 0.4554, "lr": 5.541373499457825e-07, "epoch": 9.395812451275198, "percentage": 93.96, "elapsed_time": "6:36:25", "remaining_time": "0:25:29", "throughput": 4302.81, "total_tokens": 102345200} +{"current_steps": 84370, "total_steps": 89790, "loss": 0.4515, "lr": 5.531203383206951e-07, "epoch": 9.396369306158816, "percentage": 93.96, "elapsed_time": "6:36:27", "remaining_time": "0:25:28", "throughput": 4302.83, "total_tokens": 102351504} +{"current_steps": 84375, "total_steps": 89790, "loss": 0.4618, "lr": 5.521042503770668e-07, "epoch": 9.396926161042432, "percentage": 93.97, "elapsed_time": "6:36:28", "remaining_time": "0:25:26", "throughput": 4302.86, "total_tokens": 102357712} +{"current_steps": 84380, "total_steps": 89790, "loss": 0.4538, "lr": 5.510890861532864e-07, "epoch": 9.39748301592605, "percentage": 93.97, "elapsed_time": "6:36:29", "remaining_time": "0:25:25", "throughput": 4302.88, "total_tokens": 102363600} +{"current_steps": 84385, "total_steps": 89790, "loss": 0.4556, "lr": 5.500748456877092e-07, "epoch": 9.398039870809667, "percentage": 93.98, "elapsed_time": "6:36:30", "remaining_time": "0:25:23", "throughput": 4302.9, "total_tokens": 102370096} +{"current_steps": 84390, "total_steps": 89790, "loss": 0.4578, "lr": 5.490615290186602e-07, "epoch": 9.398596725693285, "percentage": 93.99, "elapsed_time": "6:36:32", "remaining_time": "0:25:22", "throughput": 4302.93, "total_tokens": 102376432} +{"current_steps": 84395, "total_steps": 89790, "loss": 0.4587, "lr": 5.480491361844197e-07, "epoch": 9.399153580576902, "percentage": 93.99, "elapsed_time": "6:36:33", "remaining_time": "0:25:21", "throughput": 4302.95, "total_tokens": 102382480} +{"current_steps": 84400, "total_steps": 89790, "loss": 0.4577, "lr": 5.470376672232463e-07, "epoch": 9.39971043546052, "percentage": 94.0, "elapsed_time": "6:36:34", "remaining_time": "0:25:19", "throughput": 4302.97, "total_tokens": 102388528} +{"current_steps": 84405, "total_steps": 89790, "loss": 0.4698, "lr": 5.46027122173351e-07, "epoch": 9.400267290344136, "percentage": 94.0, "elapsed_time": "6:36:36", "remaining_time": "0:25:18", "throughput": 4302.99, "total_tokens": 102394288} +{"current_steps": 84410, "total_steps": 89790, "loss": 0.4591, "lr": 5.450175010729225e-07, "epoch": 9.400824145227753, "percentage": 94.01, "elapsed_time": "6:36:37", "remaining_time": "0:25:16", "throughput": 4303.02, "total_tokens": 102400400} +{"current_steps": 84415, "total_steps": 89790, "loss": 0.4602, "lr": 5.440088039600999e-07, "epoch": 9.401381000111371, "percentage": 94.01, "elapsed_time": "6:36:38", "remaining_time": "0:25:15", "throughput": 4303.04, "total_tokens": 102406640} +{"current_steps": 84420, "total_steps": 89790, "loss": 0.4607, "lr": 5.430010308729944e-07, "epoch": 9.401937854994989, "percentage": 94.02, "elapsed_time": "6:36:39", "remaining_time": "0:25:13", "throughput": 4303.06, "total_tokens": 102412432} +{"current_steps": 84425, "total_steps": 89790, "loss": 0.4758, "lr": 5.419941818496921e-07, "epoch": 9.402494709878606, "percentage": 94.02, "elapsed_time": "6:36:41", "remaining_time": "0:25:12", "throughput": 4303.08, "total_tokens": 102418512} +{"current_steps": 84430, "total_steps": 89790, "loss": 0.4664, "lr": 5.409882569282238e-07, "epoch": 9.403051564762222, "percentage": 94.03, "elapsed_time": "6:36:42", "remaining_time": "0:25:11", "throughput": 4303.1, "total_tokens": 102424624} +{"current_steps": 84435, "total_steps": 89790, "loss": 0.4557, "lr": 5.399832561466062e-07, "epoch": 9.40360841964584, "percentage": 94.04, "elapsed_time": "6:36:43", "remaining_time": "0:25:09", "throughput": 4303.12, "total_tokens": 102430608} +{"current_steps": 84440, "total_steps": 89790, "loss": 0.4543, "lr": 5.389791795428034e-07, "epoch": 9.404165274529458, "percentage": 94.04, "elapsed_time": "6:36:45", "remaining_time": "0:25:08", "throughput": 4303.15, "total_tokens": 102436560} +{"current_steps": 84445, "total_steps": 89790, "loss": 0.4549, "lr": 5.379760271547574e-07, "epoch": 9.404722129413075, "percentage": 94.05, "elapsed_time": "6:36:46", "remaining_time": "0:25:06", "throughput": 4303.17, "total_tokens": 102442768} +{"current_steps": 84450, "total_steps": 89790, "loss": 0.4524, "lr": 5.369737990203711e-07, "epoch": 9.405278984296693, "percentage": 94.05, "elapsed_time": "6:36:47", "remaining_time": "0:25:05", "throughput": 4303.2, "total_tokens": 102448848} +{"current_steps": 84455, "total_steps": 89790, "loss": 0.4537, "lr": 5.359724951775086e-07, "epoch": 9.405835839180309, "percentage": 94.06, "elapsed_time": "6:36:48", "remaining_time": "0:25:04", "throughput": 4303.22, "total_tokens": 102455184} +{"current_steps": 84460, "total_steps": 89790, "loss": 0.4585, "lr": 5.349721156640037e-07, "epoch": 9.406392694063927, "percentage": 94.06, "elapsed_time": "6:36:50", "remaining_time": "0:25:02", "throughput": 4303.24, "total_tokens": 102461360} +{"current_steps": 84465, "total_steps": 89790, "loss": 0.4649, "lr": 5.339726605176565e-07, "epoch": 9.406949548947544, "percentage": 94.07, "elapsed_time": "6:36:51", "remaining_time": "0:25:01", "throughput": 4303.27, "total_tokens": 102467792} +{"current_steps": 84470, "total_steps": 89790, "loss": 0.4626, "lr": 5.329741297762258e-07, "epoch": 9.407506403831162, "percentage": 94.08, "elapsed_time": "6:36:52", "remaining_time": "0:24:59", "throughput": 4303.29, "total_tokens": 102473968} +{"current_steps": 84475, "total_steps": 89790, "loss": 0.4615, "lr": 5.319765234774399e-07, "epoch": 9.40806325871478, "percentage": 94.08, "elapsed_time": "6:36:54", "remaining_time": "0:24:58", "throughput": 4303.31, "total_tokens": 102479888} +{"current_steps": 84480, "total_steps": 89790, "loss": 0.4658, "lr": 5.309798416589934e-07, "epoch": 9.408620113598396, "percentage": 94.09, "elapsed_time": "6:36:55", "remaining_time": "0:24:56", "throughput": 4303.34, "total_tokens": 102485712} +{"current_steps": 84485, "total_steps": 89790, "loss": 0.4504, "lr": 5.299840843585452e-07, "epoch": 9.409176968482013, "percentage": 94.09, "elapsed_time": "6:36:56", "remaining_time": "0:24:55", "throughput": 4303.36, "total_tokens": 102491280} +{"current_steps": 84490, "total_steps": 89790, "loss": 0.4648, "lr": 5.289892516137152e-07, "epoch": 9.409733823365631, "percentage": 94.1, "elapsed_time": "6:36:57", "remaining_time": "0:24:54", "throughput": 4303.38, "total_tokens": 102497456} +{"current_steps": 84495, "total_steps": 89790, "loss": 0.4673, "lr": 5.279953434620927e-07, "epoch": 9.410290678249249, "percentage": 94.1, "elapsed_time": "6:36:59", "remaining_time": "0:24:52", "throughput": 4303.41, "total_tokens": 102503760} +{"current_steps": 84500, "total_steps": 89790, "loss": 0.4652, "lr": 5.270023599412283e-07, "epoch": 9.410847533132866, "percentage": 94.11, "elapsed_time": "6:37:00", "remaining_time": "0:24:51", "throughput": 4303.44, "total_tokens": 102510064} +{"current_steps": 84505, "total_steps": 89790, "loss": 0.4594, "lr": 5.260103010886447e-07, "epoch": 9.411404388016482, "percentage": 94.11, "elapsed_time": "6:37:01", "remaining_time": "0:24:49", "throughput": 4303.46, "total_tokens": 102516368} +{"current_steps": 84510, "total_steps": 89790, "loss": 0.4594, "lr": 5.25019166941823e-07, "epoch": 9.4119612429001, "percentage": 94.12, "elapsed_time": "6:37:03", "remaining_time": "0:24:48", "throughput": 4303.48, "total_tokens": 102522576} +{"current_steps": 84515, "total_steps": 89790, "loss": 0.4751, "lr": 5.240289575382084e-07, "epoch": 9.412518097783718, "percentage": 94.13, "elapsed_time": "6:37:04", "remaining_time": "0:24:47", "throughput": 4303.51, "total_tokens": 102528848} +{"current_steps": 84520, "total_steps": 89790, "loss": 0.4687, "lr": 5.230396729152209e-07, "epoch": 9.413074952667335, "percentage": 94.13, "elapsed_time": "6:37:05", "remaining_time": "0:24:45", "throughput": 4303.53, "total_tokens": 102534416} +{"current_steps": 84525, "total_steps": 89790, "loss": 0.4809, "lr": 5.220513131102306e-07, "epoch": 9.413631807550953, "percentage": 94.14, "elapsed_time": "6:37:07", "remaining_time": "0:24:44", "throughput": 4303.55, "total_tokens": 102540848} +{"current_steps": 84530, "total_steps": 89790, "loss": 0.4596, "lr": 5.210638781605881e-07, "epoch": 9.414188662434569, "percentage": 94.14, "elapsed_time": "6:37:08", "remaining_time": "0:24:42", "throughput": 4303.58, "total_tokens": 102546992} +{"current_steps": 84535, "total_steps": 89790, "loss": 0.4623, "lr": 5.20077368103597e-07, "epoch": 9.414745517318186, "percentage": 94.15, "elapsed_time": "6:37:09", "remaining_time": "0:24:41", "throughput": 4303.6, "total_tokens": 102553008} +{"current_steps": 84540, "total_steps": 89790, "loss": 0.4545, "lr": 5.190917829765357e-07, "epoch": 9.415302372201804, "percentage": 94.15, "elapsed_time": "6:37:10", "remaining_time": "0:24:39", "throughput": 4303.63, "total_tokens": 102559312} +{"current_steps": 84545, "total_steps": 89790, "loss": 0.4651, "lr": 5.181071228166356e-07, "epoch": 9.415859227085422, "percentage": 94.16, "elapsed_time": "6:37:12", "remaining_time": "0:24:38", "throughput": 4303.65, "total_tokens": 102564816} +{"current_steps": 84550, "total_steps": 89790, "loss": 0.4492, "lr": 5.17123387661106e-07, "epoch": 9.41641608196904, "percentage": 94.16, "elapsed_time": "6:37:13", "remaining_time": "0:24:37", "throughput": 4303.67, "total_tokens": 102570928} +{"current_steps": 84555, "total_steps": 89790, "loss": 0.4675, "lr": 5.161405775471167e-07, "epoch": 9.416972936852655, "percentage": 94.17, "elapsed_time": "6:37:14", "remaining_time": "0:24:35", "throughput": 4303.69, "total_tokens": 102577456} +{"current_steps": 84560, "total_steps": 89790, "loss": 0.4646, "lr": 5.151586925117941e-07, "epoch": 9.417529791736273, "percentage": 94.18, "elapsed_time": "6:37:16", "remaining_time": "0:24:34", "throughput": 4303.71, "total_tokens": 102583568} +{"current_steps": 84565, "total_steps": 89790, "loss": 0.4583, "lr": 5.14177732592247e-07, "epoch": 9.41808664661989, "percentage": 94.18, "elapsed_time": "6:37:17", "remaining_time": "0:24:32", "throughput": 4303.74, "total_tokens": 102590160} +{"current_steps": 84570, "total_steps": 89790, "loss": 0.4558, "lr": 5.131976978255292e-07, "epoch": 9.418643501503508, "percentage": 94.19, "elapsed_time": "6:37:18", "remaining_time": "0:24:31", "throughput": 4303.77, "total_tokens": 102596304} +{"current_steps": 84575, "total_steps": 89790, "loss": 0.4636, "lr": 5.122185882486751e-07, "epoch": 9.419200356387126, "percentage": 94.19, "elapsed_time": "6:37:20", "remaining_time": "0:24:30", "throughput": 4303.79, "total_tokens": 102602544} +{"current_steps": 84580, "total_steps": 89790, "loss": 0.4567, "lr": 5.112404038986801e-07, "epoch": 9.419757211270742, "percentage": 94.2, "elapsed_time": "6:37:21", "remaining_time": "0:24:28", "throughput": 4303.82, "total_tokens": 102608944} +{"current_steps": 84585, "total_steps": 89790, "loss": 0.4584, "lr": 5.102631448124979e-07, "epoch": 9.42031406615436, "percentage": 94.2, "elapsed_time": "6:37:22", "remaining_time": "0:24:27", "throughput": 4303.84, "total_tokens": 102614832} +{"current_steps": 84590, "total_steps": 89790, "loss": 0.4548, "lr": 5.092868110270571e-07, "epoch": 9.420870921037977, "percentage": 94.21, "elapsed_time": "6:37:23", "remaining_time": "0:24:25", "throughput": 4303.86, "total_tokens": 102620976} +{"current_steps": 84595, "total_steps": 89790, "loss": 0.4698, "lr": 5.083114025792423e-07, "epoch": 9.421427775921595, "percentage": 94.21, "elapsed_time": "6:37:25", "remaining_time": "0:24:24", "throughput": 4303.88, "total_tokens": 102626896} +{"current_steps": 84600, "total_steps": 89790, "loss": 0.458, "lr": 5.073369195059158e-07, "epoch": 9.421984630805213, "percentage": 94.22, "elapsed_time": "6:37:26", "remaining_time": "0:24:22", "throughput": 4303.91, "total_tokens": 102633168} +{"current_steps": 84605, "total_steps": 89790, "loss": 0.4538, "lr": 5.063633618438868e-07, "epoch": 9.42254148568883, "percentage": 94.23, "elapsed_time": "6:37:27", "remaining_time": "0:24:21", "throughput": 4303.93, "total_tokens": 102638896} +{"current_steps": 84610, "total_steps": 89790, "loss": 0.4685, "lr": 5.053907296299426e-07, "epoch": 9.423098340572446, "percentage": 94.23, "elapsed_time": "6:37:29", "remaining_time": "0:24:20", "throughput": 4303.95, "total_tokens": 102645040} +{"current_steps": 84615, "total_steps": 89790, "loss": 0.4705, "lr": 5.044190229008372e-07, "epoch": 9.423655195456064, "percentage": 94.24, "elapsed_time": "6:37:30", "remaining_time": "0:24:18", "throughput": 4303.98, "total_tokens": 102650960} +{"current_steps": 84620, "total_steps": 89790, "loss": 0.4591, "lr": 5.034482416932773e-07, "epoch": 9.424212050339682, "percentage": 94.24, "elapsed_time": "6:37:31", "remaining_time": "0:24:17", "throughput": 4304.0, "total_tokens": 102656848} +{"current_steps": 84625, "total_steps": 89790, "loss": 0.4569, "lr": 5.024783860439475e-07, "epoch": 9.4247689052233, "percentage": 94.25, "elapsed_time": "6:37:32", "remaining_time": "0:24:15", "throughput": 4304.02, "total_tokens": 102663280} +{"current_steps": 84630, "total_steps": 89790, "loss": 0.4613, "lr": 5.015094559894906e-07, "epoch": 9.425325760106917, "percentage": 94.25, "elapsed_time": "6:37:34", "remaining_time": "0:24:14", "throughput": 4304.04, "total_tokens": 102669104} +{"current_steps": 84635, "total_steps": 89790, "loss": 0.4492, "lr": 5.005414515665163e-07, "epoch": 9.425882614990533, "percentage": 94.26, "elapsed_time": "6:37:35", "remaining_time": "0:24:12", "throughput": 4304.05, "total_tokens": 102674288} +{"current_steps": 84640, "total_steps": 89790, "loss": 0.458, "lr": 4.995743728115981e-07, "epoch": 9.42643946987415, "percentage": 94.26, "elapsed_time": "6:37:36", "remaining_time": "0:24:11", "throughput": 4304.07, "total_tokens": 102680400} +{"current_steps": 84645, "total_steps": 89790, "loss": 0.4663, "lr": 4.986082197612734e-07, "epoch": 9.426996324757768, "percentage": 94.27, "elapsed_time": "6:37:37", "remaining_time": "0:24:10", "throughput": 4304.09, "total_tokens": 102686320} +{"current_steps": 84650, "total_steps": 89790, "loss": 0.4576, "lr": 4.976429924520521e-07, "epoch": 9.427553179641386, "percentage": 94.28, "elapsed_time": "6:37:39", "remaining_time": "0:24:08", "throughput": 4304.12, "total_tokens": 102692560} +{"current_steps": 84655, "total_steps": 89790, "loss": 0.4472, "lr": 4.966786909203991e-07, "epoch": 9.428110034525004, "percentage": 94.28, "elapsed_time": "6:37:40", "remaining_time": "0:24:07", "throughput": 4304.14, "total_tokens": 102698800} +{"current_steps": 84660, "total_steps": 89790, "loss": 0.4612, "lr": 4.957153152027493e-07, "epoch": 9.42866688940862, "percentage": 94.29, "elapsed_time": "6:37:41", "remaining_time": "0:24:05", "throughput": 4304.16, "total_tokens": 102704720} +{"current_steps": 84665, "total_steps": 89790, "loss": 0.4633, "lr": 4.947528653355016e-07, "epoch": 9.429223744292237, "percentage": 94.29, "elapsed_time": "6:37:43", "remaining_time": "0:24:04", "throughput": 4304.18, "total_tokens": 102710864} +{"current_steps": 84670, "total_steps": 89790, "loss": 0.4677, "lr": 4.937913413550266e-07, "epoch": 9.429780599175855, "percentage": 94.3, "elapsed_time": "6:37:44", "remaining_time": "0:24:03", "throughput": 4304.21, "total_tokens": 102717136} +{"current_steps": 84675, "total_steps": 89790, "loss": 0.4588, "lr": 4.928307432976426e-07, "epoch": 9.430337454059472, "percentage": 94.3, "elapsed_time": "6:37:45", "remaining_time": "0:24:01", "throughput": 4304.22, "total_tokens": 102722672} +{"current_steps": 84680, "total_steps": 89790, "loss": 0.4595, "lr": 4.918710711996511e-07, "epoch": 9.43089430894309, "percentage": 94.31, "elapsed_time": "6:37:46", "remaining_time": "0:24:00", "throughput": 4304.25, "total_tokens": 102728944} +{"current_steps": 84685, "total_steps": 89790, "loss": 0.4686, "lr": 4.909123250973146e-07, "epoch": 9.431451163826706, "percentage": 94.31, "elapsed_time": "6:37:48", "remaining_time": "0:23:58", "throughput": 4304.27, "total_tokens": 102735152} +{"current_steps": 84690, "total_steps": 89790, "loss": 0.4639, "lr": 4.899545050268489e-07, "epoch": 9.432008018710324, "percentage": 94.32, "elapsed_time": "6:37:49", "remaining_time": "0:23:57", "throughput": 4304.3, "total_tokens": 102741808} +{"current_steps": 84695, "total_steps": 89790, "loss": 0.4573, "lr": 4.889976110244526e-07, "epoch": 9.432564873593941, "percentage": 94.33, "elapsed_time": "6:37:50", "remaining_time": "0:23:55", "throughput": 4304.32, "total_tokens": 102747888} +{"current_steps": 84700, "total_steps": 89790, "loss": 0.4533, "lr": 4.880416431262746e-07, "epoch": 9.433121728477559, "percentage": 94.33, "elapsed_time": "6:37:52", "remaining_time": "0:23:54", "throughput": 4304.34, "total_tokens": 102753840} +{"current_steps": 84705, "total_steps": 89790, "loss": 0.4581, "lr": 4.870866013684333e-07, "epoch": 9.433678583361177, "percentage": 94.34, "elapsed_time": "6:37:53", "remaining_time": "0:23:53", "throughput": 4304.37, "total_tokens": 102760240} +{"current_steps": 84710, "total_steps": 89790, "loss": 0.4561, "lr": 4.861324857870192e-07, "epoch": 9.434235438244793, "percentage": 94.34, "elapsed_time": "6:37:54", "remaining_time": "0:23:51", "throughput": 4304.39, "total_tokens": 102766448} +{"current_steps": 84715, "total_steps": 89790, "loss": 0.4556, "lr": 4.851792964180757e-07, "epoch": 9.43479229312841, "percentage": 94.35, "elapsed_time": "6:37:56", "remaining_time": "0:23:50", "throughput": 4304.42, "total_tokens": 102772336} +{"current_steps": 84720, "total_steps": 89790, "loss": 0.4606, "lr": 4.842270332976212e-07, "epoch": 9.435349148012028, "percentage": 94.35, "elapsed_time": "6:37:57", "remaining_time": "0:23:48", "throughput": 4304.44, "total_tokens": 102778640} +{"current_steps": 84725, "total_steps": 89790, "loss": 0.4568, "lr": 4.832756964616326e-07, "epoch": 9.435906002895646, "percentage": 94.36, "elapsed_time": "6:37:58", "remaining_time": "0:23:47", "throughput": 4304.46, "total_tokens": 102784560} +{"current_steps": 84730, "total_steps": 89790, "loss": 0.4577, "lr": 4.823252859460587e-07, "epoch": 9.436462857779263, "percentage": 94.36, "elapsed_time": "6:37:59", "remaining_time": "0:23:46", "throughput": 4304.48, "total_tokens": 102790544} +{"current_steps": 84735, "total_steps": 89790, "loss": 0.4549, "lr": 4.813758017868042e-07, "epoch": 9.43701971266288, "percentage": 94.37, "elapsed_time": "6:38:01", "remaining_time": "0:23:44", "throughput": 4304.5, "total_tokens": 102796112} +{"current_steps": 84740, "total_steps": 89790, "loss": 0.4577, "lr": 4.804272440197461e-07, "epoch": 9.437576567546497, "percentage": 94.38, "elapsed_time": "6:38:02", "remaining_time": "0:23:43", "throughput": 4304.53, "total_tokens": 102802256} +{"current_steps": 84745, "total_steps": 89790, "loss": 0.4633, "lr": 4.79479612680725e-07, "epoch": 9.438133422430115, "percentage": 94.38, "elapsed_time": "6:38:03", "remaining_time": "0:23:41", "throughput": 4304.55, "total_tokens": 102808176} +{"current_steps": 84750, "total_steps": 89790, "loss": 0.4575, "lr": 4.785329078055401e-07, "epoch": 9.438690277313732, "percentage": 94.39, "elapsed_time": "6:38:04", "remaining_time": "0:23:40", "throughput": 4304.57, "total_tokens": 102814416} +{"current_steps": 84755, "total_steps": 89790, "loss": 0.4625, "lr": 4.775871294299683e-07, "epoch": 9.43924713219735, "percentage": 94.39, "elapsed_time": "6:38:06", "remaining_time": "0:23:39", "throughput": 4304.6, "total_tokens": 102820784} +{"current_steps": 84760, "total_steps": 89790, "loss": 0.4679, "lr": 4.7664227758973945e-07, "epoch": 9.439803987080968, "percentage": 94.4, "elapsed_time": "6:38:07", "remaining_time": "0:23:37", "throughput": 4304.62, "total_tokens": 102826768} +{"current_steps": 84765, "total_steps": 89790, "loss": 0.4614, "lr": 4.756983523205555e-07, "epoch": 9.440360841964583, "percentage": 94.4, "elapsed_time": "6:38:08", "remaining_time": "0:23:36", "throughput": 4304.64, "total_tokens": 102832400} +{"current_steps": 84770, "total_steps": 89790, "loss": 0.4507, "lr": 4.7475535365807676e-07, "epoch": 9.440917696848201, "percentage": 94.41, "elapsed_time": "6:38:10", "remaining_time": "0:23:34", "throughput": 4304.66, "total_tokens": 102838416} +{"current_steps": 84775, "total_steps": 89790, "loss": 0.465, "lr": 4.738132816379387e-07, "epoch": 9.441474551731819, "percentage": 94.41, "elapsed_time": "6:38:11", "remaining_time": "0:23:33", "throughput": 4304.68, "total_tokens": 102844368} +{"current_steps": 84780, "total_steps": 89790, "loss": 0.451, "lr": 4.7287213629573223e-07, "epoch": 9.442031406615436, "percentage": 94.42, "elapsed_time": "6:38:12", "remaining_time": "0:23:31", "throughput": 4304.7, "total_tokens": 102850512} +{"current_steps": 84785, "total_steps": 89790, "loss": 0.4551, "lr": 4.7193191766701784e-07, "epoch": 9.442588261499054, "percentage": 94.43, "elapsed_time": "6:38:13", "remaining_time": "0:23:30", "throughput": 4304.72, "total_tokens": 102856464} +{"current_steps": 84790, "total_steps": 89790, "loss": 0.4855, "lr": 4.7099262578731983e-07, "epoch": 9.44314511638267, "percentage": 94.43, "elapsed_time": "6:38:15", "remaining_time": "0:23:29", "throughput": 4304.74, "total_tokens": 102861808} +{"current_steps": 84795, "total_steps": 89790, "loss": 0.4615, "lr": 4.7005426069212375e-07, "epoch": 9.443701971266288, "percentage": 94.44, "elapsed_time": "6:38:16", "remaining_time": "0:23:27", "throughput": 4304.77, "total_tokens": 102868016} +{"current_steps": 84800, "total_steps": 89790, "loss": 0.4627, "lr": 4.6911682241689016e-07, "epoch": 9.444258826149905, "percentage": 94.44, "elapsed_time": "6:38:17", "remaining_time": "0:23:26", "throughput": 4304.79, "total_tokens": 102874096} +{"current_steps": 84805, "total_steps": 89790, "loss": 0.4479, "lr": 4.6818031099703784e-07, "epoch": 9.444815681033523, "percentage": 94.45, "elapsed_time": "6:38:18", "remaining_time": "0:23:24", "throughput": 4304.81, "total_tokens": 102880304} +{"current_steps": 84810, "total_steps": 89790, "loss": 0.4605, "lr": 4.672447264679497e-07, "epoch": 9.44537253591714, "percentage": 94.45, "elapsed_time": "6:38:20", "remaining_time": "0:23:23", "throughput": 4304.84, "total_tokens": 102886320} +{"current_steps": 84815, "total_steps": 89790, "loss": 0.446, "lr": 4.663100688649724e-07, "epoch": 9.445929390800757, "percentage": 94.46, "elapsed_time": "6:38:21", "remaining_time": "0:23:21", "throughput": 4304.86, "total_tokens": 102892368} +{"current_steps": 84820, "total_steps": 89790, "loss": 0.4571, "lr": 4.6537633822342496e-07, "epoch": 9.446486245684374, "percentage": 94.46, "elapsed_time": "6:38:22", "remaining_time": "0:23:20", "throughput": 4304.89, "total_tokens": 102898672} +{"current_steps": 84825, "total_steps": 89790, "loss": 0.4549, "lr": 4.644435345785847e-07, "epoch": 9.447043100567992, "percentage": 94.47, "elapsed_time": "6:38:24", "remaining_time": "0:23:19", "throughput": 4304.91, "total_tokens": 102904656} +{"current_steps": 84830, "total_steps": 89790, "loss": 0.4573, "lr": 4.635116579656956e-07, "epoch": 9.44759995545161, "percentage": 94.48, "elapsed_time": "6:38:25", "remaining_time": "0:23:17", "throughput": 4304.94, "total_tokens": 102910832} +{"current_steps": 84835, "total_steps": 89790, "loss": 0.4561, "lr": 4.6258070841996294e-07, "epoch": 9.448156810335227, "percentage": 94.48, "elapsed_time": "6:38:26", "remaining_time": "0:23:16", "throughput": 4304.96, "total_tokens": 102916976} +{"current_steps": 84840, "total_steps": 89790, "loss": 0.4515, "lr": 4.616506859765696e-07, "epoch": 9.448713665218843, "percentage": 94.49, "elapsed_time": "6:38:27", "remaining_time": "0:23:14", "throughput": 4304.99, "total_tokens": 102923184} +{"current_steps": 84845, "total_steps": 89790, "loss": 0.4616, "lr": 4.6072159067064856e-07, "epoch": 9.449270520102461, "percentage": 94.49, "elapsed_time": "6:38:29", "remaining_time": "0:23:13", "throughput": 4305.01, "total_tokens": 102929072} +{"current_steps": 84850, "total_steps": 89790, "loss": 0.4581, "lr": 4.597934225373052e-07, "epoch": 9.449827374986079, "percentage": 94.5, "elapsed_time": "6:38:30", "remaining_time": "0:23:12", "throughput": 4305.03, "total_tokens": 102935056} +{"current_steps": 84855, "total_steps": 89790, "loss": 0.4567, "lr": 4.588661816116113e-07, "epoch": 9.450384229869696, "percentage": 94.5, "elapsed_time": "6:38:31", "remaining_time": "0:23:10", "throughput": 4305.05, "total_tokens": 102941328} +{"current_steps": 84860, "total_steps": 89790, "loss": 0.4569, "lr": 4.5793986792859733e-07, "epoch": 9.450941084753314, "percentage": 94.51, "elapsed_time": "6:38:33", "remaining_time": "0:23:09", "throughput": 4305.07, "total_tokens": 102947600} +{"current_steps": 84865, "total_steps": 89790, "loss": 0.4559, "lr": 4.5701448152326576e-07, "epoch": 9.45149793963693, "percentage": 94.51, "elapsed_time": "6:38:34", "remaining_time": "0:23:07", "throughput": 4305.09, "total_tokens": 102953904} +{"current_steps": 84870, "total_steps": 89790, "loss": 0.4612, "lr": 4.5609002243057753e-07, "epoch": 9.452054794520548, "percentage": 94.52, "elapsed_time": "6:38:35", "remaining_time": "0:23:06", "throughput": 4305.12, "total_tokens": 102960048} +{"current_steps": 84875, "total_steps": 89790, "loss": 0.4564, "lr": 4.5516649068546305e-07, "epoch": 9.452611649404165, "percentage": 94.53, "elapsed_time": "6:38:37", "remaining_time": "0:23:05", "throughput": 4305.14, "total_tokens": 102966032} +{"current_steps": 84880, "total_steps": 89790, "loss": 0.4696, "lr": 4.542438863228166e-07, "epoch": 9.453168504287783, "percentage": 94.53, "elapsed_time": "6:38:38", "remaining_time": "0:23:03", "throughput": 4305.16, "total_tokens": 102971536} +{"current_steps": 84885, "total_steps": 89790, "loss": 0.4685, "lr": 4.533222093774964e-07, "epoch": 9.4537253591714, "percentage": 94.54, "elapsed_time": "6:38:39", "remaining_time": "0:23:02", "throughput": 4305.18, "total_tokens": 102977648} +{"current_steps": 84890, "total_steps": 89790, "loss": 0.4574, "lr": 4.524014598843274e-07, "epoch": 9.454282214055016, "percentage": 94.54, "elapsed_time": "6:38:40", "remaining_time": "0:23:00", "throughput": 4305.2, "total_tokens": 102983696} +{"current_steps": 84895, "total_steps": 89790, "loss": 0.4528, "lr": 4.514816378780984e-07, "epoch": 9.454839068938634, "percentage": 94.55, "elapsed_time": "6:38:42", "remaining_time": "0:22:59", "throughput": 4305.22, "total_tokens": 102989680} +{"current_steps": 84900, "total_steps": 89790, "loss": 0.4649, "lr": 4.505627433935622e-07, "epoch": 9.455395923822252, "percentage": 94.55, "elapsed_time": "6:38:43", "remaining_time": "0:22:57", "throughput": 4305.25, "total_tokens": 102995696} +{"current_steps": 84905, "total_steps": 89790, "loss": 0.4724, "lr": 4.496447764654382e-07, "epoch": 9.45595277870587, "percentage": 94.56, "elapsed_time": "6:38:44", "remaining_time": "0:22:56", "throughput": 4305.27, "total_tokens": 103001744} +{"current_steps": 84910, "total_steps": 89790, "loss": 0.4595, "lr": 4.487277371284099e-07, "epoch": 9.456509633589487, "percentage": 94.57, "elapsed_time": "6:38:45", "remaining_time": "0:22:55", "throughput": 4305.29, "total_tokens": 103007760} +{"current_steps": 84915, "total_steps": 89790, "loss": 0.4691, "lr": 4.478116254171244e-07, "epoch": 9.457066488473103, "percentage": 94.57, "elapsed_time": "6:38:47", "remaining_time": "0:22:53", "throughput": 4305.31, "total_tokens": 103013840} +{"current_steps": 84920, "total_steps": 89790, "loss": 0.4526, "lr": 4.4689644136619857e-07, "epoch": 9.45762334335672, "percentage": 94.58, "elapsed_time": "6:38:48", "remaining_time": "0:22:52", "throughput": 4305.34, "total_tokens": 103020048} +{"current_steps": 84925, "total_steps": 89790, "loss": 0.4641, "lr": 4.4598218501021025e-07, "epoch": 9.458180198240338, "percentage": 94.58, "elapsed_time": "6:38:49", "remaining_time": "0:22:50", "throughput": 4305.36, "total_tokens": 103026096} +{"current_steps": 84930, "total_steps": 89790, "loss": 0.4575, "lr": 4.4506885638370135e-07, "epoch": 9.458737053123956, "percentage": 94.59, "elapsed_time": "6:38:50", "remaining_time": "0:22:49", "throughput": 4305.38, "total_tokens": 103031760} +{"current_steps": 84935, "total_steps": 89790, "loss": 0.454, "lr": 4.44156455521183e-07, "epoch": 9.459293908007574, "percentage": 94.59, "elapsed_time": "6:38:52", "remaining_time": "0:22:48", "throughput": 4305.4, "total_tokens": 103037968} +{"current_steps": 84940, "total_steps": 89790, "loss": 0.4498, "lr": 4.43244982457125e-07, "epoch": 9.45985076289119, "percentage": 94.6, "elapsed_time": "6:38:53", "remaining_time": "0:22:46", "throughput": 4305.43, "total_tokens": 103044336} +{"current_steps": 84945, "total_steps": 89790, "loss": 0.4599, "lr": 4.4233443722596914e-07, "epoch": 9.460407617774807, "percentage": 94.6, "elapsed_time": "6:38:54", "remaining_time": "0:22:45", "throughput": 4305.45, "total_tokens": 103050800} +{"current_steps": 84950, "total_steps": 89790, "loss": 0.4556, "lr": 4.4142481986211294e-07, "epoch": 9.460964472658425, "percentage": 94.61, "elapsed_time": "6:38:56", "remaining_time": "0:22:43", "throughput": 4305.47, "total_tokens": 103056944} +{"current_steps": 84955, "total_steps": 89790, "loss": 0.453, "lr": 4.4051613039993166e-07, "epoch": 9.461521327542043, "percentage": 94.62, "elapsed_time": "6:38:57", "remaining_time": "0:22:42", "throughput": 4305.49, "total_tokens": 103062800} +{"current_steps": 84960, "total_steps": 89790, "loss": 0.4594, "lr": 4.396083688737562e-07, "epoch": 9.46207818242566, "percentage": 94.62, "elapsed_time": "6:38:58", "remaining_time": "0:22:40", "throughput": 4305.51, "total_tokens": 103068272} +{"current_steps": 84965, "total_steps": 89790, "loss": 0.468, "lr": 4.3870153531788415e-07, "epoch": 9.462635037309278, "percentage": 94.63, "elapsed_time": "6:38:59", "remaining_time": "0:22:39", "throughput": 4305.53, "total_tokens": 103074224} +{"current_steps": 84970, "total_steps": 89790, "loss": 0.4555, "lr": 4.3779562976657974e-07, "epoch": 9.463191892192894, "percentage": 94.63, "elapsed_time": "6:39:01", "remaining_time": "0:22:38", "throughput": 4305.56, "total_tokens": 103080432} +{"current_steps": 84975, "total_steps": 89790, "loss": 0.4476, "lr": 4.3689065225406555e-07, "epoch": 9.463748747076512, "percentage": 94.64, "elapsed_time": "6:39:02", "remaining_time": "0:22:36", "throughput": 4305.58, "total_tokens": 103086768} +{"current_steps": 84980, "total_steps": 89790, "loss": 0.4575, "lr": 4.3598660281454207e-07, "epoch": 9.46430560196013, "percentage": 94.64, "elapsed_time": "6:39:03", "remaining_time": "0:22:35", "throughput": 4305.61, "total_tokens": 103093008} +{"current_steps": 84985, "total_steps": 89790, "loss": 0.45, "lr": 4.350834814821653e-07, "epoch": 9.464862456843747, "percentage": 94.65, "elapsed_time": "6:39:05", "remaining_time": "0:22:33", "throughput": 4305.63, "total_tokens": 103099088} +{"current_steps": 84990, "total_steps": 89790, "loss": 0.4635, "lr": 4.3418128829105233e-07, "epoch": 9.465419311727365, "percentage": 94.65, "elapsed_time": "6:39:06", "remaining_time": "0:22:32", "throughput": 4305.65, "total_tokens": 103105136} +{"current_steps": 84995, "total_steps": 89790, "loss": 0.4523, "lr": 4.332800232753009e-07, "epoch": 9.46597616661098, "percentage": 94.66, "elapsed_time": "6:39:07", "remaining_time": "0:22:31", "throughput": 4305.67, "total_tokens": 103110800} +{"current_steps": 85000, "total_steps": 89790, "loss": 0.463, "lr": 4.323796864689533e-07, "epoch": 9.466533021494598, "percentage": 94.67, "elapsed_time": "6:39:08", "remaining_time": "0:22:29", "throughput": 4305.7, "total_tokens": 103117040} +{"current_steps": 85005, "total_steps": 89790, "loss": 0.4528, "lr": 4.314802779060351e-07, "epoch": 9.467089876378216, "percentage": 94.67, "elapsed_time": "6:39:10", "remaining_time": "0:22:28", "throughput": 4305.73, "total_tokens": 103123440} +{"current_steps": 85010, "total_steps": 89790, "loss": 0.4571, "lr": 4.305817976205245e-07, "epoch": 9.467646731261834, "percentage": 94.68, "elapsed_time": "6:39:11", "remaining_time": "0:22:26", "throughput": 4305.75, "total_tokens": 103129552} +{"current_steps": 85015, "total_steps": 89790, "loss": 0.4563, "lr": 4.296842456463668e-07, "epoch": 9.468203586145451, "percentage": 94.68, "elapsed_time": "6:39:12", "remaining_time": "0:22:25", "throughput": 4305.78, "total_tokens": 103135824} +{"current_steps": 85020, "total_steps": 89790, "loss": 0.4791, "lr": 4.287876220174819e-07, "epoch": 9.468760441029067, "percentage": 94.69, "elapsed_time": "6:39:14", "remaining_time": "0:22:23", "throughput": 4305.8, "total_tokens": 103142032} +{"current_steps": 85025, "total_steps": 89790, "loss": 0.4658, "lr": 4.2789192676774283e-07, "epoch": 9.469317295912685, "percentage": 94.69, "elapsed_time": "6:39:15", "remaining_time": "0:22:22", "throughput": 4305.82, "total_tokens": 103148272} +{"current_steps": 85030, "total_steps": 89790, "loss": 0.4646, "lr": 4.269971599309919e-07, "epoch": 9.469874150796302, "percentage": 94.7, "elapsed_time": "6:39:16", "remaining_time": "0:22:21", "throughput": 4305.85, "total_tokens": 103154480} +{"current_steps": 85035, "total_steps": 89790, "loss": 0.4681, "lr": 4.261033215410354e-07, "epoch": 9.47043100567992, "percentage": 94.7, "elapsed_time": "6:39:17", "remaining_time": "0:22:19", "throughput": 4305.86, "total_tokens": 103159600} +{"current_steps": 85040, "total_steps": 89790, "loss": 0.4558, "lr": 4.2521041163164633e-07, "epoch": 9.470987860563538, "percentage": 94.71, "elapsed_time": "6:39:19", "remaining_time": "0:22:18", "throughput": 4305.88, "total_tokens": 103165520} +{"current_steps": 85045, "total_steps": 89790, "loss": 0.4627, "lr": 4.243184302365616e-07, "epoch": 9.471544715447154, "percentage": 94.72, "elapsed_time": "6:39:20", "remaining_time": "0:22:16", "throughput": 4305.9, "total_tokens": 103171056} +{"current_steps": 85050, "total_steps": 89790, "loss": 0.4567, "lr": 4.23427377389482e-07, "epoch": 9.472101570330771, "percentage": 94.72, "elapsed_time": "6:39:21", "remaining_time": "0:22:15", "throughput": 4305.92, "total_tokens": 103177072} +{"current_steps": 85055, "total_steps": 89790, "loss": 0.4528, "lr": 4.2253725312408065e-07, "epoch": 9.472658425214389, "percentage": 94.73, "elapsed_time": "6:39:22", "remaining_time": "0:22:14", "throughput": 4305.94, "total_tokens": 103182960} +{"current_steps": 85060, "total_steps": 89790, "loss": 0.4615, "lr": 4.2164805747397784e-07, "epoch": 9.473215280098007, "percentage": 94.73, "elapsed_time": "6:39:24", "remaining_time": "0:22:12", "throughput": 4305.96, "total_tokens": 103189200} +{"current_steps": 85065, "total_steps": 89790, "loss": 0.4556, "lr": 4.2075979047278e-07, "epoch": 9.473772134981624, "percentage": 94.74, "elapsed_time": "6:39:25", "remaining_time": "0:22:11", "throughput": 4305.98, "total_tokens": 103195088} +{"current_steps": 85070, "total_steps": 89790, "loss": 0.4645, "lr": 4.1987245215404646e-07, "epoch": 9.47432898986524, "percentage": 94.74, "elapsed_time": "6:39:26", "remaining_time": "0:22:09", "throughput": 4306.0, "total_tokens": 103201104} +{"current_steps": 85075, "total_steps": 89790, "loss": 0.4708, "lr": 4.189860425512976e-07, "epoch": 9.474885844748858, "percentage": 94.75, "elapsed_time": "6:39:28", "remaining_time": "0:22:08", "throughput": 4306.02, "total_tokens": 103206896} +{"current_steps": 85080, "total_steps": 89790, "loss": 0.4637, "lr": 4.1810056169803433e-07, "epoch": 9.475442699632476, "percentage": 94.75, "elapsed_time": "6:39:29", "remaining_time": "0:22:06", "throughput": 4306.04, "total_tokens": 103212528} +{"current_steps": 85085, "total_steps": 89790, "loss": 0.465, "lr": 4.172160096277078e-07, "epoch": 9.475999554516093, "percentage": 94.76, "elapsed_time": "6:39:30", "remaining_time": "0:22:05", "throughput": 4306.06, "total_tokens": 103218896} +{"current_steps": 85090, "total_steps": 89790, "loss": 0.4441, "lr": 4.163323863737384e-07, "epoch": 9.476556409399711, "percentage": 94.77, "elapsed_time": "6:39:31", "remaining_time": "0:22:04", "throughput": 4306.08, "total_tokens": 103225040} +{"current_steps": 85095, "total_steps": 89790, "loss": 0.4622, "lr": 4.154496919695161e-07, "epoch": 9.477113264283329, "percentage": 94.77, "elapsed_time": "6:39:33", "remaining_time": "0:22:02", "throughput": 4306.1, "total_tokens": 103230960} +{"current_steps": 85100, "total_steps": 89790, "loss": 0.4502, "lr": 4.145679264483865e-07, "epoch": 9.477670119166945, "percentage": 94.78, "elapsed_time": "6:39:34", "remaining_time": "0:22:01", "throughput": 4306.13, "total_tokens": 103237104} +{"current_steps": 85105, "total_steps": 89790, "loss": 0.4654, "lr": 4.136870898436701e-07, "epoch": 9.478226974050562, "percentage": 94.78, "elapsed_time": "6:39:35", "remaining_time": "0:21:59", "throughput": 4306.15, "total_tokens": 103243248} +{"current_steps": 85110, "total_steps": 89790, "loss": 0.4585, "lr": 4.128071821886459e-07, "epoch": 9.47878382893418, "percentage": 94.79, "elapsed_time": "6:39:37", "remaining_time": "0:21:58", "throughput": 4306.17, "total_tokens": 103249424} +{"current_steps": 85115, "total_steps": 89790, "loss": 0.4546, "lr": 4.119282035165595e-07, "epoch": 9.479340683817798, "percentage": 94.79, "elapsed_time": "6:39:38", "remaining_time": "0:21:57", "throughput": 4306.2, "total_tokens": 103255920} +{"current_steps": 85120, "total_steps": 89790, "loss": 0.4605, "lr": 4.1105015386062316e-07, "epoch": 9.479897538701415, "percentage": 94.8, "elapsed_time": "6:39:39", "remaining_time": "0:21:55", "throughput": 4306.22, "total_tokens": 103262064} +{"current_steps": 85125, "total_steps": 89790, "loss": 0.4602, "lr": 4.101730332540105e-07, "epoch": 9.480454393585031, "percentage": 94.8, "elapsed_time": "6:39:41", "remaining_time": "0:21:54", "throughput": 4306.25, "total_tokens": 103268112} +{"current_steps": 85130, "total_steps": 89790, "loss": 0.457, "lr": 4.0929684172986147e-07, "epoch": 9.481011248468649, "percentage": 94.81, "elapsed_time": "6:39:42", "remaining_time": "0:21:52", "throughput": 4306.27, "total_tokens": 103274256} +{"current_steps": 85135, "total_steps": 89790, "loss": 0.4626, "lr": 4.084215793212859e-07, "epoch": 9.481568103352267, "percentage": 94.82, "elapsed_time": "6:39:43", "remaining_time": "0:21:51", "throughput": 4306.29, "total_tokens": 103280400} +{"current_steps": 85140, "total_steps": 89790, "loss": 0.4612, "lr": 4.075472460613461e-07, "epoch": 9.482124958235884, "percentage": 94.82, "elapsed_time": "6:39:44", "remaining_time": "0:21:49", "throughput": 4306.32, "total_tokens": 103286832} +{"current_steps": 85145, "total_steps": 89790, "loss": 0.4647, "lr": 4.0667384198308236e-07, "epoch": 9.482681813119502, "percentage": 94.83, "elapsed_time": "6:39:46", "remaining_time": "0:21:48", "throughput": 4306.34, "total_tokens": 103292912} +{"current_steps": 85150, "total_steps": 89790, "loss": 0.4536, "lr": 4.05801367119496e-07, "epoch": 9.483238668003118, "percentage": 94.83, "elapsed_time": "6:39:47", "remaining_time": "0:21:47", "throughput": 4306.37, "total_tokens": 103299280} +{"current_steps": 85155, "total_steps": 89790, "loss": 0.4676, "lr": 4.0492982150354965e-07, "epoch": 9.483795522886735, "percentage": 94.84, "elapsed_time": "6:39:48", "remaining_time": "0:21:45", "throughput": 4306.39, "total_tokens": 103305200} +{"current_steps": 85160, "total_steps": 89790, "loss": 0.4523, "lr": 4.0405920516817517e-07, "epoch": 9.484352377770353, "percentage": 94.84, "elapsed_time": "6:39:50", "remaining_time": "0:21:44", "throughput": 4306.41, "total_tokens": 103311216} +{"current_steps": 85165, "total_steps": 89790, "loss": 0.4581, "lr": 4.0318951814626305e-07, "epoch": 9.48490923265397, "percentage": 94.85, "elapsed_time": "6:39:51", "remaining_time": "0:21:42", "throughput": 4306.43, "total_tokens": 103316688} +{"current_steps": 85170, "total_steps": 89790, "loss": 0.4635, "lr": 4.023207604706758e-07, "epoch": 9.485466087537588, "percentage": 94.85, "elapsed_time": "6:39:52", "remaining_time": "0:21:41", "throughput": 4306.45, "total_tokens": 103322736} +{"current_steps": 85175, "total_steps": 89790, "loss": 0.4652, "lr": 4.014529321742372e-07, "epoch": 9.486022942421204, "percentage": 94.86, "elapsed_time": "6:39:53", "remaining_time": "0:21:40", "throughput": 4306.47, "total_tokens": 103328944} +{"current_steps": 85180, "total_steps": 89790, "loss": 0.4512, "lr": 4.005860332897349e-07, "epoch": 9.486579797304822, "percentage": 94.87, "elapsed_time": "6:39:55", "remaining_time": "0:21:38", "throughput": 4306.5, "total_tokens": 103335056} +{"current_steps": 85185, "total_steps": 89790, "loss": 0.4708, "lr": 3.997200638499288e-07, "epoch": 9.48713665218844, "percentage": 94.87, "elapsed_time": "6:39:56", "remaining_time": "0:21:37", "throughput": 4306.53, "total_tokens": 103341424} +{"current_steps": 85190, "total_steps": 89790, "loss": 0.455, "lr": 3.988550238875316e-07, "epoch": 9.487693507072057, "percentage": 94.88, "elapsed_time": "6:39:57", "remaining_time": "0:21:35", "throughput": 4306.55, "total_tokens": 103347408} +{"current_steps": 85195, "total_steps": 89790, "loss": 0.4511, "lr": 3.979909134352311e-07, "epoch": 9.488250361955675, "percentage": 94.88, "elapsed_time": "6:39:59", "remaining_time": "0:21:34", "throughput": 4306.57, "total_tokens": 103353520} +{"current_steps": 85200, "total_steps": 89790, "loss": 0.4617, "lr": 3.9712773252567335e-07, "epoch": 9.488807216839291, "percentage": 94.89, "elapsed_time": "6:40:00", "remaining_time": "0:21:32", "throughput": 4306.59, "total_tokens": 103359408} +{"current_steps": 85205, "total_steps": 89790, "loss": 0.464, "lr": 3.96265481191474e-07, "epoch": 9.489364071722909, "percentage": 94.89, "elapsed_time": "6:40:01", "remaining_time": "0:21:31", "throughput": 4306.61, "total_tokens": 103365712} +{"current_steps": 85210, "total_steps": 89790, "loss": 0.4794, "lr": 3.9540415946521247e-07, "epoch": 9.489920926606526, "percentage": 94.9, "elapsed_time": "6:40:02", "remaining_time": "0:21:30", "throughput": 4306.64, "total_tokens": 103372048} +{"current_steps": 85215, "total_steps": 89790, "loss": 0.4453, "lr": 3.945437673794322e-07, "epoch": 9.490477781490144, "percentage": 94.9, "elapsed_time": "6:40:04", "remaining_time": "0:21:28", "throughput": 4306.66, "total_tokens": 103377872} +{"current_steps": 85220, "total_steps": 89790, "loss": 0.4523, "lr": 3.9368430496663777e-07, "epoch": 9.491034636373762, "percentage": 94.91, "elapsed_time": "6:40:05", "remaining_time": "0:21:27", "throughput": 4306.68, "total_tokens": 103383920} +{"current_steps": 85225, "total_steps": 89790, "loss": 0.4713, "lr": 3.928257722593059e-07, "epoch": 9.491591491257378, "percentage": 94.92, "elapsed_time": "6:40:06", "remaining_time": "0:21:25", "throughput": 4306.7, "total_tokens": 103389552} +{"current_steps": 85230, "total_steps": 89790, "loss": 0.4567, "lr": 3.919681692898747e-07, "epoch": 9.492148346140995, "percentage": 94.92, "elapsed_time": "6:40:07", "remaining_time": "0:21:24", "throughput": 4306.73, "total_tokens": 103395536} +{"current_steps": 85235, "total_steps": 89790, "loss": 0.4445, "lr": 3.911114960907486e-07, "epoch": 9.492705201024613, "percentage": 94.93, "elapsed_time": "6:40:09", "remaining_time": "0:21:23", "throughput": 4306.74, "total_tokens": 103401520} +{"current_steps": 85240, "total_steps": 89790, "loss": 0.4562, "lr": 3.902557526942879e-07, "epoch": 9.49326205590823, "percentage": 94.93, "elapsed_time": "6:40:10", "remaining_time": "0:21:21", "throughput": 4306.77, "total_tokens": 103407824} +{"current_steps": 85245, "total_steps": 89790, "loss": 0.4499, "lr": 3.8940093913283626e-07, "epoch": 9.493818910791848, "percentage": 94.94, "elapsed_time": "6:40:11", "remaining_time": "0:21:20", "throughput": 4306.79, "total_tokens": 103413808} +{"current_steps": 85250, "total_steps": 89790, "loss": 0.47, "lr": 3.885470554386816e-07, "epoch": 9.494375765675464, "percentage": 94.94, "elapsed_time": "6:40:13", "remaining_time": "0:21:18", "throughput": 4306.82, "total_tokens": 103420272} +{"current_steps": 85255, "total_steps": 89790, "loss": 0.4709, "lr": 3.8769410164408994e-07, "epoch": 9.494932620559082, "percentage": 94.95, "elapsed_time": "6:40:14", "remaining_time": "0:21:17", "throughput": 4306.84, "total_tokens": 103426224} +{"current_steps": 85260, "total_steps": 89790, "loss": 0.4679, "lr": 3.868420777812909e-07, "epoch": 9.4954894754427, "percentage": 94.95, "elapsed_time": "6:40:15", "remaining_time": "0:21:15", "throughput": 4306.86, "total_tokens": 103432304} +{"current_steps": 85265, "total_steps": 89790, "loss": 0.447, "lr": 3.8599098388247545e-07, "epoch": 9.496046330326317, "percentage": 94.96, "elapsed_time": "6:40:16", "remaining_time": "0:21:14", "throughput": 4306.88, "total_tokens": 103438384} +{"current_steps": 85270, "total_steps": 89790, "loss": 0.46, "lr": 3.851408199798012e-07, "epoch": 9.496603185209935, "percentage": 94.97, "elapsed_time": "6:40:18", "remaining_time": "0:21:13", "throughput": 4306.9, "total_tokens": 103444208} +{"current_steps": 85275, "total_steps": 89790, "loss": 0.4573, "lr": 3.842915861053842e-07, "epoch": 9.49716004009355, "percentage": 94.97, "elapsed_time": "6:40:19", "remaining_time": "0:21:11", "throughput": 4306.93, "total_tokens": 103450288} +{"current_steps": 85280, "total_steps": 89790, "loss": 0.4594, "lr": 3.834432822913209e-07, "epoch": 9.497716894977168, "percentage": 94.98, "elapsed_time": "6:40:20", "remaining_time": "0:21:10", "throughput": 4306.94, "total_tokens": 103455888} +{"current_steps": 85285, "total_steps": 89790, "loss": 0.4634, "lr": 3.825959085696551e-07, "epoch": 9.498273749860786, "percentage": 94.98, "elapsed_time": "6:40:22", "remaining_time": "0:21:08", "throughput": 4306.96, "total_tokens": 103462000} +{"current_steps": 85290, "total_steps": 89790, "loss": 0.4601, "lr": 3.8174946497240574e-07, "epoch": 9.498830604744404, "percentage": 94.99, "elapsed_time": "6:40:23", "remaining_time": "0:21:07", "throughput": 4306.98, "total_tokens": 103467856} +{"current_steps": 85295, "total_steps": 89790, "loss": 0.4713, "lr": 3.8090395153155824e-07, "epoch": 9.499387459628021, "percentage": 94.99, "elapsed_time": "6:40:24", "remaining_time": "0:21:06", "throughput": 4307.0, "total_tokens": 103473968} +{"current_steps": 85300, "total_steps": 89790, "loss": 0.4655, "lr": 3.80059368279051e-07, "epoch": 9.49994431451164, "percentage": 95.0, "elapsed_time": "6:40:25", "remaining_time": "0:21:04", "throughput": 4307.03, "total_tokens": 103479984} +{"current_steps": 85305, "total_steps": 89790, "loss": 0.4609, "lr": 3.792157152468029e-07, "epoch": 9.500501169395255, "percentage": 95.01, "elapsed_time": "6:40:27", "remaining_time": "0:21:03", "throughput": 4307.05, "total_tokens": 103486000} +{"current_steps": 85310, "total_steps": 89790, "loss": 0.466, "lr": 3.783729924666829e-07, "epoch": 9.501058024278873, "percentage": 95.01, "elapsed_time": "6:40:28", "remaining_time": "0:21:01", "throughput": 4307.07, "total_tokens": 103491728} +{"current_steps": 85310, "total_steps": 89790, "eval_loss": 0.46408841013908386, "epoch": 9.501058024278873, "percentage": 95.01, "elapsed_time": "6:42:21", "remaining_time": "0:21:07", "throughput": 4286.92, "total_tokens": 103491728} +{"current_steps": 85315, "total_steps": 89790, "loss": 0.4636, "lr": 3.7753119997054054e-07, "epoch": 9.50161487916249, "percentage": 95.02, "elapsed_time": "6:42:23", "remaining_time": "0:21:06", "throughput": 4286.68, "total_tokens": 103497232} +{"current_steps": 85320, "total_steps": 89790, "loss": 0.4589, "lr": 3.766903377901698e-07, "epoch": 9.502171734046108, "percentage": 95.02, "elapsed_time": "6:42:25", "remaining_time": "0:21:04", "throughput": 4286.7, "total_tokens": 103503152} +{"current_steps": 85325, "total_steps": 89790, "loss": 0.4676, "lr": 3.758504059573509e-07, "epoch": 9.502728588929726, "percentage": 95.03, "elapsed_time": "6:42:26", "remaining_time": "0:21:03", "throughput": 4286.73, "total_tokens": 103509264}