diff --git "a/trainer_log.jsonl" "b/trainer_log.jsonl" --- "a/trainer_log.jsonl" +++ "b/trainer_log.jsonl" @@ -14643,3 +14643,771 @@ {"current_steps": 73120, "total_steps": 76960, "loss": 0.0023, "lr": 3.7842909396733627e-07, "epoch": 19.002079002079004, "percentage": 95.01, "elapsed_time": "1:46:21", "remaining_time": "0:05:35", "throughput": 1031.73, "total_tokens": 6584112} {"current_steps": 73125, "total_steps": 76960, "loss": 0.0042, "lr": 3.774469844413792e-07, "epoch": 19.00337837837838, "percentage": 95.02, "elapsed_time": "1:46:22", "remaining_time": "0:05:34", "throughput": 1031.73, "total_tokens": 6584560} {"current_steps": 73130, "total_steps": 76960, "loss": 0.0029, "lr": 3.7646614127691546e-07, "epoch": 19.004677754677754, "percentage": 95.02, "elapsed_time": "1:46:22", "remaining_time": "0:05:34", "throughput": 1031.72, "total_tokens": 6584960} +{"current_steps": 73135, "total_steps": 76960, "loss": 0.0245, "lr": 3.7548656452438826e-07, "epoch": 19.00597713097713, "percentage": 95.03, "elapsed_time": "1:46:22", "remaining_time": "0:05:33", "throughput": 1031.72, "total_tokens": 6585392} +{"current_steps": 73140, "total_steps": 76960, "loss": 0.2734, "lr": 3.7450825423418767e-07, "epoch": 19.007276507276508, "percentage": 95.04, "elapsed_time": "1:46:23", "remaining_time": "0:05:33", "throughput": 1031.72, "total_tokens": 6585856} +{"current_steps": 73145, "total_steps": 76960, "loss": 0.144, "lr": 3.7353121045661797e-07, "epoch": 19.008575883575883, "percentage": 95.04, "elapsed_time": "1:46:23", "remaining_time": "0:05:32", "throughput": 1031.73, "total_tokens": 6586336} +{"current_steps": 73150, "total_steps": 76960, "loss": 0.0002, "lr": 3.725554332419362e-07, "epoch": 19.00987525987526, "percentage": 95.05, "elapsed_time": "1:46:24", "remaining_time": "0:05:32", "throughput": 1031.73, "total_tokens": 6586752} +{"current_steps": 73155, "total_steps": 76960, "loss": 0.0164, "lr": 3.715809226403244e-07, "epoch": 19.011174636174637, "percentage": 95.06, "elapsed_time": "1:46:24", "remaining_time": "0:05:32", "throughput": 1031.73, "total_tokens": 6587216} +{"current_steps": 73160, "total_steps": 76960, "loss": 0.0013, "lr": 3.706076787019036e-07, "epoch": 19.012474012474012, "percentage": 95.06, "elapsed_time": "1:46:25", "remaining_time": "0:05:31", "throughput": 1031.74, "total_tokens": 6587680} +{"current_steps": 73165, "total_steps": 76960, "loss": 0.0023, "lr": 3.6963570147672824e-07, "epoch": 19.013773388773387, "percentage": 95.07, "elapsed_time": "1:46:25", "remaining_time": "0:05:31", "throughput": 1031.75, "total_tokens": 6588176} +{"current_steps": 73170, "total_steps": 76960, "loss": 0.0202, "lr": 3.686649910147888e-07, "epoch": 19.015072765072766, "percentage": 95.08, "elapsed_time": "1:46:25", "remaining_time": "0:05:30", "throughput": 1031.75, "total_tokens": 6588624} +{"current_steps": 73175, "total_steps": 76960, "loss": 0.0429, "lr": 3.676955473660093e-07, "epoch": 19.01637214137214, "percentage": 95.08, "elapsed_time": "1:46:26", "remaining_time": "0:05:30", "throughput": 1031.75, "total_tokens": 6589040} +{"current_steps": 73180, "total_steps": 76960, "loss": 0.1748, "lr": 3.6672737058025266e-07, "epoch": 19.017671517671516, "percentage": 95.09, "elapsed_time": "1:46:26", "remaining_time": "0:05:29", "throughput": 1031.74, "total_tokens": 6589456} +{"current_steps": 73185, "total_steps": 76960, "loss": 0.0015, "lr": 3.6576046070730675e-07, "epoch": 19.018970893970895, "percentage": 95.09, "elapsed_time": "1:46:27", "remaining_time": "0:05:29", "throughput": 1031.74, "total_tokens": 6589872} +{"current_steps": 73190, "total_steps": 76960, "loss": 0.002, "lr": 3.6479481779690403e-07, "epoch": 19.02027027027027, "percentage": 95.1, "elapsed_time": "1:46:27", "remaining_time": "0:05:29", "throughput": 1031.74, "total_tokens": 6590304} +{"current_steps": 73195, "total_steps": 76960, "loss": 0.0088, "lr": 3.6383044189870763e-07, "epoch": 19.021569646569645, "percentage": 95.11, "elapsed_time": "1:46:27", "remaining_time": "0:05:28", "throughput": 1031.74, "total_tokens": 6590720} +{"current_steps": 73200, "total_steps": 76960, "loss": 0.0055, "lr": 3.628673330623139e-07, "epoch": 19.022869022869024, "percentage": 95.11, "elapsed_time": "1:46:28", "remaining_time": "0:05:28", "throughput": 1031.75, "total_tokens": 6591200} +{"current_steps": 73205, "total_steps": 76960, "loss": 0.0221, "lr": 3.619054913372638e-07, "epoch": 19.0241683991684, "percentage": 95.12, "elapsed_time": "1:46:28", "remaining_time": "0:05:27", "throughput": 1031.75, "total_tokens": 6591632} +{"current_steps": 73210, "total_steps": 76960, "loss": 0.0323, "lr": 3.609449167730206e-07, "epoch": 19.025467775467774, "percentage": 95.13, "elapsed_time": "1:46:29", "remaining_time": "0:05:27", "throughput": 1031.75, "total_tokens": 6592080} +{"current_steps": 73215, "total_steps": 76960, "loss": 0.0015, "lr": 3.5998560941898907e-07, "epoch": 19.026767151767153, "percentage": 95.13, "elapsed_time": "1:46:29", "remaining_time": "0:05:26", "throughput": 1031.76, "total_tokens": 6592560} +{"current_steps": 73220, "total_steps": 76960, "loss": 0.0006, "lr": 3.5902756932450486e-07, "epoch": 19.028066528066528, "percentage": 95.14, "elapsed_time": "1:46:30", "remaining_time": "0:05:26", "throughput": 1031.76, "total_tokens": 6593024} +{"current_steps": 73225, "total_steps": 76960, "loss": 0.0094, "lr": 3.5807079653884526e-07, "epoch": 19.029365904365903, "percentage": 95.15, "elapsed_time": "1:46:30", "remaining_time": "0:05:25", "throughput": 1031.77, "total_tokens": 6593472} +{"current_steps": 73230, "total_steps": 76960, "loss": 0.0335, "lr": 3.5711529111121244e-07, "epoch": 19.030665280665282, "percentage": 95.15, "elapsed_time": "1:46:30", "remaining_time": "0:05:25", "throughput": 1031.77, "total_tokens": 6593952} +{"current_steps": 73235, "total_steps": 76960, "loss": 0.2378, "lr": 3.561610530907505e-07, "epoch": 19.031964656964657, "percentage": 95.16, "elapsed_time": "1:46:31", "remaining_time": "0:05:25", "throughput": 1031.77, "total_tokens": 6594384} +{"current_steps": 73240, "total_steps": 76960, "loss": 0.1014, "lr": 3.552080825265397e-07, "epoch": 19.033264033264032, "percentage": 95.17, "elapsed_time": "1:46:31", "remaining_time": "0:05:24", "throughput": 1031.77, "total_tokens": 6594800} +{"current_steps": 73245, "total_steps": 76960, "loss": 0.0577, "lr": 3.5425637946759347e-07, "epoch": 19.03456340956341, "percentage": 95.17, "elapsed_time": "1:46:32", "remaining_time": "0:05:24", "throughput": 1031.78, "total_tokens": 6595264} +{"current_steps": 73250, "total_steps": 76960, "loss": 0.1905, "lr": 3.533059439628561e-07, "epoch": 19.035862785862786, "percentage": 95.18, "elapsed_time": "1:46:32", "remaining_time": "0:05:23", "throughput": 1031.78, "total_tokens": 6595712} +{"current_steps": 73255, "total_steps": 76960, "loss": 0.0002, "lr": 3.523567760612051e-07, "epoch": 19.03716216216216, "percentage": 95.19, "elapsed_time": "1:46:32", "remaining_time": "0:05:23", "throughput": 1031.78, "total_tokens": 6596176} +{"current_steps": 73260, "total_steps": 76960, "loss": 0.1467, "lr": 3.5140887581146534e-07, "epoch": 19.03846153846154, "percentage": 95.19, "elapsed_time": "1:46:33", "remaining_time": "0:05:22", "throughput": 1031.78, "total_tokens": 6596592} +{"current_steps": 73265, "total_steps": 76960, "loss": 0.1366, "lr": 3.5046224326238107e-07, "epoch": 19.039760914760915, "percentage": 95.2, "elapsed_time": "1:46:33", "remaining_time": "0:05:22", "throughput": 1031.78, "total_tokens": 6597040} +{"current_steps": 73270, "total_steps": 76960, "loss": 0.002, "lr": 3.49516878462644e-07, "epoch": 19.04106029106029, "percentage": 95.21, "elapsed_time": "1:46:34", "remaining_time": "0:05:22", "throughput": 1031.79, "total_tokens": 6597520} +{"current_steps": 73275, "total_steps": 76960, "loss": 0.1164, "lr": 3.485727814608708e-07, "epoch": 19.04235966735967, "percentage": 95.21, "elapsed_time": "1:46:34", "remaining_time": "0:05:21", "throughput": 1031.79, "total_tokens": 6597968} +{"current_steps": 73280, "total_steps": 76960, "loss": 0.0009, "lr": 3.476299523056198e-07, "epoch": 19.043659043659044, "percentage": 95.22, "elapsed_time": "1:46:35", "remaining_time": "0:05:21", "throughput": 1031.79, "total_tokens": 6598400} +{"current_steps": 73285, "total_steps": 76960, "loss": 0.0007, "lr": 3.4668839104538273e-07, "epoch": 19.04495841995842, "percentage": 95.22, "elapsed_time": "1:46:35", "remaining_time": "0:05:20", "throughput": 1031.8, "total_tokens": 6598848} +{"current_steps": 73290, "total_steps": 76960, "loss": 0.008, "lr": 3.457480977285821e-07, "epoch": 19.046257796257795, "percentage": 95.23, "elapsed_time": "1:46:35", "remaining_time": "0:05:20", "throughput": 1031.8, "total_tokens": 6599280} +{"current_steps": 73295, "total_steps": 76960, "loss": 0.0138, "lr": 3.4480907240357906e-07, "epoch": 19.047557172557173, "percentage": 95.24, "elapsed_time": "1:46:36", "remaining_time": "0:05:19", "throughput": 1031.8, "total_tokens": 6599728} +{"current_steps": 73300, "total_steps": 76960, "loss": 0.4383, "lr": 3.438713151186712e-07, "epoch": 19.04885654885655, "percentage": 95.24, "elapsed_time": "1:46:36", "remaining_time": "0:05:19", "throughput": 1031.8, "total_tokens": 6600176} +{"current_steps": 73305, "total_steps": 76960, "loss": 0.091, "lr": 3.429348259220838e-07, "epoch": 19.050155925155924, "percentage": 95.25, "elapsed_time": "1:46:37", "remaining_time": "0:05:18", "throughput": 1031.8, "total_tokens": 6600608} +{"current_steps": 73310, "total_steps": 76960, "loss": 0.0368, "lr": 3.419996048619839e-07, "epoch": 19.051455301455302, "percentage": 95.26, "elapsed_time": "1:46:37", "remaining_time": "0:05:18", "throughput": 1031.8, "total_tokens": 6601040} +{"current_steps": 73315, "total_steps": 76960, "loss": 0.245, "lr": 3.410656519864719e-07, "epoch": 19.052754677754677, "percentage": 95.26, "elapsed_time": "1:46:37", "remaining_time": "0:05:18", "throughput": 1031.8, "total_tokens": 6601472} +{"current_steps": 73320, "total_steps": 76960, "loss": 0.3608, "lr": 3.401329673435788e-07, "epoch": 19.054054054054053, "percentage": 95.27, "elapsed_time": "1:46:38", "remaining_time": "0:05:17", "throughput": 1031.81, "total_tokens": 6601952} +{"current_steps": 73325, "total_steps": 76960, "loss": 0.017, "lr": 3.3920155098127457e-07, "epoch": 19.05535343035343, "percentage": 95.28, "elapsed_time": "1:46:38", "remaining_time": "0:05:17", "throughput": 1031.82, "total_tokens": 6602416} +{"current_steps": 73330, "total_steps": 76960, "loss": 0.0056, "lr": 3.382714029474654e-07, "epoch": 19.056652806652806, "percentage": 95.28, "elapsed_time": "1:46:39", "remaining_time": "0:05:16", "throughput": 1031.82, "total_tokens": 6602864} +{"current_steps": 73335, "total_steps": 76960, "loss": 0.186, "lr": 3.3734252328998795e-07, "epoch": 19.05795218295218, "percentage": 95.29, "elapsed_time": "1:46:39", "remaining_time": "0:05:16", "throughput": 1031.82, "total_tokens": 6603296} +{"current_steps": 73340, "total_steps": 76960, "loss": 0.0641, "lr": 3.3641491205661236e-07, "epoch": 19.05925155925156, "percentage": 95.3, "elapsed_time": "1:46:40", "remaining_time": "0:05:15", "throughput": 1031.82, "total_tokens": 6603728} +{"current_steps": 73345, "total_steps": 76960, "loss": 0.0021, "lr": 3.3548856929505047e-07, "epoch": 19.060550935550935, "percentage": 95.3, "elapsed_time": "1:46:40", "remaining_time": "0:05:15", "throughput": 1031.82, "total_tokens": 6604176} +{"current_steps": 73350, "total_steps": 76960, "loss": 0.1468, "lr": 3.345634950529419e-07, "epoch": 19.06185031185031, "percentage": 95.31, "elapsed_time": "1:46:40", "remaining_time": "0:05:15", "throughput": 1031.83, "total_tokens": 6604624} +{"current_steps": 73355, "total_steps": 76960, "loss": 0.0018, "lr": 3.336396893778709e-07, "epoch": 19.06314968814969, "percentage": 95.32, "elapsed_time": "1:46:41", "remaining_time": "0:05:14", "throughput": 1031.84, "total_tokens": 6605120} +{"current_steps": 73360, "total_steps": 76960, "loss": 0.0011, "lr": 3.3271715231734113e-07, "epoch": 19.064449064449065, "percentage": 95.32, "elapsed_time": "1:46:41", "remaining_time": "0:05:14", "throughput": 1031.83, "total_tokens": 6605536} +{"current_steps": 73365, "total_steps": 76960, "loss": 0.0086, "lr": 3.317958839188062e-07, "epoch": 19.06574844074844, "percentage": 95.33, "elapsed_time": "1:46:42", "remaining_time": "0:05:13", "throughput": 1031.84, "total_tokens": 6606000} +{"current_steps": 73370, "total_steps": 76960, "loss": 0.1659, "lr": 3.3087588422964223e-07, "epoch": 19.06704781704782, "percentage": 95.34, "elapsed_time": "1:46:42", "remaining_time": "0:05:13", "throughput": 1031.85, "total_tokens": 6606480} +{"current_steps": 73375, "total_steps": 76960, "loss": 0.0435, "lr": 3.2995715329716957e-07, "epoch": 19.068347193347194, "percentage": 95.34, "elapsed_time": "1:46:42", "remaining_time": "0:05:12", "throughput": 1031.85, "total_tokens": 6606912} +{"current_steps": 73380, "total_steps": 76960, "loss": 0.002, "lr": 3.2903969116863667e-07, "epoch": 19.06964656964657, "percentage": 95.35, "elapsed_time": "1:46:43", "remaining_time": "0:05:12", "throughput": 1031.84, "total_tokens": 6607328} +{"current_steps": 73385, "total_steps": 76960, "loss": 0.1614, "lr": 3.2812349789123063e-07, "epoch": 19.070945945945947, "percentage": 95.35, "elapsed_time": "1:46:43", "remaining_time": "0:05:11", "throughput": 1031.84, "total_tokens": 6607760} +{"current_steps": 73390, "total_steps": 76960, "loss": 0.002, "lr": 3.272085735120778e-07, "epoch": 19.072245322245323, "percentage": 95.36, "elapsed_time": "1:46:44", "remaining_time": "0:05:11", "throughput": 1031.85, "total_tokens": 6608208} +{"current_steps": 73395, "total_steps": 76960, "loss": 0.0986, "lr": 3.2629491807822375e-07, "epoch": 19.073544698544698, "percentage": 95.37, "elapsed_time": "1:46:44", "remaining_time": "0:05:11", "throughput": 1031.85, "total_tokens": 6608656} +{"current_steps": 73400, "total_steps": 76960, "loss": 0.0027, "lr": 3.253825316366643e-07, "epoch": 19.074844074844076, "percentage": 95.37, "elapsed_time": "1:46:45", "remaining_time": "0:05:10", "throughput": 1031.85, "total_tokens": 6609088} +{"current_steps": 73405, "total_steps": 76960, "loss": 0.0001, "lr": 3.24471414234323e-07, "epoch": 19.07614345114345, "percentage": 95.38, "elapsed_time": "1:46:45", "remaining_time": "0:05:10", "throughput": 1031.86, "total_tokens": 6609568} +{"current_steps": 73410, "total_steps": 76960, "loss": 0.0001, "lr": 3.2356156591805966e-07, "epoch": 19.077442827442827, "percentage": 95.39, "elapsed_time": "1:46:45", "remaining_time": "0:05:09", "throughput": 1031.86, "total_tokens": 6610000} +{"current_steps": 73415, "total_steps": 76960, "loss": 0.0014, "lr": 3.226529867346673e-07, "epoch": 19.078742203742205, "percentage": 95.39, "elapsed_time": "1:46:46", "remaining_time": "0:05:09", "throughput": 1031.86, "total_tokens": 6610448} +{"current_steps": 73420, "total_steps": 76960, "loss": 0.0002, "lr": 3.2174567673088077e-07, "epoch": 19.08004158004158, "percentage": 95.4, "elapsed_time": "1:46:46", "remaining_time": "0:05:08", "throughput": 1031.87, "total_tokens": 6610928} +{"current_steps": 73425, "total_steps": 76960, "loss": 0.1347, "lr": 3.208396359533572e-07, "epoch": 19.081340956340956, "percentage": 95.41, "elapsed_time": "1:46:47", "remaining_time": "0:05:08", "throughput": 1031.87, "total_tokens": 6611376} +{"current_steps": 73430, "total_steps": 76960, "loss": 0.0173, "lr": 3.1993486444869823e-07, "epoch": 19.08264033264033, "percentage": 95.41, "elapsed_time": "1:46:47", "remaining_time": "0:05:08", "throughput": 1031.87, "total_tokens": 6611824} +{"current_steps": 73435, "total_steps": 76960, "loss": 0.0116, "lr": 3.190313622634333e-07, "epoch": 19.08393970893971, "percentage": 95.42, "elapsed_time": "1:46:48", "remaining_time": "0:05:07", "throughput": 1031.87, "total_tokens": 6612256} +{"current_steps": 73440, "total_steps": 76960, "loss": 0.1345, "lr": 3.1812912944403915e-07, "epoch": 19.085239085239085, "percentage": 95.43, "elapsed_time": "1:46:48", "remaining_time": "0:05:07", "throughput": 1031.88, "total_tokens": 6612704} +{"current_steps": 73445, "total_steps": 76960, "loss": 0.0006, "lr": 3.172281660369092e-07, "epoch": 19.08653846153846, "percentage": 95.43, "elapsed_time": "1:46:48", "remaining_time": "0:05:06", "throughput": 1031.88, "total_tokens": 6613152} +{"current_steps": 73450, "total_steps": 76960, "loss": 0.3105, "lr": 3.163284720883841e-07, "epoch": 19.08783783783784, "percentage": 95.44, "elapsed_time": "1:46:49", "remaining_time": "0:05:06", "throughput": 1031.89, "total_tokens": 6613616} +{"current_steps": 73455, "total_steps": 76960, "loss": 0.0005, "lr": 3.1543004764473805e-07, "epoch": 19.089137214137214, "percentage": 95.45, "elapsed_time": "1:46:49", "remaining_time": "0:05:05", "throughput": 1031.89, "total_tokens": 6614080} +{"current_steps": 73460, "total_steps": 76960, "loss": 0.0759, "lr": 3.145328927521757e-07, "epoch": 19.09043659043659, "percentage": 95.45, "elapsed_time": "1:46:50", "remaining_time": "0:05:05", "throughput": 1031.9, "total_tokens": 6614560} +{"current_steps": 73465, "total_steps": 76960, "loss": 0.1129, "lr": 3.1363700745684065e-07, "epoch": 19.091735966735968, "percentage": 95.46, "elapsed_time": "1:46:50", "remaining_time": "0:05:04", "throughput": 1031.9, "total_tokens": 6615008} +{"current_steps": 73470, "total_steps": 76960, "loss": 0.2572, "lr": 3.1274239180480446e-07, "epoch": 19.093035343035343, "percentage": 95.47, "elapsed_time": "1:46:50", "remaining_time": "0:05:04", "throughput": 1031.9, "total_tokens": 6615440} +{"current_steps": 73475, "total_steps": 76960, "loss": 0.3657, "lr": 3.1184904584208586e-07, "epoch": 19.094334719334718, "percentage": 95.47, "elapsed_time": "1:46:51", "remaining_time": "0:05:04", "throughput": 1031.91, "total_tokens": 6615888} +{"current_steps": 73480, "total_steps": 76960, "loss": 0.2061, "lr": 3.109569696146231e-07, "epoch": 19.095634095634097, "percentage": 95.48, "elapsed_time": "1:46:51", "remaining_time": "0:05:03", "throughput": 1031.91, "total_tokens": 6616352} +{"current_steps": 73485, "total_steps": 76960, "loss": 0.0186, "lr": 3.1006616316829886e-07, "epoch": 19.096933471933472, "percentage": 95.48, "elapsed_time": "1:46:52", "remaining_time": "0:05:03", "throughput": 1031.91, "total_tokens": 6616784} +{"current_steps": 73490, "total_steps": 76960, "loss": 0.1593, "lr": 3.0917662654892654e-07, "epoch": 19.098232848232847, "percentage": 95.49, "elapsed_time": "1:46:52", "remaining_time": "0:05:02", "throughput": 1031.92, "total_tokens": 6617248} +{"current_steps": 73495, "total_steps": 76960, "loss": 0.0017, "lr": 3.082883598022612e-07, "epoch": 19.099532224532226, "percentage": 95.5, "elapsed_time": "1:46:52", "remaining_time": "0:05:02", "throughput": 1031.93, "total_tokens": 6617728} +{"current_steps": 73500, "total_steps": 76960, "loss": 0.0014, "lr": 3.0740136297398305e-07, "epoch": 19.1008316008316, "percentage": 95.5, "elapsed_time": "1:46:53", "remaining_time": "0:05:01", "throughput": 1031.93, "total_tokens": 6618192} +{"current_steps": 73505, "total_steps": 76960, "loss": 0.0014, "lr": 3.065156361097138e-07, "epoch": 19.102130977130976, "percentage": 95.51, "elapsed_time": "1:46:53", "remaining_time": "0:05:01", "throughput": 1031.93, "total_tokens": 6618624} +{"current_steps": 73510, "total_steps": 76960, "loss": 0.2685, "lr": 3.0563117925500595e-07, "epoch": 19.103430353430355, "percentage": 95.52, "elapsed_time": "1:46:54", "remaining_time": "0:05:01", "throughput": 1031.93, "total_tokens": 6619056} +{"current_steps": 73515, "total_steps": 76960, "loss": 0.0198, "lr": 3.0474799245534537e-07, "epoch": 19.10472972972973, "percentage": 95.52, "elapsed_time": "1:46:54", "remaining_time": "0:05:00", "throughput": 1031.93, "total_tokens": 6619488} +{"current_steps": 73520, "total_steps": 76960, "loss": 0.0005, "lr": 3.038660757561568e-07, "epoch": 19.106029106029105, "percentage": 95.53, "elapsed_time": "1:46:55", "remaining_time": "0:05:00", "throughput": 1031.94, "total_tokens": 6619968} +{"current_steps": 73525, "total_steps": 76960, "loss": 0.0239, "lr": 3.0298542920279835e-07, "epoch": 19.107328482328484, "percentage": 95.54, "elapsed_time": "1:46:55", "remaining_time": "0:04:59", "throughput": 1031.94, "total_tokens": 6620400} +{"current_steps": 73530, "total_steps": 76960, "loss": 0.0039, "lr": 3.021060528405645e-07, "epoch": 19.10862785862786, "percentage": 95.54, "elapsed_time": "1:46:55", "remaining_time": "0:04:59", "throughput": 1031.94, "total_tokens": 6620848} +{"current_steps": 73535, "total_steps": 76960, "loss": 0.1192, "lr": 3.0122794671468004e-07, "epoch": 19.109927234927234, "percentage": 95.55, "elapsed_time": "1:46:56", "remaining_time": "0:04:58", "throughput": 1031.94, "total_tokens": 6621280} +{"current_steps": 73540, "total_steps": 76960, "loss": 0.0001, "lr": 3.0035111087030885e-07, "epoch": 19.111226611226613, "percentage": 95.56, "elapsed_time": "1:46:56", "remaining_time": "0:04:58", "throughput": 1031.95, "total_tokens": 6621760} +{"current_steps": 73545, "total_steps": 76960, "loss": 0.0063, "lr": 2.9947554535254275e-07, "epoch": 19.112525987525988, "percentage": 95.56, "elapsed_time": "1:46:57", "remaining_time": "0:04:57", "throughput": 1031.95, "total_tokens": 6622192} +{"current_steps": 73550, "total_steps": 76960, "loss": 0.0938, "lr": 2.9860125020642063e-07, "epoch": 19.113825363825363, "percentage": 95.57, "elapsed_time": "1:46:57", "remaining_time": "0:04:57", "throughput": 1031.95, "total_tokens": 6622624} +{"current_steps": 73555, "total_steps": 76960, "loss": 0.0062, "lr": 2.977282254769009e-07, "epoch": 19.11512474012474, "percentage": 95.58, "elapsed_time": "1:46:57", "remaining_time": "0:04:57", "throughput": 1031.95, "total_tokens": 6623072} +{"current_steps": 73560, "total_steps": 76960, "loss": 0.2992, "lr": 2.968564712088867e-07, "epoch": 19.116424116424117, "percentage": 95.58, "elapsed_time": "1:46:58", "remaining_time": "0:04:56", "throughput": 1031.95, "total_tokens": 6623488} +{"current_steps": 73565, "total_steps": 76960, "loss": 0.3634, "lr": 2.959859874472143e-07, "epoch": 19.117723492723492, "percentage": 95.59, "elapsed_time": "1:46:58", "remaining_time": "0:04:56", "throughput": 1031.96, "total_tokens": 6623952} +{"current_steps": 73570, "total_steps": 76960, "loss": 0.0005, "lr": 2.951167742366534e-07, "epoch": 19.11902286902287, "percentage": 95.6, "elapsed_time": "1:46:59", "remaining_time": "0:04:55", "throughput": 1031.96, "total_tokens": 6624416} +{"current_steps": 73575, "total_steps": 76960, "loss": 0.0006, "lr": 2.9424883162191e-07, "epoch": 19.120322245322246, "percentage": 95.6, "elapsed_time": "1:46:59", "remaining_time": "0:04:55", "throughput": 1031.96, "total_tokens": 6624848} +{"current_steps": 73580, "total_steps": 76960, "loss": 0.0194, "lr": 2.933821596476177e-07, "epoch": 19.12162162162162, "percentage": 95.61, "elapsed_time": "1:47:00", "remaining_time": "0:04:54", "throughput": 1031.96, "total_tokens": 6625280} +{"current_steps": 73585, "total_steps": 76960, "loss": 0.0308, "lr": 2.925167583583577e-07, "epoch": 19.122920997920996, "percentage": 95.61, "elapsed_time": "1:47:00", "remaining_time": "0:04:54", "throughput": 1031.96, "total_tokens": 6625696} +{"current_steps": 73590, "total_steps": 76960, "loss": 0.1281, "lr": 2.9165262779863036e-07, "epoch": 19.124220374220375, "percentage": 95.62, "elapsed_time": "1:47:00", "remaining_time": "0:04:54", "throughput": 1031.96, "total_tokens": 6626112} +{"current_steps": 73595, "total_steps": 76960, "loss": 0.0815, "lr": 2.907897680128835e-07, "epoch": 19.12551975051975, "percentage": 95.63, "elapsed_time": "1:47:01", "remaining_time": "0:04:53", "throughput": 1031.96, "total_tokens": 6626528} +{"current_steps": 73600, "total_steps": 76960, "loss": 0.1224, "lr": 2.899281790454927e-07, "epoch": 19.126819126819125, "percentage": 95.63, "elapsed_time": "1:47:01", "remaining_time": "0:04:53", "throughput": 1031.96, "total_tokens": 6626976} +{"current_steps": 73605, "total_steps": 76960, "loss": 0.0003, "lr": 2.890678609407754e-07, "epoch": 19.128118503118504, "percentage": 95.64, "elapsed_time": "1:47:02", "remaining_time": "0:04:52", "throughput": 1031.97, "total_tokens": 6627440} +{"current_steps": 73610, "total_steps": 76960, "loss": 0.0971, "lr": 2.8820881374297113e-07, "epoch": 19.12941787941788, "percentage": 95.65, "elapsed_time": "1:47:02", "remaining_time": "0:04:52", "throughput": 1031.97, "total_tokens": 6627872} +{"current_steps": 73615, "total_steps": 76960, "loss": 0.0007, "lr": 2.8735103749626955e-07, "epoch": 19.130717255717254, "percentage": 95.65, "elapsed_time": "1:47:02", "remaining_time": "0:04:51", "throughput": 1031.98, "total_tokens": 6628368} +{"current_steps": 73620, "total_steps": 76960, "loss": 0.0004, "lr": 2.8649453224477986e-07, "epoch": 19.132016632016633, "percentage": 95.66, "elapsed_time": "1:47:03", "remaining_time": "0:04:51", "throughput": 1031.98, "total_tokens": 6628848} +{"current_steps": 73625, "total_steps": 76960, "loss": 0.5107, "lr": 2.856392980325556e-07, "epoch": 19.133316008316008, "percentage": 95.67, "elapsed_time": "1:47:03", "remaining_time": "0:04:50", "throughput": 1031.98, "total_tokens": 6629280} +{"current_steps": 73630, "total_steps": 76960, "loss": 0.0039, "lr": 2.8478533490358395e-07, "epoch": 19.134615384615383, "percentage": 95.67, "elapsed_time": "1:47:04", "remaining_time": "0:04:50", "throughput": 1032.0, "total_tokens": 6629792} +{"current_steps": 73635, "total_steps": 76960, "loss": 0.0057, "lr": 2.8393264290178243e-07, "epoch": 19.135914760914762, "percentage": 95.68, "elapsed_time": "1:47:04", "remaining_time": "0:04:50", "throughput": 1032.0, "total_tokens": 6630240} +{"current_steps": 73640, "total_steps": 76960, "loss": 0.0065, "lr": 2.8308122207100773e-07, "epoch": 19.137214137214137, "percentage": 95.69, "elapsed_time": "1:47:05", "remaining_time": "0:04:49", "throughput": 1032.0, "total_tokens": 6630688} +{"current_steps": 73645, "total_steps": 76960, "loss": 0.1871, "lr": 2.82231072455047e-07, "epoch": 19.138513513513512, "percentage": 95.69, "elapsed_time": "1:47:05", "remaining_time": "0:04:49", "throughput": 1032.01, "total_tokens": 6631136} +{"current_steps": 73650, "total_steps": 76960, "loss": 0.1032, "lr": 2.8138219409762633e-07, "epoch": 19.13981288981289, "percentage": 95.7, "elapsed_time": "1:47:05", "remaining_time": "0:04:48", "throughput": 1032.0, "total_tokens": 6631552} +{"current_steps": 73655, "total_steps": 76960, "loss": 0.0162, "lr": 2.805345870424025e-07, "epoch": 19.141112266112266, "percentage": 95.71, "elapsed_time": "1:47:06", "remaining_time": "0:04:48", "throughput": 1032.0, "total_tokens": 6631984} +{"current_steps": 73660, "total_steps": 76960, "loss": 0.0685, "lr": 2.796882513329713e-07, "epoch": 19.14241164241164, "percentage": 95.71, "elapsed_time": "1:47:06", "remaining_time": "0:04:47", "throughput": 1032.01, "total_tokens": 6632432} +{"current_steps": 73665, "total_steps": 76960, "loss": 0.0066, "lr": 2.7884318701285885e-07, "epoch": 19.14371101871102, "percentage": 95.72, "elapsed_time": "1:47:07", "remaining_time": "0:04:47", "throughput": 1032.01, "total_tokens": 6632864} +{"current_steps": 73670, "total_steps": 76960, "loss": 0.2459, "lr": 2.779993941255277e-07, "epoch": 19.145010395010395, "percentage": 95.73, "elapsed_time": "1:47:07", "remaining_time": "0:04:47", "throughput": 1032.01, "total_tokens": 6633296} +{"current_steps": 73675, "total_steps": 76960, "loss": 0.0173, "lr": 2.771568727143736e-07, "epoch": 19.14630977130977, "percentage": 95.73, "elapsed_time": "1:47:07", "remaining_time": "0:04:46", "throughput": 1032.01, "total_tokens": 6633760} +{"current_steps": 73680, "total_steps": 76960, "loss": 0.0003, "lr": 2.7631562282273425e-07, "epoch": 19.14760914760915, "percentage": 95.74, "elapsed_time": "1:47:08", "remaining_time": "0:04:46", "throughput": 1032.03, "total_tokens": 6634272} +{"current_steps": 73685, "total_steps": 76960, "loss": 0.2333, "lr": 2.7547564449386664e-07, "epoch": 19.148908523908524, "percentage": 95.74, "elapsed_time": "1:47:08", "remaining_time": "0:04:45", "throughput": 1032.03, "total_tokens": 6634704} +{"current_steps": 73690, "total_steps": 76960, "loss": 0.0026, "lr": 2.7463693777098065e-07, "epoch": 19.1502079002079, "percentage": 95.75, "elapsed_time": "1:47:09", "remaining_time": "0:04:45", "throughput": 1032.04, "total_tokens": 6635232} +{"current_steps": 73695, "total_steps": 76960, "loss": 0.0221, "lr": 2.7379950269720565e-07, "epoch": 19.151507276507278, "percentage": 95.76, "elapsed_time": "1:47:09", "remaining_time": "0:04:44", "throughput": 1032.04, "total_tokens": 6635648} +{"current_steps": 73700, "total_steps": 76960, "loss": 0.0022, "lr": 2.729633393156128e-07, "epoch": 19.152806652806653, "percentage": 95.76, "elapsed_time": "1:47:10", "remaining_time": "0:04:44", "throughput": 1032.04, "total_tokens": 6636096} +{"current_steps": 73705, "total_steps": 76960, "loss": 0.0086, "lr": 2.721284476692093e-07, "epoch": 19.15410602910603, "percentage": 95.77, "elapsed_time": "1:47:10", "remaining_time": "0:04:43", "throughput": 1032.05, "total_tokens": 6636576} +{"current_steps": 73710, "total_steps": 76960, "loss": 0.0395, "lr": 2.7129482780093305e-07, "epoch": 19.155405405405407, "percentage": 95.78, "elapsed_time": "1:47:10", "remaining_time": "0:04:43", "throughput": 1032.05, "total_tokens": 6637024} +{"current_steps": 73715, "total_steps": 76960, "loss": 0.022, "lr": 2.7046247975365815e-07, "epoch": 19.156704781704782, "percentage": 95.78, "elapsed_time": "1:47:11", "remaining_time": "0:04:43", "throughput": 1032.06, "total_tokens": 6637472} +{"current_steps": 73720, "total_steps": 76960, "loss": 0.1497, "lr": 2.6963140357018914e-07, "epoch": 19.158004158004157, "percentage": 95.79, "elapsed_time": "1:47:11", "remaining_time": "0:04:42", "throughput": 1032.06, "total_tokens": 6637904} +{"current_steps": 73725, "total_steps": 76960, "loss": 0.2852, "lr": 2.6880159929327796e-07, "epoch": 19.159303534303536, "percentage": 95.8, "elapsed_time": "1:47:12", "remaining_time": "0:04:42", "throughput": 1032.06, "total_tokens": 6638384} +{"current_steps": 73730, "total_steps": 76960, "loss": 0.094, "lr": 2.679730669655933e-07, "epoch": 19.16060291060291, "percentage": 95.8, "elapsed_time": "1:47:12", "remaining_time": "0:04:41", "throughput": 1032.07, "total_tokens": 6638848} +{"current_steps": 73735, "total_steps": 76960, "loss": 0.0205, "lr": 2.671458066297511e-07, "epoch": 19.161902286902286, "percentage": 95.81, "elapsed_time": "1:47:12", "remaining_time": "0:04:41", "throughput": 1032.07, "total_tokens": 6639296} +{"current_steps": 73740, "total_steps": 76960, "loss": 0.0113, "lr": 2.66319818328295e-07, "epoch": 19.16320166320166, "percentage": 95.82, "elapsed_time": "1:47:13", "remaining_time": "0:04:40", "throughput": 1032.08, "total_tokens": 6639760} +{"current_steps": 73745, "total_steps": 76960, "loss": 0.0069, "lr": 2.6549510210371607e-07, "epoch": 19.16450103950104, "percentage": 95.82, "elapsed_time": "1:47:13", "remaining_time": "0:04:40", "throughput": 1032.08, "total_tokens": 6640192} +{"current_steps": 73750, "total_steps": 76960, "loss": 0.0141, "lr": 2.646716579984193e-07, "epoch": 19.165800415800415, "percentage": 95.83, "elapsed_time": "1:47:14", "remaining_time": "0:04:40", "throughput": 1032.08, "total_tokens": 6640656} +{"current_steps": 73755, "total_steps": 76960, "loss": 0.004, "lr": 2.638494860547597e-07, "epoch": 19.16709979209979, "percentage": 95.84, "elapsed_time": "1:47:14", "remaining_time": "0:04:39", "throughput": 1032.09, "total_tokens": 6641104} +{"current_steps": 73760, "total_steps": 76960, "loss": 0.0015, "lr": 2.6302858631502283e-07, "epoch": 19.16839916839917, "percentage": 95.84, "elapsed_time": "1:47:15", "remaining_time": "0:04:39", "throughput": 1032.09, "total_tokens": 6641536} +{"current_steps": 73765, "total_steps": 76960, "loss": 0.0195, "lr": 2.622089588214277e-07, "epoch": 19.169698544698544, "percentage": 95.85, "elapsed_time": "1:47:15", "remaining_time": "0:04:38", "throughput": 1032.09, "total_tokens": 6642000} +{"current_steps": 73770, "total_steps": 76960, "loss": 0.1285, "lr": 2.613906036161268e-07, "epoch": 19.17099792099792, "percentage": 95.85, "elapsed_time": "1:47:15", "remaining_time": "0:04:38", "throughput": 1032.1, "total_tokens": 6642480} +{"current_steps": 73775, "total_steps": 76960, "loss": 0.1825, "lr": 2.6057352074121134e-07, "epoch": 19.1722972972973, "percentage": 95.86, "elapsed_time": "1:47:16", "remaining_time": "0:04:37", "throughput": 1032.1, "total_tokens": 6642912} +{"current_steps": 73780, "total_steps": 76960, "loss": 0.055, "lr": 2.597577102387061e-07, "epoch": 19.173596673596673, "percentage": 95.87, "elapsed_time": "1:47:16", "remaining_time": "0:04:37", "throughput": 1032.1, "total_tokens": 6643344} +{"current_steps": 73785, "total_steps": 76960, "loss": 0.0002, "lr": 2.5894317215056363e-07, "epoch": 19.17489604989605, "percentage": 95.87, "elapsed_time": "1:47:17", "remaining_time": "0:04:36", "throughput": 1032.1, "total_tokens": 6643776} +{"current_steps": 73790, "total_steps": 76960, "loss": 0.3333, "lr": 2.5812990651868097e-07, "epoch": 19.176195426195427, "percentage": 95.88, "elapsed_time": "1:47:17", "remaining_time": "0:04:36", "throughput": 1032.1, "total_tokens": 6644208} +{"current_steps": 73795, "total_steps": 76960, "loss": 0.2218, "lr": 2.5731791338488296e-07, "epoch": 19.177494802494802, "percentage": 95.89, "elapsed_time": "1:47:17", "remaining_time": "0:04:36", "throughput": 1032.1, "total_tokens": 6644640} +{"current_steps": 73800, "total_steps": 76960, "loss": 0.0042, "lr": 2.5650719279093347e-07, "epoch": 19.178794178794178, "percentage": 95.89, "elapsed_time": "1:47:18", "remaining_time": "0:04:35", "throughput": 1032.1, "total_tokens": 6645056} +{"current_steps": 73805, "total_steps": 76960, "loss": 0.2077, "lr": 2.5569774477852695e-07, "epoch": 19.180093555093556, "percentage": 95.9, "elapsed_time": "1:47:18", "remaining_time": "0:04:35", "throughput": 1032.1, "total_tokens": 6645504} +{"current_steps": 73810, "total_steps": 76960, "loss": 0.1037, "lr": 2.548895693892911e-07, "epoch": 19.18139293139293, "percentage": 95.91, "elapsed_time": "1:47:19", "remaining_time": "0:04:34", "throughput": 1032.1, "total_tokens": 6645952} +{"current_steps": 73815, "total_steps": 76960, "loss": 0.012, "lr": 2.540826666647955e-07, "epoch": 19.182692307692307, "percentage": 95.91, "elapsed_time": "1:47:19", "remaining_time": "0:04:34", "throughput": 1032.11, "total_tokens": 6646400} +{"current_steps": 73820, "total_steps": 76960, "loss": 0.3664, "lr": 2.532770366465431e-07, "epoch": 19.183991683991685, "percentage": 95.92, "elapsed_time": "1:47:20", "remaining_time": "0:04:33", "throughput": 1032.11, "total_tokens": 6646864} +{"current_steps": 73825, "total_steps": 76960, "loss": 0.3938, "lr": 2.524726793759591e-07, "epoch": 19.18529106029106, "percentage": 95.93, "elapsed_time": "1:47:20", "remaining_time": "0:04:33", "throughput": 1032.11, "total_tokens": 6647296} +{"current_steps": 73830, "total_steps": 76960, "loss": 0.0023, "lr": 2.5166959489441866e-07, "epoch": 19.186590436590436, "percentage": 95.93, "elapsed_time": "1:47:20", "remaining_time": "0:04:33", "throughput": 1032.11, "total_tokens": 6647696} +{"current_steps": 73835, "total_steps": 76960, "loss": 0.0016, "lr": 2.508677832432249e-07, "epoch": 19.187889812889814, "percentage": 95.94, "elapsed_time": "1:47:21", "remaining_time": "0:04:32", "throughput": 1032.11, "total_tokens": 6648144} +{"current_steps": 73840, "total_steps": 76960, "loss": 0.0002, "lr": 2.500672444636143e-07, "epoch": 19.18918918918919, "percentage": 95.95, "elapsed_time": "1:47:21", "remaining_time": "0:04:32", "throughput": 1032.11, "total_tokens": 6648576} +{"current_steps": 73845, "total_steps": 76960, "loss": 0.2185, "lr": 2.4926797859675666e-07, "epoch": 19.190488565488565, "percentage": 95.95, "elapsed_time": "1:47:22", "remaining_time": "0:04:31", "throughput": 1032.11, "total_tokens": 6648992} +{"current_steps": 73850, "total_steps": 76960, "loss": 0.025, "lr": 2.484699856837636e-07, "epoch": 19.191787941787943, "percentage": 95.96, "elapsed_time": "1:47:22", "remaining_time": "0:04:31", "throughput": 1032.11, "total_tokens": 6649408} +{"current_steps": 73855, "total_steps": 76960, "loss": 0.0157, "lr": 2.4767326576567716e-07, "epoch": 19.19308731808732, "percentage": 95.97, "elapsed_time": "1:47:22", "remaining_time": "0:04:30", "throughput": 1032.11, "total_tokens": 6649856} +{"current_steps": 73860, "total_steps": 76960, "loss": 0.0006, "lr": 2.468778188834675e-07, "epoch": 19.194386694386694, "percentage": 95.97, "elapsed_time": "1:47:23", "remaining_time": "0:04:30", "throughput": 1032.12, "total_tokens": 6650352} +{"current_steps": 73865, "total_steps": 76960, "loss": 0.0015, "lr": 2.4608364507805184e-07, "epoch": 19.195686070686072, "percentage": 95.98, "elapsed_time": "1:47:23", "remaining_time": "0:04:30", "throughput": 1032.12, "total_tokens": 6650800} +{"current_steps": 73870, "total_steps": 76960, "loss": 0.0181, "lr": 2.4529074439027244e-07, "epoch": 19.196985446985448, "percentage": 95.98, "elapsed_time": "1:47:24", "remaining_time": "0:04:29", "throughput": 1032.12, "total_tokens": 6651232} +{"current_steps": 73875, "total_steps": 76960, "loss": 0.0019, "lr": 2.444991168609079e-07, "epoch": 19.198284823284823, "percentage": 95.99, "elapsed_time": "1:47:24", "remaining_time": "0:04:29", "throughput": 1032.13, "total_tokens": 6651728} +{"current_steps": 73880, "total_steps": 76960, "loss": 0.042, "lr": 2.4370876253067277e-07, "epoch": 19.1995841995842, "percentage": 96.0, "elapsed_time": "1:47:25", "remaining_time": "0:04:28", "throughput": 1032.14, "total_tokens": 6652176} +{"current_steps": 73885, "total_steps": 76960, "loss": 0.0008, "lr": 2.4291968144021516e-07, "epoch": 19.200883575883577, "percentage": 96.0, "elapsed_time": "1:47:25", "remaining_time": "0:04:28", "throughput": 1032.15, "total_tokens": 6652704} +{"current_steps": 73890, "total_steps": 76960, "loss": 0.0331, "lr": 2.421318736301192e-07, "epoch": 19.20218295218295, "percentage": 96.01, "elapsed_time": "1:47:25", "remaining_time": "0:04:27", "throughput": 1032.15, "total_tokens": 6653136} +{"current_steps": 73895, "total_steps": 76960, "loss": 0.0144, "lr": 2.4134533914090817e-07, "epoch": 19.203482328482327, "percentage": 96.02, "elapsed_time": "1:47:26", "remaining_time": "0:04:27", "throughput": 1032.15, "total_tokens": 6653552} +{"current_steps": 73900, "total_steps": 76960, "loss": 0.0006, "lr": 2.405600780130246e-07, "epoch": 19.204781704781706, "percentage": 96.02, "elapsed_time": "1:47:26", "remaining_time": "0:04:26", "throughput": 1032.15, "total_tokens": 6654000} +{"current_steps": 73905, "total_steps": 76960, "loss": 0.0837, "lr": 2.397760902868612e-07, "epoch": 19.20608108108108, "percentage": 96.03, "elapsed_time": "1:47:27", "remaining_time": "0:04:26", "throughput": 1032.15, "total_tokens": 6654416} +{"current_steps": 73910, "total_steps": 76960, "loss": 0.0014, "lr": 2.3899337600273577e-07, "epoch": 19.207380457380456, "percentage": 96.04, "elapsed_time": "1:47:27", "remaining_time": "0:04:26", "throughput": 1032.15, "total_tokens": 6654864} +{"current_steps": 73915, "total_steps": 76960, "loss": 0.0012, "lr": 2.382119352009049e-07, "epoch": 19.208679833679835, "percentage": 96.04, "elapsed_time": "1:47:27", "remaining_time": "0:04:25", "throughput": 1032.16, "total_tokens": 6655312} +{"current_steps": 73920, "total_steps": 76960, "loss": 0.0303, "lr": 2.374317679215643e-07, "epoch": 19.20997920997921, "percentage": 96.05, "elapsed_time": "1:47:28", "remaining_time": "0:04:25", "throughput": 1032.16, "total_tokens": 6655744} +{"current_steps": 73925, "total_steps": 76960, "loss": 0.0006, "lr": 2.3665287420482907e-07, "epoch": 19.211278586278585, "percentage": 96.06, "elapsed_time": "1:47:28", "remaining_time": "0:04:24", "throughput": 1032.16, "total_tokens": 6656208} +{"current_steps": 73930, "total_steps": 76960, "loss": 0.0093, "lr": 2.3587525409076716e-07, "epoch": 19.212577962577964, "percentage": 96.06, "elapsed_time": "1:47:29", "remaining_time": "0:04:24", "throughput": 1032.17, "total_tokens": 6656672} +{"current_steps": 73935, "total_steps": 76960, "loss": 0.0003, "lr": 2.3509890761936882e-07, "epoch": 19.21387733887734, "percentage": 96.07, "elapsed_time": "1:47:29", "remaining_time": "0:04:23", "throughput": 1032.17, "total_tokens": 6657104} +{"current_steps": 73940, "total_steps": 76960, "loss": 0.0003, "lr": 2.3432383483056041e-07, "epoch": 19.215176715176714, "percentage": 96.08, "elapsed_time": "1:47:30", "remaining_time": "0:04:23", "throughput": 1032.17, "total_tokens": 6657552} +{"current_steps": 73945, "total_steps": 76960, "loss": 0.0941, "lr": 2.335500357642073e-07, "epoch": 19.216476091476093, "percentage": 96.08, "elapsed_time": "1:47:30", "remaining_time": "0:04:23", "throughput": 1032.18, "total_tokens": 6658016} +{"current_steps": 73950, "total_steps": 76960, "loss": 0.0949, "lr": 2.3277751046010543e-07, "epoch": 19.217775467775468, "percentage": 96.09, "elapsed_time": "1:47:30", "remaining_time": "0:04:22", "throughput": 1032.18, "total_tokens": 6658464} +{"current_steps": 73955, "total_steps": 76960, "loss": 0.3579, "lr": 2.3200625895798688e-07, "epoch": 19.219074844074843, "percentage": 96.1, "elapsed_time": "1:47:31", "remaining_time": "0:04:22", "throughput": 1032.18, "total_tokens": 6658912} +{"current_steps": 73960, "total_steps": 76960, "loss": 0.0003, "lr": 2.3123628129751996e-07, "epoch": 19.22037422037422, "percentage": 96.1, "elapsed_time": "1:47:31", "remaining_time": "0:04:21", "throughput": 1032.19, "total_tokens": 6659392} +{"current_steps": 73965, "total_steps": 76960, "loss": 0.3203, "lr": 2.3046757751830073e-07, "epoch": 19.221673596673597, "percentage": 96.11, "elapsed_time": "1:47:32", "remaining_time": "0:04:21", "throughput": 1032.19, "total_tokens": 6659840} +{"current_steps": 73970, "total_steps": 76960, "loss": 0.0054, "lr": 2.297001476598698e-07, "epoch": 19.222972972972972, "percentage": 96.11, "elapsed_time": "1:47:32", "remaining_time": "0:04:20", "throughput": 1032.19, "total_tokens": 6660256} +{"current_steps": 73975, "total_steps": 76960, "loss": 0.1865, "lr": 2.2893399176169284e-07, "epoch": 19.22427234927235, "percentage": 96.12, "elapsed_time": "1:47:32", "remaining_time": "0:04:20", "throughput": 1032.19, "total_tokens": 6660688} +{"current_steps": 73980, "total_steps": 76960, "loss": 0.0002, "lr": 2.281691098631744e-07, "epoch": 19.225571725571726, "percentage": 96.13, "elapsed_time": "1:47:33", "remaining_time": "0:04:19", "throughput": 1032.19, "total_tokens": 6661136} +{"current_steps": 73985, "total_steps": 76960, "loss": 0.0458, "lr": 2.274055020036553e-07, "epoch": 19.2268711018711, "percentage": 96.13, "elapsed_time": "1:47:33", "remaining_time": "0:04:19", "throughput": 1032.2, "total_tokens": 6661584} +{"current_steps": 73990, "total_steps": 76960, "loss": 0.461, "lr": 2.2664316822240407e-07, "epoch": 19.22817047817048, "percentage": 96.14, "elapsed_time": "1:47:34", "remaining_time": "0:04:19", "throughput": 1032.2, "total_tokens": 6662032} +{"current_steps": 73995, "total_steps": 76960, "loss": 0.4063, "lr": 2.258821085586338e-07, "epoch": 19.229469854469855, "percentage": 96.15, "elapsed_time": "1:47:34", "remaining_time": "0:04:18", "throughput": 1032.21, "total_tokens": 6662528} +{"current_steps": 74000, "total_steps": 76960, "loss": 0.0015, "lr": 2.251223230514854e-07, "epoch": 19.23076923076923, "percentage": 96.15, "elapsed_time": "1:47:35", "remaining_time": "0:04:18", "throughput": 1032.22, "total_tokens": 6663024} +{"current_steps": 74005, "total_steps": 76960, "loss": 0.0553, "lr": 2.243638117400332e-07, "epoch": 19.23206860706861, "percentage": 96.16, "elapsed_time": "1:47:35", "remaining_time": "0:04:17", "throughput": 1032.22, "total_tokens": 6663456} +{"current_steps": 74010, "total_steps": 76960, "loss": 0.2757, "lr": 2.2360657466328761e-07, "epoch": 19.233367983367984, "percentage": 96.17, "elapsed_time": "1:47:35", "remaining_time": "0:04:17", "throughput": 1032.22, "total_tokens": 6663904} +{"current_steps": 74015, "total_steps": 76960, "loss": 0.1017, "lr": 2.228506118601953e-07, "epoch": 19.23466735966736, "percentage": 96.17, "elapsed_time": "1:47:36", "remaining_time": "0:04:16", "throughput": 1032.22, "total_tokens": 6664320} +{"current_steps": 74020, "total_steps": 76960, "loss": 0.0003, "lr": 2.2209592336963625e-07, "epoch": 19.235966735966738, "percentage": 96.18, "elapsed_time": "1:47:36", "remaining_time": "0:04:16", "throughput": 1032.22, "total_tokens": 6664736} +{"current_steps": 74025, "total_steps": 76960, "loss": 0.0556, "lr": 2.2134250923042665e-07, "epoch": 19.237266112266113, "percentage": 96.19, "elapsed_time": "1:47:37", "remaining_time": "0:04:16", "throughput": 1032.21, "total_tokens": 6665152} +{"current_steps": 74030, "total_steps": 76960, "loss": 0.0003, "lr": 2.205903694813133e-07, "epoch": 19.238565488565488, "percentage": 96.19, "elapsed_time": "1:47:37", "remaining_time": "0:04:15", "throughput": 1032.23, "total_tokens": 6665648} +{"current_steps": 74035, "total_steps": 76960, "loss": 0.5437, "lr": 2.198395041609791e-07, "epoch": 19.239864864864863, "percentage": 96.2, "elapsed_time": "1:47:37", "remaining_time": "0:04:15", "throughput": 1032.23, "total_tokens": 6666096} +{"current_steps": 74040, "total_steps": 76960, "loss": 0.0809, "lr": 2.1908991330804319e-07, "epoch": 19.241164241164242, "percentage": 96.21, "elapsed_time": "1:47:38", "remaining_time": "0:04:14", "throughput": 1032.23, "total_tokens": 6666512} +{"current_steps": 74045, "total_steps": 76960, "loss": 0.1067, "lr": 2.1834159696105528e-07, "epoch": 19.242463617463617, "percentage": 96.21, "elapsed_time": "1:47:38", "remaining_time": "0:04:14", "throughput": 1032.23, "total_tokens": 6666992} +{"current_steps": 74050, "total_steps": 76960, "loss": 0.0866, "lr": 2.175945551585068e-07, "epoch": 19.243762993762992, "percentage": 96.22, "elapsed_time": "1:47:39", "remaining_time": "0:04:13", "throughput": 1032.23, "total_tokens": 6667424} +{"current_steps": 74055, "total_steps": 76960, "loss": 0.2138, "lr": 2.1684878793881146e-07, "epoch": 19.24506237006237, "percentage": 96.23, "elapsed_time": "1:47:39", "remaining_time": "0:04:13", "throughput": 1032.25, "total_tokens": 6667936} +{"current_steps": 74060, "total_steps": 76960, "loss": 0.1322, "lr": 2.1610429534033027e-07, "epoch": 19.246361746361746, "percentage": 96.23, "elapsed_time": "1:47:40", "remaining_time": "0:04:12", "throughput": 1032.25, "total_tokens": 6668384} +{"current_steps": 74065, "total_steps": 76960, "loss": 0.1325, "lr": 2.1536107740135482e-07, "epoch": 19.24766112266112, "percentage": 96.24, "elapsed_time": "1:47:40", "remaining_time": "0:04:12", "throughput": 1032.26, "total_tokens": 6668864} +{"current_steps": 74070, "total_steps": 76960, "loss": 0.334, "lr": 2.1461913416010448e-07, "epoch": 19.2489604989605, "percentage": 96.24, "elapsed_time": "1:47:40", "remaining_time": "0:04:12", "throughput": 1032.26, "total_tokens": 6669328} +{"current_steps": 74075, "total_steps": 76960, "loss": 0.3307, "lr": 2.1387846565474045e-07, "epoch": 19.250259875259875, "percentage": 96.25, "elapsed_time": "1:47:41", "remaining_time": "0:04:11", "throughput": 1032.27, "total_tokens": 6669776} +{"current_steps": 74080, "total_steps": 76960, "loss": 0.2115, "lr": 2.1313907192335724e-07, "epoch": 19.25155925155925, "percentage": 96.26, "elapsed_time": "1:47:41", "remaining_time": "0:04:11", "throughput": 1032.27, "total_tokens": 6670256} +{"current_steps": 74085, "total_steps": 76960, "loss": 0.0194, "lr": 2.1240095300397723e-07, "epoch": 19.25285862785863, "percentage": 96.26, "elapsed_time": "1:47:42", "remaining_time": "0:04:10", "throughput": 1032.28, "total_tokens": 6670704} +{"current_steps": 74090, "total_steps": 76960, "loss": 0.0012, "lr": 2.1166410893457e-07, "epoch": 19.254158004158004, "percentage": 96.27, "elapsed_time": "1:47:42", "remaining_time": "0:04:10", "throughput": 1032.28, "total_tokens": 6671184} +{"current_steps": 74095, "total_steps": 76960, "loss": 0.0327, "lr": 2.109285397530275e-07, "epoch": 19.25545738045738, "percentage": 96.28, "elapsed_time": "1:47:42", "remaining_time": "0:04:09", "throughput": 1032.28, "total_tokens": 6671584} +{"current_steps": 74100, "total_steps": 76960, "loss": 0.4546, "lr": 2.1019424549718335e-07, "epoch": 19.256756756756758, "percentage": 96.28, "elapsed_time": "1:47:43", "remaining_time": "0:04:09", "throughput": 1032.28, "total_tokens": 6672016} +{"current_steps": 74105, "total_steps": 76960, "loss": 0.0009, "lr": 2.09461226204799e-07, "epoch": 19.258056133056133, "percentage": 96.29, "elapsed_time": "1:47:43", "remaining_time": "0:04:09", "throughput": 1032.28, "total_tokens": 6672448} +{"current_steps": 74110, "total_steps": 76960, "loss": 0.0022, "lr": 2.0872948191358045e-07, "epoch": 19.259355509355508, "percentage": 96.3, "elapsed_time": "1:47:44", "remaining_time": "0:04:08", "throughput": 1032.27, "total_tokens": 6672848} +{"current_steps": 74115, "total_steps": 76960, "loss": 0.0004, "lr": 2.0799901266115585e-07, "epoch": 19.260654885654887, "percentage": 96.3, "elapsed_time": "1:47:44", "remaining_time": "0:04:08", "throughput": 1032.28, "total_tokens": 6673296} +{"current_steps": 74120, "total_steps": 76960, "loss": 0.0009, "lr": 2.0726981848509797e-07, "epoch": 19.261954261954262, "percentage": 96.31, "elapsed_time": "1:47:45", "remaining_time": "0:04:07", "throughput": 1032.27, "total_tokens": 6673712} +{"current_steps": 74125, "total_steps": 76960, "loss": 0.0146, "lr": 2.0654189942290735e-07, "epoch": 19.263253638253637, "percentage": 96.32, "elapsed_time": "1:47:45", "remaining_time": "0:04:07", "throughput": 1032.28, "total_tokens": 6674160} +{"current_steps": 74130, "total_steps": 76960, "loss": 0.0035, "lr": 2.0581525551202352e-07, "epoch": 19.264553014553016, "percentage": 96.32, "elapsed_time": "1:47:45", "remaining_time": "0:04:06", "throughput": 1032.28, "total_tokens": 6674592} +{"current_steps": 74135, "total_steps": 76960, "loss": 0.001, "lr": 2.0508988678981656e-07, "epoch": 19.26585239085239, "percentage": 96.33, "elapsed_time": "1:47:46", "remaining_time": "0:04:06", "throughput": 1032.28, "total_tokens": 6675008} +{"current_steps": 74140, "total_steps": 76960, "loss": 0.0118, "lr": 2.043657932935955e-07, "epoch": 19.267151767151766, "percentage": 96.34, "elapsed_time": "1:47:46", "remaining_time": "0:04:05", "throughput": 1032.28, "total_tokens": 6675440} +{"current_steps": 74145, "total_steps": 76960, "loss": 0.1041, "lr": 2.0364297506060003e-07, "epoch": 19.268451143451145, "percentage": 96.34, "elapsed_time": "1:47:47", "remaining_time": "0:04:05", "throughput": 1032.28, "total_tokens": 6675888} +{"current_steps": 74150, "total_steps": 76960, "loss": 0.1016, "lr": 2.029214321280032e-07, "epoch": 19.26975051975052, "percentage": 96.35, "elapsed_time": "1:47:47", "remaining_time": "0:04:05", "throughput": 1032.28, "total_tokens": 6676320} +{"current_steps": 74155, "total_steps": 76960, "loss": 0.0476, "lr": 2.0220116453291693e-07, "epoch": 19.271049896049895, "percentage": 96.36, "elapsed_time": "1:47:47", "remaining_time": "0:04:04", "throughput": 1032.28, "total_tokens": 6676752} +{"current_steps": 74160, "total_steps": 76960, "loss": 0.005, "lr": 2.0148217231238664e-07, "epoch": 19.272349272349274, "percentage": 96.36, "elapsed_time": "1:47:48", "remaining_time": "0:04:04", "throughput": 1032.28, "total_tokens": 6677168} +{"current_steps": 74165, "total_steps": 76960, "loss": 0.002, "lr": 2.007644555033855e-07, "epoch": 19.27364864864865, "percentage": 96.37, "elapsed_time": "1:47:48", "remaining_time": "0:04:03", "throughput": 1032.28, "total_tokens": 6677632} +{"current_steps": 74170, "total_steps": 76960, "loss": 0.0021, "lr": 2.0004801414283402e-07, "epoch": 19.274948024948024, "percentage": 96.37, "elapsed_time": "1:47:49", "remaining_time": "0:04:03", "throughput": 1032.29, "total_tokens": 6678128} +{"current_steps": 74175, "total_steps": 76960, "loss": 0.0198, "lr": 1.9933284826757216e-07, "epoch": 19.276247401247403, "percentage": 96.38, "elapsed_time": "1:47:49", "remaining_time": "0:04:02", "throughput": 1032.29, "total_tokens": 6678544} +{"current_steps": 74180, "total_steps": 76960, "loss": 0.1247, "lr": 1.9861895791438712e-07, "epoch": 19.277546777546778, "percentage": 96.39, "elapsed_time": "1:47:50", "remaining_time": "0:04:02", "throughput": 1032.3, "total_tokens": 6679024} +{"current_steps": 74185, "total_steps": 76960, "loss": 0.1756, "lr": 1.9790634311999124e-07, "epoch": 19.278846153846153, "percentage": 96.39, "elapsed_time": "1:47:50", "remaining_time": "0:04:02", "throughput": 1032.31, "total_tokens": 6679504} +{"current_steps": 74190, "total_steps": 76960, "loss": 0.0008, "lr": 1.971950039210385e-07, "epoch": 19.28014553014553, "percentage": 96.4, "elapsed_time": "1:47:50", "remaining_time": "0:04:01", "throughput": 1032.31, "total_tokens": 6679936} +{"current_steps": 74195, "total_steps": 76960, "loss": 0.0058, "lr": 1.964849403541108e-07, "epoch": 19.281444906444907, "percentage": 96.41, "elapsed_time": "1:47:51", "remaining_time": "0:04:01", "throughput": 1032.31, "total_tokens": 6680368} +{"current_steps": 74200, "total_steps": 76960, "loss": 0.0004, "lr": 1.957761524557261e-07, "epoch": 19.282744282744282, "percentage": 96.41, "elapsed_time": "1:47:51", "remaining_time": "0:04:00", "throughput": 1032.31, "total_tokens": 6680800} +{"current_steps": 74205, "total_steps": 76960, "loss": 0.0111, "lr": 1.950686402623414e-07, "epoch": 19.284043659043657, "percentage": 96.42, "elapsed_time": "1:47:52", "remaining_time": "0:04:00", "throughput": 1032.31, "total_tokens": 6681264} +{"current_steps": 74210, "total_steps": 76960, "loss": 0.0569, "lr": 1.943624038103442e-07, "epoch": 19.285343035343036, "percentage": 96.43, "elapsed_time": "1:47:52", "remaining_time": "0:03:59", "throughput": 1032.31, "total_tokens": 6681696} +{"current_steps": 74215, "total_steps": 76960, "loss": 0.3067, "lr": 1.936574431360555e-07, "epoch": 19.28664241164241, "percentage": 96.43, "elapsed_time": "1:47:52", "remaining_time": "0:03:59", "throughput": 1032.32, "total_tokens": 6682160} +{"current_steps": 74220, "total_steps": 76960, "loss": 0.0071, "lr": 1.9295375827573238e-07, "epoch": 19.287941787941786, "percentage": 96.44, "elapsed_time": "1:47:53", "remaining_time": "0:03:58", "throughput": 1032.32, "total_tokens": 6682624} +{"current_steps": 74225, "total_steps": 76960, "loss": 0.0448, "lr": 1.922513492655653e-07, "epoch": 19.289241164241165, "percentage": 96.45, "elapsed_time": "1:47:53", "remaining_time": "0:03:58", "throughput": 1032.33, "total_tokens": 6683088} +{"current_steps": 74230, "total_steps": 76960, "loss": 0.1007, "lr": 1.915502161416838e-07, "epoch": 19.29054054054054, "percentage": 96.45, "elapsed_time": "1:47:54", "remaining_time": "0:03:58", "throughput": 1032.33, "total_tokens": 6683536} +{"current_steps": 74235, "total_steps": 76960, "loss": 0.0237, "lr": 1.9085035894014224e-07, "epoch": 19.291839916839916, "percentage": 96.46, "elapsed_time": "1:47:54", "remaining_time": "0:03:57", "throughput": 1032.34, "total_tokens": 6684000} +{"current_steps": 74240, "total_steps": 76960, "loss": 0.0399, "lr": 1.901517776969397e-07, "epoch": 19.293139293139294, "percentage": 96.47, "elapsed_time": "1:47:55", "remaining_time": "0:03:57", "throughput": 1032.34, "total_tokens": 6684432} +{"current_steps": 74245, "total_steps": 76960, "loss": 0.0003, "lr": 1.8945447244800297e-07, "epoch": 19.29443866943867, "percentage": 96.47, "elapsed_time": "1:47:55", "remaining_time": "0:03:56", "throughput": 1032.33, "total_tokens": 6684848} +{"current_steps": 74250, "total_steps": 76960, "loss": 0.2293, "lr": 1.88758443229195e-07, "epoch": 19.295738045738045, "percentage": 96.48, "elapsed_time": "1:47:55", "remaining_time": "0:03:56", "throughput": 1032.33, "total_tokens": 6685264} +{"current_steps": 74255, "total_steps": 76960, "loss": 0.0084, "lr": 1.8806369007631219e-07, "epoch": 19.297037422037423, "percentage": 96.49, "elapsed_time": "1:47:56", "remaining_time": "0:03:55", "throughput": 1032.33, "total_tokens": 6685696} +{"current_steps": 74260, "total_steps": 76960, "loss": 0.0008, "lr": 1.8737021302508707e-07, "epoch": 19.2983367983368, "percentage": 96.49, "elapsed_time": "1:47:56", "remaining_time": "0:03:55", "throughput": 1032.33, "total_tokens": 6686144} +{"current_steps": 74265, "total_steps": 76960, "loss": 0.1665, "lr": 1.8667801211118828e-07, "epoch": 19.299636174636174, "percentage": 96.5, "elapsed_time": "1:47:57", "remaining_time": "0:03:55", "throughput": 1032.34, "total_tokens": 6686592} +{"current_steps": 74270, "total_steps": 76960, "loss": 0.0186, "lr": 1.8598708737021243e-07, "epoch": 19.300935550935552, "percentage": 96.5, "elapsed_time": "1:47:57", "remaining_time": "0:03:54", "throughput": 1032.34, "total_tokens": 6687040} +{"current_steps": 74275, "total_steps": 76960, "loss": 0.0271, "lr": 1.852974388376977e-07, "epoch": 19.302234927234927, "percentage": 96.51, "elapsed_time": "1:47:57", "remaining_time": "0:03:54", "throughput": 1032.34, "total_tokens": 6687472} +{"current_steps": 74280, "total_steps": 76960, "loss": 0.0012, "lr": 1.8460906654911014e-07, "epoch": 19.303534303534303, "percentage": 96.52, "elapsed_time": "1:47:58", "remaining_time": "0:03:53", "throughput": 1032.35, "total_tokens": 6687936} +{"current_steps": 74285, "total_steps": 76960, "loss": 0.1129, "lr": 1.839219705398576e-07, "epoch": 19.30483367983368, "percentage": 96.52, "elapsed_time": "1:47:58", "remaining_time": "0:03:53", "throughput": 1032.35, "total_tokens": 6688368} +{"current_steps": 74290, "total_steps": 76960, "loss": 0.0132, "lr": 1.832361508452729e-07, "epoch": 19.306133056133056, "percentage": 96.53, "elapsed_time": "1:47:59", "remaining_time": "0:03:52", "throughput": 1032.35, "total_tokens": 6688816} +{"current_steps": 74295, "total_steps": 76960, "loss": 0.0019, "lr": 1.8255160750063338e-07, "epoch": 19.30743243243243, "percentage": 96.54, "elapsed_time": "1:47:59", "remaining_time": "0:03:52", "throughput": 1032.35, "total_tokens": 6689264} +{"current_steps": 74300, "total_steps": 76960, "loss": 0.0002, "lr": 1.8186834054114422e-07, "epoch": 19.30873180873181, "percentage": 96.54, "elapsed_time": "1:48:00", "remaining_time": "0:03:51", "throughput": 1032.35, "total_tokens": 6689696} +{"current_steps": 74305, "total_steps": 76960, "loss": 0.1327, "lr": 1.8118635000194396e-07, "epoch": 19.310031185031185, "percentage": 96.55, "elapsed_time": "1:48:00", "remaining_time": "0:03:51", "throughput": 1032.35, "total_tokens": 6690128} +{"current_steps": 74310, "total_steps": 76960, "loss": 0.0009, "lr": 1.805056359181101e-07, "epoch": 19.31133056133056, "percentage": 96.56, "elapsed_time": "1:48:00", "remaining_time": "0:03:51", "throughput": 1032.36, "total_tokens": 6690624} +{"current_steps": 74315, "total_steps": 76960, "loss": 0.0003, "lr": 1.7982619832465353e-07, "epoch": 19.31262993762994, "percentage": 96.56, "elapsed_time": "1:48:01", "remaining_time": "0:03:50", "throughput": 1032.37, "total_tokens": 6691072} +{"current_steps": 74320, "total_steps": 76960, "loss": 0.022, "lr": 1.7914803725651573e-07, "epoch": 19.313929313929314, "percentage": 96.57, "elapsed_time": "1:48:01", "remaining_time": "0:03:50", "throughput": 1032.38, "total_tokens": 6691568} +{"current_steps": 74325, "total_steps": 76960, "loss": 0.1351, "lr": 1.7847115274857718e-07, "epoch": 19.31522869022869, "percentage": 96.58, "elapsed_time": "1:48:02", "remaining_time": "0:03:49", "throughput": 1032.38, "total_tokens": 6692016} +{"current_steps": 74330, "total_steps": 76960, "loss": 0.0868, "lr": 1.7779554483565163e-07, "epoch": 19.316528066528065, "percentage": 96.58, "elapsed_time": "1:48:02", "remaining_time": "0:03:49", "throughput": 1032.38, "total_tokens": 6692448} +{"current_steps": 74335, "total_steps": 76960, "loss": 0.1206, "lr": 1.7712121355248356e-07, "epoch": 19.317827442827443, "percentage": 96.59, "elapsed_time": "1:48:02", "remaining_time": "0:03:48", "throughput": 1032.38, "total_tokens": 6692896} +{"current_steps": 74340, "total_steps": 76960, "loss": 0.2277, "lr": 1.7644815893375632e-07, "epoch": 19.31912681912682, "percentage": 96.6, "elapsed_time": "1:48:03", "remaining_time": "0:03:48", "throughput": 1032.38, "total_tokens": 6693328} +{"current_steps": 74345, "total_steps": 76960, "loss": 0.2095, "lr": 1.7577638101408389e-07, "epoch": 19.320426195426194, "percentage": 96.6, "elapsed_time": "1:48:03", "remaining_time": "0:03:48", "throughput": 1032.39, "total_tokens": 6693792} +{"current_steps": 74350, "total_steps": 76960, "loss": 0.23, "lr": 1.7510587982801641e-07, "epoch": 19.321725571725572, "percentage": 96.61, "elapsed_time": "1:48:04", "remaining_time": "0:03:47", "throughput": 1032.4, "total_tokens": 6694304} +{"current_steps": 74355, "total_steps": 76960, "loss": 0.0002, "lr": 1.7443665541004016e-07, "epoch": 19.323024948024948, "percentage": 96.62, "elapsed_time": "1:48:04", "remaining_time": "0:03:47", "throughput": 1032.4, "total_tokens": 6694752} +{"current_steps": 74360, "total_steps": 76960, "loss": 0.0021, "lr": 1.7376870779457487e-07, "epoch": 19.324324324324323, "percentage": 96.62, "elapsed_time": "1:48:05", "remaining_time": "0:03:46", "throughput": 1032.41, "total_tokens": 6695216} +{"current_steps": 74365, "total_steps": 76960, "loss": 0.0093, "lr": 1.731020370159736e-07, "epoch": 19.3256237006237, "percentage": 96.63, "elapsed_time": "1:48:05", "remaining_time": "0:03:46", "throughput": 1032.41, "total_tokens": 6695664} +{"current_steps": 74370, "total_steps": 76960, "loss": 0.0036, "lr": 1.7243664310852003e-07, "epoch": 19.326923076923077, "percentage": 96.63, "elapsed_time": "1:48:05", "remaining_time": "0:03:45", "throughput": 1032.41, "total_tokens": 6696112} +{"current_steps": 74375, "total_steps": 76960, "loss": 0.0003, "lr": 1.7177252610643958e-07, "epoch": 19.328222453222452, "percentage": 96.64, "elapsed_time": "1:48:06", "remaining_time": "0:03:45", "throughput": 1032.42, "total_tokens": 6696576} +{"current_steps": 74380, "total_steps": 76960, "loss": 0.0328, "lr": 1.7110968604388544e-07, "epoch": 19.32952182952183, "percentage": 96.65, "elapsed_time": "1:48:06", "remaining_time": "0:03:45", "throughput": 1032.42, "total_tokens": 6697024} +{"current_steps": 74385, "total_steps": 76960, "loss": 0.1391, "lr": 1.704481229549526e-07, "epoch": 19.330821205821206, "percentage": 96.65, "elapsed_time": "1:48:07", "remaining_time": "0:03:44", "throughput": 1032.43, "total_tokens": 6697504} +{"current_steps": 74390, "total_steps": 76960, "loss": 0.1668, "lr": 1.6978783687366107e-07, "epoch": 19.33212058212058, "percentage": 96.66, "elapsed_time": "1:48:07", "remaining_time": "0:03:44", "throughput": 1032.44, "total_tokens": 6698000} +{"current_steps": 74395, "total_steps": 76960, "loss": 0.0037, "lr": 1.691288278339753e-07, "epoch": 19.33341995841996, "percentage": 96.67, "elapsed_time": "1:48:07", "remaining_time": "0:03:43", "throughput": 1032.44, "total_tokens": 6698432} +{"current_steps": 74400, "total_steps": 76960, "loss": 0.0018, "lr": 1.6847109586978216e-07, "epoch": 19.334719334719335, "percentage": 96.67, "elapsed_time": "1:48:08", "remaining_time": "0:03:43", "throughput": 1032.45, "total_tokens": 6698896} +{"current_steps": 74405, "total_steps": 76960, "loss": 0.0211, "lr": 1.678146410149156e-07, "epoch": 19.33601871101871, "percentage": 96.68, "elapsed_time": "1:48:08", "remaining_time": "0:03:42", "throughput": 1032.45, "total_tokens": 6699360} +{"current_steps": 74410, "total_steps": 76960, "loss": 0.0525, "lr": 1.671594633031348e-07, "epoch": 19.33731808731809, "percentage": 96.69, "elapsed_time": "1:48:09", "remaining_time": "0:03:42", "throughput": 1032.45, "total_tokens": 6699808} +{"current_steps": 74415, "total_steps": 76960, "loss": 0.0083, "lr": 1.66505562768135e-07, "epoch": 19.338617463617464, "percentage": 96.69, "elapsed_time": "1:48:09", "remaining_time": "0:03:41", "throughput": 1032.46, "total_tokens": 6700240} +{"current_steps": 74420, "total_steps": 76960, "loss": 0.0005, "lr": 1.6585293944354762e-07, "epoch": 19.33991683991684, "percentage": 96.7, "elapsed_time": "1:48:10", "remaining_time": "0:03:41", "throughput": 1032.46, "total_tokens": 6700720} +{"current_steps": 74425, "total_steps": 76960, "loss": 0.0007, "lr": 1.6520159336294306e-07, "epoch": 19.341216216216218, "percentage": 96.71, "elapsed_time": "1:48:10", "remaining_time": "0:03:41", "throughput": 1032.46, "total_tokens": 6701120} +{"current_steps": 74430, "total_steps": 76960, "loss": 0.0014, "lr": 1.6455152455981392e-07, "epoch": 19.342515592515593, "percentage": 96.71, "elapsed_time": "1:48:10", "remaining_time": "0:03:40", "throughput": 1032.46, "total_tokens": 6701584} +{"current_steps": 74435, "total_steps": 76960, "loss": 0.0038, "lr": 1.6390273306759463e-07, "epoch": 19.343814968814968, "percentage": 96.72, "elapsed_time": "1:48:11", "remaining_time": "0:03:40", "throughput": 1032.47, "total_tokens": 6702032} +{"current_steps": 74440, "total_steps": 76960, "loss": 0.0569, "lr": 1.6325521891965568e-07, "epoch": 19.345114345114347, "percentage": 96.73, "elapsed_time": "1:48:11", "remaining_time": "0:03:39", "throughput": 1032.47, "total_tokens": 6702480} +{"current_steps": 74445, "total_steps": 76960, "loss": 0.0012, "lr": 1.6260898214929542e-07, "epoch": 19.34641372141372, "percentage": 96.73, "elapsed_time": "1:48:12", "remaining_time": "0:03:39", "throughput": 1032.48, "total_tokens": 6702944} +{"current_steps": 74450, "total_steps": 76960, "loss": 0.0059, "lr": 1.6196402278975675e-07, "epoch": 19.347713097713097, "percentage": 96.74, "elapsed_time": "1:48:12", "remaining_time": "0:03:38", "throughput": 1032.48, "total_tokens": 6703376} +{"current_steps": 74455, "total_steps": 76960, "loss": 0.1383, "lr": 1.6132034087420477e-07, "epoch": 19.349012474012476, "percentage": 96.75, "elapsed_time": "1:48:12", "remaining_time": "0:03:38", "throughput": 1032.47, "total_tokens": 6703792} +{"current_steps": 74460, "total_steps": 76960, "loss": 0.0002, "lr": 1.6067793643574912e-07, "epoch": 19.35031185031185, "percentage": 96.75, "elapsed_time": "1:48:13", "remaining_time": "0:03:38", "throughput": 1032.48, "total_tokens": 6704256} +{"current_steps": 74465, "total_steps": 76960, "loss": 0.0004, "lr": 1.6003680950742728e-07, "epoch": 19.351611226611226, "percentage": 96.76, "elapsed_time": "1:48:13", "remaining_time": "0:03:37", "throughput": 1032.48, "total_tokens": 6704720} +{"current_steps": 74470, "total_steps": 76960, "loss": 0.011, "lr": 1.5939696012221007e-07, "epoch": 19.352910602910605, "percentage": 96.76, "elapsed_time": "1:48:14", "remaining_time": "0:03:37", "throughput": 1032.48, "total_tokens": 6705136} +{"current_steps": 74475, "total_steps": 76960, "loss": 0.0025, "lr": 1.5875838831301004e-07, "epoch": 19.35420997920998, "percentage": 96.77, "elapsed_time": "1:48:14", "remaining_time": "0:03:36", "throughput": 1032.49, "total_tokens": 6705600} +{"current_steps": 74480, "total_steps": 76960, "loss": 0.0011, "lr": 1.5812109411266762e-07, "epoch": 19.355509355509355, "percentage": 96.78, "elapsed_time": "1:48:15", "remaining_time": "0:03:36", "throughput": 1032.49, "total_tokens": 6706048} +{"current_steps": 74485, "total_steps": 76960, "loss": 0.0671, "lr": 1.5748507755395936e-07, "epoch": 19.35680873180873, "percentage": 96.78, "elapsed_time": "1:48:15", "remaining_time": "0:03:35", "throughput": 1032.49, "total_tokens": 6706480} +{"current_steps": 74490, "total_steps": 76960, "loss": 0.0207, "lr": 1.5685033866959798e-07, "epoch": 19.35810810810811, "percentage": 96.79, "elapsed_time": "1:48:15", "remaining_time": "0:03:35", "throughput": 1032.49, "total_tokens": 6706928} +{"current_steps": 74495, "total_steps": 76960, "loss": 0.0015, "lr": 1.5621687749222679e-07, "epoch": 19.359407484407484, "percentage": 96.8, "elapsed_time": "1:48:16", "remaining_time": "0:03:34", "throughput": 1032.5, "total_tokens": 6707392} +{"current_steps": 74500, "total_steps": 76960, "loss": 0.0182, "lr": 1.5558469405442534e-07, "epoch": 19.36070686070686, "percentage": 96.8, "elapsed_time": "1:48:16", "remaining_time": "0:03:34", "throughput": 1032.5, "total_tokens": 6707872} +{"current_steps": 74505, "total_steps": 76960, "loss": 0.0328, "lr": 1.5495378838870643e-07, "epoch": 19.362006237006238, "percentage": 96.81, "elapsed_time": "1:48:17", "remaining_time": "0:03:34", "throughput": 1032.5, "total_tokens": 6708288} +{"current_steps": 74510, "total_steps": 76960, "loss": 0.0005, "lr": 1.5432416052752198e-07, "epoch": 19.363305613305613, "percentage": 96.82, "elapsed_time": "1:48:17", "remaining_time": "0:03:33", "throughput": 1032.51, "total_tokens": 6708752} +{"current_steps": 74515, "total_steps": 76960, "loss": 0.1366, "lr": 1.5369581050325155e-07, "epoch": 19.364604989604988, "percentage": 96.82, "elapsed_time": "1:48:17", "remaining_time": "0:03:33", "throughput": 1032.51, "total_tokens": 6709216} +{"current_steps": 74520, "total_steps": 76960, "loss": 0.0001, "lr": 1.5306873834821102e-07, "epoch": 19.365904365904367, "percentage": 96.83, "elapsed_time": "1:48:18", "remaining_time": "0:03:32", "throughput": 1032.51, "total_tokens": 6709664} +{"current_steps": 74525, "total_steps": 76960, "loss": 0.1629, "lr": 1.5244294409465232e-07, "epoch": 19.367203742203742, "percentage": 96.84, "elapsed_time": "1:48:18", "remaining_time": "0:03:32", "throughput": 1032.52, "total_tokens": 6710112} +{"current_steps": 74530, "total_steps": 76960, "loss": 0.0286, "lr": 1.5181842777476084e-07, "epoch": 19.368503118503117, "percentage": 96.84, "elapsed_time": "1:48:19", "remaining_time": "0:03:31", "throughput": 1032.52, "total_tokens": 6710544} +{"current_steps": 74535, "total_steps": 76960, "loss": 0.0149, "lr": 1.5119518942065535e-07, "epoch": 19.369802494802496, "percentage": 96.85, "elapsed_time": "1:48:19", "remaining_time": "0:03:31", "throughput": 1032.52, "total_tokens": 6710992} +{"current_steps": 74540, "total_steps": 76960, "loss": 0.0871, "lr": 1.5057322906439075e-07, "epoch": 19.37110187110187, "percentage": 96.86, "elapsed_time": "1:48:20", "remaining_time": "0:03:31", "throughput": 1032.52, "total_tokens": 6711440} +{"current_steps": 74545, "total_steps": 76960, "loss": 0.0001, "lr": 1.4995254673795812e-07, "epoch": 19.372401247401246, "percentage": 96.86, "elapsed_time": "1:48:20", "remaining_time": "0:03:30", "throughput": 1032.53, "total_tokens": 6711904} +{"current_steps": 74550, "total_steps": 76960, "loss": 0.0022, "lr": 1.4933314247327078e-07, "epoch": 19.373700623700625, "percentage": 96.87, "elapsed_time": "1:48:20", "remaining_time": "0:03:30", "throughput": 1032.54, "total_tokens": 6712384} +{"current_steps": 74555, "total_steps": 76960, "loss": 0.0576, "lr": 1.48715016302195e-07, "epoch": 19.375, "percentage": 96.88, "elapsed_time": "1:48:21", "remaining_time": "0:03:29", "throughput": 1032.54, "total_tokens": 6712832} +{"current_steps": 74560, "total_steps": 76960, "loss": 0.0022, "lr": 1.4809816825651356e-07, "epoch": 19.376299376299375, "percentage": 96.88, "elapsed_time": "1:48:21", "remaining_time": "0:03:29", "throughput": 1032.54, "total_tokens": 6713264} +{"current_steps": 74565, "total_steps": 76960, "loss": 0.0003, "lr": 1.4748259836795675e-07, "epoch": 19.377598752598754, "percentage": 96.89, "elapsed_time": "1:48:22", "remaining_time": "0:03:28", "throughput": 1032.55, "total_tokens": 6713760} +{"current_steps": 74570, "total_steps": 76960, "loss": 0.4416, "lr": 1.468683066681853e-07, "epoch": 19.37889812889813, "percentage": 96.89, "elapsed_time": "1:48:22", "remaining_time": "0:03:28", "throughput": 1032.55, "total_tokens": 6714224} +{"current_steps": 74575, "total_steps": 76960, "loss": 0.0156, "lr": 1.4625529318878505e-07, "epoch": 19.380197505197504, "percentage": 96.9, "elapsed_time": "1:48:22", "remaining_time": "0:03:27", "throughput": 1032.56, "total_tokens": 6714656} +{"current_steps": 74580, "total_steps": 76960, "loss": 0.2713, "lr": 1.4564355796129193e-07, "epoch": 19.381496881496883, "percentage": 96.91, "elapsed_time": "1:48:23", "remaining_time": "0:03:27", "throughput": 1032.56, "total_tokens": 6715136} +{"current_steps": 74585, "total_steps": 76960, "loss": 0.0099, "lr": 1.4503310101716406e-07, "epoch": 19.382796257796258, "percentage": 96.91, "elapsed_time": "1:48:23", "remaining_time": "0:03:27", "throughput": 1032.57, "total_tokens": 6715584} +{"current_steps": 74590, "total_steps": 76960, "loss": 0.0011, "lr": 1.4442392238779856e-07, "epoch": 19.384095634095633, "percentage": 96.92, "elapsed_time": "1:48:24", "remaining_time": "0:03:26", "throughput": 1032.57, "total_tokens": 6716032} +{"current_steps": 74595, "total_steps": 76960, "loss": 0.0026, "lr": 1.4381602210452593e-07, "epoch": 19.385395010395012, "percentage": 96.93, "elapsed_time": "1:48:24", "remaining_time": "0:03:26", "throughput": 1032.57, "total_tokens": 6716464} +{"current_steps": 74600, "total_steps": 76960, "loss": 0.0476, "lr": 1.4320940019861283e-07, "epoch": 19.386694386694387, "percentage": 96.93, "elapsed_time": "1:48:25", "remaining_time": "0:03:25", "throughput": 1032.57, "total_tokens": 6716896} +{"current_steps": 74605, "total_steps": 76960, "loss": 0.0507, "lr": 1.4260405670125378e-07, "epoch": 19.387993762993762, "percentage": 96.94, "elapsed_time": "1:48:25", "remaining_time": "0:03:25", "throughput": 1032.58, "total_tokens": 6717360} +{"current_steps": 74610, "total_steps": 76960, "loss": 0.0004, "lr": 1.4199999164359045e-07, "epoch": 19.38929313929314, "percentage": 96.95, "elapsed_time": "1:48:25", "remaining_time": "0:03:24", "throughput": 1032.58, "total_tokens": 6717792} +{"current_steps": 74615, "total_steps": 76960, "loss": 0.0027, "lr": 1.4139720505668141e-07, "epoch": 19.390592515592516, "percentage": 96.95, "elapsed_time": "1:48:26", "remaining_time": "0:03:24", "throughput": 1032.58, "total_tokens": 6718256} +{"current_steps": 74620, "total_steps": 76960, "loss": 0.0186, "lr": 1.4079569697153239e-07, "epoch": 19.39189189189189, "percentage": 96.96, "elapsed_time": "1:48:26", "remaining_time": "0:03:24", "throughput": 1032.59, "total_tokens": 6718736} +{"current_steps": 74625, "total_steps": 76960, "loss": 0.053, "lr": 1.4019546741908251e-07, "epoch": 19.39319126819127, "percentage": 96.97, "elapsed_time": "1:48:27", "remaining_time": "0:03:23", "throughput": 1032.59, "total_tokens": 6719200} +{"current_steps": 74630, "total_steps": 76960, "loss": 0.0234, "lr": 1.39596516430196e-07, "epoch": 19.394490644490645, "percentage": 96.97, "elapsed_time": "1:48:27", "remaining_time": "0:03:23", "throughput": 1032.6, "total_tokens": 6719632} +{"current_steps": 74635, "total_steps": 76960, "loss": 0.1017, "lr": 1.3899884403568153e-07, "epoch": 19.39579002079002, "percentage": 96.98, "elapsed_time": "1:48:27", "remaining_time": "0:03:22", "throughput": 1032.6, "total_tokens": 6720112} +{"current_steps": 74640, "total_steps": 76960, "loss": 0.1185, "lr": 1.384024502662784e-07, "epoch": 19.397089397089395, "percentage": 96.99, "elapsed_time": "1:48:28", "remaining_time": "0:03:22", "throughput": 1032.61, "total_tokens": 6720592} +{"current_steps": 74645, "total_steps": 76960, "loss": 0.2012, "lr": 1.378073351526593e-07, "epoch": 19.398388773388774, "percentage": 96.99, "elapsed_time": "1:48:28", "remaining_time": "0:03:21", "throughput": 1032.61, "total_tokens": 6721040} +{"current_steps": 74650, "total_steps": 76960, "loss": 0.0714, "lr": 1.3721349872542756e-07, "epoch": 19.39968814968815, "percentage": 97.0, "elapsed_time": "1:48:29", "remaining_time": "0:03:21", "throughput": 1032.62, "total_tokens": 6721504} +{"current_steps": 74655, "total_steps": 76960, "loss": 0.0764, "lr": 1.366209410151309e-07, "epoch": 19.400987525987524, "percentage": 97.0, "elapsed_time": "1:48:29", "remaining_time": "0:03:20", "throughput": 1032.62, "total_tokens": 6721968} +{"current_steps": 74660, "total_steps": 76960, "loss": 0.0098, "lr": 1.3602966205223943e-07, "epoch": 19.402286902286903, "percentage": 97.01, "elapsed_time": "1:48:30", "remaining_time": "0:03:20", "throughput": 1032.63, "total_tokens": 6722432} +{"current_steps": 74665, "total_steps": 76960, "loss": 0.0032, "lr": 1.3543966186716773e-07, "epoch": 19.40358627858628, "percentage": 97.02, "elapsed_time": "1:48:30", "remaining_time": "0:03:20", "throughput": 1032.64, "total_tokens": 6722944} +{"current_steps": 74670, "total_steps": 76960, "loss": 0.0018, "lr": 1.3485094049025816e-07, "epoch": 19.404885654885653, "percentage": 97.02, "elapsed_time": "1:48:30", "remaining_time": "0:03:19", "throughput": 1032.64, "total_tokens": 6723376} +{"current_steps": 74675, "total_steps": 76960, "loss": 0.0067, "lr": 1.3426349795178926e-07, "epoch": 19.406185031185032, "percentage": 97.03, "elapsed_time": "1:48:31", "remaining_time": "0:03:19", "throughput": 1032.64, "total_tokens": 6723808} +{"current_steps": 74680, "total_steps": 76960, "loss": 0.0042, "lr": 1.3367733428197304e-07, "epoch": 19.407484407484407, "percentage": 97.04, "elapsed_time": "1:48:31", "remaining_time": "0:03:18", "throughput": 1032.65, "total_tokens": 6724256} +{"current_steps": 74685, "total_steps": 76960, "loss": 0.0074, "lr": 1.3309244951095756e-07, "epoch": 19.408783783783782, "percentage": 97.04, "elapsed_time": "1:48:32", "remaining_time": "0:03:18", "throughput": 1032.65, "total_tokens": 6724720} +{"current_steps": 74690, "total_steps": 76960, "loss": 0.0716, "lr": 1.325088436688271e-07, "epoch": 19.41008316008316, "percentage": 97.05, "elapsed_time": "1:48:32", "remaining_time": "0:03:17", "throughput": 1032.66, "total_tokens": 6725216} +{"current_steps": 74695, "total_steps": 76960, "loss": 0.0001, "lr": 1.319265167855882e-07, "epoch": 19.411382536382536, "percentage": 97.06, "elapsed_time": "1:48:32", "remaining_time": "0:03:17", "throughput": 1032.67, "total_tokens": 6725664} +{"current_steps": 74700, "total_steps": 76960, "loss": 0.0028, "lr": 1.3134546889120026e-07, "epoch": 19.41268191268191, "percentage": 97.06, "elapsed_time": "1:48:33", "remaining_time": "0:03:17", "throughput": 1032.68, "total_tokens": 6726160} +{"current_steps": 74705, "total_steps": 76960, "loss": 0.0982, "lr": 1.3076570001553934e-07, "epoch": 19.41398128898129, "percentage": 97.07, "elapsed_time": "1:48:33", "remaining_time": "0:03:16", "throughput": 1032.68, "total_tokens": 6726608} +{"current_steps": 74710, "total_steps": 76960, "loss": 0.0072, "lr": 1.3018721018842883e-07, "epoch": 19.415280665280665, "percentage": 97.08, "elapsed_time": "1:48:34", "remaining_time": "0:03:16", "throughput": 1032.68, "total_tokens": 6727072} +{"current_steps": 74715, "total_steps": 76960, "loss": 0.0094, "lr": 1.2960999943961992e-07, "epoch": 19.41658004158004, "percentage": 97.08, "elapsed_time": "1:48:34", "remaining_time": "0:03:15", "throughput": 1032.69, "total_tokens": 6727536} +{"current_steps": 74720, "total_steps": 76960, "loss": 0.0281, "lr": 1.2903406779879722e-07, "epoch": 19.41787941787942, "percentage": 97.09, "elapsed_time": "1:48:34", "remaining_time": "0:03:15", "throughput": 1032.7, "total_tokens": 6728016} +{"current_steps": 74725, "total_steps": 76960, "loss": 0.4705, "lr": 1.2845941529558424e-07, "epoch": 19.419178794178794, "percentage": 97.1, "elapsed_time": "1:48:35", "remaining_time": "0:03:14", "throughput": 1032.69, "total_tokens": 6728432} +{"current_steps": 74730, "total_steps": 76960, "loss": 0.0003, "lr": 1.2788604195953234e-07, "epoch": 19.42047817047817, "percentage": 97.1, "elapsed_time": "1:48:35", "remaining_time": "0:03:14", "throughput": 1032.7, "total_tokens": 6728880} +{"current_steps": 74735, "total_steps": 76960, "loss": 0.2007, "lr": 1.273139478201346e-07, "epoch": 19.421777546777548, "percentage": 97.11, "elapsed_time": "1:48:36", "remaining_time": "0:03:14", "throughput": 1032.7, "total_tokens": 6729296} +{"current_steps": 74740, "total_steps": 76960, "loss": 0.0246, "lr": 1.2674313290680916e-07, "epoch": 19.423076923076923, "percentage": 97.12, "elapsed_time": "1:48:36", "remaining_time": "0:03:13", "throughput": 1032.7, "total_tokens": 6729728} +{"current_steps": 74745, "total_steps": 76960, "loss": 0.0007, "lr": 1.2617359724891863e-07, "epoch": 19.4243762993763, "percentage": 97.12, "elapsed_time": "1:48:37", "remaining_time": "0:03:13", "throughput": 1032.7, "total_tokens": 6730176} +{"current_steps": 74750, "total_steps": 76960, "loss": 0.1564, "lr": 1.2560534087575349e-07, "epoch": 19.425675675675677, "percentage": 97.13, "elapsed_time": "1:48:37", "remaining_time": "0:03:12", "throughput": 1032.7, "total_tokens": 6730624} +{"current_steps": 74755, "total_steps": 76960, "loss": 0.1978, "lr": 1.2503836381654032e-07, "epoch": 19.426975051975052, "percentage": 97.13, "elapsed_time": "1:48:37", "remaining_time": "0:03:12", "throughput": 1032.71, "total_tokens": 6731088} +{"current_steps": 74760, "total_steps": 76960, "loss": 0.0062, "lr": 1.244726661004364e-07, "epoch": 19.428274428274428, "percentage": 97.14, "elapsed_time": "1:48:38", "remaining_time": "0:03:11", "throughput": 1032.71, "total_tokens": 6731552} +{"current_steps": 74765, "total_steps": 76960, "loss": 0.0072, "lr": 1.2390824775653788e-07, "epoch": 19.429573804573806, "percentage": 97.15, "elapsed_time": "1:48:38", "remaining_time": "0:03:11", "throughput": 1032.71, "total_tokens": 6731968} +{"current_steps": 74770, "total_steps": 76960, "loss": 0.1766, "lr": 1.233451088138743e-07, "epoch": 19.43087318087318, "percentage": 97.15, "elapsed_time": "1:48:39", "remaining_time": "0:03:10", "throughput": 1032.71, "total_tokens": 6732400} +{"current_steps": 74775, "total_steps": 76960, "loss": 0.071, "lr": 1.2278324930140585e-07, "epoch": 19.432172557172557, "percentage": 97.16, "elapsed_time": "1:48:39", "remaining_time": "0:03:10", "throughput": 1032.71, "total_tokens": 6732816} +{"current_steps": 74780, "total_steps": 76960, "loss": 0.1949, "lr": 1.2222266924803161e-07, "epoch": 19.433471933471935, "percentage": 97.17, "elapsed_time": "1:48:39", "remaining_time": "0:03:10", "throughput": 1032.71, "total_tokens": 6733264} +{"current_steps": 74785, "total_steps": 76960, "loss": 0.0954, "lr": 1.216633686825841e-07, "epoch": 19.43477130977131, "percentage": 97.17, "elapsed_time": "1:48:40", "remaining_time": "0:03:09", "throughput": 1032.71, "total_tokens": 6733696} +{"current_steps": 74790, "total_steps": 76960, "loss": 0.0085, "lr": 1.2110534763382365e-07, "epoch": 19.436070686070686, "percentage": 97.18, "elapsed_time": "1:48:40", "remaining_time": "0:03:09", "throughput": 1032.71, "total_tokens": 6734144} +{"current_steps": 74795, "total_steps": 76960, "loss": 0.5306, "lr": 1.2054860613045504e-07, "epoch": 19.43737006237006, "percentage": 97.19, "elapsed_time": "1:48:41", "remaining_time": "0:03:08", "throughput": 1032.72, "total_tokens": 6734624} +{"current_steps": 74800, "total_steps": 76960, "loss": 0.0254, "lr": 1.1999314420111095e-07, "epoch": 19.43866943866944, "percentage": 97.19, "elapsed_time": "1:48:41", "remaining_time": "0:03:08", "throughput": 1032.73, "total_tokens": 6735088} +{"current_steps": 74805, "total_steps": 76960, "loss": 0.3679, "lr": 1.1943896187435744e-07, "epoch": 19.439968814968815, "percentage": 97.2, "elapsed_time": "1:48:42", "remaining_time": "0:03:07", "throughput": 1032.73, "total_tokens": 6735552} +{"current_steps": 74810, "total_steps": 76960, "loss": 0.0334, "lr": 1.1888605917869666e-07, "epoch": 19.44126819126819, "percentage": 97.21, "elapsed_time": "1:48:42", "remaining_time": "0:03:07", "throughput": 1032.73, "total_tokens": 6735984} +{"current_steps": 74815, "total_steps": 76960, "loss": 0.0527, "lr": 1.1833443614256423e-07, "epoch": 19.44256756756757, "percentage": 97.21, "elapsed_time": "1:48:42", "remaining_time": "0:03:07", "throughput": 1032.75, "total_tokens": 6736496} +{"current_steps": 74820, "total_steps": 76960, "loss": 0.0004, "lr": 1.1778409279433467e-07, "epoch": 19.443866943866944, "percentage": 97.22, "elapsed_time": "1:48:43", "remaining_time": "0:03:06", "throughput": 1032.75, "total_tokens": 6736976} +{"current_steps": 74825, "total_steps": 76960, "loss": 0.001, "lr": 1.1723502916231032e-07, "epoch": 19.44516632016632, "percentage": 97.23, "elapsed_time": "1:48:43", "remaining_time": "0:03:06", "throughput": 1032.76, "total_tokens": 6737424} +{"current_steps": 74830, "total_steps": 76960, "loss": 0.3934, "lr": 1.1668724527472974e-07, "epoch": 19.446465696465697, "percentage": 97.23, "elapsed_time": "1:48:44", "remaining_time": "0:03:05", "throughput": 1032.76, "total_tokens": 6737872} +{"current_steps": 74835, "total_steps": 76960, "loss": 0.0004, "lr": 1.1614074115976481e-07, "epoch": 19.447765072765073, "percentage": 97.24, "elapsed_time": "1:48:44", "remaining_time": "0:03:05", "throughput": 1032.77, "total_tokens": 6738352} +{"current_steps": 74840, "total_steps": 76960, "loss": 0.2381, "lr": 1.1559551684552638e-07, "epoch": 19.449064449064448, "percentage": 97.25, "elapsed_time": "1:48:44", "remaining_time": "0:03:04", "throughput": 1032.77, "total_tokens": 6738800} +{"current_steps": 74845, "total_steps": 76960, "loss": 0.4484, "lr": 1.1505157236005037e-07, "epoch": 19.450363825363826, "percentage": 97.25, "elapsed_time": "1:48:45", "remaining_time": "0:03:04", "throughput": 1032.77, "total_tokens": 6739248} +{"current_steps": 74850, "total_steps": 76960, "loss": 0.2536, "lr": 1.1450890773131717e-07, "epoch": 19.4516632016632, "percentage": 97.26, "elapsed_time": "1:48:45", "remaining_time": "0:03:03", "throughput": 1032.78, "total_tokens": 6739712} +{"current_steps": 74855, "total_steps": 76960, "loss": 0.0864, "lr": 1.1396752298723501e-07, "epoch": 19.452962577962577, "percentage": 97.26, "elapsed_time": "1:48:46", "remaining_time": "0:03:03", "throughput": 1032.77, "total_tokens": 6740128} +{"current_steps": 74860, "total_steps": 76960, "loss": 0.0566, "lr": 1.1342741815564828e-07, "epoch": 19.454261954261955, "percentage": 97.27, "elapsed_time": "1:48:46", "remaining_time": "0:03:03", "throughput": 1032.77, "total_tokens": 6740560} +{"current_steps": 74865, "total_steps": 76960, "loss": 0.0494, "lr": 1.1288859326433477e-07, "epoch": 19.45556133056133, "percentage": 97.28, "elapsed_time": "1:48:47", "remaining_time": "0:03:02", "throughput": 1032.78, "total_tokens": 6740992} +{"current_steps": 74870, "total_steps": 76960, "loss": 0.0105, "lr": 1.1235104834100563e-07, "epoch": 19.456860706860706, "percentage": 97.28, "elapsed_time": "1:48:47", "remaining_time": "0:03:02", "throughput": 1032.78, "total_tokens": 6741440} +{"current_steps": 74875, "total_steps": 76960, "loss": 0.01, "lr": 1.118147834133082e-07, "epoch": 19.458160083160084, "percentage": 97.29, "elapsed_time": "1:48:47", "remaining_time": "0:03:01", "throughput": 1032.78, "total_tokens": 6741856} +{"current_steps": 74880, "total_steps": 76960, "loss": 0.0005, "lr": 1.1127979850882598e-07, "epoch": 19.45945945945946, "percentage": 97.3, "elapsed_time": "1:48:48", "remaining_time": "0:03:01", "throughput": 1032.78, "total_tokens": 6742288} +{"current_steps": 74885, "total_steps": 76960, "loss": 0.171, "lr": 1.107460936550675e-07, "epoch": 19.460758835758835, "percentage": 97.3, "elapsed_time": "1:48:48", "remaining_time": "0:03:00", "throughput": 1032.78, "total_tokens": 6742768} +{"current_steps": 74890, "total_steps": 76960, "loss": 0.3031, "lr": 1.1021366887948581e-07, "epoch": 19.462058212058214, "percentage": 97.31, "elapsed_time": "1:48:49", "remaining_time": "0:03:00", "throughput": 1032.79, "total_tokens": 6743232} +{"current_steps": 74895, "total_steps": 76960, "loss": 0.121, "lr": 1.0968252420946456e-07, "epoch": 19.46335758835759, "percentage": 97.32, "elapsed_time": "1:48:49", "remaining_time": "0:03:00", "throughput": 1032.79, "total_tokens": 6743664} +{"current_steps": 74900, "total_steps": 76960, "loss": 0.2179, "lr": 1.0915265967231802e-07, "epoch": 19.464656964656964, "percentage": 97.32, "elapsed_time": "1:48:49", "remaining_time": "0:02:59", "throughput": 1032.79, "total_tokens": 6744080} +{"current_steps": 74905, "total_steps": 76960, "loss": 0.0397, "lr": 1.0862407529530217e-07, "epoch": 19.465956340956343, "percentage": 97.33, "elapsed_time": "1:48:50", "remaining_time": "0:02:59", "throughput": 1032.79, "total_tokens": 6744528} +{"current_steps": 74910, "total_steps": 76960, "loss": 0.1178, "lr": 1.0809677110559802e-07, "epoch": 19.467255717255718, "percentage": 97.34, "elapsed_time": "1:48:50", "remaining_time": "0:02:58", "throughput": 1032.79, "total_tokens": 6744976} +{"current_steps": 74915, "total_steps": 76960, "loss": 0.0093, "lr": 1.0757074713032556e-07, "epoch": 19.468555093555093, "percentage": 97.34, "elapsed_time": "1:48:51", "remaining_time": "0:02:58", "throughput": 1032.8, "total_tokens": 6745424} +{"current_steps": 74920, "total_steps": 76960, "loss": 0.0009, "lr": 1.0704600339654369e-07, "epoch": 19.46985446985447, "percentage": 97.35, "elapsed_time": "1:48:51", "remaining_time": "0:02:57", "throughput": 1032.81, "total_tokens": 6745904} +{"current_steps": 74925, "total_steps": 76960, "loss": 0.0004, "lr": 1.065225399312364e-07, "epoch": 19.471153846153847, "percentage": 97.36, "elapsed_time": "1:48:52", "remaining_time": "0:02:57", "throughput": 1032.81, "total_tokens": 6746336} +{"current_steps": 74930, "total_steps": 76960, "loss": 0.285, "lr": 1.060003567613238e-07, "epoch": 19.472453222453222, "percentage": 97.36, "elapsed_time": "1:48:52", "remaining_time": "0:02:56", "throughput": 1032.81, "total_tokens": 6746768} +{"current_steps": 74935, "total_steps": 76960, "loss": 0.0289, "lr": 1.0547945391366776e-07, "epoch": 19.473752598752597, "percentage": 97.37, "elapsed_time": "1:48:52", "remaining_time": "0:02:56", "throughput": 1032.81, "total_tokens": 6747216} +{"current_steps": 74940, "total_steps": 76960, "loss": 0.0001, "lr": 1.0495983141505794e-07, "epoch": 19.475051975051976, "percentage": 97.38, "elapsed_time": "1:48:53", "remaining_time": "0:02:56", "throughput": 1032.81, "total_tokens": 6747648} +{"current_steps": 74945, "total_steps": 76960, "loss": 0.1152, "lr": 1.0444148929221464e-07, "epoch": 19.47635135135135, "percentage": 97.38, "elapsed_time": "1:48:53", "remaining_time": "0:02:55", "throughput": 1032.81, "total_tokens": 6748096} +{"current_steps": 74950, "total_steps": 76960, "loss": 0.0081, "lr": 1.0392442757179987e-07, "epoch": 19.477650727650726, "percentage": 97.39, "elapsed_time": "1:48:54", "remaining_time": "0:02:55", "throughput": 1032.81, "total_tokens": 6748496} +{"current_steps": 74955, "total_steps": 76960, "loss": 0.4189, "lr": 1.0340864628040626e-07, "epoch": 19.478950103950105, "percentage": 97.39, "elapsed_time": "1:48:54", "remaining_time": "0:02:54", "throughput": 1032.81, "total_tokens": 6748928} +{"current_steps": 74960, "total_steps": 76960, "loss": 0.4371, "lr": 1.0289414544455978e-07, "epoch": 19.48024948024948, "percentage": 97.4, "elapsed_time": "1:48:54", "remaining_time": "0:02:54", "throughput": 1032.81, "total_tokens": 6749344} +{"current_steps": 74965, "total_steps": 76960, "loss": 0.001, "lr": 1.0238092509072262e-07, "epoch": 19.481548856548855, "percentage": 97.41, "elapsed_time": "1:48:55", "remaining_time": "0:02:53", "throughput": 1032.81, "total_tokens": 6749792} +{"current_steps": 74970, "total_steps": 76960, "loss": 0.0074, "lr": 1.0186898524529309e-07, "epoch": 19.482848232848234, "percentage": 97.41, "elapsed_time": "1:48:55", "remaining_time": "0:02:53", "throughput": 1032.82, "total_tokens": 6750272} +{"current_steps": 74975, "total_steps": 76960, "loss": 0.1604, "lr": 1.013583259345946e-07, "epoch": 19.48414760914761, "percentage": 97.42, "elapsed_time": "1:48:56", "remaining_time": "0:02:53", "throughput": 1032.82, "total_tokens": 6750736} +{"current_steps": 74980, "total_steps": 76960, "loss": 0.191, "lr": 1.0084894718489501e-07, "epoch": 19.485446985446984, "percentage": 97.43, "elapsed_time": "1:48:56", "remaining_time": "0:02:52", "throughput": 1032.82, "total_tokens": 6751168} +{"current_steps": 74985, "total_steps": 76960, "loss": 0.0003, "lr": 1.0034084902239282e-07, "epoch": 19.486746361746363, "percentage": 97.43, "elapsed_time": "1:48:57", "remaining_time": "0:02:52", "throughput": 1032.83, "total_tokens": 6751616} +{"current_steps": 74990, "total_steps": 76960, "loss": 0.0038, "lr": 9.983403147321712e-08, "epoch": 19.488045738045738, "percentage": 97.44, "elapsed_time": "1:48:57", "remaining_time": "0:02:51", "throughput": 1032.82, "total_tokens": 6752032} +{"current_steps": 74995, "total_steps": 76960, "loss": 0.0001, "lr": 9.932849456343318e-08, "epoch": 19.489345114345113, "percentage": 97.45, "elapsed_time": "1:48:57", "remaining_time": "0:02:51", "throughput": 1032.83, "total_tokens": 6752480} +{"current_steps": 75000, "total_steps": 76960, "loss": 0.5291, "lr": 9.882423831904797e-08, "epoch": 19.490644490644492, "percentage": 97.45, "elapsed_time": "1:48:58", "remaining_time": "0:02:50", "throughput": 1032.83, "total_tokens": 6752960} +{"current_steps": 75005, "total_steps": 76960, "loss": 0.2203, "lr": 9.832126276598797e-08, "epoch": 19.491943866943867, "percentage": 97.46, "elapsed_time": "1:48:58", "remaining_time": "0:02:50", "throughput": 1032.84, "total_tokens": 6753392} +{"current_steps": 75010, "total_steps": 76960, "loss": 0.0528, "lr": 9.781956793012692e-08, "epoch": 19.493243243243242, "percentage": 97.47, "elapsed_time": "1:48:59", "remaining_time": "0:02:49", "throughput": 1032.84, "total_tokens": 6753824} +{"current_steps": 75015, "total_steps": 76960, "loss": 0.0226, "lr": 9.731915383726364e-08, "epoch": 19.49454261954262, "percentage": 97.47, "elapsed_time": "1:48:59", "remaining_time": "0:02:49", "throughput": 1032.84, "total_tokens": 6754304} +{"current_steps": 75020, "total_steps": 76960, "loss": 0.102, "lr": 9.682002051313866e-08, "epoch": 19.495841995841996, "percentage": 97.48, "elapsed_time": "1:48:59", "remaining_time": "0:02:49", "throughput": 1032.85, "total_tokens": 6754800} +{"current_steps": 75025, "total_steps": 76960, "loss": 0.1213, "lr": 9.63221679834203e-08, "epoch": 19.49714137214137, "percentage": 97.49, "elapsed_time": "1:49:00", "remaining_time": "0:02:48", "throughput": 1032.86, "total_tokens": 6755280} +{"current_steps": 75030, "total_steps": 76960, "loss": 0.2315, "lr": 9.582559627371313e-08, "epoch": 19.49844074844075, "percentage": 97.49, "elapsed_time": "1:49:00", "remaining_time": "0:02:48", "throughput": 1032.87, "total_tokens": 6755744} +{"current_steps": 75035, "total_steps": 76960, "loss": 0.078, "lr": 9.533030540956056e-08, "epoch": 19.499740124740125, "percentage": 97.5, "elapsed_time": "1:49:01", "remaining_time": "0:02:47", "throughput": 1032.87, "total_tokens": 6756192} +{"current_steps": 75040, "total_steps": 76960, "loss": 0.0009, "lr": 9.483629541643114e-08, "epoch": 19.5010395010395, "percentage": 97.51, "elapsed_time": "1:49:01", "remaining_time": "0:02:47", "throughput": 1032.88, "total_tokens": 6756656} +{"current_steps": 75045, "total_steps": 76960, "loss": 0.009, "lr": 9.434356631973506e-08, "epoch": 19.50233887733888, "percentage": 97.51, "elapsed_time": "1:49:02", "remaining_time": "0:02:46", "throughput": 1032.88, "total_tokens": 6757136} +{"current_steps": 75050, "total_steps": 76960, "loss": 0.0002, "lr": 9.38521181448132e-08, "epoch": 19.503638253638254, "percentage": 97.52, "elapsed_time": "1:49:02", "remaining_time": "0:02:46", "throughput": 1032.89, "total_tokens": 6757584} +{"current_steps": 75055, "total_steps": 76960, "loss": 0.0017, "lr": 9.336195091693978e-08, "epoch": 19.50493762993763, "percentage": 97.52, "elapsed_time": "1:49:02", "remaining_time": "0:02:46", "throughput": 1032.89, "total_tokens": 6758016} +{"current_steps": 75060, "total_steps": 76960, "loss": 0.0959, "lr": 9.287306466132518e-08, "epoch": 19.506237006237008, "percentage": 97.53, "elapsed_time": "1:49:03", "remaining_time": "0:02:45", "throughput": 1032.89, "total_tokens": 6758480} +{"current_steps": 75065, "total_steps": 76960, "loss": 0.0563, "lr": 9.238545940311316e-08, "epoch": 19.507536382536383, "percentage": 97.54, "elapsed_time": "1:49:03", "remaining_time": "0:02:45", "throughput": 1032.9, "total_tokens": 6758944} +{"current_steps": 75070, "total_steps": 76960, "loss": 0.0161, "lr": 9.189913516738368e-08, "epoch": 19.508835758835758, "percentage": 97.54, "elapsed_time": "1:49:04", "remaining_time": "0:02:44", "throughput": 1032.9, "total_tokens": 6759376} +{"current_steps": 75075, "total_steps": 76960, "loss": 0.0002, "lr": 9.14140919791473e-08, "epoch": 19.510135135135137, "percentage": 97.55, "elapsed_time": "1:49:04", "remaining_time": "0:02:44", "throughput": 1032.91, "total_tokens": 6759856} +{"current_steps": 75080, "total_steps": 76960, "loss": 0.0003, "lr": 9.09303298633507e-08, "epoch": 19.511434511434512, "percentage": 97.56, "elapsed_time": "1:49:04", "remaining_time": "0:02:43", "throughput": 1032.91, "total_tokens": 6760336} +{"current_steps": 75085, "total_steps": 76960, "loss": 0.0003, "lr": 9.044784884487123e-08, "epoch": 19.512733887733887, "percentage": 97.56, "elapsed_time": "1:49:05", "remaining_time": "0:02:43", "throughput": 1032.92, "total_tokens": 6760784} +{"current_steps": 75090, "total_steps": 76960, "loss": 0.2153, "lr": 8.996664894853069e-08, "epoch": 19.514033264033262, "percentage": 97.57, "elapsed_time": "1:49:05", "remaining_time": "0:02:43", "throughput": 1032.92, "total_tokens": 6761232} +{"current_steps": 75095, "total_steps": 76960, "loss": 0.0022, "lr": 8.948673019906762e-08, "epoch": 19.51533264033264, "percentage": 97.58, "elapsed_time": "1:49:06", "remaining_time": "0:02:42", "throughput": 1032.92, "total_tokens": 6761680} +{"current_steps": 75100, "total_steps": 76960, "loss": 0.1041, "lr": 8.900809262117337e-08, "epoch": 19.516632016632016, "percentage": 97.58, "elapsed_time": "1:49:06", "remaining_time": "0:02:42", "throughput": 1032.93, "total_tokens": 6762128} +{"current_steps": 75105, "total_steps": 76960, "loss": 0.0015, "lr": 8.853073623946162e-08, "epoch": 19.51793139293139, "percentage": 97.59, "elapsed_time": "1:49:06", "remaining_time": "0:02:41", "throughput": 1032.93, "total_tokens": 6762592} +{"current_steps": 75110, "total_steps": 76960, "loss": 0.002, "lr": 8.805466107848215e-08, "epoch": 19.51923076923077, "percentage": 97.6, "elapsed_time": "1:49:07", "remaining_time": "0:02:41", "throughput": 1032.94, "total_tokens": 6763072} +{"current_steps": 75115, "total_steps": 76960, "loss": 0.0412, "lr": 8.757986716272093e-08, "epoch": 19.520530145530145, "percentage": 97.6, "elapsed_time": "1:49:07", "remaining_time": "0:02:40", "throughput": 1032.95, "total_tokens": 6763584} +{"current_steps": 75120, "total_steps": 76960, "loss": 0.0001, "lr": 8.71063545166001e-08, "epoch": 19.52182952182952, "percentage": 97.61, "elapsed_time": "1:49:08", "remaining_time": "0:02:40", "throughput": 1032.96, "total_tokens": 6764032} +{"current_steps": 75125, "total_steps": 76960, "loss": 0.0283, "lr": 8.663412316446684e-08, "epoch": 19.5231288981289, "percentage": 97.62, "elapsed_time": "1:49:08", "remaining_time": "0:02:39", "throughput": 1032.96, "total_tokens": 6764464} +{"current_steps": 75130, "total_steps": 76960, "loss": 0.007, "lr": 8.616317313061285e-08, "epoch": 19.524428274428274, "percentage": 97.62, "elapsed_time": "1:49:09", "remaining_time": "0:02:39", "throughput": 1032.96, "total_tokens": 6764896} +{"current_steps": 75135, "total_steps": 76960, "loss": 0.0102, "lr": 8.569350443925484e-08, "epoch": 19.52572765072765, "percentage": 97.63, "elapsed_time": "1:49:09", "remaining_time": "0:02:39", "throughput": 1032.96, "total_tokens": 6765360} +{"current_steps": 75140, "total_steps": 76960, "loss": 0.0681, "lr": 8.522511711455406e-08, "epoch": 19.527027027027028, "percentage": 97.64, "elapsed_time": "1:49:09", "remaining_time": "0:02:38", "throughput": 1032.96, "total_tokens": 6765776} +{"current_steps": 75145, "total_steps": 76960, "loss": 0.0005, "lr": 8.475801118059956e-08, "epoch": 19.528326403326403, "percentage": 97.64, "elapsed_time": "1:49:10", "remaining_time": "0:02:38", "throughput": 1032.97, "total_tokens": 6766240} +{"current_steps": 75150, "total_steps": 76960, "loss": 0.0013, "lr": 8.429218666141103e-08, "epoch": 19.52962577962578, "percentage": 97.65, "elapsed_time": "1:49:10", "remaining_time": "0:02:37", "throughput": 1032.97, "total_tokens": 6766688} +{"current_steps": 75155, "total_steps": 76960, "loss": 0.0373, "lr": 8.382764358094708e-08, "epoch": 19.530925155925157, "percentage": 97.65, "elapsed_time": "1:49:11", "remaining_time": "0:02:37", "throughput": 1032.97, "total_tokens": 6767136} +{"current_steps": 75160, "total_steps": 76960, "loss": 0.067, "lr": 8.336438196310248e-08, "epoch": 19.532224532224532, "percentage": 97.66, "elapsed_time": "1:49:11", "remaining_time": "0:02:36", "throughput": 1032.98, "total_tokens": 6767584} +{"current_steps": 75165, "total_steps": 76960, "loss": 0.0823, "lr": 8.290240183170261e-08, "epoch": 19.533523908523907, "percentage": 97.67, "elapsed_time": "1:49:11", "remaining_time": "0:02:36", "throughput": 1032.98, "total_tokens": 6768016} +{"current_steps": 75170, "total_steps": 76960, "loss": 0.0758, "lr": 8.244170321050626e-08, "epoch": 19.534823284823286, "percentage": 97.67, "elapsed_time": "1:49:12", "remaining_time": "0:02:36", "throughput": 1032.98, "total_tokens": 6768448} +{"current_steps": 75175, "total_steps": 76960, "loss": 0.0603, "lr": 8.198228612320558e-08, "epoch": 19.53612266112266, "percentage": 97.68, "elapsed_time": "1:49:12", "remaining_time": "0:02:35", "throughput": 1032.98, "total_tokens": 6768912} +{"current_steps": 75180, "total_steps": 76960, "loss": 0.0131, "lr": 8.152415059343443e-08, "epoch": 19.537422037422036, "percentage": 97.69, "elapsed_time": "1:49:13", "remaining_time": "0:02:35", "throughput": 1032.98, "total_tokens": 6769344} +{"current_steps": 75185, "total_steps": 76960, "loss": 0.0003, "lr": 8.106729664475176e-08, "epoch": 19.538721413721415, "percentage": 97.69, "elapsed_time": "1:49:13", "remaining_time": "0:02:34", "throughput": 1032.98, "total_tokens": 6769760} +{"current_steps": 75190, "total_steps": 76960, "loss": 0.0006, "lr": 8.061172430065266e-08, "epoch": 19.54002079002079, "percentage": 97.7, "elapsed_time": "1:49:14", "remaining_time": "0:02:34", "throughput": 1032.99, "total_tokens": 6770224} +{"current_steps": 75195, "total_steps": 76960, "loss": 0.0735, "lr": 8.01574335845684e-08, "epoch": 19.541320166320165, "percentage": 97.71, "elapsed_time": "1:49:14", "remaining_time": "0:02:33", "throughput": 1032.99, "total_tokens": 6770656} +{"current_steps": 75200, "total_steps": 76960, "loss": 0.0867, "lr": 7.970442451986638e-08, "epoch": 19.542619542619544, "percentage": 97.71, "elapsed_time": "1:49:14", "remaining_time": "0:02:33", "throughput": 1032.99, "total_tokens": 6771104} +{"current_steps": 75205, "total_steps": 76960, "loss": 0.0004, "lr": 7.925269712984184e-08, "epoch": 19.54391891891892, "percentage": 97.72, "elapsed_time": "1:49:15", "remaining_time": "0:02:32", "throughput": 1032.99, "total_tokens": 6771552} +{"current_steps": 75210, "total_steps": 76960, "loss": 0.1321, "lr": 7.880225143772902e-08, "epoch": 19.545218295218294, "percentage": 97.73, "elapsed_time": "1:49:15", "remaining_time": "0:02:32", "throughput": 1033.0, "total_tokens": 6772000} +{"current_steps": 75215, "total_steps": 76960, "loss": 0.0032, "lr": 7.835308746669545e-08, "epoch": 19.546517671517673, "percentage": 97.73, "elapsed_time": "1:49:16", "remaining_time": "0:02:32", "throughput": 1033.0, "total_tokens": 6772432} +{"current_steps": 75220, "total_steps": 76960, "loss": 0.6433, "lr": 7.790520523984213e-08, "epoch": 19.54781704781705, "percentage": 97.74, "elapsed_time": "1:49:16", "remaining_time": "0:02:31", "throughput": 1032.99, "total_tokens": 6772848} +{"current_steps": 75225, "total_steps": 76960, "loss": 0.0678, "lr": 7.74586047802034e-08, "epoch": 19.549116424116423, "percentage": 97.75, "elapsed_time": "1:49:16", "remaining_time": "0:02:31", "throughput": 1033.0, "total_tokens": 6773296} +{"current_steps": 75230, "total_steps": 76960, "loss": 0.09, "lr": 7.701328611074698e-08, "epoch": 19.5504158004158, "percentage": 97.75, "elapsed_time": "1:49:17", "remaining_time": "0:02:30", "throughput": 1032.99, "total_tokens": 6773712} +{"current_steps": 75235, "total_steps": 76960, "loss": 0.0925, "lr": 7.656924925437681e-08, "epoch": 19.551715176715177, "percentage": 97.76, "elapsed_time": "1:49:17", "remaining_time": "0:02:30", "throughput": 1033.0, "total_tokens": 6774176} +{"current_steps": 75240, "total_steps": 76960, "loss": 0.3901, "lr": 7.612649423393014e-08, "epoch": 19.553014553014552, "percentage": 97.77, "elapsed_time": "1:49:18", "remaining_time": "0:02:29", "throughput": 1033.0, "total_tokens": 6774592} +{"current_steps": 75245, "total_steps": 76960, "loss": 0.2096, "lr": 7.568502107218044e-08, "epoch": 19.554313929313928, "percentage": 97.77, "elapsed_time": "1:49:18", "remaining_time": "0:02:29", "throughput": 1033.01, "total_tokens": 6775072} +{"current_steps": 75250, "total_steps": 76960, "loss": 0.1357, "lr": 7.524482979183178e-08, "epoch": 19.555613305613306, "percentage": 97.78, "elapsed_time": "1:49:19", "remaining_time": "0:02:29", "throughput": 1033.01, "total_tokens": 6775536} +{"current_steps": 75255, "total_steps": 76960, "loss": 0.0035, "lr": 7.48059204155216e-08, "epoch": 19.55691268191268, "percentage": 97.78, "elapsed_time": "1:49:19", "remaining_time": "0:02:28", "throughput": 1033.02, "total_tokens": 6775984} +{"current_steps": 75260, "total_steps": 76960, "loss": 0.0013, "lr": 7.436829296582626e-08, "epoch": 19.558212058212057, "percentage": 97.79, "elapsed_time": "1:49:19", "remaining_time": "0:02:28", "throughput": 1033.02, "total_tokens": 6776432} +{"current_steps": 75265, "total_steps": 76960, "loss": 0.3756, "lr": 7.393194746525279e-08, "epoch": 19.559511434511435, "percentage": 97.8, "elapsed_time": "1:49:20", "remaining_time": "0:02:27", "throughput": 1033.03, "total_tokens": 6776912} +{"current_steps": 75270, "total_steps": 76960, "loss": 0.0116, "lr": 7.349688393624154e-08, "epoch": 19.56081081081081, "percentage": 97.8, "elapsed_time": "1:49:20", "remaining_time": "0:02:27", "throughput": 1033.03, "total_tokens": 6777360} +{"current_steps": 75275, "total_steps": 76960, "loss": 0.016, "lr": 7.30631024011691e-08, "epoch": 19.562110187110186, "percentage": 97.81, "elapsed_time": "1:49:21", "remaining_time": "0:02:26", "throughput": 1033.03, "total_tokens": 6777808} +{"current_steps": 75280, "total_steps": 76960, "loss": 0.0627, "lr": 7.263060288234535e-08, "epoch": 19.563409563409564, "percentage": 97.82, "elapsed_time": "1:49:21", "remaining_time": "0:02:26", "throughput": 1033.03, "total_tokens": 6778224} +{"current_steps": 75285, "total_steps": 76960, "loss": 0.0051, "lr": 7.219938540201366e-08, "epoch": 19.56470893970894, "percentage": 97.82, "elapsed_time": "1:49:21", "remaining_time": "0:02:25", "throughput": 1033.03, "total_tokens": 6778672} +{"current_steps": 75290, "total_steps": 76960, "loss": 0.1542, "lr": 7.17694499823507e-08, "epoch": 19.566008316008315, "percentage": 97.83, "elapsed_time": "1:49:22", "remaining_time": "0:02:25", "throughput": 1033.04, "total_tokens": 6779136} +{"current_steps": 75295, "total_steps": 76960, "loss": 0.0002, "lr": 7.13407966454721e-08, "epoch": 19.567307692307693, "percentage": 97.84, "elapsed_time": "1:49:22", "remaining_time": "0:02:25", "throughput": 1033.04, "total_tokens": 6779568} +{"current_steps": 75300, "total_steps": 76960, "loss": 0.0031, "lr": 7.091342541342139e-08, "epoch": 19.56860706860707, "percentage": 97.84, "elapsed_time": "1:49:23", "remaining_time": "0:02:24", "throughput": 1033.04, "total_tokens": 6780000} +{"current_steps": 75305, "total_steps": 76960, "loss": 0.0118, "lr": 7.048733630817817e-08, "epoch": 19.569906444906444, "percentage": 97.85, "elapsed_time": "1:49:23", "remaining_time": "0:02:24", "throughput": 1033.04, "total_tokens": 6780432} +{"current_steps": 75310, "total_steps": 76960, "loss": 0.2386, "lr": 7.006252935165824e-08, "epoch": 19.571205821205822, "percentage": 97.86, "elapsed_time": "1:49:23", "remaining_time": "0:02:23", "throughput": 1033.04, "total_tokens": 6780880} +{"current_steps": 75315, "total_steps": 76960, "loss": 0.0008, "lr": 6.963900456571081e-08, "epoch": 19.572505197505198, "percentage": 97.86, "elapsed_time": "1:49:24", "remaining_time": "0:02:23", "throughput": 1033.05, "total_tokens": 6781344} +{"current_steps": 75320, "total_steps": 76960, "loss": 0.1828, "lr": 6.921676197211291e-08, "epoch": 19.573804573804573, "percentage": 97.87, "elapsed_time": "1:49:24", "remaining_time": "0:02:22", "throughput": 1033.05, "total_tokens": 6781776} +{"current_steps": 75325, "total_steps": 76960, "loss": 0.0005, "lr": 6.87958015925888e-08, "epoch": 19.57510395010395, "percentage": 97.88, "elapsed_time": "1:49:25", "remaining_time": "0:02:22", "throughput": 1033.06, "total_tokens": 6782240} +{"current_steps": 75330, "total_steps": 76960, "loss": 0.1866, "lr": 6.837612344877952e-08, "epoch": 19.576403326403327, "percentage": 97.88, "elapsed_time": "1:49:25", "remaining_time": "0:02:22", "throughput": 1033.06, "total_tokens": 6782688} +{"current_steps": 75335, "total_steps": 76960, "loss": 0.0041, "lr": 6.795772756227891e-08, "epoch": 19.5777027027027, "percentage": 97.89, "elapsed_time": "1:49:26", "remaining_time": "0:02:21", "throughput": 1033.06, "total_tokens": 6783136} +{"current_steps": 75340, "total_steps": 76960, "loss": 0.0881, "lr": 6.754061395460032e-08, "epoch": 19.57900207900208, "percentage": 97.9, "elapsed_time": "1:49:26", "remaining_time": "0:02:21", "throughput": 1033.06, "total_tokens": 6783568} +{"current_steps": 75345, "total_steps": 76960, "loss": 0.0133, "lr": 6.712478264719601e-08, "epoch": 19.580301455301456, "percentage": 97.9, "elapsed_time": "1:49:26", "remaining_time": "0:02:20", "throughput": 1033.06, "total_tokens": 6784000} +{"current_steps": 75350, "total_steps": 76960, "loss": 0.0004, "lr": 6.671023366145169e-08, "epoch": 19.58160083160083, "percentage": 97.91, "elapsed_time": "1:49:27", "remaining_time": "0:02:20", "throughput": 1033.07, "total_tokens": 6784448} +{"current_steps": 75355, "total_steps": 76960, "loss": 0.1137, "lr": 6.629696701869193e-08, "epoch": 19.58290020790021, "percentage": 97.91, "elapsed_time": "1:49:27", "remaining_time": "0:02:19", "throughput": 1033.07, "total_tokens": 6784896} +{"current_steps": 75360, "total_steps": 76960, "loss": 0.0079, "lr": 6.588498274017196e-08, "epoch": 19.584199584199585, "percentage": 97.92, "elapsed_time": "1:49:28", "remaining_time": "0:02:19", "throughput": 1033.08, "total_tokens": 6785376} +{"current_steps": 75365, "total_steps": 76960, "loss": 0.0008, "lr": 6.547428084707485e-08, "epoch": 19.58549896049896, "percentage": 97.93, "elapsed_time": "1:49:28", "remaining_time": "0:02:19", "throughput": 1033.08, "total_tokens": 6785808} +{"current_steps": 75370, "total_steps": 76960, "loss": 0.0495, "lr": 6.506486136052814e-08, "epoch": 19.58679833679834, "percentage": 97.93, "elapsed_time": "1:49:28", "remaining_time": "0:02:18", "throughput": 1033.09, "total_tokens": 6786304} +{"current_steps": 75375, "total_steps": 76960, "loss": 0.0165, "lr": 6.465672430158443e-08, "epoch": 19.588097713097714, "percentage": 97.94, "elapsed_time": "1:49:29", "remaining_time": "0:02:18", "throughput": 1033.09, "total_tokens": 6786736} +{"current_steps": 75380, "total_steps": 76960, "loss": 0.0218, "lr": 6.424986969124081e-08, "epoch": 19.58939708939709, "percentage": 97.95, "elapsed_time": "1:49:29", "remaining_time": "0:02:17", "throughput": 1033.09, "total_tokens": 6787200} +{"current_steps": 75385, "total_steps": 76960, "loss": 0.0071, "lr": 6.384429755041665e-08, "epoch": 19.590696465696467, "percentage": 97.95, "elapsed_time": "1:49:30", "remaining_time": "0:02:17", "throughput": 1033.09, "total_tokens": 6787632} +{"current_steps": 75390, "total_steps": 76960, "loss": 0.0014, "lr": 6.344000789997307e-08, "epoch": 19.591995841995843, "percentage": 97.96, "elapsed_time": "1:49:30", "remaining_time": "0:02:16", "throughput": 1033.1, "total_tokens": 6788096} +{"current_steps": 75395, "total_steps": 76960, "loss": 0.0002, "lr": 6.303700076070173e-08, "epoch": 19.593295218295218, "percentage": 97.97, "elapsed_time": "1:49:31", "remaining_time": "0:02:16", "throughput": 1033.1, "total_tokens": 6788544} +{"current_steps": 75400, "total_steps": 76960, "loss": 0.086, "lr": 6.26352761533333e-08, "epoch": 19.594594594594593, "percentage": 97.97, "elapsed_time": "1:49:31", "remaining_time": "0:02:15", "throughput": 1033.11, "total_tokens": 6789024} +{"current_steps": 75405, "total_steps": 76960, "loss": 0.1483, "lr": 6.223483409852626e-08, "epoch": 19.59589397089397, "percentage": 97.98, "elapsed_time": "1:49:31", "remaining_time": "0:02:15", "throughput": 1033.11, "total_tokens": 6789440} +{"current_steps": 75410, "total_steps": 76960, "loss": 0.2518, "lr": 6.183567461687523e-08, "epoch": 19.597193347193347, "percentage": 97.99, "elapsed_time": "1:49:32", "remaining_time": "0:02:15", "throughput": 1033.12, "total_tokens": 6789952} +{"current_steps": 75415, "total_steps": 76960, "loss": 0.0756, "lr": 6.1437797728911e-08, "epoch": 19.598492723492722, "percentage": 97.99, "elapsed_time": "1:49:32", "remaining_time": "0:02:14", "throughput": 1033.13, "total_tokens": 6790416} +{"current_steps": 75420, "total_steps": 76960, "loss": 0.1465, "lr": 6.1041203455095e-08, "epoch": 19.5997920997921, "percentage": 98.0, "elapsed_time": "1:49:33", "remaining_time": "0:02:14", "throughput": 1033.14, "total_tokens": 6790912} +{"current_steps": 75425, "total_steps": 76960, "loss": 0.0605, "lr": 6.064589181582481e-08, "epoch": 19.601091476091476, "percentage": 98.01, "elapsed_time": "1:49:33", "remaining_time": "0:02:13", "throughput": 1033.14, "total_tokens": 6791360} +{"current_steps": 75430, "total_steps": 76960, "loss": 0.2378, "lr": 6.025186283143136e-08, "epoch": 19.60239085239085, "percentage": 98.01, "elapsed_time": "1:49:33", "remaining_time": "0:02:13", "throughput": 1033.14, "total_tokens": 6791792} +{"current_steps": 75435, "total_steps": 76960, "loss": 0.182, "lr": 5.985911652218179e-08, "epoch": 19.60369022869023, "percentage": 98.02, "elapsed_time": "1:49:34", "remaining_time": "0:02:12", "throughput": 1033.15, "total_tokens": 6792256} +{"current_steps": 75440, "total_steps": 76960, "loss": 0.0131, "lr": 5.946765290827383e-08, "epoch": 19.604989604989605, "percentage": 98.02, "elapsed_time": "1:49:34", "remaining_time": "0:02:12", "throughput": 1033.15, "total_tokens": 6792704} +{"current_steps": 75445, "total_steps": 76960, "loss": 0.001, "lr": 5.907747200984415e-08, "epoch": 19.60628898128898, "percentage": 98.03, "elapsed_time": "1:49:35", "remaining_time": "0:02:12", "throughput": 1033.15, "total_tokens": 6793136} +{"current_steps": 75450, "total_steps": 76960, "loss": 0.001, "lr": 5.8688573846954474e-08, "epoch": 19.60758835758836, "percentage": 98.04, "elapsed_time": "1:49:35", "remaining_time": "0:02:11", "throughput": 1033.15, "total_tokens": 6793552} +{"current_steps": 75455, "total_steps": 76960, "loss": 0.0011, "lr": 5.8300958439608254e-08, "epoch": 19.608887733887734, "percentage": 98.04, "elapsed_time": "1:49:35", "remaining_time": "0:02:11", "throughput": 1033.15, "total_tokens": 6794016} +{"current_steps": 75460, "total_steps": 76960, "loss": 0.1093, "lr": 5.791462580774232e-08, "epoch": 19.61018711018711, "percentage": 98.05, "elapsed_time": "1:49:36", "remaining_time": "0:02:10", "throughput": 1033.16, "total_tokens": 6794464} +{"current_steps": 75465, "total_steps": 76960, "loss": 0.0077, "lr": 5.7529575971226877e-08, "epoch": 19.611486486486488, "percentage": 98.06, "elapsed_time": "1:49:36", "remaining_time": "0:02:10", "throughput": 1033.17, "total_tokens": 6794944} +{"current_steps": 75470, "total_steps": 76960, "loss": 0.1612, "lr": 5.7145808949865546e-08, "epoch": 19.612785862785863, "percentage": 98.06, "elapsed_time": "1:49:37", "remaining_time": "0:02:09", "throughput": 1033.17, "total_tokens": 6795392} +{"current_steps": 75475, "total_steps": 76960, "loss": 0.5882, "lr": 5.676332476339252e-08, "epoch": 19.614085239085238, "percentage": 98.07, "elapsed_time": "1:49:37", "remaining_time": "0:02:09", "throughput": 1033.17, "total_tokens": 6795824} +{"current_steps": 75480, "total_steps": 76960, "loss": 0.0006, "lr": 5.638212343148097e-08, "epoch": 19.615384615384617, "percentage": 98.08, "elapsed_time": "1:49:38", "remaining_time": "0:02:08", "throughput": 1033.18, "total_tokens": 6796288} +{"current_steps": 75485, "total_steps": 76960, "loss": 0.1714, "lr": 5.600220497373465e-08, "epoch": 19.616683991683992, "percentage": 98.08, "elapsed_time": "1:49:38", "remaining_time": "0:02:08", "throughput": 1033.18, "total_tokens": 6796720} +{"current_steps": 75490, "total_steps": 76960, "loss": 0.0352, "lr": 5.562356940969904e-08, "epoch": 19.617983367983367, "percentage": 98.09, "elapsed_time": "1:49:38", "remaining_time": "0:02:08", "throughput": 1033.19, "total_tokens": 6797216} +{"current_steps": 75495, "total_steps": 76960, "loss": 0.1328, "lr": 5.5246216758841895e-08, "epoch": 19.619282744282746, "percentage": 98.1, "elapsed_time": "1:49:39", "remaining_time": "0:02:07", "throughput": 1033.19, "total_tokens": 6797664} +{"current_steps": 75500, "total_steps": 76960, "loss": 0.2572, "lr": 5.48701470405727e-08, "epoch": 19.62058212058212, "percentage": 98.1, "elapsed_time": "1:49:39", "remaining_time": "0:02:07", "throughput": 1033.19, "total_tokens": 6798112} +{"current_steps": 75505, "total_steps": 76960, "loss": 0.0026, "lr": 5.4495360274231524e-08, "epoch": 19.621881496881496, "percentage": 98.11, "elapsed_time": "1:49:40", "remaining_time": "0:02:06", "throughput": 1033.19, "total_tokens": 6798544} +{"current_steps": 75510, "total_steps": 76960, "loss": 0.035, "lr": 5.41218564790974e-08, "epoch": 19.623180873180875, "percentage": 98.12, "elapsed_time": "1:49:40", "remaining_time": "0:02:06", "throughput": 1033.2, "total_tokens": 6799008} +{"current_steps": 75515, "total_steps": 76960, "loss": 0.0008, "lr": 5.374963567437719e-08, "epoch": 19.62448024948025, "percentage": 98.12, "elapsed_time": "1:49:40", "remaining_time": "0:02:05", "throughput": 1033.2, "total_tokens": 6799456} +{"current_steps": 75520, "total_steps": 76960, "loss": 0.0046, "lr": 5.3378697879216676e-08, "epoch": 19.625779625779625, "percentage": 98.13, "elapsed_time": "1:49:41", "remaining_time": "0:02:05", "throughput": 1033.2, "total_tokens": 6799904} +{"current_steps": 75525, "total_steps": 76960, "loss": 0.0103, "lr": 5.300904311269228e-08, "epoch": 19.627079002079, "percentage": 98.14, "elapsed_time": "1:49:41", "remaining_time": "0:02:05", "throughput": 1033.2, "total_tokens": 6800336} +{"current_steps": 75530, "total_steps": 76960, "loss": 0.1673, "lr": 5.2640671393816566e-08, "epoch": 19.62837837837838, "percentage": 98.14, "elapsed_time": "1:49:42", "remaining_time": "0:02:04", "throughput": 1033.21, "total_tokens": 6800816} +{"current_steps": 75535, "total_steps": 76960, "loss": 0.2626, "lr": 5.227358274153271e-08, "epoch": 19.629677754677754, "percentage": 98.15, "elapsed_time": "1:49:42", "remaining_time": "0:02:04", "throughput": 1033.21, "total_tokens": 6801248} +{"current_steps": 75540, "total_steps": 76960, "loss": 0.0003, "lr": 5.1907777174722835e-08, "epoch": 19.63097713097713, "percentage": 98.15, "elapsed_time": "1:49:43", "remaining_time": "0:02:03", "throughput": 1033.22, "total_tokens": 6801728} +{"current_steps": 75545, "total_steps": 76960, "loss": 0.0016, "lr": 5.154325471220245e-08, "epoch": 19.632276507276508, "percentage": 98.16, "elapsed_time": "1:49:43", "remaining_time": "0:02:03", "throughput": 1033.22, "total_tokens": 6802176} +{"current_steps": 75550, "total_steps": 76960, "loss": 0.283, "lr": 5.1180015372714886e-08, "epoch": 19.633575883575883, "percentage": 98.17, "elapsed_time": "1:49:43", "remaining_time": "0:02:02", "throughput": 1033.22, "total_tokens": 6802608} +{"current_steps": 75555, "total_steps": 76960, "loss": 0.0003, "lr": 5.081805917494242e-08, "epoch": 19.63487525987526, "percentage": 98.17, "elapsed_time": "1:49:44", "remaining_time": "0:02:02", "throughput": 1033.23, "total_tokens": 6803072} +{"current_steps": 75560, "total_steps": 76960, "loss": 0.2331, "lr": 5.045738613750628e-08, "epoch": 19.636174636174637, "percentage": 98.18, "elapsed_time": "1:49:44", "remaining_time": "0:02:02", "throughput": 1033.23, "total_tokens": 6803504} +{"current_steps": 75565, "total_steps": 76960, "loss": 0.1971, "lr": 5.009799627894718e-08, "epoch": 19.637474012474012, "percentage": 98.19, "elapsed_time": "1:49:45", "remaining_time": "0:02:01", "throughput": 1033.23, "total_tokens": 6803936} +{"current_steps": 75570, "total_steps": 76960, "loss": 0.0465, "lr": 4.973988961775866e-08, "epoch": 19.638773388773387, "percentage": 98.19, "elapsed_time": "1:49:45", "remaining_time": "0:02:01", "throughput": 1033.23, "total_tokens": 6804368} +{"current_steps": 75575, "total_steps": 76960, "loss": 0.0292, "lr": 4.9383066172351e-08, "epoch": 19.640072765072766, "percentage": 98.2, "elapsed_time": "1:49:45", "remaining_time": "0:02:00", "throughput": 1033.24, "total_tokens": 6804832} +{"current_steps": 75580, "total_steps": 76960, "loss": 0.0761, "lr": 4.902752596107896e-08, "epoch": 19.64137214137214, "percentage": 98.21, "elapsed_time": "1:49:46", "remaining_time": "0:02:00", "throughput": 1033.24, "total_tokens": 6805280} +{"current_steps": 75585, "total_steps": 76960, "loss": 0.0009, "lr": 4.867326900223068e-08, "epoch": 19.642671517671516, "percentage": 98.21, "elapsed_time": "1:49:46", "remaining_time": "0:01:59", "throughput": 1033.25, "total_tokens": 6805776} +{"current_steps": 75590, "total_steps": 76960, "loss": 0.2865, "lr": 4.832029531401938e-08, "epoch": 19.643970893970895, "percentage": 98.22, "elapsed_time": "1:49:47", "remaining_time": "0:01:59", "throughput": 1033.25, "total_tokens": 6806224} +{"current_steps": 75595, "total_steps": 76960, "loss": 0.2045, "lr": 4.7968604914605534e-08, "epoch": 19.64527027027027, "percentage": 98.23, "elapsed_time": "1:49:47", "remaining_time": "0:01:58", "throughput": 1033.26, "total_tokens": 6806688} +{"current_steps": 75600, "total_steps": 76960, "loss": 0.4816, "lr": 4.761819782207466e-08, "epoch": 19.646569646569645, "percentage": 98.23, "elapsed_time": "1:49:48", "remaining_time": "0:01:58", "throughput": 1033.26, "total_tokens": 6807136} +{"current_steps": 75605, "total_steps": 76960, "loss": 0.0026, "lr": 4.726907405444569e-08, "epoch": 19.647869022869024, "percentage": 98.24, "elapsed_time": "1:49:48", "remaining_time": "0:01:58", "throughput": 1033.26, "total_tokens": 6807584} +{"current_steps": 75610, "total_steps": 76960, "loss": 0.3166, "lr": 4.692123362967926e-08, "epoch": 19.6491683991684, "percentage": 98.25, "elapsed_time": "1:49:48", "remaining_time": "0:01:57", "throughput": 1033.27, "total_tokens": 6808048} +{"current_steps": 75615, "total_steps": 76960, "loss": 0.1089, "lr": 4.657467656566106e-08, "epoch": 19.650467775467774, "percentage": 98.25, "elapsed_time": "1:49:49", "remaining_time": "0:01:57", "throughput": 1033.27, "total_tokens": 6808480} +{"current_steps": 75620, "total_steps": 76960, "loss": 0.119, "lr": 4.6229402880215713e-08, "epoch": 19.651767151767153, "percentage": 98.26, "elapsed_time": "1:49:49", "remaining_time": "0:01:56", "throughput": 1033.27, "total_tokens": 6808896} +{"current_steps": 75625, "total_steps": 76960, "loss": 0.0025, "lr": 4.5885412591104016e-08, "epoch": 19.653066528066528, "percentage": 98.27, "elapsed_time": "1:49:50", "remaining_time": "0:01:56", "throughput": 1033.27, "total_tokens": 6809344} +{"current_steps": 75630, "total_steps": 76960, "loss": 0.0943, "lr": 4.55427057160146e-08, "epoch": 19.654365904365903, "percentage": 98.27, "elapsed_time": "1:49:50", "remaining_time": "0:01:55", "throughput": 1033.28, "total_tokens": 6809808} +{"current_steps": 75635, "total_steps": 76960, "loss": 0.1022, "lr": 4.520128227257226e-08, "epoch": 19.655665280665282, "percentage": 98.28, "elapsed_time": "1:49:50", "remaining_time": "0:01:55", "throughput": 1033.28, "total_tokens": 6810256} +{"current_steps": 75640, "total_steps": 76960, "loss": 0.0413, "lr": 4.4861142278340704e-08, "epoch": 19.656964656964657, "percentage": 98.28, "elapsed_time": "1:49:51", "remaining_time": "0:01:55", "throughput": 1033.28, "total_tokens": 6810688} +{"current_steps": 75645, "total_steps": 76960, "loss": 0.0015, "lr": 4.452228575081152e-08, "epoch": 19.658264033264032, "percentage": 98.29, "elapsed_time": "1:49:51", "remaining_time": "0:01:54", "throughput": 1033.29, "total_tokens": 6811152} +{"current_steps": 75650, "total_steps": 76960, "loss": 0.0008, "lr": 4.4184712707412426e-08, "epoch": 19.65956340956341, "percentage": 98.3, "elapsed_time": "1:49:52", "remaining_time": "0:01:54", "throughput": 1033.29, "total_tokens": 6811600} +{"current_steps": 75655, "total_steps": 76960, "loss": 0.001, "lr": 4.384842316550453e-08, "epoch": 19.660862785862786, "percentage": 98.3, "elapsed_time": "1:49:52", "remaining_time": "0:01:53", "throughput": 1033.29, "total_tokens": 6812016} +{"current_steps": 75660, "total_steps": 76960, "loss": 0.0009, "lr": 4.351341714238233e-08, "epoch": 19.66216216216216, "percentage": 98.31, "elapsed_time": "1:49:52", "remaining_time": "0:01:53", "throughput": 1033.29, "total_tokens": 6812464} +{"current_steps": 75665, "total_steps": 76960, "loss": 0.3542, "lr": 4.317969465527927e-08, "epoch": 19.66346153846154, "percentage": 98.32, "elapsed_time": "1:49:53", "remaining_time": "0:01:52", "throughput": 1033.3, "total_tokens": 6812928} +{"current_steps": 75670, "total_steps": 76960, "loss": 0.308, "lr": 4.2847255721356616e-08, "epoch": 19.664760914760915, "percentage": 98.32, "elapsed_time": "1:49:53", "remaining_time": "0:01:52", "throughput": 1033.3, "total_tokens": 6813392} +{"current_steps": 75675, "total_steps": 76960, "loss": 0.0014, "lr": 4.251610035771181e-08, "epoch": 19.66606029106029, "percentage": 98.33, "elapsed_time": "1:49:54", "remaining_time": "0:01:51", "throughput": 1033.3, "total_tokens": 6813840} +{"current_steps": 75680, "total_steps": 76960, "loss": 0.136, "lr": 4.218622858137844e-08, "epoch": 19.66735966735967, "percentage": 98.34, "elapsed_time": "1:49:54", "remaining_time": "0:01:51", "throughput": 1033.31, "total_tokens": 6814320} +{"current_steps": 75685, "total_steps": 76960, "loss": 0.1466, "lr": 4.1857640409317946e-08, "epoch": 19.668659043659044, "percentage": 98.34, "elapsed_time": "1:49:55", "remaining_time": "0:01:51", "throughput": 1033.32, "total_tokens": 6814816} +{"current_steps": 75690, "total_steps": 76960, "loss": 0.2458, "lr": 4.153033585843624e-08, "epoch": 19.66995841995842, "percentage": 98.35, "elapsed_time": "1:49:55", "remaining_time": "0:01:50", "throughput": 1033.33, "total_tokens": 6815264} +{"current_steps": 75695, "total_steps": 76960, "loss": 0.0044, "lr": 4.120431494556154e-08, "epoch": 19.671257796257795, "percentage": 98.36, "elapsed_time": "1:49:55", "remaining_time": "0:01:50", "throughput": 1033.33, "total_tokens": 6815728} +{"current_steps": 75700, "total_steps": 76960, "loss": 0.0549, "lr": 4.087957768746375e-08, "epoch": 19.672557172557173, "percentage": 98.36, "elapsed_time": "1:49:56", "remaining_time": "0:01:49", "throughput": 1033.33, "total_tokens": 6816176} +{"current_steps": 75705, "total_steps": 76960, "loss": 0.0057, "lr": 4.055612410084342e-08, "epoch": 19.67385654885655, "percentage": 98.37, "elapsed_time": "1:49:56", "remaining_time": "0:01:49", "throughput": 1033.34, "total_tokens": 6816624} +{"current_steps": 75710, "total_steps": 76960, "loss": 0.0007, "lr": 4.023395420233722e-08, "epoch": 19.675155925155924, "percentage": 98.38, "elapsed_time": "1:49:57", "remaining_time": "0:01:48", "throughput": 1033.34, "total_tokens": 6817056} +{"current_steps": 75715, "total_steps": 76960, "loss": 0.0073, "lr": 3.9913068008512466e-08, "epoch": 19.676455301455302, "percentage": 98.38, "elapsed_time": "1:49:57", "remaining_time": "0:01:48", "throughput": 1033.34, "total_tokens": 6817488} +{"current_steps": 75720, "total_steps": 76960, "loss": 0.0003, "lr": 3.9593465535875396e-08, "epoch": 19.677754677754677, "percentage": 98.39, "elapsed_time": "1:49:57", "remaining_time": "0:01:48", "throughput": 1033.35, "total_tokens": 6817968} +{"current_steps": 75725, "total_steps": 76960, "loss": 0.0019, "lr": 3.927514680086286e-08, "epoch": 19.679054054054053, "percentage": 98.4, "elapsed_time": "1:49:58", "remaining_time": "0:01:47", "throughput": 1033.35, "total_tokens": 6818416} +{"current_steps": 75730, "total_steps": 76960, "loss": 0.0029, "lr": 3.89581118198451e-08, "epoch": 19.68035343035343, "percentage": 98.4, "elapsed_time": "1:49:58", "remaining_time": "0:01:47", "throughput": 1033.35, "total_tokens": 6818864} +{"current_steps": 75735, "total_steps": 76960, "loss": 0.0011, "lr": 3.8642360609128516e-08, "epoch": 19.681652806652806, "percentage": 98.41, "elapsed_time": "1:49:59", "remaining_time": "0:01:46", "throughput": 1033.36, "total_tokens": 6819328} +{"current_steps": 75740, "total_steps": 76960, "loss": 0.0006, "lr": 3.832789318495289e-08, "epoch": 19.68295218295218, "percentage": 98.41, "elapsed_time": "1:49:59", "remaining_time": "0:01:46", "throughput": 1033.36, "total_tokens": 6819792} +{"current_steps": 75745, "total_steps": 76960, "loss": 0.4826, "lr": 3.8014709563488625e-08, "epoch": 19.68425155925156, "percentage": 98.42, "elapsed_time": "1:50:00", "remaining_time": "0:01:45", "throughput": 1033.37, "total_tokens": 6820256} +{"current_steps": 75750, "total_steps": 76960, "loss": 0.2011, "lr": 3.7702809760847833e-08, "epoch": 19.685550935550935, "percentage": 98.43, "elapsed_time": "1:50:00", "remaining_time": "0:01:45", "throughput": 1033.37, "total_tokens": 6820688} +{"current_steps": 75755, "total_steps": 76960, "loss": 0.0188, "lr": 3.7392193793067684e-08, "epoch": 19.68685031185031, "percentage": 98.43, "elapsed_time": "1:50:00", "remaining_time": "0:01:44", "throughput": 1033.36, "total_tokens": 6821088} +{"current_steps": 75760, "total_steps": 76960, "loss": 0.039, "lr": 3.708286167612707e-08, "epoch": 19.68814968814969, "percentage": 98.44, "elapsed_time": "1:50:01", "remaining_time": "0:01:44", "throughput": 1033.37, "total_tokens": 6821552} +{"current_steps": 75765, "total_steps": 76960, "loss": 0.0093, "lr": 3.677481342592992e-08, "epoch": 19.689449064449065, "percentage": 98.45, "elapsed_time": "1:50:01", "remaining_time": "0:01:44", "throughput": 1033.38, "total_tokens": 6822016} +{"current_steps": 75770, "total_steps": 76960, "loss": 0.195, "lr": 3.646804905832468e-08, "epoch": 19.69074844074844, "percentage": 98.45, "elapsed_time": "1:50:02", "remaining_time": "0:01:43", "throughput": 1033.38, "total_tokens": 6822464} +{"current_steps": 75775, "total_steps": 76960, "loss": 0.5548, "lr": 3.6162568589084845e-08, "epoch": 19.69204781704782, "percentage": 98.46, "elapsed_time": "1:50:02", "remaining_time": "0:01:43", "throughput": 1033.38, "total_tokens": 6822912} +{"current_steps": 75780, "total_steps": 76960, "loss": 0.2642, "lr": 3.585837203392561e-08, "epoch": 19.693347193347194, "percentage": 98.47, "elapsed_time": "1:50:02", "remaining_time": "0:01:42", "throughput": 1033.38, "total_tokens": 6823344} +{"current_steps": 75785, "total_steps": 76960, "loss": 0.0004, "lr": 3.555545940848726e-08, "epoch": 19.69464656964657, "percentage": 98.47, "elapsed_time": "1:50:03", "remaining_time": "0:01:42", "throughput": 1033.38, "total_tokens": 6823792} +{"current_steps": 75790, "total_steps": 76960, "loss": 0.0105, "lr": 3.525383072835453e-08, "epoch": 19.695945945945947, "percentage": 98.48, "elapsed_time": "1:50:03", "remaining_time": "0:01:41", "throughput": 1033.39, "total_tokens": 6824224} +{"current_steps": 75795, "total_steps": 76960, "loss": 0.0004, "lr": 3.495348600903448e-08, "epoch": 19.697245322245323, "percentage": 98.49, "elapsed_time": "1:50:04", "remaining_time": "0:01:41", "throughput": 1033.39, "total_tokens": 6824656} +{"current_steps": 75800, "total_steps": 76960, "loss": 0.0059, "lr": 3.4654425265978616e-08, "epoch": 19.698544698544698, "percentage": 98.49, "elapsed_time": "1:50:04", "remaining_time": "0:01:41", "throughput": 1033.4, "total_tokens": 6825152} +{"current_steps": 75805, "total_steps": 76960, "loss": 0.1261, "lr": 3.435664851456632e-08, "epoch": 19.699844074844076, "percentage": 98.5, "elapsed_time": "1:50:04", "remaining_time": "0:01:40", "throughput": 1033.4, "total_tokens": 6825600} +{"current_steps": 75810, "total_steps": 76960, "loss": 0.2064, "lr": 3.406015577011312e-08, "epoch": 19.70114345114345, "percentage": 98.51, "elapsed_time": "1:50:05", "remaining_time": "0:01:40", "throughput": 1033.4, "total_tokens": 6826048} +{"current_steps": 75815, "total_steps": 76960, "loss": 0.0035, "lr": 3.376494704786515e-08, "epoch": 19.702442827442827, "percentage": 98.51, "elapsed_time": "1:50:05", "remaining_time": "0:01:39", "throughput": 1033.4, "total_tokens": 6826464} +{"current_steps": 75820, "total_steps": 76960, "loss": 0.0056, "lr": 3.347102236301025e-08, "epoch": 19.703742203742205, "percentage": 98.52, "elapsed_time": "1:50:06", "remaining_time": "0:01:39", "throughput": 1033.4, "total_tokens": 6826880} +{"current_steps": 75825, "total_steps": 76960, "loss": 0.2354, "lr": 3.317838173066135e-08, "epoch": 19.70504158004158, "percentage": 98.53, "elapsed_time": "1:50:06", "remaining_time": "0:01:38", "throughput": 1033.41, "total_tokens": 6827344} +{"current_steps": 75830, "total_steps": 76960, "loss": 0.1935, "lr": 3.28870251658675e-08, "epoch": 19.706340956340956, "percentage": 98.53, "elapsed_time": "1:50:07", "remaining_time": "0:01:38", "throughput": 1033.41, "total_tokens": 6827776} +{"current_steps": 75835, "total_steps": 76960, "loss": 0.0107, "lr": 3.259695268361951e-08, "epoch": 19.70764033264033, "percentage": 98.54, "elapsed_time": "1:50:07", "remaining_time": "0:01:38", "throughput": 1033.41, "total_tokens": 6828224} +{"current_steps": 75840, "total_steps": 76960, "loss": 0.0024, "lr": 3.230816429883321e-08, "epoch": 19.70893970893971, "percentage": 98.54, "elapsed_time": "1:50:07", "remaining_time": "0:01:37", "throughput": 1033.41, "total_tokens": 6828656} +{"current_steps": 75845, "total_steps": 76960, "loss": 0.0162, "lr": 3.2020660026360615e-08, "epoch": 19.710239085239085, "percentage": 98.55, "elapsed_time": "1:50:08", "remaining_time": "0:01:37", "throughput": 1033.41, "total_tokens": 6829104} +{"current_steps": 75850, "total_steps": 76960, "loss": 0.3247, "lr": 3.173443988098712e-08, "epoch": 19.71153846153846, "percentage": 98.56, "elapsed_time": "1:50:08", "remaining_time": "0:01:36", "throughput": 1033.42, "total_tokens": 6829552} +{"current_steps": 75855, "total_steps": 76960, "loss": 0.0046, "lr": 3.144950387743428e-08, "epoch": 19.71283783783784, "percentage": 98.56, "elapsed_time": "1:50:09", "remaining_time": "0:01:36", "throughput": 1033.42, "total_tokens": 6830016} +{"current_steps": 75860, "total_steps": 76960, "loss": 0.0574, "lr": 3.116585203035705e-08, "epoch": 19.714137214137214, "percentage": 98.57, "elapsed_time": "1:50:09", "remaining_time": "0:01:35", "throughput": 1033.42, "total_tokens": 6830448} +{"current_steps": 75865, "total_steps": 76960, "loss": 0.1859, "lr": 3.0883484354346514e-08, "epoch": 19.71543659043659, "percentage": 98.58, "elapsed_time": "1:50:09", "remaining_time": "0:01:35", "throughput": 1033.43, "total_tokens": 6830912} +{"current_steps": 75870, "total_steps": 76960, "loss": 0.0023, "lr": 3.060240086392163e-08, "epoch": 19.716735966735968, "percentage": 98.58, "elapsed_time": "1:50:10", "remaining_time": "0:01:34", "throughput": 1033.44, "total_tokens": 6831440} +{"current_steps": 75875, "total_steps": 76960, "loss": 0.0068, "lr": 3.032260157354028e-08, "epoch": 19.718035343035343, "percentage": 98.59, "elapsed_time": "1:50:10", "remaining_time": "0:01:34", "throughput": 1033.45, "total_tokens": 6831920} +{"current_steps": 75880, "total_steps": 76960, "loss": 0.0112, "lr": 3.004408649759094e-08, "epoch": 19.719334719334718, "percentage": 98.6, "elapsed_time": "1:50:11", "remaining_time": "0:01:34", "throughput": 1033.45, "total_tokens": 6832320} +{"current_steps": 75885, "total_steps": 76960, "loss": 0.0656, "lr": 2.9766855650398273e-08, "epoch": 19.720634095634097, "percentage": 98.6, "elapsed_time": "1:50:11", "remaining_time": "0:01:33", "throughput": 1033.45, "total_tokens": 6832768} +{"current_steps": 75890, "total_steps": 76960, "loss": 0.0072, "lr": 2.9490909046225867e-08, "epoch": 19.721933471933472, "percentage": 98.61, "elapsed_time": "1:50:12", "remaining_time": "0:01:33", "throughput": 1033.44, "total_tokens": 6833168} +{"current_steps": 75895, "total_steps": 76960, "loss": 0.0004, "lr": 2.921624669925682e-08, "epoch": 19.723232848232847, "percentage": 98.62, "elapsed_time": "1:50:12", "remaining_time": "0:01:32", "throughput": 1033.45, "total_tokens": 6833600} +{"current_steps": 75900, "total_steps": 76960, "loss": 0.0002, "lr": 2.8942868623624276e-08, "epoch": 19.724532224532226, "percentage": 98.62, "elapsed_time": "1:50:12", "remaining_time": "0:01:32", "throughput": 1033.45, "total_tokens": 6834048} +{"current_steps": 75905, "total_steps": 76960, "loss": 0.053, "lr": 2.8670774833386426e-08, "epoch": 19.7258316008316, "percentage": 98.63, "elapsed_time": "1:50:13", "remaining_time": "0:01:31", "throughput": 1033.45, "total_tokens": 6834496} +{"current_steps": 75910, "total_steps": 76960, "loss": 0.0009, "lr": 2.8399965342537637e-08, "epoch": 19.727130977130976, "percentage": 98.64, "elapsed_time": "1:50:13", "remaining_time": "0:01:31", "throughput": 1033.45, "total_tokens": 6834944} +{"current_steps": 75915, "total_steps": 76960, "loss": 0.0032, "lr": 2.813044016500288e-08, "epoch": 19.728430353430355, "percentage": 98.64, "elapsed_time": "1:50:14", "remaining_time": "0:01:31", "throughput": 1033.45, "total_tokens": 6835360} +{"current_steps": 75920, "total_steps": 76960, "loss": 0.0808, "lr": 2.786219931464884e-08, "epoch": 19.72972972972973, "percentage": 98.65, "elapsed_time": "1:50:14", "remaining_time": "0:01:30", "throughput": 1033.46, "total_tokens": 6835824} +{"current_steps": 75925, "total_steps": 76960, "loss": 0.0466, "lr": 2.7595242805267262e-08, "epoch": 19.731029106029105, "percentage": 98.66, "elapsed_time": "1:50:14", "remaining_time": "0:01:30", "throughput": 1033.46, "total_tokens": 6836288} +{"current_steps": 75930, "total_steps": 76960, "loss": 0.1236, "lr": 2.7329570650591606e-08, "epoch": 19.732328482328484, "percentage": 98.66, "elapsed_time": "1:50:15", "remaining_time": "0:01:29", "throughput": 1033.47, "total_tokens": 6836768} +{"current_steps": 75935, "total_steps": 76960, "loss": 0.0459, "lr": 2.7065182864283167e-08, "epoch": 19.73362785862786, "percentage": 98.67, "elapsed_time": "1:50:15", "remaining_time": "0:01:29", "throughput": 1033.47, "total_tokens": 6837216} +{"current_steps": 75940, "total_steps": 76960, "loss": 0.0004, "lr": 2.68020794599394e-08, "epoch": 19.734927234927234, "percentage": 98.67, "elapsed_time": "1:50:16", "remaining_time": "0:01:28", "throughput": 1033.48, "total_tokens": 6837696} +{"current_steps": 75945, "total_steps": 76960, "loss": 0.085, "lr": 2.6540260451093922e-08, "epoch": 19.736226611226613, "percentage": 98.68, "elapsed_time": "1:50:16", "remaining_time": "0:01:28", "throughput": 1033.49, "total_tokens": 6838176} +{"current_steps": 75950, "total_steps": 76960, "loss": 0.004, "lr": 2.6279725851208194e-08, "epoch": 19.737525987525988, "percentage": 98.69, "elapsed_time": "1:50:17", "remaining_time": "0:01:27", "throughput": 1033.49, "total_tokens": 6838592} +{"current_steps": 75955, "total_steps": 76960, "loss": 0.0005, "lr": 2.602047567368815e-08, "epoch": 19.738825363825363, "percentage": 98.69, "elapsed_time": "1:50:17", "remaining_time": "0:01:27", "throughput": 1033.5, "total_tokens": 6839072} +{"current_steps": 75960, "total_steps": 76960, "loss": 0.0017, "lr": 2.5762509931862023e-08, "epoch": 19.74012474012474, "percentage": 98.7, "elapsed_time": "1:50:17", "remaining_time": "0:01:27", "throughput": 1033.5, "total_tokens": 6839536} +{"current_steps": 75965, "total_steps": 76960, "loss": 0.1345, "lr": 2.5505828639002527e-08, "epoch": 19.741424116424117, "percentage": 98.71, "elapsed_time": "1:50:18", "remaining_time": "0:01:26", "throughput": 1033.5, "total_tokens": 6839968} +{"current_steps": 75970, "total_steps": 76960, "loss": 0.0043, "lr": 2.5250431808304665e-08, "epoch": 19.742723492723492, "percentage": 98.71, "elapsed_time": "1:50:18", "remaining_time": "0:01:26", "throughput": 1033.5, "total_tokens": 6840384} +{"current_steps": 75975, "total_steps": 76960, "loss": 0.0031, "lr": 2.4996319452907925e-08, "epoch": 19.74402286902287, "percentage": 98.72, "elapsed_time": "1:50:19", "remaining_time": "0:01:25", "throughput": 1033.5, "total_tokens": 6840832} +{"current_steps": 75980, "total_steps": 76960, "loss": 0.0558, "lr": 2.474349158587963e-08, "epoch": 19.745322245322246, "percentage": 98.73, "elapsed_time": "1:50:19", "remaining_time": "0:01:25", "throughput": 1033.51, "total_tokens": 6841296} +{"current_steps": 75985, "total_steps": 76960, "loss": 0.1946, "lr": 2.449194822022327e-08, "epoch": 19.74662162162162, "percentage": 98.73, "elapsed_time": "1:50:19", "remaining_time": "0:01:24", "throughput": 1033.51, "total_tokens": 6841760} +{"current_steps": 75990, "total_steps": 76960, "loss": 0.0609, "lr": 2.4241689368878494e-08, "epoch": 19.747920997921, "percentage": 98.74, "elapsed_time": "1:50:20", "remaining_time": "0:01:24", "throughput": 1033.52, "total_tokens": 6842240} +{"current_steps": 75995, "total_steps": 76960, "loss": 0.1413, "lr": 2.3992715044710012e-08, "epoch": 19.749220374220375, "percentage": 98.75, "elapsed_time": "1:50:20", "remaining_time": "0:01:24", "throughput": 1033.53, "total_tokens": 6842704} +{"current_steps": 76000, "total_steps": 76960, "loss": 0.0078, "lr": 2.374502526053257e-08, "epoch": 19.75051975051975, "percentage": 98.75, "elapsed_time": "1:50:21", "remaining_time": "0:01:23", "throughput": 1033.52, "total_tokens": 6843120} +{"current_steps": 76005, "total_steps": 76960, "loss": 0.171, "lr": 2.349862002907488e-08, "epoch": 19.751819126819125, "percentage": 98.76, "elapsed_time": "1:50:21", "remaining_time": "0:01:23", "throughput": 1033.53, "total_tokens": 6843584} +{"current_steps": 76010, "total_steps": 76960, "loss": 0.0009, "lr": 2.325349936301846e-08, "epoch": 19.753118503118504, "percentage": 98.77, "elapsed_time": "1:50:21", "remaining_time": "0:01:22", "throughput": 1033.53, "total_tokens": 6844032} +{"current_steps": 76015, "total_steps": 76960, "loss": 0.4221, "lr": 2.300966327496157e-08, "epoch": 19.75441787941788, "percentage": 98.77, "elapsed_time": "1:50:22", "remaining_time": "0:01:22", "throughput": 1033.54, "total_tokens": 6844512} +{"current_steps": 76020, "total_steps": 76960, "loss": 0.0592, "lr": 2.27671117774525e-08, "epoch": 19.755717255717254, "percentage": 98.78, "elapsed_time": "1:50:22", "remaining_time": "0:01:21", "throughput": 1033.54, "total_tokens": 6844928} +{"current_steps": 76025, "total_steps": 76960, "loss": 0.0016, "lr": 2.2525844882964607e-08, "epoch": 19.757016632016633, "percentage": 98.79, "elapsed_time": "1:50:23", "remaining_time": "0:01:21", "throughput": 1033.54, "total_tokens": 6845376} +{"current_steps": 76030, "total_steps": 76960, "loss": 0.0011, "lr": 2.2285862603901865e-08, "epoch": 19.758316008316008, "percentage": 98.79, "elapsed_time": "1:50:23", "remaining_time": "0:01:21", "throughput": 1033.55, "total_tokens": 6845856} +{"current_steps": 76035, "total_steps": 76960, "loss": 0.0067, "lr": 2.2047164952609944e-08, "epoch": 19.759615384615383, "percentage": 98.8, "elapsed_time": "1:50:24", "remaining_time": "0:01:20", "throughput": 1033.56, "total_tokens": 6846320} +{"current_steps": 76040, "total_steps": 76960, "loss": 0.0047, "lr": 2.1809751941365142e-08, "epoch": 19.760914760914762, "percentage": 98.8, "elapsed_time": "1:50:24", "remaining_time": "0:01:20", "throughput": 1033.56, "total_tokens": 6846752} +{"current_steps": 76045, "total_steps": 76960, "loss": 0.0018, "lr": 2.1573623582377133e-08, "epoch": 19.762214137214137, "percentage": 98.81, "elapsed_time": "1:50:24", "remaining_time": "0:01:19", "throughput": 1033.56, "total_tokens": 6847232} +{"current_steps": 76050, "total_steps": 76960, "loss": 0.0017, "lr": 2.1338779887794534e-08, "epoch": 19.763513513513512, "percentage": 98.82, "elapsed_time": "1:50:25", "remaining_time": "0:01:19", "throughput": 1033.57, "total_tokens": 6847664} +{"current_steps": 76055, "total_steps": 76960, "loss": 0.0627, "lr": 2.1105220869688246e-08, "epoch": 19.76481288981289, "percentage": 98.82, "elapsed_time": "1:50:25", "remaining_time": "0:01:18", "throughput": 1033.56, "total_tokens": 6848080} +{"current_steps": 76060, "total_steps": 76960, "loss": 0.0167, "lr": 2.0872946540076433e-08, "epoch": 19.766112266112266, "percentage": 98.83, "elapsed_time": "1:50:26", "remaining_time": "0:01:18", "throughput": 1033.57, "total_tokens": 6848576} +{"current_steps": 76065, "total_steps": 76960, "loss": 0.1462, "lr": 2.064195691089954e-08, "epoch": 19.76741164241164, "percentage": 98.84, "elapsed_time": "1:50:26", "remaining_time": "0:01:17", "throughput": 1033.57, "total_tokens": 6849008} +{"current_steps": 76070, "total_steps": 76960, "loss": 0.0903, "lr": 2.0412251994042508e-08, "epoch": 19.76871101871102, "percentage": 98.84, "elapsed_time": "1:50:26", "remaining_time": "0:01:17", "throughput": 1033.58, "total_tokens": 6849488} +{"current_steps": 76075, "total_steps": 76960, "loss": 0.001, "lr": 2.018383180131811e-08, "epoch": 19.770010395010395, "percentage": 98.85, "elapsed_time": "1:50:27", "remaining_time": "0:01:17", "throughput": 1033.58, "total_tokens": 6849920} +{"current_steps": 76080, "total_steps": 76960, "loss": 0.044, "lr": 1.995669634447528e-08, "epoch": 19.77130977130977, "percentage": 98.86, "elapsed_time": "1:50:27", "remaining_time": "0:01:16", "throughput": 1033.59, "total_tokens": 6850368} +{"current_steps": 76085, "total_steps": 76960, "loss": 0.0139, "lr": 1.9730845635190788e-08, "epoch": 19.77260914760915, "percentage": 98.86, "elapsed_time": "1:50:28", "remaining_time": "0:01:16", "throughput": 1033.59, "total_tokens": 6850800} +{"current_steps": 76090, "total_steps": 76960, "loss": 0.0009, "lr": 1.950627968508589e-08, "epoch": 19.773908523908524, "percentage": 98.87, "elapsed_time": "1:50:28", "remaining_time": "0:01:15", "throughput": 1033.59, "total_tokens": 6851280} +{"current_steps": 76095, "total_steps": 76960, "loss": 0.1665, "lr": 1.9282998505709693e-08, "epoch": 19.7752079002079, "percentage": 98.88, "elapsed_time": "1:50:29", "remaining_time": "0:01:15", "throughput": 1033.59, "total_tokens": 6851696} +{"current_steps": 76100, "total_steps": 76960, "loss": 0.0001, "lr": 1.906100210854189e-08, "epoch": 19.776507276507278, "percentage": 98.88, "elapsed_time": "1:50:29", "remaining_time": "0:01:14", "throughput": 1033.59, "total_tokens": 6852128} +{"current_steps": 76105, "total_steps": 76960, "loss": 0.117, "lr": 1.8840290505001134e-08, "epoch": 19.777806652806653, "percentage": 98.89, "elapsed_time": "1:50:29", "remaining_time": "0:01:14", "throughput": 1033.6, "total_tokens": 6852608} +{"current_steps": 76110, "total_steps": 76960, "loss": 0.0005, "lr": 1.8620863706442228e-08, "epoch": 19.77910602910603, "percentage": 98.9, "elapsed_time": "1:50:30", "remaining_time": "0:01:14", "throughput": 1033.6, "total_tokens": 6853040} +{"current_steps": 76115, "total_steps": 76960, "loss": 0.0001, "lr": 1.840272172414781e-08, "epoch": 19.780405405405407, "percentage": 98.9, "elapsed_time": "1:50:30", "remaining_time": "0:01:13", "throughput": 1033.6, "total_tokens": 6853472} +{"current_steps": 76120, "total_steps": 76960, "loss": 0.2944, "lr": 1.8185864569336687e-08, "epoch": 19.781704781704782, "percentage": 98.91, "elapsed_time": "1:50:31", "remaining_time": "0:01:13", "throughput": 1033.6, "total_tokens": 6853904} +{"current_steps": 76125, "total_steps": 76960, "loss": 0.1953, "lr": 1.79702922531666e-08, "epoch": 19.783004158004157, "percentage": 98.92, "elapsed_time": "1:50:31", "remaining_time": "0:01:12", "throughput": 1033.61, "total_tokens": 6854384} +{"current_steps": 76130, "total_steps": 76960, "loss": 0.1222, "lr": 1.7756004786717572e-08, "epoch": 19.784303534303533, "percentage": 98.92, "elapsed_time": "1:50:31", "remaining_time": "0:01:12", "throughput": 1033.61, "total_tokens": 6854816} +{"current_steps": 76135, "total_steps": 76960, "loss": 0.039, "lr": 1.7543002181014125e-08, "epoch": 19.78560291060291, "percentage": 98.93, "elapsed_time": "1:50:32", "remaining_time": "0:01:11", "throughput": 1033.61, "total_tokens": 6855264} +{"current_steps": 76140, "total_steps": 76960, "loss": 0.0031, "lr": 1.7331284447011377e-08, "epoch": 19.786902286902286, "percentage": 98.93, "elapsed_time": "1:50:32", "remaining_time": "0:01:11", "throughput": 1033.61, "total_tokens": 6855696} +{"current_steps": 76145, "total_steps": 76960, "loss": 0.128, "lr": 1.712085159559784e-08, "epoch": 19.78820166320166, "percentage": 98.94, "elapsed_time": "1:50:33", "remaining_time": "0:01:10", "throughput": 1033.62, "total_tokens": 6856144} +{"current_steps": 76150, "total_steps": 76960, "loss": 0.5711, "lr": 1.69117036375982e-08, "epoch": 19.78950103950104, "percentage": 98.95, "elapsed_time": "1:50:33", "remaining_time": "0:01:10", "throughput": 1033.62, "total_tokens": 6856592} +{"current_steps": 76155, "total_steps": 76960, "loss": 0.0028, "lr": 1.670384058376495e-08, "epoch": 19.790800415800415, "percentage": 98.95, "elapsed_time": "1:50:33", "remaining_time": "0:01:10", "throughput": 1033.63, "total_tokens": 6857056} +{"current_steps": 76160, "total_steps": 76960, "loss": 0.0715, "lr": 1.6497262444792326e-08, "epoch": 19.79209979209979, "percentage": 98.96, "elapsed_time": "1:50:34", "remaining_time": "0:01:09", "throughput": 1033.63, "total_tokens": 6857488} +{"current_steps": 76165, "total_steps": 76960, "loss": 0.1582, "lr": 1.629196923130516e-08, "epoch": 19.79339916839917, "percentage": 98.97, "elapsed_time": "1:50:34", "remaining_time": "0:01:09", "throughput": 1033.63, "total_tokens": 6857936} +{"current_steps": 76170, "total_steps": 76960, "loss": 0.0332, "lr": 1.608796095385612e-08, "epoch": 19.794698544698544, "percentage": 98.97, "elapsed_time": "1:50:35", "remaining_time": "0:01:08", "throughput": 1033.63, "total_tokens": 6858384} +{"current_steps": 76175, "total_steps": 76960, "loss": 0.0243, "lr": 1.5885237622945136e-08, "epoch": 19.79599792099792, "percentage": 98.98, "elapsed_time": "1:50:35", "remaining_time": "0:01:08", "throughput": 1033.63, "total_tokens": 6858816} +{"current_steps": 76180, "total_steps": 76960, "loss": 0.0034, "lr": 1.5683799248994436e-08, "epoch": 19.7972972972973, "percentage": 98.99, "elapsed_time": "1:50:36", "remaining_time": "0:01:07", "throughput": 1033.63, "total_tokens": 6859248} +{"current_steps": 76185, "total_steps": 76960, "loss": 0.0144, "lr": 1.5483645842362392e-08, "epoch": 19.798596673596673, "percentage": 98.99, "elapsed_time": "1:50:36", "remaining_time": "0:01:07", "throughput": 1033.63, "total_tokens": 6859664} +{"current_steps": 76190, "total_steps": 76960, "loss": 0.0049, "lr": 1.5284777413349106e-08, "epoch": 19.79989604989605, "percentage": 99.0, "elapsed_time": "1:50:36", "remaining_time": "0:01:07", "throughput": 1033.64, "total_tokens": 6860128} +{"current_steps": 76195, "total_steps": 76960, "loss": 0.1375, "lr": 1.508719397217695e-08, "epoch": 19.801195426195427, "percentage": 99.01, "elapsed_time": "1:50:37", "remaining_time": "0:01:06", "throughput": 1033.65, "total_tokens": 6860624} +{"current_steps": 76200, "total_steps": 76960, "loss": 0.0974, "lr": 1.4890895529010019e-08, "epoch": 19.802494802494802, "percentage": 99.01, "elapsed_time": "1:50:37", "remaining_time": "0:01:06", "throughput": 1033.65, "total_tokens": 6861088} +{"current_steps": 76205, "total_steps": 76960, "loss": 0.0001, "lr": 1.4695882093943015e-08, "epoch": 19.803794178794178, "percentage": 99.02, "elapsed_time": "1:50:38", "remaining_time": "0:01:05", "throughput": 1033.66, "total_tokens": 6861536} +{"current_steps": 76210, "total_steps": 76960, "loss": 0.1276, "lr": 1.4502153677006802e-08, "epoch": 19.805093555093556, "percentage": 99.03, "elapsed_time": "1:50:38", "remaining_time": "0:01:05", "throughput": 1033.66, "total_tokens": 6861968} +{"current_steps": 76215, "total_steps": 76960, "loss": 0.0076, "lr": 1.4309710288165634e-08, "epoch": 19.80639293139293, "percentage": 99.03, "elapsed_time": "1:50:38", "remaining_time": "0:01:04", "throughput": 1033.66, "total_tokens": 6862400} +{"current_steps": 76220, "total_steps": 76960, "loss": 0.0028, "lr": 1.4118551937314372e-08, "epoch": 19.807692307692307, "percentage": 99.04, "elapsed_time": "1:50:39", "remaining_time": "0:01:04", "throughput": 1033.66, "total_tokens": 6862848} +{"current_steps": 76225, "total_steps": 76960, "loss": 0.0002, "lr": 1.3928678634289593e-08, "epoch": 19.808991683991685, "percentage": 99.04, "elapsed_time": "1:50:39", "remaining_time": "0:01:04", "throughput": 1033.66, "total_tokens": 6863296} +{"current_steps": 76230, "total_steps": 76960, "loss": 0.0014, "lr": 1.3740090388850158e-08, "epoch": 19.81029106029106, "percentage": 99.05, "elapsed_time": "1:50:40", "remaining_time": "0:01:03", "throughput": 1033.66, "total_tokens": 6863712} +{"current_steps": 76235, "total_steps": 76960, "loss": 0.0011, "lr": 1.3552787210699413e-08, "epoch": 19.811590436590436, "percentage": 99.06, "elapsed_time": "1:50:40", "remaining_time": "0:01:03", "throughput": 1033.66, "total_tokens": 6864144} +{"current_steps": 76240, "total_steps": 76960, "loss": 0.0002, "lr": 1.3366769109471321e-08, "epoch": 19.812889812889814, "percentage": 99.06, "elapsed_time": "1:50:41", "remaining_time": "0:01:02", "throughput": 1033.66, "total_tokens": 6864576} +{"current_steps": 76245, "total_steps": 76960, "loss": 0.3562, "lr": 1.3182036094730454e-08, "epoch": 19.81418918918919, "percentage": 99.07, "elapsed_time": "1:50:41", "remaining_time": "0:01:02", "throughput": 1033.67, "total_tokens": 6865024} +{"current_steps": 76250, "total_steps": 76960, "loss": 0.0005, "lr": 1.2998588175977544e-08, "epoch": 19.815488565488565, "percentage": 99.08, "elapsed_time": "1:50:41", "remaining_time": "0:01:01", "throughput": 1033.67, "total_tokens": 6865504} +{"current_steps": 76255, "total_steps": 76960, "loss": 0.0002, "lr": 1.2816425362649487e-08, "epoch": 19.816787941787943, "percentage": 99.08, "elapsed_time": "1:50:42", "remaining_time": "0:01:01", "throughput": 1033.68, "total_tokens": 6865968} +{"current_steps": 76260, "total_steps": 76960, "loss": 0.0618, "lr": 1.263554766411379e-08, "epoch": 19.81808731808732, "percentage": 99.09, "elapsed_time": "1:50:42", "remaining_time": "0:01:00", "throughput": 1033.68, "total_tokens": 6866432} +{"current_steps": 76265, "total_steps": 76960, "loss": 0.0001, "lr": 1.245595508967412e-08, "epoch": 19.819386694386694, "percentage": 99.1, "elapsed_time": "1:50:43", "remaining_time": "0:01:00", "throughput": 1033.69, "total_tokens": 6866896} +{"current_steps": 76270, "total_steps": 76960, "loss": 0.0001, "lr": 1.2277647648567537e-08, "epoch": 19.820686070686072, "percentage": 99.1, "elapsed_time": "1:50:43", "remaining_time": "0:01:00", "throughput": 1033.7, "total_tokens": 6867376} +{"current_steps": 76275, "total_steps": 76960, "loss": 0.2063, "lr": 1.2100625349961702e-08, "epoch": 19.821985446985448, "percentage": 99.11, "elapsed_time": "1:50:43", "remaining_time": "0:00:59", "throughput": 1033.7, "total_tokens": 6867808} +{"current_steps": 76280, "total_steps": 76960, "loss": 0.0066, "lr": 1.1924888202963224e-08, "epoch": 19.823284823284823, "percentage": 99.12, "elapsed_time": "1:50:44", "remaining_time": "0:00:59", "throughput": 1033.7, "total_tokens": 6868272} +{"current_steps": 76285, "total_steps": 76960, "loss": 0.0853, "lr": 1.1750436216612092e-08, "epoch": 19.8245841995842, "percentage": 99.12, "elapsed_time": "1:50:44", "remaining_time": "0:00:58", "throughput": 1033.71, "total_tokens": 6868752} +{"current_steps": 76290, "total_steps": 76960, "loss": 0.0533, "lr": 1.1577269399876135e-08, "epoch": 19.825883575883577, "percentage": 99.13, "elapsed_time": "1:50:45", "remaining_time": "0:00:58", "throughput": 1033.71, "total_tokens": 6869184} +{"current_steps": 76295, "total_steps": 76960, "loss": 0.0023, "lr": 1.1405387761664887e-08, "epoch": 19.82718295218295, "percentage": 99.14, "elapsed_time": "1:50:45", "remaining_time": "0:00:57", "throughput": 1033.72, "total_tokens": 6869648} +{"current_steps": 76300, "total_steps": 76960, "loss": 0.0003, "lr": 1.1234791310818504e-08, "epoch": 19.828482328482327, "percentage": 99.14, "elapsed_time": "1:50:45", "remaining_time": "0:00:57", "throughput": 1033.72, "total_tokens": 6870080} +{"current_steps": 76305, "total_steps": 76960, "loss": 0.0026, "lr": 1.1065480056110522e-08, "epoch": 19.829781704781706, "percentage": 99.15, "elapsed_time": "1:50:46", "remaining_time": "0:00:57", "throughput": 1033.72, "total_tokens": 6870528} +{"current_steps": 76310, "total_steps": 76960, "loss": 0.0223, "lr": 1.0897454006245089e-08, "epoch": 19.83108108108108, "percentage": 99.16, "elapsed_time": "1:50:46", "remaining_time": "0:00:56", "throughput": 1033.72, "total_tokens": 6870944} +{"current_steps": 76315, "total_steps": 76960, "loss": 0.0105, "lr": 1.0730713169868067e-08, "epoch": 19.832380457380456, "percentage": 99.16, "elapsed_time": "1:50:47", "remaining_time": "0:00:56", "throughput": 1033.72, "total_tokens": 6871392} +{"current_steps": 76320, "total_steps": 76960, "loss": 0.0081, "lr": 1.056525755555593e-08, "epoch": 19.833679833679835, "percentage": 99.17, "elapsed_time": "1:50:47", "remaining_time": "0:00:55", "throughput": 1033.72, "total_tokens": 6871840} +{"current_steps": 76325, "total_steps": 76960, "loss": 0.0007, "lr": 1.040108717181576e-08, "epoch": 19.83497920997921, "percentage": 99.17, "elapsed_time": "1:50:48", "remaining_time": "0:00:55", "throughput": 1033.73, "total_tokens": 6872304} +{"current_steps": 76330, "total_steps": 76960, "loss": 0.0081, "lr": 1.0238202027090804e-08, "epoch": 19.836278586278585, "percentage": 99.18, "elapsed_time": "1:50:48", "remaining_time": "0:00:54", "throughput": 1033.73, "total_tokens": 6872736} +{"current_steps": 76335, "total_steps": 76960, "loss": 0.0765, "lr": 1.0076602129757696e-08, "epoch": 19.837577962577964, "percentage": 99.19, "elapsed_time": "1:50:48", "remaining_time": "0:00:54", "throughput": 1033.73, "total_tokens": 6873184} +{"current_steps": 76340, "total_steps": 76960, "loss": 0.0005, "lr": 9.916287488132003e-09, "epoch": 19.83887733887734, "percentage": 99.19, "elapsed_time": "1:50:49", "remaining_time": "0:00:54", "throughput": 1033.73, "total_tokens": 6873616} +{"current_steps": 76345, "total_steps": 76960, "loss": 0.0001, "lr": 9.757258110454359e-09, "epoch": 19.840176715176714, "percentage": 99.2, "elapsed_time": "1:50:49", "remaining_time": "0:00:53", "throughput": 1033.74, "total_tokens": 6874080} +{"current_steps": 76350, "total_steps": 76960, "loss": 0.0367, "lr": 9.599514004904331e-09, "epoch": 19.841476091476093, "percentage": 99.21, "elapsed_time": "1:50:50", "remaining_time": "0:00:53", "throughput": 1033.74, "total_tokens": 6874528} +{"current_steps": 76355, "total_steps": 76960, "loss": 0.0984, "lr": 9.443055179597648e-09, "epoch": 19.842775467775468, "percentage": 99.21, "elapsed_time": "1:50:50", "remaining_time": "0:00:52", "throughput": 1033.74, "total_tokens": 6874944} +{"current_steps": 76360, "total_steps": 76960, "loss": 0.0713, "lr": 9.287881642577878e-09, "epoch": 19.844074844074843, "percentage": 99.22, "elapsed_time": "1:50:50", "remaining_time": "0:00:52", "throughput": 1033.75, "total_tokens": 6875424} +{"current_steps": 76365, "total_steps": 76960, "loss": 0.0129, "lr": 9.133993401830298e-09, "epoch": 19.84537422037422, "percentage": 99.23, "elapsed_time": "1:50:51", "remaining_time": "0:00:51", "throughput": 1033.75, "total_tokens": 6875856} +{"current_steps": 76370, "total_steps": 76960, "loss": 0.0001, "lr": 8.981390465262474e-09, "epoch": 19.846673596673597, "percentage": 99.23, "elapsed_time": "1:50:51", "remaining_time": "0:00:51", "throughput": 1033.75, "total_tokens": 6876304} +{"current_steps": 76375, "total_steps": 76960, "loss": 0.3114, "lr": 8.83007284072923e-09, "epoch": 19.847972972972972, "percentage": 99.24, "elapsed_time": "1:50:52", "remaining_time": "0:00:50", "throughput": 1033.75, "total_tokens": 6876736} +{"current_steps": 76380, "total_steps": 76960, "loss": 0.0009, "lr": 8.680040536010458e-09, "epoch": 19.84927234927235, "percentage": 99.25, "elapsed_time": "1:50:52", "remaining_time": "0:00:50", "throughput": 1033.75, "total_tokens": 6877168} +{"current_steps": 76385, "total_steps": 76960, "loss": 0.0008, "lr": 8.531293558824982e-09, "epoch": 19.850571725571726, "percentage": 99.25, "elapsed_time": "1:50:53", "remaining_time": "0:00:50", "throughput": 1033.76, "total_tokens": 6877616} +{"current_steps": 76390, "total_steps": 76960, "loss": 0.0193, "lr": 8.383831916816686e-09, "epoch": 19.8518711018711, "percentage": 99.26, "elapsed_time": "1:50:53", "remaining_time": "0:00:49", "throughput": 1033.76, "total_tokens": 6878080} +{"current_steps": 76395, "total_steps": 76960, "loss": 0.0249, "lr": 8.237655617576723e-09, "epoch": 19.85317047817048, "percentage": 99.27, "elapsed_time": "1:50:53", "remaining_time": "0:00:49", "throughput": 1033.77, "total_tokens": 6878544} +{"current_steps": 76400, "total_steps": 76960, "loss": 0.0025, "lr": 8.092764668618524e-09, "epoch": 19.854469854469855, "percentage": 99.27, "elapsed_time": "1:50:54", "remaining_time": "0:00:48", "throughput": 1033.77, "total_tokens": 6878976} +{"current_steps": 76405, "total_steps": 76960, "loss": 0.0219, "lr": 7.949159077397238e-09, "epoch": 19.85576923076923, "percentage": 99.28, "elapsed_time": "1:50:54", "remaining_time": "0:00:48", "throughput": 1033.78, "total_tokens": 6879456} +{"current_steps": 76410, "total_steps": 76960, "loss": 0.0785, "lr": 7.80683885129585e-09, "epoch": 19.85706860706861, "percentage": 99.29, "elapsed_time": "1:50:55", "remaining_time": "0:00:47", "throughput": 1033.78, "total_tokens": 6879888} +{"current_steps": 76415, "total_steps": 76960, "loss": 0.0053, "lr": 7.665803997633503e-09, "epoch": 19.858367983367984, "percentage": 99.29, "elapsed_time": "1:50:55", "remaining_time": "0:00:47", "throughput": 1033.78, "total_tokens": 6880352} +{"current_steps": 76420, "total_steps": 76960, "loss": 0.0046, "lr": 7.52605452366828e-09, "epoch": 19.85966735966736, "percentage": 99.3, "elapsed_time": "1:50:55", "remaining_time": "0:00:47", "throughput": 1033.78, "total_tokens": 6880768} +{"current_steps": 76425, "total_steps": 76960, "loss": 0.0644, "lr": 7.387590436583325e-09, "epoch": 19.860966735966738, "percentage": 99.3, "elapsed_time": "1:50:56", "remaining_time": "0:00:46", "throughput": 1033.78, "total_tokens": 6881168} +{"current_steps": 76430, "total_steps": 76960, "loss": 0.0005, "lr": 7.250411743500718e-09, "epoch": 19.862266112266113, "percentage": 99.31, "elapsed_time": "1:50:56", "remaining_time": "0:00:46", "throughput": 1033.78, "total_tokens": 6881632} +{"current_steps": 76435, "total_steps": 76960, "loss": 0.0013, "lr": 7.114518451478702e-09, "epoch": 19.863565488565488, "percentage": 99.32, "elapsed_time": "1:50:57", "remaining_time": "0:00:45", "throughput": 1033.79, "total_tokens": 6882096} +{"current_steps": 76440, "total_steps": 76960, "loss": 0.0841, "lr": 6.979910567500581e-09, "epoch": 19.864864864864863, "percentage": 99.32, "elapsed_time": "1:50:57", "remaining_time": "0:00:45", "throughput": 1033.79, "total_tokens": 6882544} +{"current_steps": 76445, "total_steps": 76960, "loss": 0.1963, "lr": 6.8465880984941444e-09, "epoch": 19.866164241164242, "percentage": 99.33, "elapsed_time": "1:50:57", "remaining_time": "0:00:44", "throughput": 1033.8, "total_tokens": 6883008} +{"current_steps": 76450, "total_steps": 76960, "loss": 0.0197, "lr": 6.714551051317796e-09, "epoch": 19.867463617463617, "percentage": 99.34, "elapsed_time": "1:50:58", "remaining_time": "0:00:44", "throughput": 1033.8, "total_tokens": 6883456} +{"current_steps": 76455, "total_steps": 76960, "loss": 0.0011, "lr": 6.583799432755e-09, "epoch": 19.868762993762992, "percentage": 99.34, "elapsed_time": "1:50:58", "remaining_time": "0:00:43", "throughput": 1033.81, "total_tokens": 6883936} +{"current_steps": 76460, "total_steps": 76960, "loss": 0.0995, "lr": 6.454333249536482e-09, "epoch": 19.87006237006237, "percentage": 99.35, "elapsed_time": "1:50:59", "remaining_time": "0:00:43", "throughput": 1033.82, "total_tokens": 6884448} +{"current_steps": 76465, "total_steps": 76960, "loss": 0.0009, "lr": 6.326152508320804e-09, "epoch": 19.871361746361746, "percentage": 99.36, "elapsed_time": "1:50:59", "remaining_time": "0:00:43", "throughput": 1033.83, "total_tokens": 6884960} +{"current_steps": 76470, "total_steps": 76960, "loss": 0.0172, "lr": 6.199257215697141e-09, "epoch": 19.87266112266112, "percentage": 99.36, "elapsed_time": "1:51:00", "remaining_time": "0:00:42", "throughput": 1033.84, "total_tokens": 6885472} +{"current_steps": 76475, "total_steps": 76960, "loss": 0.0822, "lr": 6.073647378196379e-09, "epoch": 19.8739604989605, "percentage": 99.37, "elapsed_time": "1:51:00", "remaining_time": "0:00:42", "throughput": 1033.84, "total_tokens": 6885888} +{"current_steps": 76480, "total_steps": 76960, "loss": 0.2098, "lr": 5.94932300227169e-09, "epoch": 19.875259875259875, "percentage": 99.38, "elapsed_time": "1:51:00", "remaining_time": "0:00:41", "throughput": 1033.85, "total_tokens": 6886368} +{"current_steps": 76485, "total_steps": 76960, "loss": 0.0026, "lr": 5.8262840943235085e-09, "epoch": 19.87655925155925, "percentage": 99.38, "elapsed_time": "1:51:01", "remaining_time": "0:00:41", "throughput": 1033.85, "total_tokens": 6886816} +{"current_steps": 76490, "total_steps": 76960, "loss": 0.3259, "lr": 5.7045306606801075e-09, "epoch": 19.87785862785863, "percentage": 99.39, "elapsed_time": "1:51:01", "remaining_time": "0:00:40", "throughput": 1033.85, "total_tokens": 6887248} +{"current_steps": 76495, "total_steps": 76960, "loss": 0.0005, "lr": 5.584062707597593e-09, "epoch": 19.879158004158004, "percentage": 99.4, "elapsed_time": "1:51:02", "remaining_time": "0:00:40", "throughput": 1033.86, "total_tokens": 6887728} +{"current_steps": 76500, "total_steps": 76960, "loss": 0.1159, "lr": 5.46488024127656e-09, "epoch": 19.88045738045738, "percentage": 99.4, "elapsed_time": "1:51:02", "remaining_time": "0:00:40", "throughput": 1033.86, "total_tokens": 6888160} +{"current_steps": 76505, "total_steps": 76960, "loss": 0.2307, "lr": 5.34698326784544e-09, "epoch": 19.881756756756758, "percentage": 99.41, "elapsed_time": "1:51:02", "remaining_time": "0:00:39", "throughput": 1033.87, "total_tokens": 6888640} +{"current_steps": 76510, "total_steps": 76960, "loss": 0.0098, "lr": 5.230371793368827e-09, "epoch": 19.883056133056133, "percentage": 99.42, "elapsed_time": "1:51:03", "remaining_time": "0:00:39", "throughput": 1033.87, "total_tokens": 6889072} +{"current_steps": 76515, "total_steps": 76960, "loss": 0.002, "lr": 5.115045823841924e-09, "epoch": 19.884355509355508, "percentage": 99.42, "elapsed_time": "1:51:03", "remaining_time": "0:00:38", "throughput": 1033.87, "total_tokens": 6889504} +{"current_steps": 76520, "total_steps": 76960, "loss": 0.0234, "lr": 5.001005365196098e-09, "epoch": 19.885654885654887, "percentage": 99.43, "elapsed_time": "1:51:04", "remaining_time": "0:00:38", "throughput": 1033.87, "total_tokens": 6889936} +{"current_steps": 76525, "total_steps": 76960, "loss": 0.0001, "lr": 4.888250423298879e-09, "epoch": 19.886954261954262, "percentage": 99.43, "elapsed_time": "1:51:04", "remaining_time": "0:00:37", "throughput": 1033.87, "total_tokens": 6890384} +{"current_steps": 76530, "total_steps": 76960, "loss": 0.0055, "lr": 4.776781003948405e-09, "epoch": 19.888253638253637, "percentage": 99.44, "elapsed_time": "1:51:05", "remaining_time": "0:00:37", "throughput": 1033.87, "total_tokens": 6890800} +{"current_steps": 76535, "total_steps": 76960, "loss": 0.0007, "lr": 4.666597112876203e-09, "epoch": 19.889553014553016, "percentage": 99.45, "elapsed_time": "1:51:05", "remaining_time": "0:00:37", "throughput": 1033.88, "total_tokens": 6891264} +{"current_steps": 76540, "total_steps": 76960, "loss": 0.1765, "lr": 4.557698755749962e-09, "epoch": 19.89085239085239, "percentage": 99.45, "elapsed_time": "1:51:05", "remaining_time": "0:00:36", "throughput": 1033.88, "total_tokens": 6891712} +{"current_steps": 76545, "total_steps": 76960, "loss": 0.028, "lr": 4.450085938170756e-09, "epoch": 19.892151767151766, "percentage": 99.46, "elapsed_time": "1:51:06", "remaining_time": "0:00:36", "throughput": 1033.88, "total_tokens": 6892160} +{"current_steps": 76550, "total_steps": 76960, "loss": 0.003, "lr": 4.3437586656758236e-09, "epoch": 19.893451143451145, "percentage": 99.47, "elapsed_time": "1:51:06", "remaining_time": "0:00:35", "throughput": 1033.89, "total_tokens": 6892640} +{"current_steps": 76555, "total_steps": 76960, "loss": 0.0046, "lr": 4.238716943727461e-09, "epoch": 19.89475051975052, "percentage": 99.47, "elapsed_time": "1:51:07", "remaining_time": "0:00:35", "throughput": 1033.9, "total_tokens": 6893136} +{"current_steps": 76560, "total_steps": 76960, "loss": 0.0007, "lr": 4.1349607777352305e-09, "epoch": 19.896049896049895, "percentage": 99.48, "elapsed_time": "1:51:07", "remaining_time": "0:00:34", "throughput": 1033.91, "total_tokens": 6893584} +{"current_steps": 76565, "total_steps": 76960, "loss": 0.0018, "lr": 4.032490173030978e-09, "epoch": 19.897349272349274, "percentage": 99.49, "elapsed_time": "1:51:07", "remaining_time": "0:00:34", "throughput": 1033.91, "total_tokens": 6894048} +{"current_steps": 76570, "total_steps": 76960, "loss": 0.274, "lr": 3.931305134882712e-09, "epoch": 19.89864864864865, "percentage": 99.49, "elapsed_time": "1:51:08", "remaining_time": "0:00:33", "throughput": 1033.91, "total_tokens": 6894496} +{"current_steps": 76575, "total_steps": 76960, "loss": 0.0008, "lr": 3.831405668500154e-09, "epoch": 19.899948024948024, "percentage": 99.5, "elapsed_time": "1:51:08", "remaining_time": "0:00:33", "throughput": 1033.92, "total_tokens": 6894944} +{"current_steps": 76580, "total_steps": 76960, "loss": 0.4099, "lr": 3.732791779018086e-09, "epoch": 19.901247401247403, "percentage": 99.51, "elapsed_time": "1:51:09", "remaining_time": "0:00:33", "throughput": 1033.92, "total_tokens": 6895376} +{"current_steps": 76585, "total_steps": 76960, "loss": 0.0253, "lr": 3.6354634715102255e-09, "epoch": 19.902546777546778, "percentage": 99.51, "elapsed_time": "1:51:09", "remaining_time": "0:00:32", "throughput": 1033.92, "total_tokens": 6895808} +{"current_steps": 76590, "total_steps": 76960, "loss": 0.3439, "lr": 3.5394207509781287e-09, "epoch": 19.903846153846153, "percentage": 99.52, "elapsed_time": "1:51:10", "remaining_time": "0:00:32", "throughput": 1033.92, "total_tokens": 6896256} +{"current_steps": 76595, "total_steps": 76960, "loss": 0.0131, "lr": 3.444663622365063e-09, "epoch": 19.90514553014553, "percentage": 99.53, "elapsed_time": "1:51:10", "remaining_time": "0:00:31", "throughput": 1033.93, "total_tokens": 6896736} +{"current_steps": 76600, "total_steps": 76960, "loss": 0.2191, "lr": 3.351192090544908e-09, "epoch": 19.906444906444907, "percentage": 99.53, "elapsed_time": "1:51:10", "remaining_time": "0:00:31", "throughput": 1033.94, "total_tokens": 6897216} +{"current_steps": 76605, "total_steps": 76960, "loss": 0.2251, "lr": 3.2590061603221535e-09, "epoch": 19.907744282744282, "percentage": 99.54, "elapsed_time": "1:51:11", "remaining_time": "0:00:30", "throughput": 1033.94, "total_tokens": 6897648} +{"current_steps": 76610, "total_steps": 76960, "loss": 0.1483, "lr": 3.1681058364402272e-09, "epoch": 19.909043659043657, "percentage": 99.55, "elapsed_time": "1:51:11", "remaining_time": "0:00:30", "throughput": 1033.94, "total_tokens": 6898096} +{"current_steps": 76615, "total_steps": 76960, "loss": 0.0005, "lr": 3.078491123573168e-09, "epoch": 19.910343035343036, "percentage": 99.55, "elapsed_time": "1:51:12", "remaining_time": "0:00:30", "throughput": 1033.95, "total_tokens": 6898560} +{"current_steps": 76620, "total_steps": 76960, "loss": 0.0055, "lr": 2.9901620263284026e-09, "epoch": 19.91164241164241, "percentage": 99.56, "elapsed_time": "1:51:12", "remaining_time": "0:00:29", "throughput": 1033.95, "total_tokens": 6898992} +{"current_steps": 76625, "total_steps": 76960, "loss": 0.1088, "lr": 2.9031185492522926e-09, "epoch": 19.912941787941786, "percentage": 99.56, "elapsed_time": "1:51:12", "remaining_time": "0:00:29", "throughput": 1033.95, "total_tokens": 6899424} +{"current_steps": 76630, "total_steps": 76960, "loss": 0.0001, "lr": 2.817360696819038e-09, "epoch": 19.914241164241165, "percentage": 99.57, "elapsed_time": "1:51:13", "remaining_time": "0:00:28", "throughput": 1033.95, "total_tokens": 6899872} +{"current_steps": 76635, "total_steps": 76960, "loss": 0.0016, "lr": 2.732888473441775e-09, "epoch": 19.91554054054054, "percentage": 99.58, "elapsed_time": "1:51:13", "remaining_time": "0:00:28", "throughput": 1033.95, "total_tokens": 6900288} +{"current_steps": 76640, "total_steps": 76960, "loss": 0.3209, "lr": 2.649701883461475e-09, "epoch": 19.916839916839916, "percentage": 99.58, "elapsed_time": "1:51:14", "remaining_time": "0:00:27", "throughput": 1033.96, "total_tokens": 6900784} +{"current_steps": 76645, "total_steps": 76960, "loss": 0.0545, "lr": 2.5678009311608243e-09, "epoch": 19.918139293139294, "percentage": 99.59, "elapsed_time": "1:51:14", "remaining_time": "0:00:27", "throughput": 1033.96, "total_tokens": 6901232} +{"current_steps": 76650, "total_steps": 76960, "loss": 0.0007, "lr": 2.4871856207475673e-09, "epoch": 19.91943866943867, "percentage": 99.6, "elapsed_time": "1:51:14", "remaining_time": "0:00:26", "throughput": 1033.97, "total_tokens": 6901728} +{"current_steps": 76655, "total_steps": 76960, "loss": 0.2168, "lr": 2.407855956368388e-09, "epoch": 19.920738045738045, "percentage": 99.6, "elapsed_time": "1:51:15", "remaining_time": "0:00:26", "throughput": 1033.97, "total_tokens": 6902176} +{"current_steps": 76660, "total_steps": 76960, "loss": 0.0013, "lr": 2.329811942108906e-09, "epoch": 19.922037422037423, "percentage": 99.61, "elapsed_time": "1:51:15", "remaining_time": "0:00:26", "throughput": 1033.98, "total_tokens": 6902624} +{"current_steps": 76665, "total_steps": 76960, "loss": 0.2307, "lr": 2.2530535819742514e-09, "epoch": 19.9233367983368, "percentage": 99.62, "elapsed_time": "1:51:16", "remaining_time": "0:00:25", "throughput": 1033.98, "total_tokens": 6903072} +{"current_steps": 76670, "total_steps": 76960, "loss": 0.357, "lr": 2.177580879919594e-09, "epoch": 19.924636174636174, "percentage": 99.62, "elapsed_time": "1:51:16", "remaining_time": "0:00:25", "throughput": 1033.98, "total_tokens": 6903504} +{"current_steps": 76675, "total_steps": 76960, "loss": 0.0026, "lr": 2.1033938398223872e-09, "epoch": 19.925935550935552, "percentage": 99.63, "elapsed_time": "1:51:17", "remaining_time": "0:00:24", "throughput": 1033.99, "total_tokens": 6904000} +{"current_steps": 76680, "total_steps": 76960, "loss": 0.0004, "lr": 2.0304924655017986e-09, "epoch": 19.927234927234927, "percentage": 99.64, "elapsed_time": "1:51:17", "remaining_time": "0:00:24", "throughput": 1033.99, "total_tokens": 6904432} +{"current_steps": 76685, "total_steps": 76960, "loss": 0.0289, "lr": 1.9588767607020553e-09, "epoch": 19.928534303534303, "percentage": 99.64, "elapsed_time": "1:51:17", "remaining_time": "0:00:23", "throughput": 1034.01, "total_tokens": 6904960} +{"current_steps": 76690, "total_steps": 76960, "loss": 0.0048, "lr": 1.8885467291090973e-09, "epoch": 19.92983367983368, "percentage": 99.65, "elapsed_time": "1:51:18", "remaining_time": "0:00:23", "throughput": 1034.01, "total_tokens": 6905440} +{"current_steps": 76695, "total_steps": 76960, "loss": 0.0693, "lr": 1.8195023743422523e-09, "epoch": 19.931133056133056, "percentage": 99.66, "elapsed_time": "1:51:18", "remaining_time": "0:00:23", "throughput": 1034.02, "total_tokens": 6905888} +{"current_steps": 76700, "total_steps": 76960, "loss": 0.0006, "lr": 1.7517436999486825e-09, "epoch": 19.93243243243243, "percentage": 99.66, "elapsed_time": "1:51:19", "remaining_time": "0:00:22", "throughput": 1034.02, "total_tokens": 6906352} +{"current_steps": 76705, "total_steps": 76960, "loss": 0.0036, "lr": 1.6852707094172636e-09, "epoch": 19.93373180873181, "percentage": 99.67, "elapsed_time": "1:51:19", "remaining_time": "0:00:22", "throughput": 1034.03, "total_tokens": 6906816} +{"current_steps": 76710, "total_steps": 76960, "loss": 0.0137, "lr": 1.620083406161932e-09, "epoch": 19.935031185031185, "percentage": 99.68, "elapsed_time": "1:51:19", "remaining_time": "0:00:21", "throughput": 1034.03, "total_tokens": 6907248} +{"current_steps": 76715, "total_steps": 76960, "loss": 0.0051, "lr": 1.5561817935411116e-09, "epoch": 19.93633056133056, "percentage": 99.68, "elapsed_time": "1:51:20", "remaining_time": "0:00:21", "throughput": 1034.03, "total_tokens": 6907712} +{"current_steps": 76720, "total_steps": 76960, "loss": 0.4065, "lr": 1.493565874835512e-09, "epoch": 19.93762993762994, "percentage": 99.69, "elapsed_time": "1:51:20", "remaining_time": "0:00:20", "throughput": 1034.04, "total_tokens": 6908192} +{"current_steps": 76725, "total_steps": 76960, "loss": 0.0016, "lr": 1.4322356532703308e-09, "epoch": 19.938929313929314, "percentage": 99.69, "elapsed_time": "1:51:21", "remaining_time": "0:00:20", "throughput": 1034.04, "total_tokens": 6908640} +{"current_steps": 76730, "total_steps": 76960, "loss": 0.0769, "lr": 1.3721911319958258e-09, "epoch": 19.94022869022869, "percentage": 99.7, "elapsed_time": "1:51:21", "remaining_time": "0:00:20", "throughput": 1034.05, "total_tokens": 6909088} +{"current_steps": 76735, "total_steps": 76960, "loss": 0.1907, "lr": 1.3134323141039683e-09, "epoch": 19.941528066528065, "percentage": 99.71, "elapsed_time": "1:51:22", "remaining_time": "0:00:19", "throughput": 1034.05, "total_tokens": 6909536} +{"current_steps": 76740, "total_steps": 76960, "loss": 0.1245, "lr": 1.255959202614565e-09, "epoch": 19.942827442827443, "percentage": 99.71, "elapsed_time": "1:51:22", "remaining_time": "0:00:19", "throughput": 1034.05, "total_tokens": 6910000} +{"current_steps": 76745, "total_steps": 76960, "loss": 0.0234, "lr": 1.199771800480809e-09, "epoch": 19.94412681912682, "percentage": 99.72, "elapsed_time": "1:51:22", "remaining_time": "0:00:18", "throughput": 1034.05, "total_tokens": 6910432} +{"current_steps": 76750, "total_steps": 76960, "loss": 0.1204, "lr": 1.1448701105976068e-09, "epoch": 19.945426195426194, "percentage": 99.73, "elapsed_time": "1:51:23", "remaining_time": "0:00:18", "throughput": 1034.06, "total_tokens": 6910880} +{"current_steps": 76755, "total_steps": 76960, "loss": 0.2203, "lr": 1.0912541357877004e-09, "epoch": 19.946725571725572, "percentage": 99.73, "elapsed_time": "1:51:23", "remaining_time": "0:00:17", "throughput": 1034.06, "total_tokens": 6911312} +{"current_steps": 76760, "total_steps": 76960, "loss": 0.0422, "lr": 1.0389238788072187e-09, "epoch": 19.948024948024948, "percentage": 99.74, "elapsed_time": "1:51:24", "remaining_time": "0:00:17", "throughput": 1034.07, "total_tokens": 6911792} +{"current_steps": 76765, "total_steps": 76960, "loss": 0.0007, "lr": 9.878793423456767e-10, "epoch": 19.949324324324323, "percentage": 99.75, "elapsed_time": "1:51:24", "remaining_time": "0:00:16", "throughput": 1034.07, "total_tokens": 6912240} +{"current_steps": 76770, "total_steps": 76960, "loss": 0.1742, "lr": 9.381205290315276e-10, "epoch": 19.9506237006237, "percentage": 99.75, "elapsed_time": "1:51:24", "remaining_time": "0:00:16", "throughput": 1034.07, "total_tokens": 6912672} +{"current_steps": 76775, "total_steps": 76960, "loss": 0.0017, "lr": 8.896474414238354e-10, "epoch": 19.951923076923077, "percentage": 99.76, "elapsed_time": "1:51:25", "remaining_time": "0:00:16", "throughput": 1034.08, "total_tokens": 6913152} +{"current_steps": 76780, "total_steps": 76960, "loss": 0.008, "lr": 8.424600820122752e-10, "epoch": 19.953222453222452, "percentage": 99.77, "elapsed_time": "1:51:25", "remaining_time": "0:00:15", "throughput": 1034.08, "total_tokens": 6913616} +{"current_steps": 76785, "total_steps": 76960, "loss": 0.0421, "lr": 7.965584532282355e-10, "epoch": 19.95452182952183, "percentage": 99.77, "elapsed_time": "1:51:26", "remaining_time": "0:00:15", "throughput": 1034.08, "total_tokens": 6914016} +{"current_steps": 76790, "total_steps": 76960, "loss": 0.0009, "lr": 7.519425574281647e-10, "epoch": 19.955821205821206, "percentage": 99.78, "elapsed_time": "1:51:26", "remaining_time": "0:00:14", "throughput": 1034.08, "total_tokens": 6914464} +{"current_steps": 76795, "total_steps": 76960, "loss": 0.1222, "lr": 7.086123969102243e-10, "epoch": 19.95712058212058, "percentage": 99.79, "elapsed_time": "1:51:26", "remaining_time": "0:00:14", "throughput": 1034.09, "total_tokens": 6914928} +{"current_steps": 76800, "total_steps": 76960, "loss": 0.0004, "lr": 6.665679739031871e-10, "epoch": 19.95841995841996, "percentage": 99.79, "elapsed_time": "1:51:27", "remaining_time": "0:00:13", "throughput": 1034.09, "total_tokens": 6915376} +{"current_steps": 76805, "total_steps": 76960, "loss": 0.0587, "lr": 6.258092905636614e-10, "epoch": 19.959719334719335, "percentage": 99.8, "elapsed_time": "1:51:27", "remaining_time": "0:00:13", "throughput": 1034.09, "total_tokens": 6915824} +{"current_steps": 76810, "total_steps": 76960, "loss": 0.0001, "lr": 5.863363489955198e-10, "epoch": 19.96101871101871, "percentage": 99.81, "elapsed_time": "1:51:28", "remaining_time": "0:00:13", "throughput": 1034.1, "total_tokens": 6916288} +{"current_steps": 76815, "total_steps": 76960, "loss": 0.0918, "lr": 5.481491512249193e-10, "epoch": 19.96231808731809, "percentage": 99.81, "elapsed_time": "1:51:28", "remaining_time": "0:00:12", "throughput": 1034.1, "total_tokens": 6916752} +{"current_steps": 76820, "total_steps": 76960, "loss": 0.001, "lr": 5.11247699214179e-10, "epoch": 19.963617463617464, "percentage": 99.82, "elapsed_time": "1:51:29", "remaining_time": "0:00:12", "throughput": 1034.1, "total_tokens": 6917168} +{"current_steps": 76825, "total_steps": 76960, "loss": 0.0145, "lr": 4.75631994864556e-10, "epoch": 19.96491683991684, "percentage": 99.82, "elapsed_time": "1:51:29", "remaining_time": "0:00:11", "throughput": 1034.1, "total_tokens": 6917584} +{"current_steps": 76830, "total_steps": 76960, "loss": 0.0519, "lr": 4.413020400079182e-10, "epoch": 19.966216216216218, "percentage": 99.83, "elapsed_time": "1:51:29", "remaining_time": "0:00:11", "throughput": 1034.1, "total_tokens": 6918032} +{"current_steps": 76835, "total_steps": 76960, "loss": 0.0263, "lr": 4.082578364067446e-10, "epoch": 19.967515592515593, "percentage": 99.84, "elapsed_time": "1:51:30", "remaining_time": "0:00:10", "throughput": 1034.11, "total_tokens": 6918496} +{"current_steps": 76840, "total_steps": 76960, "loss": 0.0608, "lr": 3.764993857624521e-10, "epoch": 19.968814968814968, "percentage": 99.84, "elapsed_time": "1:51:30", "remaining_time": "0:00:10", "throughput": 1034.1, "total_tokens": 6918896} +{"current_steps": 76845, "total_steps": 76960, "loss": 0.0002, "lr": 3.460266897098441e-10, "epoch": 19.970114345114347, "percentage": 99.85, "elapsed_time": "1:51:31", "remaining_time": "0:00:10", "throughput": 1034.11, "total_tokens": 6919360} +{"current_steps": 76850, "total_steps": 76960, "loss": 0.0186, "lr": 3.168397498115594e-10, "epoch": 19.97141372141372, "percentage": 99.86, "elapsed_time": "1:51:31", "remaining_time": "0:00:09", "throughput": 1034.12, "total_tokens": 6919824} +{"current_steps": 76855, "total_steps": 76960, "loss": 0.2904, "lr": 2.889385675747258e-10, "epoch": 19.972713097713097, "percentage": 99.86, "elapsed_time": "1:51:31", "remaining_time": "0:00:09", "throughput": 1034.11, "total_tokens": 6920240} +{"current_steps": 76860, "total_steps": 76960, "loss": 0.0087, "lr": 2.6232314443153106e-10, "epoch": 19.974012474012476, "percentage": 99.87, "elapsed_time": "1:51:32", "remaining_time": "0:00:08", "throughput": 1034.11, "total_tokens": 6920656} +{"current_steps": 76865, "total_steps": 76960, "loss": 0.3398, "lr": 2.3699348174754945e-10, "epoch": 19.97531185031185, "percentage": 99.88, "elapsed_time": "1:51:32", "remaining_time": "0:00:08", "throughput": 1034.11, "total_tokens": 6921104} +{"current_steps": 76870, "total_steps": 76960, "loss": 0.0002, "lr": 2.1294958083006855e-10, "epoch": 19.976611226611226, "percentage": 99.88, "elapsed_time": "1:51:33", "remaining_time": "0:00:07", "throughput": 1034.12, "total_tokens": 6921568} +{"current_steps": 76875, "total_steps": 76960, "loss": 0.0897, "lr": 1.9019144291421153e-10, "epoch": 19.977910602910605, "percentage": 99.89, "elapsed_time": "1:51:33", "remaining_time": "0:00:07", "throughput": 1034.13, "total_tokens": 6922048} +{"current_steps": 76880, "total_steps": 76960, "loss": 0.0067, "lr": 1.6871906917126367e-10, "epoch": 19.97920997920998, "percentage": 99.9, "elapsed_time": "1:51:34", "remaining_time": "0:00:06", "throughput": 1034.13, "total_tokens": 6922528} +{"current_steps": 76885, "total_steps": 76960, "loss": 0.0982, "lr": 1.4853246070589689e-10, "epoch": 19.980509355509355, "percentage": 99.9, "elapsed_time": "1:51:34", "remaining_time": "0:00:06", "throughput": 1034.14, "total_tokens": 6922976} +{"current_steps": 76890, "total_steps": 76960, "loss": 0.0093, "lr": 1.2963161855339413e-10, "epoch": 19.981808731808734, "percentage": 99.91, "elapsed_time": "1:51:34", "remaining_time": "0:00:06", "throughput": 1034.14, "total_tokens": 6923424} +{"current_steps": 76895, "total_steps": 76960, "loss": 0.0031, "lr": 1.120165436879761e-10, "epoch": 19.98310810810811, "percentage": 99.92, "elapsed_time": "1:51:35", "remaining_time": "0:00:05", "throughput": 1034.15, "total_tokens": 6923888} +{"current_steps": 76900, "total_steps": 76960, "loss": 0.0694, "lr": 9.568723701447457e-11, "epoch": 19.984407484407484, "percentage": 99.92, "elapsed_time": "1:51:35", "remaining_time": "0:00:05", "throughput": 1034.15, "total_tokens": 6924336} +{"current_steps": 76905, "total_steps": 76960, "loss": 0.1367, "lr": 8.064369937388349e-11, "epoch": 19.98570686070686, "percentage": 99.93, "elapsed_time": "1:51:36", "remaining_time": "0:00:04", "throughput": 1034.15, "total_tokens": 6924768} +{"current_steps": 76910, "total_steps": 76960, "loss": 0.0127, "lr": 6.688593154058343e-11, "epoch": 19.987006237006238, "percentage": 99.94, "elapsed_time": "1:51:36", "remaining_time": "0:00:04", "throughput": 1034.15, "total_tokens": 6925232} +{"current_steps": 76915, "total_steps": 76960, "loss": 0.0096, "lr": 5.4413934219565974e-11, "epoch": 19.988305613305613, "percentage": 99.94, "elapsed_time": "1:51:36", "remaining_time": "0:00:03", "throughput": 1034.16, "total_tokens": 6925664} +{"current_steps": 76920, "total_steps": 76960, "loss": 0.4628, "lr": 4.3227708054760504e-11, "epoch": 19.989604989604988, "percentage": 99.95, "elapsed_time": "1:51:37", "remaining_time": "0:00:03", "throughput": 1034.16, "total_tokens": 6926128} +{"current_steps": 76925, "total_steps": 76960, "loss": 0.0004, "lr": 3.3327253620707433e-11, "epoch": 19.990904365904367, "percentage": 99.95, "elapsed_time": "1:51:37", "remaining_time": "0:00:03", "throughput": 1034.16, "total_tokens": 6926576} +{"current_steps": 76930, "total_steps": 76960, "loss": 0.0002, "lr": 2.4712571428109344e-11, "epoch": 19.992203742203742, "percentage": 99.96, "elapsed_time": "1:51:38", "remaining_time": "0:00:02", "throughput": 1034.16, "total_tokens": 6927008} +{"current_steps": 76935, "total_steps": 76960, "loss": 0.0001, "lr": 1.7383661915504334e-11, "epoch": 19.993503118503117, "percentage": 99.97, "elapsed_time": "1:51:38", "remaining_time": "0:00:02", "throughput": 1034.17, "total_tokens": 6927488} +{"current_steps": 76940, "total_steps": 76960, "loss": 0.0201, "lr": 1.1340525463143791e-11, "epoch": 19.994802494802496, "percentage": 99.97, "elapsed_time": "1:51:38", "remaining_time": "0:00:01", "throughput": 1034.18, "total_tokens": 6927968} +{"current_steps": 76945, "total_steps": 76960, "loss": 0.1956, "lr": 6.583162381890162e-12, "epoch": 19.99610187110187, "percentage": 99.98, "elapsed_time": "1:51:39", "remaining_time": "0:00:01", "throughput": 1034.18, "total_tokens": 6928400} +{"current_steps": 76950, "total_steps": 76960, "loss": 0.0006, "lr": 3.111572915992511e-12, "epoch": 19.997401247401246, "percentage": 99.99, "elapsed_time": "1:51:39", "remaining_time": "0:00:00", "throughput": 1034.18, "total_tokens": 6928848} +{"current_steps": 76955, "total_steps": 76960, "loss": 0.4653, "lr": 9.2575724586208e-13, "epoch": 19.998700623700625, "percentage": 99.99, "elapsed_time": "1:51:40", "remaining_time": "0:00:00", "throughput": 1034.18, "total_tokens": 6929280} +{"current_steps": 76960, "total_steps": 76960, "loss": 0.0006, "lr": 2.5715479745613837e-14, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:51:40", "remaining_time": "0:00:00", "throughput": 1034.17, "total_tokens": 6929680} +{"current_steps": 76960, "total_steps": 76960, "eval_loss": 0.9521387219429016, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:51:53", "remaining_time": "0:00:00", "throughput": 1032.14, "total_tokens": 6929680} +{"current_steps": 76960, "total_steps": 76960, "epoch": 20.0, "percentage": 100.0, "elapsed_time": "1:51:55", "remaining_time": "0:00:00", "throughput": 1031.82, "total_tokens": 6929680}