{"current_steps": 5, "total_steps": 500, "loss": 1.6703, "lr": 4.99921047320825e-05, "epoch": 0.02, "percentage": 1.0, "elapsed_time": "0:00:25", "remaining_time": "0:41:32", "throughput": 2323.92, "total_tokens": 58512} {"current_steps": 10, "total_steps": 500, "loss": 1.7062, "lr": 4.996003875272438e-05, "epoch": 0.04, "percentage": 2.0, "elapsed_time": "0:00:47", "remaining_time": "0:38:34", "throughput": 2342.15, "total_tokens": 110624} {"current_steps": 15, "total_steps": 500, "loss": 1.6517, "lr": 4.990334022857932e-05, "epoch": 0.06, "percentage": 3.0, "elapsed_time": "0:01:10", "remaining_time": "0:37:52", "throughput": 2348.38, "total_tokens": 165088} {"current_steps": 20, "total_steps": 500, "loss": 1.6386, "lr": 4.982206511424534e-05, "epoch": 0.08, "percentage": 4.0, "elapsed_time": "0:01:32", "remaining_time": "0:37:07", "throughput": 2356.41, "total_tokens": 218736} {"current_steps": 25, "total_steps": 500, "loss": 1.4913, "lr": 4.971629361844785e-05, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:01:54", "remaining_time": "0:36:08", "throughput": 2354.13, "total_tokens": 268736} {"current_steps": 30, "total_steps": 500, "loss": 1.4176, "lr": 4.958613012488324e-05, "epoch": 0.12, "percentage": 6.0, "elapsed_time": "0:02:17", "remaining_time": "0:35:47", "throughput": 2355.96, "total_tokens": 322928} {"current_steps": 35, "total_steps": 500, "loss": 1.5363, "lr": 4.943170308920484e-05, "epoch": 0.14, "percentage": 7.0, "elapsed_time": "0:02:41", "remaining_time": "0:35:39", "throughput": 2361.01, "total_tokens": 380176} {"current_steps": 40, "total_steps": 500, "loss": 1.3961, "lr": 4.925316491225265e-05, "epoch": 0.16, "percentage": 8.0, "elapsed_time": "0:03:03", "remaining_time": "0:35:14", "throughput": 2362.02, "total_tokens": 434224} {"current_steps": 45, "total_steps": 500, "loss": 1.48, "lr": 4.905069178965215e-05, "epoch": 0.18, "percentage": 9.0, "elapsed_time": "0:03:25", "remaining_time": "0:34:40", "throughput": 2362.14, "total_tokens": 485936} {"current_steps": 50, "total_steps": 500, "loss": 1.3835, "lr": 4.882448353793048e-05, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:03:48", "remaining_time": "0:34:16", "throughput": 2363.65, "total_tokens": 540048} {"current_steps": 55, "total_steps": 500, "loss": 1.2657, "lr": 4.8574763397321614e-05, "epoch": 0.22, "percentage": 11.0, "elapsed_time": "0:04:10", "remaining_time": "0:33:43", "throughput": 2363.48, "total_tokens": 591056} {"current_steps": 60, "total_steps": 500, "loss": 1.3018, "lr": 4.8301777811455276e-05, "epoch": 0.24, "percentage": 12.0, "elapsed_time": "0:04:34", "remaining_time": "0:33:32", "throughput": 2364.55, "total_tokens": 648880} {"current_steps": 65, "total_steps": 500, "loss": 1.3696, "lr": 4.800579618414676e-05, "epoch": 0.26, "percentage": 13.0, "elapsed_time": "0:04:57", "remaining_time": "0:33:08", "throughput": 2364.23, "total_tokens": 702496} {"current_steps": 70, "total_steps": 500, "loss": 1.4257, "lr": 4.7687110613527926e-05, "epoch": 0.28, "percentage": 14.0, "elapsed_time": "0:05:18", "remaining_time": "0:32:38", "throughput": 2363.72, "total_tokens": 753456} {"current_steps": 75, "total_steps": 500, "loss": 1.4829, "lr": 4.73460356037816e-05, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "0:05:41", "remaining_time": "0:32:16", "throughput": 2364.35, "total_tokens": 808176} {"current_steps": 80, "total_steps": 500, "loss": 1.2336, "lr": 4.6982907754763906e-05, "epoch": 0.32, "percentage": 16.0, "elapsed_time": "0:06:07", "remaining_time": "0:32:10", "throughput": 2365.8, "total_tokens": 869808} {"current_steps": 85, "total_steps": 500, "loss": 1.3996, "lr": 4.659808542982088e-05, "epoch": 0.34, "percentage": 17.0, "elapsed_time": "0:06:30", "remaining_time": "0:31:45", "throughput": 2366.4, "total_tokens": 923600} {"current_steps": 90, "total_steps": 500, "loss": 1.2719, "lr": 4.619194840212708e-05, "epoch": 0.36, "percentage": 18.0, "elapsed_time": "0:06:54", "remaining_time": "0:31:28", "throughput": 2367.16, "total_tokens": 981488} {"current_steps": 95, "total_steps": 500, "loss": 1.4032, "lr": 4.5764897479895317e-05, "epoch": 0.38, "percentage": 19.0, "elapsed_time": "0:07:16", "remaining_time": "0:31:02", "throughput": 2366.11, "total_tokens": 1033840} {"current_steps": 100, "total_steps": 500, "loss": 1.3374, "lr": 4.531735411082735e-05, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:07:39", "remaining_time": "0:30:37", "throughput": 2366.33, "total_tokens": 1086960} {"current_steps": 100, "total_steps": 500, "eval_loss": 1.3060753345489502, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:09:09", "remaining_time": "0:36:36", "throughput": 1979.04, "total_tokens": 1086960} {"current_steps": 105, "total_steps": 500, "loss": 1.3098, "lr": 4.484975996619589e-05, "epoch": 0.42, "percentage": 21.0, "elapsed_time": "0:09:32", "remaining_time": "0:35:53", "throughput": 1990.03, "total_tokens": 1139312} {"current_steps": 110, "total_steps": 500, "loss": 1.2947, "lr": 4.436257650496834e-05, "epoch": 0.44, "percentage": 22.0, "elapsed_time": "0:09:56", "remaining_time": "0:35:15", "throughput": 2005.45, "total_tokens": 1196400} {"current_steps": 115, "total_steps": 500, "loss": 1.2352, "lr": 4.3856284518402594e-05, "epoch": 0.46, "percentage": 23.0, "elapsed_time": "0:10:18", "remaining_time": "0:34:32", "throughput": 2017.99, "total_tokens": 1249008} {"current_steps": 120, "total_steps": 500, "loss": 1.3525, "lr": 4.3331383655564006e-05, "epoch": 0.48, "percentage": 24.0, "elapsed_time": "0:10:42", "remaining_time": "0:33:53", "throughput": 2030.42, "total_tokens": 1304032} {"current_steps": 125, "total_steps": 500, "loss": 1.2646, "lr": 4.278839193023214e-05, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "0:11:05", "remaining_time": "0:33:15", "throughput": 2042.38, "total_tokens": 1358832} {"current_steps": 130, "total_steps": 500, "loss": 1.3183, "lr": 4.2227845209683716e-05, "epoch": 0.52, "percentage": 26.0, "elapsed_time": "0:11:26", "remaining_time": "0:32:33", "throughput": 2051.98, "total_tokens": 1408752} {"current_steps": 135, "total_steps": 500, "loss": 1.338, "lr": 4.165029668585629e-05, "epoch": 0.54, "percentage": 27.0, "elapsed_time": "0:11:48", "remaining_time": "0:31:55", "throughput": 2061.35, "total_tokens": 1460656} {"current_steps": 140, "total_steps": 500, "loss": 1.1311, "lr": 4.1056316329414616e-05, "epoch": 0.56, "percentage": 28.0, "elapsed_time": "0:12:12", "remaining_time": "0:31:24", "throughput": 2071.26, "total_tokens": 1517632} {"current_steps": 145, "total_steps": 500, "loss": 1.2694, "lr": 4.044649032725836e-05, "epoch": 0.58, "percentage": 29.0, "elapsed_time": "0:12:37", "remaining_time": "0:30:54", "throughput": 2080.96, "total_tokens": 1576320} {"current_steps": 150, "total_steps": 500, "loss": 1.2979, "lr": 3.982142050402649e-05, "epoch": 0.6, "percentage": 30.0, "elapsed_time": "0:13:00", "remaining_time": "0:30:21", "throughput": 2090.01, "total_tokens": 1631840} {"current_steps": 155, "total_steps": 500, "loss": 1.3677, "lr": 3.9181723728168916e-05, "epoch": 0.62, "percentage": 31.0, "elapsed_time": "0:13:24", "remaining_time": "0:29:49", "throughput": 2098.58, "total_tokens": 1687552} {"current_steps": 160, "total_steps": 500, "loss": 1.2401, "lr": 3.8528031303171895e-05, "epoch": 0.64, "percentage": 32.0, "elapsed_time": "0:13:47", "remaining_time": "0:29:18", "throughput": 2105.91, "total_tokens": 1742416} {"current_steps": 165, "total_steps": 500, "loss": 1.4727, "lr": 3.786098834453766e-05, "epoch": 0.66, "percentage": 33.0, "elapsed_time": "0:14:09", "remaining_time": "0:28:45", "throughput": 2112.45, "total_tokens": 1795152} {"current_steps": 170, "total_steps": 500, "loss": 1.2267, "lr": 3.718125314313331e-05, "epoch": 0.68, "percentage": 34.0, "elapsed_time": "0:14:34", "remaining_time": "0:28:17", "throughput": 2119.92, "total_tokens": 1853728} {"current_steps": 175, "total_steps": 500, "loss": 1.3349, "lr": 3.6489496515537204e-05, "epoch": 0.7, "percentage": 35.0, "elapsed_time": "0:14:56", "remaining_time": "0:27:44", "throughput": 2125.88, "total_tokens": 1905344} {"current_steps": 180, "total_steps": 500, "loss": 1.2891, "lr": 3.5786401142023975e-05, "epoch": 0.72, "percentage": 36.0, "elapsed_time": "0:15:19", "remaining_time": "0:27:15", "throughput": 2132.06, "total_tokens": 1960848} {"current_steps": 185, "total_steps": 500, "loss": 1.2462, "lr": 3.507266089284157e-05, "epoch": 0.74, "percentage": 37.0, "elapsed_time": "0:15:42", "remaining_time": "0:26:44", "throughput": 2137.93, "total_tokens": 2014432} {"current_steps": 190, "total_steps": 500, "loss": 1.3434, "lr": 3.434898014344501e-05, "epoch": 0.76, "percentage": 38.0, "elapsed_time": "0:16:04", "remaining_time": "0:26:13", "throughput": 2142.68, "total_tokens": 2066080} {"current_steps": 195, "total_steps": 500, "loss": 1.2786, "lr": 3.3616073079362926e-05, "epoch": 0.78, "percentage": 39.0, "elapsed_time": "0:16:25", "remaining_time": "0:25:41", "throughput": 2147.41, "total_tokens": 2116880} {"current_steps": 200, "total_steps": 500, "loss": 1.3909, "lr": 3.287466299138262e-05, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "0:16:48", "remaining_time": "0:25:12", "throughput": 2152.34, "total_tokens": 2169920} {"current_steps": 200, "total_steps": 500, "eval_loss": 1.2780131101608276, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "0:18:18", "remaining_time": "0:27:27", "throughput": 1976.11, "total_tokens": 2169920} {"current_steps": 205, "total_steps": 500, "loss": 1.3048, "lr": 3.21254815617494e-05, "epoch": 0.82, "percentage": 41.0, "elapsed_time": "0:18:42", "remaining_time": "0:26:55", "throughput": 1982.29, "total_tokens": 2224960} {"current_steps": 210, "total_steps": 500, "loss": 1.3698, "lr": 3.1369268142084556e-05, "epoch": 0.84, "percentage": 42.0, "elapsed_time": "0:19:05", "remaining_time": "0:26:22", "throughput": 1989.99, "total_tokens": 2280128} {"current_steps": 215, "total_steps": 500, "loss": 1.3298, "lr": 3.0606769023734536e-05, "epoch": 0.86, "percentage": 43.0, "elapsed_time": "0:19:31", "remaining_time": "0:25:52", "throughput": 1998.41, "total_tokens": 2340240} {"current_steps": 220, "total_steps": 500, "loss": 1.2365, "lr": 2.9838736701271514e-05, "epoch": 0.88, "percentage": 44.0, "elapsed_time": "0:19:55", "remaining_time": "0:25:21", "throughput": 2006.02, "total_tokens": 2397664} {"current_steps": 225, "total_steps": 500, "loss": 1.2446, "lr": 2.9065929129872094e-05, "epoch": 0.9, "percentage": 45.0, "elapsed_time": "0:20:16", "remaining_time": "0:24:47", "throughput": 2012.14, "total_tokens": 2448464} {"current_steps": 230, "total_steps": 500, "loss": 1.3372, "lr": 2.8289108977307067e-05, "epoch": 0.92, "percentage": 46.0, "elapsed_time": "0:20:38", "remaining_time": "0:24:13", "throughput": 2018.28, "total_tokens": 2499520} {"current_steps": 235, "total_steps": 500, "loss": 1.3568, "lr": 2.7509042871280372e-05, "epoch": 0.94, "percentage": 47.0, "elapsed_time": "0:21:00", "remaining_time": "0:23:41", "throughput": 2024.55, "total_tokens": 2552688} {"current_steps": 240, "total_steps": 500, "loss": 1.4397, "lr": 2.6726500642860154e-05, "epoch": 0.96, "percentage": 48.0, "elapsed_time": "0:21:22", "remaining_time": "0:23:09", "throughput": 2030.05, "total_tokens": 2603920} {"current_steps": 245, "total_steps": 500, "loss": 1.4108, "lr": 2.594225456674837e-05, "epoch": 0.98, "percentage": 49.0, "elapsed_time": "0:21:43", "remaining_time": "0:22:36", "throughput": 2035.3, "total_tokens": 2653088} {"current_steps": 250, "total_steps": 500, "loss": 1.3159, "lr": 2.5157078599138977e-05, "epoch": 1.0, "percentage": 50.0, "elapsed_time": "0:22:06", "remaining_time": "0:22:06", "throughput": 2040.91, "total_tokens": 2707776} {"current_steps": 255, "total_steps": 500, "loss": 1.2693, "lr": 2.4371747613916566e-05, "epoch": 1.02, "percentage": 51.0, "elapsed_time": "0:22:29", "remaining_time": "0:21:36", "throughput": 2046.54, "total_tokens": 2762608} {"current_steps": 260, "total_steps": 500, "loss": 1.2833, "lr": 2.3587036637949388e-05, "epoch": 1.04, "percentage": 52.0, "elapsed_time": "0:22:52", "remaining_time": "0:21:07", "throughput": 2051.8, "total_tokens": 2816464} {"current_steps": 265, "total_steps": 500, "loss": 1.237, "lr": 2.280372008623142e-05, "epoch": 1.06, "percentage": 53.0, "elapsed_time": "0:23:17", "remaining_time": "0:20:39", "throughput": 2057.46, "total_tokens": 2874672} {"current_steps": 270, "total_steps": 500, "loss": 1.2101, "lr": 2.2022570997628256e-05, "epoch": 1.08, "percentage": 54.0, "elapsed_time": "0:23:39", "remaining_time": "0:20:09", "throughput": 2062.05, "total_tokens": 2927408} {"current_steps": 275, "total_steps": 500, "loss": 1.2382, "lr": 2.1244360271981073e-05, "epoch": 1.1, "percentage": 55.0, "elapsed_time": "0:24:01", "remaining_time": "0:19:39", "throughput": 2066.75, "total_tokens": 2979312} {"current_steps": 280, "total_steps": 500, "loss": 1.1996, "lr": 2.0469855909321564e-05, "epoch": 1.12, "percentage": 56.0, "elapsed_time": "0:24:25", "remaining_time": "0:19:11", "throughput": 2071.92, "total_tokens": 3036720} {"current_steps": 285, "total_steps": 500, "loss": 1.3249, "lr": 1.969982225194864e-05, "epoch": 1.1400000000000001, "percentage": 57.0, "elapsed_time": "0:24:48", "remaining_time": "0:18:43", "throughput": 2076.61, "total_tokens": 3091728} {"current_steps": 290, "total_steps": 500, "loss": 1.3194, "lr": 1.893501923011482e-05, "epoch": 1.16, "percentage": 58.0, "elapsed_time": "0:25:11", "remaining_time": "0:18:14", "throughput": 2081.0, "total_tokens": 3146000} {"current_steps": 295, "total_steps": 500, "loss": 1.3347, "lr": 1.817620161206687e-05, "epoch": 1.18, "percentage": 59.0, "elapsed_time": "0:25:33", "remaining_time": "0:17:45", "throughput": 2084.81, "total_tokens": 3196272} {"current_steps": 300, "total_steps": 500, "loss": 1.3721, "lr": 1.7424118259180654e-05, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "0:25:55", "remaining_time": "0:17:17", "throughput": 2089.04, "total_tokens": 3249536} {"current_steps": 300, "total_steps": 500, "eval_loss": 1.2654056549072266, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "0:27:25", "remaining_time": "0:18:16", "throughput": 1975.0, "total_tokens": 3249536} {"current_steps": 305, "total_steps": 500, "loss": 1.1763, "lr": 1.6679511386925337e-05, "epoch": 1.22, "percentage": 61.0, "elapsed_time": "0:27:50", "remaining_time": "0:17:48", "throughput": 1979.27, "total_tokens": 3306672} {"current_steps": 310, "total_steps": 500, "loss": 1.2738, "lr": 1.594311583238636e-05, "epoch": 1.24, "percentage": 62.0, "elapsed_time": "0:28:12", "remaining_time": "0:17:17", "throughput": 1984.25, "total_tokens": 3359152} {"current_steps": 315, "total_steps": 500, "loss": 1.2969, "lr": 1.521565832906994e-05, "epoch": 1.26, "percentage": 63.0, "elapsed_time": "0:28:35", "remaining_time": "0:16:47", "throughput": 1989.38, "total_tokens": 3413520} {"current_steps": 320, "total_steps": 500, "loss": 1.2779, "lr": 1.4497856789704844e-05, "epoch": 1.28, "percentage": 64.0, "elapsed_time": "0:28:57", "remaining_time": "0:16:17", "throughput": 1994.07, "total_tokens": 3465600} {"current_steps": 325, "total_steps": 500, "loss": 1.1808, "lr": 1.3790419597749199e-05, "epoch": 1.3, "percentage": 65.0, "elapsed_time": "0:29:20", "remaining_time": "0:15:47", "throughput": 1998.72, "total_tokens": 3518768} {"current_steps": 330, "total_steps": 500, "loss": 1.2597, "lr": 1.309404490830152e-05, "epoch": 1.32, "percentage": 66.0, "elapsed_time": "0:29:42", "remaining_time": "0:15:18", "throughput": 2003.06, "total_tokens": 3570208} {"current_steps": 335, "total_steps": 500, "loss": 1.2347, "lr": 1.2409419959105981e-05, "epoch": 1.34, "percentage": 67.0, "elapsed_time": "0:30:04", "remaining_time": "0:14:48", "throughput": 2007.5, "total_tokens": 3622464} {"current_steps": 340, "total_steps": 500, "loss": 1.2341, "lr": 1.1737220392331644e-05, "epoch": 1.3599999999999999, "percentage": 68.0, "elapsed_time": "0:30:26", "remaining_time": "0:14:19", "throughput": 2011.86, "total_tokens": 3675248} {"current_steps": 345, "total_steps": 500, "loss": 1.2037, "lr": 1.107810958779531e-05, "epoch": 1.38, "percentage": 69.0, "elapsed_time": "0:30:52", "remaining_time": "0:13:52", "throughput": 2016.89, "total_tokens": 3735360} {"current_steps": 350, "total_steps": 500, "loss": 1.3922, "lr": 1.0432738008285603e-05, "epoch": 1.4, "percentage": 70.0, "elapsed_time": "0:31:14", "remaining_time": "0:13:23", "throughput": 2020.98, "total_tokens": 3787728} {"current_steps": 355, "total_steps": 500, "loss": 1.2707, "lr": 9.801742557634872e-06, "epoch": 1.42, "percentage": 71.0, "elapsed_time": "0:31:38", "remaining_time": "0:12:55", "throughput": 2025.54, "total_tokens": 3844768} {"current_steps": 360, "total_steps": 500, "loss": 1.2476, "lr": 9.18574595217189e-06, "epoch": 1.44, "percentage": 72.0, "elapsed_time": "0:32:01", "remaining_time": "0:12:27", "throughput": 2029.68, "total_tokens": 3900080} {"current_steps": 365, "total_steps": 500, "loss": 1.243, "lr": 8.585356106176094e-06, "epoch": 1.46, "percentage": 73.0, "elapsed_time": "0:32:25", "remaining_time": "0:11:59", "throughput": 2034.08, "total_tokens": 3958224} {"current_steps": 370, "total_steps": 500, "loss": 1.2654, "lr": 8.00116553193952e-06, "epoch": 1.48, "percentage": 74.0, "elapsed_time": "0:32:48", "remaining_time": "0:11:31", "throughput": 2038.0, "total_tokens": 4012240} {"current_steps": 375, "total_steps": 500, "loss": 1.1863, "lr": 7.433750755028773e-06, "epoch": 1.5, "percentage": 75.0, "elapsed_time": "0:33:11", "remaining_time": "0:11:03", "throughput": 2041.88, "total_tokens": 4067408} {"current_steps": 380, "total_steps": 500, "loss": 1.4472, "lr": 6.883671745323833e-06, "epoch": 1.52, "percentage": 76.0, "elapsed_time": "0:33:33", "remaining_time": "0:10:35", "throughput": 2045.29, "total_tokens": 4118544} {"current_steps": 385, "total_steps": 500, "loss": 1.3013, "lr": 6.3514713643954475e-06, "epoch": 1.54, "percentage": 77.0, "elapsed_time": "0:33:55", "remaining_time": "0:10:08", "throughput": 2048.75, "total_tokens": 4170944} {"current_steps": 390, "total_steps": 500, "loss": 1.3471, "lr": 5.837674829766257e-06, "epoch": 1.56, "percentage": 78.0, "elapsed_time": "0:34:17", "remaining_time": "0:09:40", "throughput": 2052.01, "total_tokens": 4222464} {"current_steps": 395, "total_steps": 500, "loss": 1.2894, "lr": 5.342789196584527e-06, "epoch": 1.58, "percentage": 79.0, "elapsed_time": "0:34:41", "remaining_time": "0:09:13", "throughput": 2055.79, "total_tokens": 4279648} {"current_steps": 400, "total_steps": 500, "loss": 1.2345, "lr": 4.867302857221953e-06, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "0:35:06", "remaining_time": "0:08:46", "throughput": 2059.65, "total_tokens": 4339360} {"current_steps": 400, "total_steps": 500, "eval_loss": 1.259685754776001, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "0:36:36", "remaining_time": "0:09:09", "throughput": 1975.49, "total_tokens": 4339360} {"current_steps": 405, "total_steps": 500, "loss": 1.2398, "lr": 4.411685059289314e-06, "epoch": 1.62, "percentage": 81.0, "elapsed_time": "0:37:01", "remaining_time": "0:08:41", "throughput": 1978.96, "total_tokens": 4396144} {"current_steps": 410, "total_steps": 500, "loss": 1.1595, "lr": 3.976385442545774e-06, "epoch": 1.6400000000000001, "percentage": 82.0, "elapsed_time": "0:37:25", "remaining_time": "0:08:12", "throughput": 1983.23, "total_tokens": 4453680} {"current_steps": 415, "total_steps": 500, "loss": 1.2997, "lr": 3.561833595158698e-06, "epoch": 1.6600000000000001, "percentage": 83.0, "elapsed_time": "0:37:48", "remaining_time": "0:07:44", "throughput": 1987.1, "total_tokens": 4506960} {"current_steps": 420, "total_steps": 500, "loss": 1.2242, "lr": 3.168438629752002e-06, "epoch": 1.6800000000000002, "percentage": 84.0, "elapsed_time": "0:38:09", "remaining_time": "0:07:16", "throughput": 1990.5, "total_tokens": 4557440} {"current_steps": 425, "total_steps": 500, "loss": 1.224, "lr": 2.7965887796613884e-06, "epoch": 1.7, "percentage": 85.0, "elapsed_time": "0:38:32", "remaining_time": "0:06:48", "throughput": 1994.31, "total_tokens": 4612192} {"current_steps": 430, "total_steps": 500, "loss": 1.2913, "lr": 2.446651015794932e-06, "epoch": 1.72, "percentage": 86.0, "elapsed_time": "0:38:55", "remaining_time": "0:06:20", "throughput": 1997.98, "total_tokens": 4666208} {"current_steps": 435, "total_steps": 500, "loss": 1.3014, "lr": 2.118970684477062e-06, "epoch": 1.74, "percentage": 87.0, "elapsed_time": "0:39:17", "remaining_time": "0:05:52", "throughput": 2001.38, "total_tokens": 4718512} {"current_steps": 440, "total_steps": 500, "loss": 1.3041, "lr": 1.8138711666334685e-06, "epoch": 1.76, "percentage": 88.0, "elapsed_time": "0:39:39", "remaining_time": "0:05:24", "throughput": 2004.53, "total_tokens": 4769296} {"current_steps": 445, "total_steps": 500, "loss": 1.341, "lr": 1.5316535586531483e-06, "epoch": 1.78, "percentage": 89.0, "elapsed_time": "0:40:01", "remaining_time": "0:04:56", "throughput": 2007.8, "total_tokens": 4821616} {"current_steps": 450, "total_steps": 500, "loss": 1.4165, "lr": 1.2725963752426379e-06, "epoch": 1.8, "percentage": 90.0, "elapsed_time": "0:40:23", "remaining_time": "0:04:29", "throughput": 2011.03, "total_tokens": 4874176} {"current_steps": 455, "total_steps": 500, "loss": 1.3572, "lr": 1.0369552745656013e-06, "epoch": 1.8199999999999998, "percentage": 91.0, "elapsed_time": "0:40:45", "remaining_time": "0:04:01", "throughput": 2014.17, "total_tokens": 4925968} {"current_steps": 460, "total_steps": 500, "loss": 1.2259, "lr": 8.249628059391251e-07, "epoch": 1.8399999999999999, "percentage": 92.0, "elapsed_time": "0:41:08", "remaining_time": "0:03:34", "throughput": 2017.54, "total_tokens": 4980480} {"current_steps": 465, "total_steps": 500, "loss": 1.239, "lr": 6.368281803355691e-07, "epoch": 1.8599999999999999, "percentage": 93.0, "elapsed_time": "0:41:30", "remaining_time": "0:03:07", "throughput": 2020.69, "total_tokens": 5033472} {"current_steps": 470, "total_steps": 500, "loss": 1.2293, "lr": 4.727370639166506e-07, "epoch": 1.88, "percentage": 94.0, "elapsed_time": "0:41:52", "remaining_time": "0:02:40", "throughput": 2023.58, "total_tokens": 5084560} {"current_steps": 475, "total_steps": 500, "loss": 1.2634, "lr": 3.328513948032991e-07, "epoch": 1.9, "percentage": 95.0, "elapsed_time": "0:42:15", "remaining_time": "0:02:13", "throughput": 2026.93, "total_tokens": 5140144} {"current_steps": 480, "total_steps": 500, "loss": 1.2197, "lr": 2.1730922326233803e-07, "epoch": 1.92, "percentage": 96.0, "elapsed_time": "0:42:39", "remaining_time": "0:01:46", "throughput": 2030.08, "total_tokens": 5195776} {"current_steps": 485, "total_steps": 500, "loss": 1.2261, "lr": 1.2622457546749567e-07, "epoch": 1.94, "percentage": 97.0, "elapsed_time": "0:43:02", "remaining_time": "0:01:19", "throughput": 2033.27, "total_tokens": 5251584} {"current_steps": 490, "total_steps": 500, "loss": 1.2766, "lr": 5.968734096936935e-08, "epoch": 1.96, "percentage": 98.0, "elapsed_time": "0:43:27", "remaining_time": "0:00:53", "throughput": 2036.49, "total_tokens": 5309184} {"current_steps": 495, "total_steps": 500, "loss": 1.2686, "lr": 1.7763183985269883e-08, "epoch": 1.98, "percentage": 99.0, "elapsed_time": "0:43:50", "remaining_time": "0:00:26", "throughput": 2039.48, "total_tokens": 5365424} {"current_steps": 500, "total_steps": 500, "loss": 1.2265, "lr": 4.934785965721167e-10, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:44:14", "remaining_time": "0:00:00", "throughput": 2042.45, "total_tokens": 5421296} {"current_steps": 500, "total_steps": 500, "eval_loss": 1.258953332901001, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:45:44", "remaining_time": "0:00:00", "throughput": 1975.56, "total_tokens": 5421296} {"current_steps": 500, "total_steps": 500, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "0:45:45", "remaining_time": "0:00:00", "throughput": 1974.79, "total_tokens": 5421296}