|
{"current_steps": 25, "total_steps": 712, "loss": 7.1534, "lr": 3.2000000000000003e-06, "epoch": 0.14013452914798205, "percentage": 3.51, "elapsed_time": "0:04:01", "remaining_time": "1:50:44", "throughput": 1316.08, "total_tokens": 318240} |
|
{"current_steps": 50, "total_steps": 712, "loss": 1.9472, "lr": 6.533333333333334e-06, "epoch": 0.2802690582959641, "percentage": 7.02, "elapsed_time": "0:08:02", "remaining_time": "1:46:30", "throughput": 1319.26, "total_tokens": 636760} |
|
{"current_steps": 75, "total_steps": 712, "loss": 1.5046, "lr": 9.866666666666668e-06, "epoch": 0.4204035874439462, "percentage": 10.53, "elapsed_time": "0:12:04", "remaining_time": "1:42:30", "throughput": 1320.9, "total_tokens": 956520} |
|
{"current_steps": 100, "total_steps": 712, "loss": 1.3971, "lr": 1.3200000000000002e-05, "epoch": 0.5605381165919282, "percentage": 14.04, "elapsed_time": "0:16:05", "remaining_time": "1:38:30", "throughput": 1321.21, "total_tokens": 1275920} |
|
{"current_steps": 125, "total_steps": 712, "loss": 1.3768, "lr": 1.6533333333333333e-05, "epoch": 0.7006726457399103, "percentage": 17.56, "elapsed_time": "0:20:07", "remaining_time": "1:34:28", "throughput": 1321.53, "total_tokens": 1595280} |
|
{"current_steps": 150, "total_steps": 712, "loss": 1.3278, "lr": 1.9866666666666667e-05, "epoch": 0.8408071748878924, "percentage": 21.07, "elapsed_time": "0:24:08", "remaining_time": "1:30:27", "throughput": 1321.82, "total_tokens": 1914720} |
|
{"current_steps": 175, "total_steps": 712, "loss": 1.2927, "lr": 1.9910139651840497e-05, "epoch": 0.9809417040358744, "percentage": 24.58, "elapsed_time": "0:28:09", "remaining_time": "1:26:24", "throughput": 1322.18, "total_tokens": 2233680} |
|
{"current_steps": 200, "total_steps": 712, "loss": 1.2029, "lr": 1.962720313575358e-05, "epoch": 1.1177130044843049, "percentage": 28.09, "elapsed_time": "0:32:04", "remaining_time": "1:22:07", "throughput": 1322.22, "total_tokens": 2544928} |
|
{"current_steps": 225, "total_steps": 712, "loss": 1.2199, "lr": 1.915655103523529e-05, "epoch": 1.257847533632287, "percentage": 31.6, "elapsed_time": "0:36:06", "remaining_time": "1:18:08", "throughput": 1322.25, "total_tokens": 2864008} |
|
{"current_steps": 250, "total_steps": 712, "loss": 1.2112, "lr": 1.8507360338956896e-05, "epoch": 1.397982062780269, "percentage": 35.11, "elapsed_time": "0:40:07", "remaining_time": "1:14:08", "throughput": 1322.45, "total_tokens": 3183248} |
|
{"current_steps": 275, "total_steps": 712, "loss": 1.221, "lr": 1.7692289262315e-05, "epoch": 1.5381165919282511, "percentage": 38.62, "elapsed_time": "0:44:20", "remaining_time": "1:10:27", "throughput": 1316.5, "total_tokens": 3502528} |
|
{"current_steps": 300, "total_steps": 712, "loss": 1.1758, "lr": 1.6727230431791816e-05, "epoch": 1.6782511210762332, "percentage": 42.13, "elapsed_time": "0:48:21", "remaining_time": "1:06:25", "throughput": 1316.99, "total_tokens": 3821648} |
|
{"current_steps": 325, "total_steps": 712, "loss": 1.1828, "lr": 1.563100100329731e-05, "epoch": 1.8183856502242153, "percentage": 45.65, "elapsed_time": "0:52:22", "remaining_time": "1:02:21", "throughput": 1317.42, "total_tokens": 4140008} |
|
{"current_steps": 350, "total_steps": 712, "loss": 1.1948, "lr": 1.442497575670668e-05, "epoch": 1.9585201793721974, "percentage": 49.16, "elapsed_time": "0:56:23", "remaining_time": "0:58:19", "throughput": 1317.74, "total_tokens": 4458448} |
|
{"current_steps": 375, "total_steps": 712, "loss": 1.07, "lr": 1.313267032068285e-05, "epoch": 2.0952914798206277, "percentage": 52.67, "elapsed_time": "1:00:18", "remaining_time": "0:54:12", "throughput": 1318.08, "total_tokens": 4770136} |
|
{"current_steps": 400, "total_steps": 712, "loss": 1.0581, "lr": 1.1779282654255685e-05, "epoch": 2.2354260089686098, "percentage": 56.18, "elapsed_time": "1:04:19", "remaining_time": "0:50:10", "throughput": 1318.28, "total_tokens": 5087896} |
|
{"current_steps": 425, "total_steps": 712, "loss": 1.048, "lr": 1.0391201725558842e-05, "epoch": 2.375560538116592, "percentage": 59.69, "elapsed_time": "1:08:21", "remaining_time": "0:46:09", "throughput": 1318.52, "total_tokens": 5407296} |
|
{"current_steps": 450, "total_steps": 712, "loss": 1.0218, "lr": 8.99549296772945e-06, "epoch": 2.515695067264574, "percentage": 63.2, "elapsed_time": "1:12:22", "remaining_time": "0:42:08", "throughput": 1318.81, "total_tokens": 5726896} |
|
{"current_steps": 475, "total_steps": 712, "loss": 1.0206, "lr": 7.619370544785608e-06, "epoch": 2.655829596412556, "percentage": 66.71, "elapsed_time": "1:16:23", "remaining_time": "0:38:07", "throughput": 1319.13, "total_tokens": 6046856} |
|
{"current_steps": 500, "total_steps": 712, "loss": 1.0277, "lr": 6.289666717481497e-06, "epoch": 2.795964125560538, "percentage": 70.22, "elapsed_time": "1:20:25", "remaining_time": "0:34:05", "throughput": 1319.31, "total_tokens": 6366216} |
|
{"current_steps": 525, "total_steps": 712, "loss": 1.0494, "lr": 5.032308655686011e-06, "epoch": 2.93609865470852, "percentage": 73.74, "elapsed_time": "1:24:39", "remaining_time": "0:30:09", "throughput": 1316.22, "total_tokens": 6685296} |
|
{"current_steps": 550, "total_steps": 712, "loss": 0.9487, "lr": 3.8718128986350154e-06, "epoch": 3.0728699551569507, "percentage": 77.25, "elapsed_time": "1:28:34", "remaining_time": "0:26:05", "throughput": 1316.47, "total_tokens": 6996704} |
|
{"current_steps": 575, "total_steps": 712, "loss": 0.9103, "lr": 2.8308073203011667e-06, "epoch": 3.213004484304933, "percentage": 80.76, "elapsed_time": "1:32:36", "remaining_time": "0:22:03", "throughput": 1316.77, "total_tokens": 7316144} |
|
{"current_steps": 600, "total_steps": 712, "loss": 0.9102, "lr": 1.929589920817806e-06, "epoch": 3.353139013452915, "percentage": 84.27, "elapsed_time": "1:36:37", "remaining_time": "0:18:02", "throughput": 1317.02, "total_tokens": 7635704} |
|
{"current_steps": 625, "total_steps": 712, "loss": 0.9034, "lr": 1.1857330468424466e-06, "epoch": 3.493273542600897, "percentage": 87.78, "elapsed_time": "1:40:39", "remaining_time": "0:14:00", "throughput": 1317.22, "total_tokens": 7955304} |
|
{"current_steps": 650, "total_steps": 712, "loss": 0.8949, "lr": 6.137407579511212e-07, "epoch": 3.633408071748879, "percentage": 91.29, "elapsed_time": "1:44:40", "remaining_time": "0:09:59", "throughput": 1317.47, "total_tokens": 8274744} |
|
{"current_steps": 675, "total_steps": 712, "loss": 0.9073, "lr": 2.2476601988947965e-07, "epoch": 3.773542600896861, "percentage": 94.8, "elapsed_time": "1:48:42", "remaining_time": "0:05:57", "throughput": 1317.67, "total_tokens": 8594304} |
|
{"current_steps": 700, "total_steps": 712, "loss": 0.8967, "lr": 2.639323897518975e-08, "epoch": 3.913677130044843, "percentage": 98.31, "elapsed_time": "1:52:43", "remaining_time": "0:01:55", "throughput": 1317.87, "total_tokens": 8913944} |
|
{"current_steps": 712, "total_steps": 712, "epoch": 3.9809417040358746, "percentage": 100.0, "elapsed_time": "1:54:52", "remaining_time": "0:00:00", "throughput": 1315.55, "total_tokens": 9067184} |
|
|