|
{"current_steps": 5, "total_steps": 180, "loss": 0.2815, "lr": 4.990486745229364e-05, "epoch": 0.08213552361396304, "percentage": 2.78, "elapsed_time": "0:01:21", "remaining_time": "0:47:19", "throughput": 1647.4, "total_tokens": 133664} |
|
{"current_steps": 5, "total_steps": 180, "loss": 0.2811, "lr": 4.990486745229364e-05, "epoch": 0.08213552361396304, "percentage": 2.78, "elapsed_time": "0:01:20", "remaining_time": "0:46:45", "throughput": 1667.76, "total_tokens": 133664} |
|
{"current_steps": 10, "total_steps": 180, "loss": 0.176, "lr": 4.962019382530521e-05, "epoch": 0.16427104722792607, "percentage": 5.56, "elapsed_time": "0:02:39", "remaining_time": "0:45:16", "throughput": 1674.74, "total_tokens": 267600} |
|
{"current_steps": 15, "total_steps": 180, "loss": 0.114, "lr": 4.914814565722671e-05, "epoch": 0.2464065708418891, "percentage": 8.33, "elapsed_time": "0:03:59", "remaining_time": "0:43:51", "throughput": 1671.9, "total_tokens": 399936} |
|
{"current_steps": 20, "total_steps": 180, "loss": 0.0928, "lr": 4.849231551964771e-05, "epoch": 0.32854209445585214, "percentage": 11.11, "elapsed_time": "0:05:24", "remaining_time": "0:43:12", "throughput": 1671.64, "total_tokens": 541792} |
|
{"current_steps": 25, "total_steps": 180, "loss": 0.0704, "lr": 4.765769467591625e-05, "epoch": 0.4106776180698152, "percentage": 13.89, "elapsed_time": "0:06:50", "remaining_time": "0:42:22", "throughput": 1668.36, "total_tokens": 684096} |
|
{"current_steps": 30, "total_steps": 180, "loss": 0.0691, "lr": 4.665063509461097e-05, "epoch": 0.4928131416837782, "percentage": 16.67, "elapsed_time": "0:08:15", "remaining_time": "0:41:19", "throughput": 1666.73, "total_tokens": 826384} |
|
{"current_steps": 35, "total_steps": 180, "loss": 0.0707, "lr": 4.54788011072248e-05, "epoch": 0.5749486652977412, "percentage": 19.44, "elapsed_time": "0:09:35", "remaining_time": "0:39:46", "throughput": 1668.68, "total_tokens": 961104} |
|
{"current_steps": 40, "total_steps": 180, "loss": 0.066, "lr": 4.415111107797445e-05, "epoch": 0.6570841889117043, "percentage": 22.22, "elapsed_time": "0:10:57", "remaining_time": "0:38:21", "throughput": 1667.53, "total_tokens": 1096752} |
|
{"current_steps": 45, "total_steps": 180, "loss": 0.0586, "lr": 4.267766952966369e-05, "epoch": 0.7392197125256673, "percentage": 25.0, "elapsed_time": "0:12:21", "remaining_time": "0:37:05", "throughput": 1667.65, "total_tokens": 1237040} |
|
{"current_steps": 50, "total_steps": 180, "loss": 0.0535, "lr": 4.1069690242163484e-05, "epoch": 0.8213552361396304, "percentage": 27.78, "elapsed_time": "0:13:46", "remaining_time": "0:35:49", "throughput": 1663.5, "total_tokens": 1375536} |
|
{"current_steps": 55, "total_steps": 180, "loss": 0.0607, "lr": 3.933941090877615e-05, "epoch": 0.9034907597535934, "percentage": 30.56, "elapsed_time": "0:15:09", "remaining_time": "0:34:26", "throughput": 1665.64, "total_tokens": 1514560} |
|
{"current_steps": 60, "total_steps": 180, "loss": 0.0486, "lr": 3.7500000000000003e-05, "epoch": 0.9856262833675564, "percentage": 33.33, "elapsed_time": "0:16:30", "remaining_time": "0:33:01", "throughput": 1666.45, "total_tokens": 1651104} |
|
{"current_steps": 65, "total_steps": 180, "loss": 0.0563, "lr": 3.556545654351749e-05, "epoch": 1.082135523613963, "percentage": 36.11, "elapsed_time": "0:18:02", "remaining_time": "0:31:55", "throughput": 1669.38, "total_tokens": 1807056} |
|
{"current_steps": 70, "total_steps": 180, "loss": 0.0485, "lr": 3.355050358314172e-05, "epoch": 1.164271047227926, "percentage": 38.89, "elapsed_time": "0:19:24", "remaining_time": "0:30:29", "throughput": 1669.25, "total_tokens": 1943808} |
|
{"current_steps": 75, "total_steps": 180, "loss": 0.0594, "lr": 3.147047612756302e-05, "epoch": 1.2464065708418892, "percentage": 41.67, "elapsed_time": "0:20:48", "remaining_time": "0:29:07", "throughput": 1668.33, "total_tokens": 2082480} |
|
{"current_steps": 80, "total_steps": 180, "loss": 0.0374, "lr": 2.9341204441673266e-05, "epoch": 1.3285420944558521, "percentage": 44.44, "elapsed_time": "0:22:14", "remaining_time": "0:27:47", "throughput": 1667.61, "total_tokens": 2225056} |
|
{"current_steps": 85, "total_steps": 180, "loss": 0.0512, "lr": 2.717889356869146e-05, "epoch": 1.410677618069815, "percentage": 47.22, "elapsed_time": "0:23:41", "remaining_time": "0:26:28", "throughput": 1665.12, "total_tokens": 2366640} |
|
{"current_steps": 90, "total_steps": 180, "loss": 0.0513, "lr": 2.5e-05, "epoch": 1.4928131416837782, "percentage": 50.0, "elapsed_time": "0:25:01", "remaining_time": "0:25:01", "throughput": 1664.82, "total_tokens": 2499200} |
|
{"current_steps": 95, "total_steps": 180, "loss": 0.0526, "lr": 2.2821106431308544e-05, "epoch": 1.5749486652977414, "percentage": 52.78, "elapsed_time": "0:26:20", "remaining_time": "0:23:33", "throughput": 1665.69, "total_tokens": 2631856} |
|
{"current_steps": 100, "total_steps": 180, "loss": 0.0486, "lr": 2.0658795558326743e-05, "epoch": 1.6570841889117043, "percentage": 55.56, "elapsed_time": "0:27:39", "remaining_time": "0:22:07", "throughput": 1668.52, "total_tokens": 2768624} |
|
{"current_steps": 105, "total_steps": 180, "loss": 0.0471, "lr": 1.852952387243698e-05, "epoch": 1.7392197125256672, "percentage": 58.33, "elapsed_time": "0:29:00", "remaining_time": "0:20:42", "throughput": 1668.45, "total_tokens": 2903376} |
|
{"current_steps": 110, "total_steps": 180, "loss": 0.0593, "lr": 1.6449496416858284e-05, "epoch": 1.8213552361396304, "percentage": 61.11, "elapsed_time": "0:30:19", "remaining_time": "0:19:17", "throughput": 1670.64, "total_tokens": 3039504} |
|
{"current_steps": 115, "total_steps": 180, "loss": 0.0491, "lr": 1.443454345648252e-05, "epoch": 1.9034907597535935, "percentage": 63.89, "elapsed_time": "0:31:41", "remaining_time": "0:17:54", "throughput": 1671.24, "total_tokens": 3177984} |
|
{"current_steps": 120, "total_steps": 180, "loss": 0.0537, "lr": 1.2500000000000006e-05, "epoch": 1.9856262833675564, "percentage": 66.67, "elapsed_time": "0:33:01", "remaining_time": "0:16:30", "throughput": 1671.86, "total_tokens": 3312768} |
|
{"current_steps": 125, "total_steps": 180, "loss": 0.0604, "lr": 1.0660589091223855e-05, "epoch": 2.082135523613963, "percentage": 69.44, "elapsed_time": "0:34:35", "remaining_time": "0:15:13", "throughput": 1672.49, "total_tokens": 3470896} |
|
{"current_steps": 130, "total_steps": 180, "loss": 0.0535, "lr": 8.930309757836517e-06, "epoch": 2.164271047227926, "percentage": 72.22, "elapsed_time": "0:35:55", "remaining_time": "0:13:49", "throughput": 1673.15, "total_tokens": 3606352} |
|
{"current_steps": 135, "total_steps": 180, "loss": 0.0471, "lr": 7.3223304703363135e-06, "epoch": 2.246406570841889, "percentage": 75.0, "elapsed_time": "0:37:14", "remaining_time": "0:12:24", "throughput": 1674.48, "total_tokens": 3741264} |
|
{"current_steps": 140, "total_steps": 180, "loss": 0.0473, "lr": 5.848888922025553e-06, "epoch": 2.328542094455852, "percentage": 77.78, "elapsed_time": "0:38:39", "remaining_time": "0:11:02", "throughput": 1674.48, "total_tokens": 3883328} |
|
{"current_steps": 145, "total_steps": 180, "loss": 0.0475, "lr": 4.521198892775203e-06, "epoch": 2.410677618069815, "percentage": 80.56, "elapsed_time": "0:40:00", "remaining_time": "0:09:39", "throughput": 1676.17, "total_tokens": 4023344} |
|
{"current_steps": 150, "total_steps": 180, "loss": 0.0475, "lr": 3.3493649053890326e-06, "epoch": 2.4928131416837784, "percentage": 83.33, "elapsed_time": "0:41:23", "remaining_time": "0:08:16", "throughput": 1675.28, "total_tokens": 4161136} |
|
{"current_steps": 155, "total_steps": 180, "loss": 0.0447, "lr": 2.3423053240837515e-06, "epoch": 2.5749486652977414, "percentage": 86.11, "elapsed_time": "0:42:47", "remaining_time": "0:06:54", "throughput": 1674.41, "total_tokens": 4299792} |
|
{"current_steps": 160, "total_steps": 180, "loss": 0.0415, "lr": 1.5076844803522922e-06, "epoch": 2.6570841889117043, "percentage": 88.89, "elapsed_time": "0:44:13", "remaining_time": "0:05:31", "throughput": 1672.38, "total_tokens": 4437744} |
|
{"current_steps": 165, "total_steps": 180, "loss": 0.0324, "lr": 8.51854342773295e-07, "epoch": 2.739219712525667, "percentage": 91.67, "elapsed_time": "0:45:38", "remaining_time": "0:04:08", "throughput": 1670.37, "total_tokens": 4574736} |
|
{"current_steps": 170, "total_steps": 180, "loss": 0.0502, "lr": 3.7980617469479953e-07, "epoch": 2.82135523613963, "percentage": 94.44, "elapsed_time": "0:47:03", "remaining_time": "0:02:46", "throughput": 1668.71, "total_tokens": 4711904} |
|
{"current_steps": 175, "total_steps": 180, "loss": 0.0483, "lr": 9.513254770636137e-08, "epoch": 2.9034907597535935, "percentage": 97.22, "elapsed_time": "0:48:22", "remaining_time": "0:01:22", "throughput": 1669.02, "total_tokens": 4844832} |
|
{"current_steps": 180, "total_steps": 180, "loss": 0.0448, "lr": 0.0, "epoch": 2.9856262833675564, "percentage": 100.0, "elapsed_time": "0:49:41", "remaining_time": "0:00:00", "throughput": 1670.47, "total_tokens": 4981312} |
|
{"current_steps": 180, "total_steps": 180, "epoch": 2.9856262833675564, "percentage": 100.0, "elapsed_time": "0:49:43", "remaining_time": "0:00:00", "throughput": 1669.89, "total_tokens": 4981312} |
|
|