Training in progress, step 546
Browse files
model-00001-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4877660776
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f477079e5cb61b17106246e4341a760166d58b5f0b434c25a2b0934b2f0e2ef6
|
3 |
size 4877660776
|
model-00002-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4932751008
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c37c31c879dced903610f6adfb439cd92dfedf7bea7c9eeceb93689c7c434b6c
|
3 |
size 4932751008
|
model-00003-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 4330865200
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b3a6a0865e01efb8e83702b5aef85d02ddb22788ec8eddffba9906331a48b4f2
|
3 |
size 4330865200
|
model-00004-of-00004.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1089994880
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4285e63d10a79ff26f74e59bc99913be8c8955c121341f3d6d9118a41ca3f626
|
3 |
size 1089994880
|
trainer_log.jsonl
CHANGED
@@ -399,3 +399,149 @@
|
|
399 |
{"current_steps": 399, "total_steps": 546, "loss": 0.4877, "lr": 2.079220480245052e-06, "epoch": 2.180574555403557, "percentage": 73.08, "elapsed_time": "12:01:19", "remaining_time": "4:25:45"}
|
400 |
{"current_steps": 400, "total_steps": 546, "loss": 0.4802, "lr": 2.053314589791706e-06, "epoch": 2.186046511627907, "percentage": 73.26, "elapsed_time": "12:02:46", "remaining_time": "4:23:48"}
|
401 |
{"current_steps": 401, "total_steps": 546, "loss": 0.489, "lr": 2.0275293331505437e-06, "epoch": 2.1915184678522572, "percentage": 73.44, "elapsed_time": "12:07:28", "remaining_time": "4:23:03"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
399 |
{"current_steps": 399, "total_steps": 546, "loss": 0.4877, "lr": 2.079220480245052e-06, "epoch": 2.180574555403557, "percentage": 73.08, "elapsed_time": "12:01:19", "remaining_time": "4:25:45"}
|
400 |
{"current_steps": 400, "total_steps": 546, "loss": 0.4802, "lr": 2.053314589791706e-06, "epoch": 2.186046511627907, "percentage": 73.26, "elapsed_time": "12:02:46", "remaining_time": "4:23:48"}
|
401 |
{"current_steps": 401, "total_steps": 546, "loss": 0.489, "lr": 2.0275293331505437e-06, "epoch": 2.1915184678522572, "percentage": 73.44, "elapsed_time": "12:07:28", "remaining_time": "4:23:03"}
|
402 |
+
{"current_steps": 402, "total_steps": 546, "loss": 0.5028, "lr": 2.00186576593945e-06, "epoch": 2.196990424076607, "percentage": 73.63, "elapsed_time": "12:09:48", "remaining_time": "4:21:25"}
|
403 |
+
{"current_steps": 403, "total_steps": 546, "loss": 0.4967, "lr": 1.9763249387944823e-06, "epoch": 2.2024623803009575, "percentage": 73.81, "elapsed_time": "12:11:39", "remaining_time": "4:19:37"}
|
404 |
+
{"current_steps": 404, "total_steps": 546, "loss": 0.4922, "lr": 1.9509078973268645e-06, "epoch": 2.207934336525308, "percentage": 73.99, "elapsed_time": "12:13:03", "remaining_time": "4:17:39"}
|
405 |
+
{"current_steps": 405, "total_steps": 546, "loss": 0.4575, "lr": 1.9256156820801896e-06, "epoch": 2.213406292749658, "percentage": 74.18, "elapsed_time": "12:14:54", "remaining_time": "4:15:51"}
|
406 |
+
{"current_steps": 406, "total_steps": 546, "loss": 0.4652, "lr": 1.9004493284877995e-06, "epoch": 2.218878248974008, "percentage": 74.36, "elapsed_time": "12:16:25", "remaining_time": "4:13:56"}
|
407 |
+
{"current_steps": 407, "total_steps": 546, "loss": 0.4066, "lr": 1.875409866830422e-06, "epoch": 2.2243502051983586, "percentage": 74.54, "elapsed_time": "12:18:24", "remaining_time": "4:12:10"}
|
408 |
+
{"current_steps": 408, "total_steps": 546, "loss": 0.4605, "lr": 1.850498322193972e-06, "epoch": 2.2298221614227085, "percentage": 74.73, "elapsed_time": "12:20:07", "remaining_time": "4:10:20"}
|
409 |
+
{"current_steps": 409, "total_steps": 546, "loss": 0.4854, "lr": 1.8257157144275939e-06, "epoch": 2.235294117647059, "percentage": 74.91, "elapsed_time": "12:22:04", "remaining_time": "4:08:34"}
|
410 |
+
{"current_steps": 410, "total_steps": 546, "loss": 0.531, "lr": 1.8010630581019095e-06, "epoch": 2.2407660738714092, "percentage": 75.09, "elapsed_time": "12:23:31", "remaining_time": "4:06:37"}
|
411 |
+
{"current_steps": 411, "total_steps": 546, "loss": 0.5214, "lr": 1.7765413624674866e-06, "epoch": 2.246238030095759, "percentage": 75.27, "elapsed_time": "12:25:19", "remaining_time": "4:04:49"}
|
412 |
+
{"current_steps": 412, "total_steps": 546, "loss": 0.5112, "lr": 1.7521516314135112e-06, "epoch": 2.2517099863201095, "percentage": 75.46, "elapsed_time": "12:27:22", "remaining_time": "4:03:04"}
|
413 |
+
{"current_steps": 413, "total_steps": 546, "loss": 0.5079, "lr": 1.7278948634266968e-06, "epoch": 2.2571819425444595, "percentage": 75.64, "elapsed_time": "12:28:58", "remaining_time": "4:01:11"}
|
414 |
+
{"current_steps": 414, "total_steps": 546, "loss": 0.4258, "lr": 1.703772051550412e-06, "epoch": 2.26265389876881, "percentage": 75.82, "elapsed_time": "12:31:13", "remaining_time": "3:59:31"}
|
415 |
+
{"current_steps": 415, "total_steps": 546, "loss": 0.5307, "lr": 1.6797841833440143e-06, "epoch": 2.26812585499316, "percentage": 76.01, "elapsed_time": "12:32:52", "remaining_time": "3:57:39"}
|
416 |
+
{"current_steps": 416, "total_steps": 546, "loss": 0.5173, "lr": 1.6559322408424289e-06, "epoch": 2.27359781121751, "percentage": 76.19, "elapsed_time": "12:34:49", "remaining_time": "3:55:53"}
|
417 |
+
{"current_steps": 417, "total_steps": 546, "loss": 0.4889, "lr": 1.6322172005159436e-06, "epoch": 2.2790697674418605, "percentage": 76.37, "elapsed_time": "12:36:21", "remaining_time": "3:53:58"}
|
418 |
+
{"current_steps": 418, "total_steps": 546, "loss": 0.4621, "lr": 1.608640033230236e-06, "epoch": 2.2845417236662104, "percentage": 76.56, "elapsed_time": "12:37:56", "remaining_time": "3:52:05"}
|
419 |
+
{"current_steps": 419, "total_steps": 546, "loss": 0.5532, "lr": 1.5852017042066215e-06, "epoch": 2.290013679890561, "percentage": 76.74, "elapsed_time": "12:39:26", "remaining_time": "3:50:11"}
|
420 |
+
{"current_steps": 420, "total_steps": 546, "loss": 0.707, "lr": 1.5619031729825401e-06, "epoch": 2.295485636114911, "percentage": 76.92, "elapsed_time": "12:41:37", "remaining_time": "3:48:29"}
|
421 |
+
{"current_steps": 421, "total_steps": 546, "loss": 0.4628, "lr": 1.5387453933722811e-06, "epoch": 2.300957592339261, "percentage": 77.11, "elapsed_time": "12:43:25", "remaining_time": "3:46:40"}
|
422 |
+
{"current_steps": 422, "total_steps": 546, "loss": 0.5053, "lr": 1.5157293134279243e-06, "epoch": 2.3064295485636115, "percentage": 77.29, "elapsed_time": "12:45:10", "remaining_time": "3:44:50"}
|
423 |
+
{"current_steps": 423, "total_steps": 546, "loss": 0.4868, "lr": 1.492855875400534e-06, "epoch": 2.311901504787962, "percentage": 77.47, "elapsed_time": "12:46:54", "remaining_time": "3:43:00"}
|
424 |
+
{"current_steps": 424, "total_steps": 546, "loss": 0.5358, "lr": 1.4701260157015823e-06, "epoch": 2.317373461012312, "percentage": 77.66, "elapsed_time": "12:48:45", "remaining_time": "3:41:12"}
|
425 |
+
{"current_steps": 425, "total_steps": 546, "loss": 0.4804, "lr": 1.4475406648646195e-06, "epoch": 2.322845417236662, "percentage": 77.84, "elapsed_time": "12:50:36", "remaining_time": "3:39:23"}
|
426 |
+
{"current_steps": 426, "total_steps": 546, "loss": 0.5275, "lr": 1.4251007475071688e-06, "epoch": 2.3283173734610125, "percentage": 78.02, "elapsed_time": "12:52:46", "remaining_time": "3:37:40"}
|
427 |
+
{"current_steps": 427, "total_steps": 546, "loss": 0.4416, "lr": 1.402807182292879e-06, "epoch": 2.3337893296853625, "percentage": 78.21, "elapsed_time": "12:54:56", "remaining_time": "3:35:58"}
|
428 |
+
{"current_steps": 428, "total_steps": 546, "loss": 0.5521, "lr": 1.3806608818939205e-06, "epoch": 2.339261285909713, "percentage": 78.39, "elapsed_time": "12:57:07", "remaining_time": "3:34:15"}
|
429 |
+
{"current_steps": 429, "total_steps": 546, "loss": 0.5347, "lr": 1.3586627529536117e-06, "epoch": 2.3447332421340628, "percentage": 78.57, "elapsed_time": "12:58:49", "remaining_time": "3:32:24"}
|
430 |
+
{"current_steps": 430, "total_steps": 546, "loss": 0.5075, "lr": 1.3368136960493083e-06, "epoch": 2.350205198358413, "percentage": 78.75, "elapsed_time": "13:01:15", "remaining_time": "3:30:45"}
|
431 |
+
{"current_steps": 431, "total_steps": 546, "loss": 0.5016, "lr": 1.315114605655532e-06, "epoch": 2.3556771545827635, "percentage": 78.94, "elapsed_time": "13:03:04", "remaining_time": "3:28:56"}
|
432 |
+
{"current_steps": 432, "total_steps": 546, "loss": 0.4486, "lr": 1.2935663701073586e-06, "epoch": 2.3611491108071134, "percentage": 79.12, "elapsed_time": "13:05:00", "remaining_time": "3:27:09"}
|
433 |
+
{"current_steps": 433, "total_steps": 546, "loss": 0.5249, "lr": 1.2721698715640352e-06, "epoch": 2.366621067031464, "percentage": 79.3, "elapsed_time": "13:06:36", "remaining_time": "3:25:16"}
|
434 |
+
{"current_steps": 434, "total_steps": 546, "loss": 0.4806, "lr": 1.2509259859728863e-06, "epoch": 2.3720930232558137, "percentage": 79.49, "elapsed_time": "13:08:40", "remaining_time": "3:23:31"}
|
435 |
+
{"current_steps": 435, "total_steps": 546, "loss": 0.5134, "lr": 1.2298355830334346e-06, "epoch": 2.377564979480164, "percentage": 79.67, "elapsed_time": "13:10:29", "remaining_time": "3:21:42"}
|
436 |
+
{"current_steps": 436, "total_steps": 546, "loss": 0.5527, "lr": 1.2088995261618108e-06, "epoch": 2.3830369357045145, "percentage": 79.85, "elapsed_time": "13:12:05", "remaining_time": "3:19:50"}
|
437 |
+
{"current_steps": 437, "total_steps": 546, "loss": 0.6196, "lr": 1.1881186724553968e-06, "epoch": 2.3885088919288644, "percentage": 80.04, "elapsed_time": "13:14:38", "remaining_time": "3:18:12"}
|
438 |
+
{"current_steps": 438, "total_steps": 546, "loss": 0.5563, "lr": 1.167493872657739e-06, "epoch": 2.3939808481532148, "percentage": 80.22, "elapsed_time": "13:16:21", "remaining_time": "3:16:21"}
|
439 |
+
{"current_steps": 439, "total_steps": 546, "loss": 0.5389, "lr": 1.1470259711237285e-06, "epoch": 2.399452804377565, "percentage": 80.4, "elapsed_time": "13:17:50", "remaining_time": "3:14:27"}
|
440 |
+
{"current_steps": 440, "total_steps": 546, "loss": 0.56, "lr": 1.1267158057850174e-06, "epoch": 2.404924760601915, "percentage": 80.59, "elapsed_time": "13:19:26", "remaining_time": "3:12:35"}
|
441 |
+
{"current_steps": 441, "total_steps": 546, "loss": 0.5401, "lr": 1.106564208115734e-06, "epoch": 2.4103967168262654, "percentage": 80.77, "elapsed_time": "13:21:25", "remaining_time": "3:10:48"}
|
442 |
+
{"current_steps": 442, "total_steps": 546, "loss": 0.4837, "lr": 1.0865720030984268e-06, "epoch": 2.415868673050616, "percentage": 80.95, "elapsed_time": "13:22:49", "remaining_time": "3:08:54"}
|
443 |
+
{"current_steps": 443, "total_steps": 546, "loss": 0.5257, "lr": 1.066740009190304e-06, "epoch": 2.4213406292749657, "percentage": 81.14, "elapsed_time": "13:24:35", "remaining_time": "3:07:04"}
|
444 |
+
{"current_steps": 444, "total_steps": 546, "loss": 0.4895, "lr": 1.0470690382897164e-06, "epoch": 2.426812585499316, "percentage": 81.32, "elapsed_time": "13:26:29", "remaining_time": "3:05:16"}
|
445 |
+
{"current_steps": 445, "total_steps": 546, "loss": 0.4759, "lr": 1.0275598957029232e-06, "epoch": 2.432284541723666, "percentage": 81.5, "elapsed_time": "13:27:58", "remaining_time": "3:03:22"}
|
446 |
+
{"current_steps": 446, "total_steps": 546, "loss": 0.5258, "lr": 1.0082133801111294e-06, "epoch": 2.4377564979480164, "percentage": 81.68, "elapsed_time": "13:29:53", "remaining_time": "3:01:35"}
|
447 |
+
{"current_steps": 447, "total_steps": 546, "loss": 0.4596, "lr": 9.890302835377736e-07, "epoch": 2.443228454172367, "percentage": 81.87, "elapsed_time": "13:31:20", "remaining_time": "2:59:41"}
|
448 |
+
{"current_steps": 448, "total_steps": 546, "loss": 0.4904, "lr": 9.70011391316124e-07, "epoch": 2.4487004103967167, "percentage": 82.05, "elapsed_time": "13:33:09", "remaining_time": "2:57:52"}
|
449 |
+
{"current_steps": 449, "total_steps": 546, "loss": 0.5418, "lr": 9.511574820571095e-07, "epoch": 2.454172366621067, "percentage": 82.23, "elapsed_time": "13:35:01", "remaining_time": "2:56:04"}
|
450 |
+
{"current_steps": 450, "total_steps": 546, "loss": 0.5106, "lr": 9.324693276174568e-07, "epoch": 2.459644322845417, "percentage": 82.42, "elapsed_time": "13:37:16", "remaining_time": "2:54:21"}
|
451 |
+
{"current_steps": 451, "total_steps": 546, "loss": 0.5182, "lr": 9.13947693068083e-07, "epoch": 2.4651162790697674, "percentage": 82.6, "elapsed_time": "13:39:21", "remaining_time": "2:52:35"}
|
452 |
+
{"current_steps": 452, "total_steps": 546, "loss": 0.4735, "lr": 8.955933366627778e-07, "epoch": 2.4705882352941178, "percentage": 82.78, "elapsed_time": "13:41:24", "remaining_time": "2:50:49"}
|
453 |
+
{"current_steps": 453, "total_steps": 546, "loss": 0.5394, "lr": 8.774070098071669e-07, "epoch": 2.4760601915184677, "percentage": 82.97, "elapsed_time": "13:43:38", "remaining_time": "2:49:05"}
|
454 |
+
{"current_steps": 454, "total_steps": 546, "loss": 0.4599, "lr": 8.593894570279365e-07, "epoch": 2.481532147742818, "percentage": 83.15, "elapsed_time": "13:45:28", "remaining_time": "2:47:16"}
|
455 |
+
{"current_steps": 455, "total_steps": 546, "loss": 0.4669, "lr": 8.415414159423707e-07, "epoch": 2.4870041039671684, "percentage": 83.33, "elapsed_time": "13:47:16", "remaining_time": "2:45:27"}
|
456 |
+
{"current_steps": 456, "total_steps": 546, "loss": 0.4434, "lr": 8.238636172281394e-07, "epoch": 2.4924760601915183, "percentage": 83.52, "elapsed_time": "13:49:10", "remaining_time": "2:43:39"}
|
457 |
+
{"current_steps": 457, "total_steps": 546, "loss": 0.4307, "lr": 8.063567845933973e-07, "epoch": 2.4979480164158687, "percentage": 83.7, "elapsed_time": "13:50:51", "remaining_time": "2:41:48"}
|
458 |
+
{"current_steps": 458, "total_steps": 546, "loss": 0.5538, "lr": 7.890216347471408e-07, "epoch": 2.503419972640219, "percentage": 83.88, "elapsed_time": "13:53:07", "remaining_time": "2:40:04"}
|
459 |
+
{"current_steps": 459, "total_steps": 546, "loss": 0.4864, "lr": 7.718588773698871e-07, "epoch": 2.508891928864569, "percentage": 84.07, "elapsed_time": "13:55:12", "remaining_time": "2:38:18"}
|
460 |
+
{"current_steps": 460, "total_steps": 546, "loss": 0.5177, "lr": 7.548692150846021e-07, "epoch": 2.5143638850889194, "percentage": 84.25, "elapsed_time": "13:57:26", "remaining_time": "2:36:33"}
|
461 |
+
{"current_steps": 461, "total_steps": 546, "loss": 0.4806, "lr": 7.380533434279457e-07, "epoch": 2.5198358413132693, "percentage": 84.43, "elapsed_time": "13:58:50", "remaining_time": "2:34:40"}
|
462 |
+
{"current_steps": 462, "total_steps": 546, "loss": 0.458, "lr": 7.214119508217976e-07, "epoch": 2.5253077975376197, "percentage": 84.62, "elapsed_time": "14:00:30", "remaining_time": "2:32:49"}
|
463 |
+
{"current_steps": 463, "total_steps": 546, "loss": 0.4749, "lr": 7.049457185450692e-07, "epoch": 2.53077975376197, "percentage": 84.8, "elapsed_time": "14:03:02", "remaining_time": "2:31:07"}
|
464 |
+
{"current_steps": 464, "total_steps": 546, "loss": 0.717, "lr": 6.88655320705815e-07, "epoch": 2.53625170998632, "percentage": 84.98, "elapsed_time": "14:04:51", "remaining_time": "2:29:18"}
|
465 |
+
{"current_steps": 465, "total_steps": 546, "loss": 0.4695, "lr": 6.725414242136364e-07, "epoch": 2.5417236662106704, "percentage": 85.16, "elapsed_time": "14:06:12", "remaining_time": "2:27:24"}
|
466 |
+
{"current_steps": 466, "total_steps": 546, "loss": 0.4882, "lr": 6.566046887523808e-07, "epoch": 2.5471956224350203, "percentage": 85.35, "elapsed_time": "14:07:34", "remaining_time": "2:25:30"}
|
467 |
+
{"current_steps": 467, "total_steps": 546, "loss": 0.4828, "lr": 6.408457667531298e-07, "epoch": 2.5526675786593707, "percentage": 85.53, "elapsed_time": "14:09:40", "remaining_time": "2:23:44"}
|
468 |
+
{"current_steps": 468, "total_steps": 546, "loss": 0.5306, "lr": 6.252653033674927e-07, "epoch": 2.558139534883721, "percentage": 85.71, "elapsed_time": "14:11:35", "remaining_time": "2:21:55"}
|
469 |
+
{"current_steps": 469, "total_steps": 546, "loss": 0.519, "lr": 6.098639364411974e-07, "epoch": 2.5636114911080714, "percentage": 85.9, "elapsed_time": "14:13:17", "remaining_time": "2:20:05"}
|
470 |
+
{"current_steps": 470, "total_steps": 546, "loss": 0.5186, "lr": 5.946422964879706e-07, "epoch": 2.5690834473324213, "percentage": 86.08, "elapsed_time": "14:14:58", "remaining_time": "2:18:15"}
|
471 |
+
{"current_steps": 471, "total_steps": 546, "loss": 0.4709, "lr": 5.79601006663732e-07, "epoch": 2.5745554035567717, "percentage": 86.26, "elapsed_time": "14:17:03", "remaining_time": "2:16:28"}
|
472 |
+
{"current_steps": 472, "total_steps": 546, "loss": 0.4838, "lr": 5.647406827410796e-07, "epoch": 2.5800273597811216, "percentage": 86.45, "elapsed_time": "14:18:26", "remaining_time": "2:14:35"}
|
473 |
+
{"current_steps": 473, "total_steps": 546, "loss": 0.4406, "lr": 5.500619330840829e-07, "epoch": 2.585499316005472, "percentage": 86.63, "elapsed_time": "14:19:59", "remaining_time": "2:12:43"}
|
474 |
+
{"current_steps": 474, "total_steps": 546, "loss": 0.4995, "lr": 5.35565358623375e-07, "epoch": 2.5909712722298224, "percentage": 86.81, "elapsed_time": "14:21:50", "remaining_time": "2:10:54"}
|
475 |
+
{"current_steps": 475, "total_steps": 546, "loss": 0.4685, "lr": 5.212515528315504e-07, "epoch": 2.5964432284541723, "percentage": 87.0, "elapsed_time": "14:23:37", "remaining_time": "2:09:05"}
|
476 |
+
{"current_steps": 476, "total_steps": 546, "loss": 0.5057, "lr": 5.071211016988753e-07, "epoch": 2.6019151846785227, "percentage": 87.18, "elapsed_time": "14:25:15", "remaining_time": "2:07:14"}
|
477 |
+
{"current_steps": 477, "total_steps": 546, "loss": 0.4893, "lr": 4.931745837092888e-07, "epoch": 2.6073871409028726, "percentage": 87.36, "elapsed_time": "14:27:06", "remaining_time": "2:05:25"}
|
478 |
+
{"current_steps": 478, "total_steps": 546, "loss": 0.4931, "lr": 4.794125698167262e-07, "epoch": 2.612859097127223, "percentage": 87.55, "elapsed_time": "14:28:49", "remaining_time": "2:03:35"}
|
479 |
+
{"current_steps": 479, "total_steps": 546, "loss": 0.5162, "lr": 4.658356234217437e-07, "epoch": 2.6183310533515733, "percentage": 87.73, "elapsed_time": "14:30:26", "remaining_time": "2:01:45"}
|
480 |
+
{"current_steps": 480, "total_steps": 546, "loss": 0.5098, "lr": 4.5244430034845466e-07, "epoch": 2.6238030095759233, "percentage": 87.91, "elapsed_time": "14:31:50", "remaining_time": "1:59:52"}
|
481 |
+
{"current_steps": 481, "total_steps": 546, "loss": 0.5566, "lr": 4.3923914882177124e-07, "epoch": 2.6292749658002736, "percentage": 88.1, "elapsed_time": "14:33:50", "remaining_time": "1:58:05"}
|
482 |
+
{"current_steps": 482, "total_steps": 546, "loss": 0.4831, "lr": 4.262207094449633e-07, "epoch": 2.6347469220246236, "percentage": 88.28, "elapsed_time": "14:35:06", "remaining_time": "1:56:11"}
|
483 |
+
{"current_steps": 483, "total_steps": 546, "loss": 0.4815, "lr": 4.1338951517752637e-07, "epoch": 2.640218878248974, "percentage": 88.46, "elapsed_time": "14:37:09", "remaining_time": "1:54:24"}
|
484 |
+
{"current_steps": 484, "total_steps": 546, "loss": 0.4281, "lr": 4.007460913133643e-07, "epoch": 2.6456908344733243, "percentage": 88.64, "elapsed_time": "14:38:44", "remaining_time": "1:52:33"}
|
485 |
+
{"current_steps": 485, "total_steps": 546, "loss": 0.4698, "lr": 3.8829095545928177e-07, "epoch": 2.6511627906976747, "percentage": 88.83, "elapsed_time": "14:40:32", "remaining_time": "1:50:44"}
|
486 |
+
{"current_steps": 486, "total_steps": 546, "loss": 0.4481, "lr": 3.760246175137938e-07, "epoch": 2.6566347469220246, "percentage": 89.01, "elapsed_time": "14:42:35", "remaining_time": "1:48:57"}
|
487 |
+
{"current_steps": 487, "total_steps": 546, "loss": 0.4609, "lr": 3.639475796462577e-07, "epoch": 2.662106703146375, "percentage": 89.19, "elapsed_time": "14:44:45", "remaining_time": "1:47:11"}
|
488 |
+
{"current_steps": 488, "total_steps": 546, "loss": 0.4648, "lr": 3.5206033627630145e-07, "epoch": 2.667578659370725, "percentage": 89.38, "elapsed_time": "14:46:42", "remaining_time": "1:45:23"}
|
489 |
+
{"current_steps": 489, "total_steps": 546, "loss": 0.4802, "lr": 3.403633740535983e-07, "epoch": 2.6730506155950753, "percentage": 89.56, "elapsed_time": "14:48:28", "remaining_time": "1:43:33"}
|
490 |
+
{"current_steps": 490, "total_steps": 546, "loss": 0.4876, "lr": 3.2885717183793296e-07, "epoch": 2.6785225718194257, "percentage": 89.74, "elapsed_time": "14:50:14", "remaining_time": "1:41:44"}
|
491 |
+
{"current_steps": 491, "total_steps": 546, "loss": 0.5916, "lr": 3.175422006796031e-07, "epoch": 2.6839945280437756, "percentage": 89.93, "elapsed_time": "14:51:27", "remaining_time": "1:39:51"}
|
492 |
+
{"current_steps": 492, "total_steps": 546, "loss": 0.5125, "lr": 3.064189238001325e-07, "epoch": 2.689466484268126, "percentage": 90.11, "elapsed_time": "14:53:22", "remaining_time": "1:38:03"}
|
493 |
+
{"current_steps": 493, "total_steps": 546, "loss": 0.4823, "lr": 2.9548779657330605e-07, "epoch": 2.694938440492476, "percentage": 90.29, "elapsed_time": "14:54:45", "remaining_time": "1:36:11"}
|
494 |
+
{"current_steps": 494, "total_steps": 546, "loss": 0.4857, "lr": 2.847492665065349e-07, "epoch": 2.7004103967168263, "percentage": 90.48, "elapsed_time": "14:56:20", "remaining_time": "1:34:21"}
|
495 |
+
{"current_steps": 495, "total_steps": 546, "loss": 0.4717, "lr": 2.742037732225228e-07, "epoch": 2.7058823529411766, "percentage": 90.66, "elapsed_time": "14:57:36", "remaining_time": "1:32:28"}
|
496 |
+
{"current_steps": 496, "total_steps": 546, "loss": 0.4976, "lr": 2.6385174844128337e-07, "epoch": 2.7113543091655266, "percentage": 90.84, "elapsed_time": "14:59:34", "remaining_time": "1:30:40"}
|
497 |
+
{"current_steps": 497, "total_steps": 546, "loss": 0.484, "lr": 2.5369361596245366e-07, "epoch": 2.716826265389877, "percentage": 91.03, "elapsed_time": "15:01:01", "remaining_time": "1:28:49"}
|
498 |
+
{"current_steps": 498, "total_steps": 546, "loss": 0.6527, "lr": 2.4372979164795306e-07, "epoch": 2.722298221614227, "percentage": 91.21, "elapsed_time": "15:03:02", "remaining_time": "1:27:02"}
|
499 |
+
{"current_steps": 499, "total_steps": 546, "loss": 0.4795, "lr": 2.3396068340495182e-07, "epoch": 2.7277701778385772, "percentage": 91.39, "elapsed_time": "15:04:54", "remaining_time": "1:25:13"}
|
500 |
+
{"current_steps": 500, "total_steps": 546, "loss": 0.5174, "lr": 2.2438669116917612e-07, "epoch": 2.7332421340629276, "percentage": 91.58, "elapsed_time": "15:05:58", "remaining_time": "1:23:20"}
|
501 |
+
{"current_steps": 501, "total_steps": 546, "loss": 0.4473, "lr": 2.1500820688853562e-07, "epoch": 2.738714090287278, "percentage": 91.76, "elapsed_time": "15:07:34", "remaining_time": "1:21:31"}
|
502 |
+
{"current_steps": 502, "total_steps": 546, "loss": 0.4801, "lr": 2.0582561450707027e-07, "epoch": 2.744186046511628, "percentage": 91.94, "elapsed_time": "15:09:06", "remaining_time": "1:19:40"}
|
503 |
+
{"current_steps": 503, "total_steps": 546, "loss": 0.5184, "lr": 1.9683928994924383e-07, "epoch": 2.7496580027359783, "percentage": 92.12, "elapsed_time": "15:10:26", "remaining_time": "1:17:49"}
|
504 |
+
{"current_steps": 504, "total_steps": 546, "loss": 0.4947, "lr": 1.8804960110454406e-07, "epoch": 2.755129958960328, "percentage": 92.31, "elapsed_time": "15:12:41", "remaining_time": "1:16:03"}
|
505 |
+
{"current_steps": 505, "total_steps": 546, "loss": 0.5058, "lr": 1.7945690781242752e-07, "epoch": 2.7606019151846786, "percentage": 92.49, "elapsed_time": "15:14:37", "remaining_time": "1:14:15"}
|
506 |
+
{"current_steps": 506, "total_steps": 546, "loss": 0.4957, "lr": 1.7106156184758248e-07, "epoch": 2.766073871409029, "percentage": 92.67, "elapsed_time": "15:16:34", "remaining_time": "1:12:27"}
|
507 |
+
{"current_steps": 507, "total_steps": 546, "loss": 0.4932, "lr": 1.62863906905536e-07, "epoch": 2.771545827633379, "percentage": 92.86, "elapsed_time": "15:17:58", "remaining_time": "1:10:36"}
|
508 |
+
{"current_steps": 508, "total_steps": 546, "loss": 0.5382, "lr": 1.5486427858857567e-07, "epoch": 2.7770177838577292, "percentage": 93.04, "elapsed_time": "15:19:55", "remaining_time": "1:08:48"}
|
509 |
+
{"current_steps": 509, "total_steps": 546, "loss": 0.532, "lr": 1.4706300439201348e-07, "epoch": 2.782489740082079, "percentage": 93.22, "elapsed_time": "15:21:32", "remaining_time": "1:06:59"}
|
510 |
+
{"current_steps": 510, "total_steps": 546, "loss": 0.4758, "lr": 1.394604036907804e-07, "epoch": 2.7879616963064295, "percentage": 93.41, "elapsed_time": "15:23:35", "remaining_time": "1:05:11"}
|
511 |
+
{"current_steps": 511, "total_steps": 546, "loss": 0.5132, "lr": 1.320567877263479e-07, "epoch": 2.79343365253078, "percentage": 93.59, "elapsed_time": "15:25:35", "remaining_time": "1:03:23"}
|
512 |
+
{"current_steps": 512, "total_steps": 546, "loss": 0.4615, "lr": 1.2485245959398928e-07, "epoch": 2.79890560875513, "percentage": 93.77, "elapsed_time": "15:27:59", "remaining_time": "1:01:37"}
|
513 |
+
{"current_steps": 513, "total_steps": 546, "loss": 0.4846, "lr": 1.17847714230368e-07, "epoch": 2.80437756497948, "percentage": 93.96, "elapsed_time": "15:29:26", "remaining_time": "0:59:47"}
|
514 |
+
{"current_steps": 514, "total_steps": 546, "loss": 0.47, "lr": 1.1104283840146834e-07, "epoch": 2.80984952120383, "percentage": 94.14, "elapsed_time": "15:31:29", "remaining_time": "0:57:59"}
|
515 |
+
{"current_steps": 515, "total_steps": 546, "loss": 0.672, "lr": 1.044381106908493e-07, "epoch": 2.8153214774281805, "percentage": 94.32, "elapsed_time": "15:33:39", "remaining_time": "0:56:12"}
|
516 |
+
{"current_steps": 516, "total_steps": 546, "loss": 0.5008, "lr": 9.803380148824371e-08, "epoch": 2.820793433652531, "percentage": 94.51, "elapsed_time": "15:35:14", "remaining_time": "0:54:22"}
|
517 |
+
{"current_steps": 517, "total_steps": 546, "loss": 0.4817, "lr": 9.18301729784904e-08, "epoch": 2.8262653898768813, "percentage": 94.69, "elapsed_time": "15:36:40", "remaining_time": "0:52:32"}
|
518 |
+
{"current_steps": 518, "total_steps": 546, "loss": 0.5053, "lr": 8.582747913079448e-08, "epoch": 2.831737346101231, "percentage": 94.87, "elapsed_time": "15:38:40", "remaining_time": "0:50:44"}
|
519 |
+
{"current_steps": 519, "total_steps": 546, "loss": 0.4637, "lr": 8.00259656883362e-08, "epoch": 2.8372093023255816, "percentage": 95.05, "elapsed_time": "15:40:57", "remaining_time": "0:48:57"}
|
520 |
+
{"current_steps": 520, "total_steps": 546, "loss": 0.4491, "lr": 7.442587015820734e-08, "epoch": 2.8426812585499315, "percentage": 95.24, "elapsed_time": "15:43:05", "remaining_time": "0:47:09"}
|
521 |
+
{"current_steps": 521, "total_steps": 546, "loss": 0.5315, "lr": 6.902742180168953e-08, "epoch": 2.848153214774282, "percentage": 95.42, "elapsed_time": "15:44:35", "remaining_time": "0:45:19"}
|
522 |
+
{"current_steps": 522, "total_steps": 546, "loss": 0.4774, "lr": 6.38308416248673e-08, "epoch": 2.853625170998632, "percentage": 95.6, "elapsed_time": "15:46:26", "remaining_time": "0:43:30"}
|
523 |
+
{"current_steps": 523, "total_steps": 546, "loss": 0.479, "lr": 5.883634236958091e-08, "epoch": 2.859097127222982, "percentage": 95.79, "elapsed_time": "15:47:50", "remaining_time": "0:41:40"}
|
524 |
+
{"current_steps": 524, "total_steps": 546, "loss": 0.441, "lr": 5.4044128504717186e-08, "epoch": 2.8645690834473325, "percentage": 95.97, "elapsed_time": "15:50:01", "remaining_time": "0:39:53"}
|
525 |
+
{"current_steps": 525, "total_steps": 546, "loss": 0.5298, "lr": 4.945439621783843e-08, "epoch": 2.8700410396716824, "percentage": 96.15, "elapsed_time": "15:51:39", "remaining_time": "0:38:03"}
|
526 |
+
{"current_steps": 526, "total_steps": 546, "loss": 0.5647, "lr": 4.506733340714997e-08, "epoch": 2.875512995896033, "percentage": 96.34, "elapsed_time": "15:53:14", "remaining_time": "0:36:14"}
|
527 |
+
{"current_steps": 527, "total_steps": 546, "loss": 0.5675, "lr": 4.08831196738102e-08, "epoch": 2.880984952120383, "percentage": 96.52, "elapsed_time": "15:54:34", "remaining_time": "0:34:24"}
|
528 |
+
{"current_steps": 528, "total_steps": 546, "loss": 0.5109, "lr": 3.69019263145759e-08, "epoch": 2.886456908344733, "percentage": 96.7, "elapsed_time": "15:56:28", "remaining_time": "0:32:36"}
|
529 |
+
{"current_steps": 529, "total_steps": 546, "loss": 0.4531, "lr": 3.312391631479006e-08, "epoch": 2.8919288645690835, "percentage": 96.89, "elapsed_time": "15:57:48", "remaining_time": "0:30:46"}
|
530 |
+
{"current_steps": 530, "total_steps": 546, "loss": 0.5175, "lr": 2.9549244341708917e-08, "epoch": 2.8974008207934334, "percentage": 97.07, "elapsed_time": "15:58:56", "remaining_time": "0:28:56"}
|
531 |
+
{"current_steps": 531, "total_steps": 546, "loss": 0.4984, "lr": 2.6178056738170866e-08, "epoch": 2.902872777017784, "percentage": 97.25, "elapsed_time": "16:00:56", "remaining_time": "0:27:08"}
|
532 |
+
{"current_steps": 532, "total_steps": 546, "loss": 0.5347, "lr": 2.301049151660628e-08, "epoch": 2.908344733242134, "percentage": 97.44, "elapsed_time": "16:02:12", "remaining_time": "0:25:19"}
|
533 |
+
{"current_steps": 533, "total_steps": 546, "loss": 0.5113, "lr": 2.0046678353384254e-08, "epoch": 2.9138166894664845, "percentage": 97.62, "elapsed_time": "16:03:49", "remaining_time": "0:23:30"}
|
534 |
+
{"current_steps": 534, "total_steps": 546, "loss": 0.4774, "lr": 1.7286738583507935e-08, "epoch": 2.9192886456908345, "percentage": 97.8, "elapsed_time": "16:06:17", "remaining_time": "0:21:42"}
|
535 |
+
{"current_steps": 535, "total_steps": 546, "loss": 0.4891, "lr": 1.4730785195643527e-08, "epoch": 2.924760601915185, "percentage": 97.99, "elapsed_time": "16:07:51", "remaining_time": "0:19:53"}
|
536 |
+
{"current_steps": 536, "total_steps": 546, "loss": 0.4572, "lr": 1.2378922827496198e-08, "epoch": 2.9302325581395348, "percentage": 98.17, "elapsed_time": "16:09:53", "remaining_time": "0:18:05"}
|
537 |
+
{"current_steps": 537, "total_steps": 546, "loss": 0.4398, "lr": 1.0231247761528507e-08, "epoch": 2.935704514363885, "percentage": 98.35, "elapsed_time": "16:12:11", "remaining_time": "0:16:17"}
|
538 |
+
{"current_steps": 538, "total_steps": 546, "loss": 0.4239, "lr": 8.287847921013558e-09, "epoch": 2.9411764705882355, "percentage": 98.53, "elapsed_time": "16:13:40", "remaining_time": "0:14:28"}
|
539 |
+
{"current_steps": 539, "total_steps": 546, "loss": 0.5259, "lr": 6.548802866441218e-09, "epoch": 2.9466484268125854, "percentage": 98.72, "elapsed_time": "16:15:03", "remaining_time": "0:12:39"}
|
540 |
+
{"current_steps": 540, "total_steps": 546, "loss": 0.5069, "lr": 5.014183792256266e-09, "epoch": 2.952120383036936, "percentage": 98.9, "elapsed_time": "16:16:34", "remaining_time": "0:10:51"}
|
541 |
+
{"current_steps": 541, "total_steps": 546, "loss": 0.4951, "lr": 3.6840535239474063e-09, "epoch": 2.9575923392612857, "percentage": 99.08, "elapsed_time": "16:17:59", "remaining_time": "0:09:02"}
|
542 |
+
{"current_steps": 542, "total_steps": 546, "loss": 0.4817, "lr": 2.5584665154732015e-09, "epoch": 2.963064295485636, "percentage": 99.27, "elapsed_time": "16:19:49", "remaining_time": "0:07:13"}
|
543 |
+
{"current_steps": 543, "total_steps": 546, "loss": 0.5063, "lr": 1.6374688470327526e-09, "epoch": 2.9685362517099865, "percentage": 99.45, "elapsed_time": "16:21:43", "remaining_time": "0:05:25"}
|
544 |
+
{"current_steps": 544, "total_steps": 546, "loss": 0.5241, "lr": 9.210982231805388e-10, "epoch": 2.9740082079343364, "percentage": 99.63, "elapsed_time": "16:23:37", "remaining_time": "0:03:36"}
|
545 |
+
{"current_steps": 545, "total_steps": 546, "loss": 0.5268, "lr": 4.093839712815406e-10, "epoch": 2.9794801641586868, "percentage": 99.82, "elapsed_time": "16:25:33", "remaining_time": "0:01:48"}
|
546 |
+
{"current_steps": 546, "total_steps": 546, "loss": 0.4545, "lr": 1.0234704031220066e-10, "epoch": 2.9849521203830367, "percentage": 100.0, "elapsed_time": "16:27:29", "remaining_time": "0:00:00"}
|
547 |
+
{"current_steps": 546, "total_steps": 546, "epoch": 2.9849521203830367, "percentage": 100.0, "elapsed_time": "16:29:56", "remaining_time": "0:00:00"}
|