tangken333 commited on
Commit
a8c67e0
·
verified ·
1 Parent(s): ffb0da5

Training in progress, step 546

Browse files
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:70737d6237cf02beb8a7b08db5a4be41da2e9e92ae986f5bf59d2083e06c3c14
3
  size 4877660776
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f477079e5cb61b17106246e4341a760166d58b5f0b434c25a2b0934b2f0e2ef6
3
  size 4877660776
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9d11b93313511baf4fcd87dd85f0e47b787f59e76dcbd56e904a55a06e67a167
3
  size 4932751008
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c37c31c879dced903610f6adfb439cd92dfedf7bea7c9eeceb93689c7c434b6c
3
  size 4932751008
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b4656d4974cb14cf1e406f81d31a6e3543bb8b967823c38d6b170eb6d5addfd
3
  size 4330865200
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b3a6a0865e01efb8e83702b5aef85d02ddb22788ec8eddffba9906331a48b4f2
3
  size 4330865200
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:dce24f2e897a696129e4bdac8274832ba436ce8364652529d9aecd98bec20fdf
3
  size 1089994880
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4285e63d10a79ff26f74e59bc99913be8c8955c121341f3d6d9118a41ca3f626
3
  size 1089994880
trainer_log.jsonl CHANGED
@@ -399,3 +399,149 @@
399
  {"current_steps": 399, "total_steps": 546, "loss": 0.4877, "lr": 2.079220480245052e-06, "epoch": 2.180574555403557, "percentage": 73.08, "elapsed_time": "12:01:19", "remaining_time": "4:25:45"}
400
  {"current_steps": 400, "total_steps": 546, "loss": 0.4802, "lr": 2.053314589791706e-06, "epoch": 2.186046511627907, "percentage": 73.26, "elapsed_time": "12:02:46", "remaining_time": "4:23:48"}
401
  {"current_steps": 401, "total_steps": 546, "loss": 0.489, "lr": 2.0275293331505437e-06, "epoch": 2.1915184678522572, "percentage": 73.44, "elapsed_time": "12:07:28", "remaining_time": "4:23:03"}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
399
  {"current_steps": 399, "total_steps": 546, "loss": 0.4877, "lr": 2.079220480245052e-06, "epoch": 2.180574555403557, "percentage": 73.08, "elapsed_time": "12:01:19", "remaining_time": "4:25:45"}
400
  {"current_steps": 400, "total_steps": 546, "loss": 0.4802, "lr": 2.053314589791706e-06, "epoch": 2.186046511627907, "percentage": 73.26, "elapsed_time": "12:02:46", "remaining_time": "4:23:48"}
401
  {"current_steps": 401, "total_steps": 546, "loss": 0.489, "lr": 2.0275293331505437e-06, "epoch": 2.1915184678522572, "percentage": 73.44, "elapsed_time": "12:07:28", "remaining_time": "4:23:03"}
402
+ {"current_steps": 402, "total_steps": 546, "loss": 0.5028, "lr": 2.00186576593945e-06, "epoch": 2.196990424076607, "percentage": 73.63, "elapsed_time": "12:09:48", "remaining_time": "4:21:25"}
403
+ {"current_steps": 403, "total_steps": 546, "loss": 0.4967, "lr": 1.9763249387944823e-06, "epoch": 2.2024623803009575, "percentage": 73.81, "elapsed_time": "12:11:39", "remaining_time": "4:19:37"}
404
+ {"current_steps": 404, "total_steps": 546, "loss": 0.4922, "lr": 1.9509078973268645e-06, "epoch": 2.207934336525308, "percentage": 73.99, "elapsed_time": "12:13:03", "remaining_time": "4:17:39"}
405
+ {"current_steps": 405, "total_steps": 546, "loss": 0.4575, "lr": 1.9256156820801896e-06, "epoch": 2.213406292749658, "percentage": 74.18, "elapsed_time": "12:14:54", "remaining_time": "4:15:51"}
406
+ {"current_steps": 406, "total_steps": 546, "loss": 0.4652, "lr": 1.9004493284877995e-06, "epoch": 2.218878248974008, "percentage": 74.36, "elapsed_time": "12:16:25", "remaining_time": "4:13:56"}
407
+ {"current_steps": 407, "total_steps": 546, "loss": 0.4066, "lr": 1.875409866830422e-06, "epoch": 2.2243502051983586, "percentage": 74.54, "elapsed_time": "12:18:24", "remaining_time": "4:12:10"}
408
+ {"current_steps": 408, "total_steps": 546, "loss": 0.4605, "lr": 1.850498322193972e-06, "epoch": 2.2298221614227085, "percentage": 74.73, "elapsed_time": "12:20:07", "remaining_time": "4:10:20"}
409
+ {"current_steps": 409, "total_steps": 546, "loss": 0.4854, "lr": 1.8257157144275939e-06, "epoch": 2.235294117647059, "percentage": 74.91, "elapsed_time": "12:22:04", "remaining_time": "4:08:34"}
410
+ {"current_steps": 410, "total_steps": 546, "loss": 0.531, "lr": 1.8010630581019095e-06, "epoch": 2.2407660738714092, "percentage": 75.09, "elapsed_time": "12:23:31", "remaining_time": "4:06:37"}
411
+ {"current_steps": 411, "total_steps": 546, "loss": 0.5214, "lr": 1.7765413624674866e-06, "epoch": 2.246238030095759, "percentage": 75.27, "elapsed_time": "12:25:19", "remaining_time": "4:04:49"}
412
+ {"current_steps": 412, "total_steps": 546, "loss": 0.5112, "lr": 1.7521516314135112e-06, "epoch": 2.2517099863201095, "percentage": 75.46, "elapsed_time": "12:27:22", "remaining_time": "4:03:04"}
413
+ {"current_steps": 413, "total_steps": 546, "loss": 0.5079, "lr": 1.7278948634266968e-06, "epoch": 2.2571819425444595, "percentage": 75.64, "elapsed_time": "12:28:58", "remaining_time": "4:01:11"}
414
+ {"current_steps": 414, "total_steps": 546, "loss": 0.4258, "lr": 1.703772051550412e-06, "epoch": 2.26265389876881, "percentage": 75.82, "elapsed_time": "12:31:13", "remaining_time": "3:59:31"}
415
+ {"current_steps": 415, "total_steps": 546, "loss": 0.5307, "lr": 1.6797841833440143e-06, "epoch": 2.26812585499316, "percentage": 76.01, "elapsed_time": "12:32:52", "remaining_time": "3:57:39"}
416
+ {"current_steps": 416, "total_steps": 546, "loss": 0.5173, "lr": 1.6559322408424289e-06, "epoch": 2.27359781121751, "percentage": 76.19, "elapsed_time": "12:34:49", "remaining_time": "3:55:53"}
417
+ {"current_steps": 417, "total_steps": 546, "loss": 0.4889, "lr": 1.6322172005159436e-06, "epoch": 2.2790697674418605, "percentage": 76.37, "elapsed_time": "12:36:21", "remaining_time": "3:53:58"}
418
+ {"current_steps": 418, "total_steps": 546, "loss": 0.4621, "lr": 1.608640033230236e-06, "epoch": 2.2845417236662104, "percentage": 76.56, "elapsed_time": "12:37:56", "remaining_time": "3:52:05"}
419
+ {"current_steps": 419, "total_steps": 546, "loss": 0.5532, "lr": 1.5852017042066215e-06, "epoch": 2.290013679890561, "percentage": 76.74, "elapsed_time": "12:39:26", "remaining_time": "3:50:11"}
420
+ {"current_steps": 420, "total_steps": 546, "loss": 0.707, "lr": 1.5619031729825401e-06, "epoch": 2.295485636114911, "percentage": 76.92, "elapsed_time": "12:41:37", "remaining_time": "3:48:29"}
421
+ {"current_steps": 421, "total_steps": 546, "loss": 0.4628, "lr": 1.5387453933722811e-06, "epoch": 2.300957592339261, "percentage": 77.11, "elapsed_time": "12:43:25", "remaining_time": "3:46:40"}
422
+ {"current_steps": 422, "total_steps": 546, "loss": 0.5053, "lr": 1.5157293134279243e-06, "epoch": 2.3064295485636115, "percentage": 77.29, "elapsed_time": "12:45:10", "remaining_time": "3:44:50"}
423
+ {"current_steps": 423, "total_steps": 546, "loss": 0.4868, "lr": 1.492855875400534e-06, "epoch": 2.311901504787962, "percentage": 77.47, "elapsed_time": "12:46:54", "remaining_time": "3:43:00"}
424
+ {"current_steps": 424, "total_steps": 546, "loss": 0.5358, "lr": 1.4701260157015823e-06, "epoch": 2.317373461012312, "percentage": 77.66, "elapsed_time": "12:48:45", "remaining_time": "3:41:12"}
425
+ {"current_steps": 425, "total_steps": 546, "loss": 0.4804, "lr": 1.4475406648646195e-06, "epoch": 2.322845417236662, "percentage": 77.84, "elapsed_time": "12:50:36", "remaining_time": "3:39:23"}
426
+ {"current_steps": 426, "total_steps": 546, "loss": 0.5275, "lr": 1.4251007475071688e-06, "epoch": 2.3283173734610125, "percentage": 78.02, "elapsed_time": "12:52:46", "remaining_time": "3:37:40"}
427
+ {"current_steps": 427, "total_steps": 546, "loss": 0.4416, "lr": 1.402807182292879e-06, "epoch": 2.3337893296853625, "percentage": 78.21, "elapsed_time": "12:54:56", "remaining_time": "3:35:58"}
428
+ {"current_steps": 428, "total_steps": 546, "loss": 0.5521, "lr": 1.3806608818939205e-06, "epoch": 2.339261285909713, "percentage": 78.39, "elapsed_time": "12:57:07", "remaining_time": "3:34:15"}
429
+ {"current_steps": 429, "total_steps": 546, "loss": 0.5347, "lr": 1.3586627529536117e-06, "epoch": 2.3447332421340628, "percentage": 78.57, "elapsed_time": "12:58:49", "remaining_time": "3:32:24"}
430
+ {"current_steps": 430, "total_steps": 546, "loss": 0.5075, "lr": 1.3368136960493083e-06, "epoch": 2.350205198358413, "percentage": 78.75, "elapsed_time": "13:01:15", "remaining_time": "3:30:45"}
431
+ {"current_steps": 431, "total_steps": 546, "loss": 0.5016, "lr": 1.315114605655532e-06, "epoch": 2.3556771545827635, "percentage": 78.94, "elapsed_time": "13:03:04", "remaining_time": "3:28:56"}
432
+ {"current_steps": 432, "total_steps": 546, "loss": 0.4486, "lr": 1.2935663701073586e-06, "epoch": 2.3611491108071134, "percentage": 79.12, "elapsed_time": "13:05:00", "remaining_time": "3:27:09"}
433
+ {"current_steps": 433, "total_steps": 546, "loss": 0.5249, "lr": 1.2721698715640352e-06, "epoch": 2.366621067031464, "percentage": 79.3, "elapsed_time": "13:06:36", "remaining_time": "3:25:16"}
434
+ {"current_steps": 434, "total_steps": 546, "loss": 0.4806, "lr": 1.2509259859728863e-06, "epoch": 2.3720930232558137, "percentage": 79.49, "elapsed_time": "13:08:40", "remaining_time": "3:23:31"}
435
+ {"current_steps": 435, "total_steps": 546, "loss": 0.5134, "lr": 1.2298355830334346e-06, "epoch": 2.377564979480164, "percentage": 79.67, "elapsed_time": "13:10:29", "remaining_time": "3:21:42"}
436
+ {"current_steps": 436, "total_steps": 546, "loss": 0.5527, "lr": 1.2088995261618108e-06, "epoch": 2.3830369357045145, "percentage": 79.85, "elapsed_time": "13:12:05", "remaining_time": "3:19:50"}
437
+ {"current_steps": 437, "total_steps": 546, "loss": 0.6196, "lr": 1.1881186724553968e-06, "epoch": 2.3885088919288644, "percentage": 80.04, "elapsed_time": "13:14:38", "remaining_time": "3:18:12"}
438
+ {"current_steps": 438, "total_steps": 546, "loss": 0.5563, "lr": 1.167493872657739e-06, "epoch": 2.3939808481532148, "percentage": 80.22, "elapsed_time": "13:16:21", "remaining_time": "3:16:21"}
439
+ {"current_steps": 439, "total_steps": 546, "loss": 0.5389, "lr": 1.1470259711237285e-06, "epoch": 2.399452804377565, "percentage": 80.4, "elapsed_time": "13:17:50", "remaining_time": "3:14:27"}
440
+ {"current_steps": 440, "total_steps": 546, "loss": 0.56, "lr": 1.1267158057850174e-06, "epoch": 2.404924760601915, "percentage": 80.59, "elapsed_time": "13:19:26", "remaining_time": "3:12:35"}
441
+ {"current_steps": 441, "total_steps": 546, "loss": 0.5401, "lr": 1.106564208115734e-06, "epoch": 2.4103967168262654, "percentage": 80.77, "elapsed_time": "13:21:25", "remaining_time": "3:10:48"}
442
+ {"current_steps": 442, "total_steps": 546, "loss": 0.4837, "lr": 1.0865720030984268e-06, "epoch": 2.415868673050616, "percentage": 80.95, "elapsed_time": "13:22:49", "remaining_time": "3:08:54"}
443
+ {"current_steps": 443, "total_steps": 546, "loss": 0.5257, "lr": 1.066740009190304e-06, "epoch": 2.4213406292749657, "percentage": 81.14, "elapsed_time": "13:24:35", "remaining_time": "3:07:04"}
444
+ {"current_steps": 444, "total_steps": 546, "loss": 0.4895, "lr": 1.0470690382897164e-06, "epoch": 2.426812585499316, "percentage": 81.32, "elapsed_time": "13:26:29", "remaining_time": "3:05:16"}
445
+ {"current_steps": 445, "total_steps": 546, "loss": 0.4759, "lr": 1.0275598957029232e-06, "epoch": 2.432284541723666, "percentage": 81.5, "elapsed_time": "13:27:58", "remaining_time": "3:03:22"}
446
+ {"current_steps": 446, "total_steps": 546, "loss": 0.5258, "lr": 1.0082133801111294e-06, "epoch": 2.4377564979480164, "percentage": 81.68, "elapsed_time": "13:29:53", "remaining_time": "3:01:35"}
447
+ {"current_steps": 447, "total_steps": 546, "loss": 0.4596, "lr": 9.890302835377736e-07, "epoch": 2.443228454172367, "percentage": 81.87, "elapsed_time": "13:31:20", "remaining_time": "2:59:41"}
448
+ {"current_steps": 448, "total_steps": 546, "loss": 0.4904, "lr": 9.70011391316124e-07, "epoch": 2.4487004103967167, "percentage": 82.05, "elapsed_time": "13:33:09", "remaining_time": "2:57:52"}
449
+ {"current_steps": 449, "total_steps": 546, "loss": 0.5418, "lr": 9.511574820571095e-07, "epoch": 2.454172366621067, "percentage": 82.23, "elapsed_time": "13:35:01", "remaining_time": "2:56:04"}
450
+ {"current_steps": 450, "total_steps": 546, "loss": 0.5106, "lr": 9.324693276174568e-07, "epoch": 2.459644322845417, "percentage": 82.42, "elapsed_time": "13:37:16", "remaining_time": "2:54:21"}
451
+ {"current_steps": 451, "total_steps": 546, "loss": 0.5182, "lr": 9.13947693068083e-07, "epoch": 2.4651162790697674, "percentage": 82.6, "elapsed_time": "13:39:21", "remaining_time": "2:52:35"}
452
+ {"current_steps": 452, "total_steps": 546, "loss": 0.4735, "lr": 8.955933366627778e-07, "epoch": 2.4705882352941178, "percentage": 82.78, "elapsed_time": "13:41:24", "remaining_time": "2:50:49"}
453
+ {"current_steps": 453, "total_steps": 546, "loss": 0.5394, "lr": 8.774070098071669e-07, "epoch": 2.4760601915184677, "percentage": 82.97, "elapsed_time": "13:43:38", "remaining_time": "2:49:05"}
454
+ {"current_steps": 454, "total_steps": 546, "loss": 0.4599, "lr": 8.593894570279365e-07, "epoch": 2.481532147742818, "percentage": 83.15, "elapsed_time": "13:45:28", "remaining_time": "2:47:16"}
455
+ {"current_steps": 455, "total_steps": 546, "loss": 0.4669, "lr": 8.415414159423707e-07, "epoch": 2.4870041039671684, "percentage": 83.33, "elapsed_time": "13:47:16", "remaining_time": "2:45:27"}
456
+ {"current_steps": 456, "total_steps": 546, "loss": 0.4434, "lr": 8.238636172281394e-07, "epoch": 2.4924760601915183, "percentage": 83.52, "elapsed_time": "13:49:10", "remaining_time": "2:43:39"}
457
+ {"current_steps": 457, "total_steps": 546, "loss": 0.4307, "lr": 8.063567845933973e-07, "epoch": 2.4979480164158687, "percentage": 83.7, "elapsed_time": "13:50:51", "remaining_time": "2:41:48"}
458
+ {"current_steps": 458, "total_steps": 546, "loss": 0.5538, "lr": 7.890216347471408e-07, "epoch": 2.503419972640219, "percentage": 83.88, "elapsed_time": "13:53:07", "remaining_time": "2:40:04"}
459
+ {"current_steps": 459, "total_steps": 546, "loss": 0.4864, "lr": 7.718588773698871e-07, "epoch": 2.508891928864569, "percentage": 84.07, "elapsed_time": "13:55:12", "remaining_time": "2:38:18"}
460
+ {"current_steps": 460, "total_steps": 546, "loss": 0.5177, "lr": 7.548692150846021e-07, "epoch": 2.5143638850889194, "percentage": 84.25, "elapsed_time": "13:57:26", "remaining_time": "2:36:33"}
461
+ {"current_steps": 461, "total_steps": 546, "loss": 0.4806, "lr": 7.380533434279457e-07, "epoch": 2.5198358413132693, "percentage": 84.43, "elapsed_time": "13:58:50", "remaining_time": "2:34:40"}
462
+ {"current_steps": 462, "total_steps": 546, "loss": 0.458, "lr": 7.214119508217976e-07, "epoch": 2.5253077975376197, "percentage": 84.62, "elapsed_time": "14:00:30", "remaining_time": "2:32:49"}
463
+ {"current_steps": 463, "total_steps": 546, "loss": 0.4749, "lr": 7.049457185450692e-07, "epoch": 2.53077975376197, "percentage": 84.8, "elapsed_time": "14:03:02", "remaining_time": "2:31:07"}
464
+ {"current_steps": 464, "total_steps": 546, "loss": 0.717, "lr": 6.88655320705815e-07, "epoch": 2.53625170998632, "percentage": 84.98, "elapsed_time": "14:04:51", "remaining_time": "2:29:18"}
465
+ {"current_steps": 465, "total_steps": 546, "loss": 0.4695, "lr": 6.725414242136364e-07, "epoch": 2.5417236662106704, "percentage": 85.16, "elapsed_time": "14:06:12", "remaining_time": "2:27:24"}
466
+ {"current_steps": 466, "total_steps": 546, "loss": 0.4882, "lr": 6.566046887523808e-07, "epoch": 2.5471956224350203, "percentage": 85.35, "elapsed_time": "14:07:34", "remaining_time": "2:25:30"}
467
+ {"current_steps": 467, "total_steps": 546, "loss": 0.4828, "lr": 6.408457667531298e-07, "epoch": 2.5526675786593707, "percentage": 85.53, "elapsed_time": "14:09:40", "remaining_time": "2:23:44"}
468
+ {"current_steps": 468, "total_steps": 546, "loss": 0.5306, "lr": 6.252653033674927e-07, "epoch": 2.558139534883721, "percentage": 85.71, "elapsed_time": "14:11:35", "remaining_time": "2:21:55"}
469
+ {"current_steps": 469, "total_steps": 546, "loss": 0.519, "lr": 6.098639364411974e-07, "epoch": 2.5636114911080714, "percentage": 85.9, "elapsed_time": "14:13:17", "remaining_time": "2:20:05"}
470
+ {"current_steps": 470, "total_steps": 546, "loss": 0.5186, "lr": 5.946422964879706e-07, "epoch": 2.5690834473324213, "percentage": 86.08, "elapsed_time": "14:14:58", "remaining_time": "2:18:15"}
471
+ {"current_steps": 471, "total_steps": 546, "loss": 0.4709, "lr": 5.79601006663732e-07, "epoch": 2.5745554035567717, "percentage": 86.26, "elapsed_time": "14:17:03", "remaining_time": "2:16:28"}
472
+ {"current_steps": 472, "total_steps": 546, "loss": 0.4838, "lr": 5.647406827410796e-07, "epoch": 2.5800273597811216, "percentage": 86.45, "elapsed_time": "14:18:26", "remaining_time": "2:14:35"}
473
+ {"current_steps": 473, "total_steps": 546, "loss": 0.4406, "lr": 5.500619330840829e-07, "epoch": 2.585499316005472, "percentage": 86.63, "elapsed_time": "14:19:59", "remaining_time": "2:12:43"}
474
+ {"current_steps": 474, "total_steps": 546, "loss": 0.4995, "lr": 5.35565358623375e-07, "epoch": 2.5909712722298224, "percentage": 86.81, "elapsed_time": "14:21:50", "remaining_time": "2:10:54"}
475
+ {"current_steps": 475, "total_steps": 546, "loss": 0.4685, "lr": 5.212515528315504e-07, "epoch": 2.5964432284541723, "percentage": 87.0, "elapsed_time": "14:23:37", "remaining_time": "2:09:05"}
476
+ {"current_steps": 476, "total_steps": 546, "loss": 0.5057, "lr": 5.071211016988753e-07, "epoch": 2.6019151846785227, "percentage": 87.18, "elapsed_time": "14:25:15", "remaining_time": "2:07:14"}
477
+ {"current_steps": 477, "total_steps": 546, "loss": 0.4893, "lr": 4.931745837092888e-07, "epoch": 2.6073871409028726, "percentage": 87.36, "elapsed_time": "14:27:06", "remaining_time": "2:05:25"}
478
+ {"current_steps": 478, "total_steps": 546, "loss": 0.4931, "lr": 4.794125698167262e-07, "epoch": 2.612859097127223, "percentage": 87.55, "elapsed_time": "14:28:49", "remaining_time": "2:03:35"}
479
+ {"current_steps": 479, "total_steps": 546, "loss": 0.5162, "lr": 4.658356234217437e-07, "epoch": 2.6183310533515733, "percentage": 87.73, "elapsed_time": "14:30:26", "remaining_time": "2:01:45"}
480
+ {"current_steps": 480, "total_steps": 546, "loss": 0.5098, "lr": 4.5244430034845466e-07, "epoch": 2.6238030095759233, "percentage": 87.91, "elapsed_time": "14:31:50", "remaining_time": "1:59:52"}
481
+ {"current_steps": 481, "total_steps": 546, "loss": 0.5566, "lr": 4.3923914882177124e-07, "epoch": 2.6292749658002736, "percentage": 88.1, "elapsed_time": "14:33:50", "remaining_time": "1:58:05"}
482
+ {"current_steps": 482, "total_steps": 546, "loss": 0.4831, "lr": 4.262207094449633e-07, "epoch": 2.6347469220246236, "percentage": 88.28, "elapsed_time": "14:35:06", "remaining_time": "1:56:11"}
483
+ {"current_steps": 483, "total_steps": 546, "loss": 0.4815, "lr": 4.1338951517752637e-07, "epoch": 2.640218878248974, "percentage": 88.46, "elapsed_time": "14:37:09", "remaining_time": "1:54:24"}
484
+ {"current_steps": 484, "total_steps": 546, "loss": 0.4281, "lr": 4.007460913133643e-07, "epoch": 2.6456908344733243, "percentage": 88.64, "elapsed_time": "14:38:44", "remaining_time": "1:52:33"}
485
+ {"current_steps": 485, "total_steps": 546, "loss": 0.4698, "lr": 3.8829095545928177e-07, "epoch": 2.6511627906976747, "percentage": 88.83, "elapsed_time": "14:40:32", "remaining_time": "1:50:44"}
486
+ {"current_steps": 486, "total_steps": 546, "loss": 0.4481, "lr": 3.760246175137938e-07, "epoch": 2.6566347469220246, "percentage": 89.01, "elapsed_time": "14:42:35", "remaining_time": "1:48:57"}
487
+ {"current_steps": 487, "total_steps": 546, "loss": 0.4609, "lr": 3.639475796462577e-07, "epoch": 2.662106703146375, "percentage": 89.19, "elapsed_time": "14:44:45", "remaining_time": "1:47:11"}
488
+ {"current_steps": 488, "total_steps": 546, "loss": 0.4648, "lr": 3.5206033627630145e-07, "epoch": 2.667578659370725, "percentage": 89.38, "elapsed_time": "14:46:42", "remaining_time": "1:45:23"}
489
+ {"current_steps": 489, "total_steps": 546, "loss": 0.4802, "lr": 3.403633740535983e-07, "epoch": 2.6730506155950753, "percentage": 89.56, "elapsed_time": "14:48:28", "remaining_time": "1:43:33"}
490
+ {"current_steps": 490, "total_steps": 546, "loss": 0.4876, "lr": 3.2885717183793296e-07, "epoch": 2.6785225718194257, "percentage": 89.74, "elapsed_time": "14:50:14", "remaining_time": "1:41:44"}
491
+ {"current_steps": 491, "total_steps": 546, "loss": 0.5916, "lr": 3.175422006796031e-07, "epoch": 2.6839945280437756, "percentage": 89.93, "elapsed_time": "14:51:27", "remaining_time": "1:39:51"}
492
+ {"current_steps": 492, "total_steps": 546, "loss": 0.5125, "lr": 3.064189238001325e-07, "epoch": 2.689466484268126, "percentage": 90.11, "elapsed_time": "14:53:22", "remaining_time": "1:38:03"}
493
+ {"current_steps": 493, "total_steps": 546, "loss": 0.4823, "lr": 2.9548779657330605e-07, "epoch": 2.694938440492476, "percentage": 90.29, "elapsed_time": "14:54:45", "remaining_time": "1:36:11"}
494
+ {"current_steps": 494, "total_steps": 546, "loss": 0.4857, "lr": 2.847492665065349e-07, "epoch": 2.7004103967168263, "percentage": 90.48, "elapsed_time": "14:56:20", "remaining_time": "1:34:21"}
495
+ {"current_steps": 495, "total_steps": 546, "loss": 0.4717, "lr": 2.742037732225228e-07, "epoch": 2.7058823529411766, "percentage": 90.66, "elapsed_time": "14:57:36", "remaining_time": "1:32:28"}
496
+ {"current_steps": 496, "total_steps": 546, "loss": 0.4976, "lr": 2.6385174844128337e-07, "epoch": 2.7113543091655266, "percentage": 90.84, "elapsed_time": "14:59:34", "remaining_time": "1:30:40"}
497
+ {"current_steps": 497, "total_steps": 546, "loss": 0.484, "lr": 2.5369361596245366e-07, "epoch": 2.716826265389877, "percentage": 91.03, "elapsed_time": "15:01:01", "remaining_time": "1:28:49"}
498
+ {"current_steps": 498, "total_steps": 546, "loss": 0.6527, "lr": 2.4372979164795306e-07, "epoch": 2.722298221614227, "percentage": 91.21, "elapsed_time": "15:03:02", "remaining_time": "1:27:02"}
499
+ {"current_steps": 499, "total_steps": 546, "loss": 0.4795, "lr": 2.3396068340495182e-07, "epoch": 2.7277701778385772, "percentage": 91.39, "elapsed_time": "15:04:54", "remaining_time": "1:25:13"}
500
+ {"current_steps": 500, "total_steps": 546, "loss": 0.5174, "lr": 2.2438669116917612e-07, "epoch": 2.7332421340629276, "percentage": 91.58, "elapsed_time": "15:05:58", "remaining_time": "1:23:20"}
501
+ {"current_steps": 501, "total_steps": 546, "loss": 0.4473, "lr": 2.1500820688853562e-07, "epoch": 2.738714090287278, "percentage": 91.76, "elapsed_time": "15:07:34", "remaining_time": "1:21:31"}
502
+ {"current_steps": 502, "total_steps": 546, "loss": 0.4801, "lr": 2.0582561450707027e-07, "epoch": 2.744186046511628, "percentage": 91.94, "elapsed_time": "15:09:06", "remaining_time": "1:19:40"}
503
+ {"current_steps": 503, "total_steps": 546, "loss": 0.5184, "lr": 1.9683928994924383e-07, "epoch": 2.7496580027359783, "percentage": 92.12, "elapsed_time": "15:10:26", "remaining_time": "1:17:49"}
504
+ {"current_steps": 504, "total_steps": 546, "loss": 0.4947, "lr": 1.8804960110454406e-07, "epoch": 2.755129958960328, "percentage": 92.31, "elapsed_time": "15:12:41", "remaining_time": "1:16:03"}
505
+ {"current_steps": 505, "total_steps": 546, "loss": 0.5058, "lr": 1.7945690781242752e-07, "epoch": 2.7606019151846786, "percentage": 92.49, "elapsed_time": "15:14:37", "remaining_time": "1:14:15"}
506
+ {"current_steps": 506, "total_steps": 546, "loss": 0.4957, "lr": 1.7106156184758248e-07, "epoch": 2.766073871409029, "percentage": 92.67, "elapsed_time": "15:16:34", "remaining_time": "1:12:27"}
507
+ {"current_steps": 507, "total_steps": 546, "loss": 0.4932, "lr": 1.62863906905536e-07, "epoch": 2.771545827633379, "percentage": 92.86, "elapsed_time": "15:17:58", "remaining_time": "1:10:36"}
508
+ {"current_steps": 508, "total_steps": 546, "loss": 0.5382, "lr": 1.5486427858857567e-07, "epoch": 2.7770177838577292, "percentage": 93.04, "elapsed_time": "15:19:55", "remaining_time": "1:08:48"}
509
+ {"current_steps": 509, "total_steps": 546, "loss": 0.532, "lr": 1.4706300439201348e-07, "epoch": 2.782489740082079, "percentage": 93.22, "elapsed_time": "15:21:32", "remaining_time": "1:06:59"}
510
+ {"current_steps": 510, "total_steps": 546, "loss": 0.4758, "lr": 1.394604036907804e-07, "epoch": 2.7879616963064295, "percentage": 93.41, "elapsed_time": "15:23:35", "remaining_time": "1:05:11"}
511
+ {"current_steps": 511, "total_steps": 546, "loss": 0.5132, "lr": 1.320567877263479e-07, "epoch": 2.79343365253078, "percentage": 93.59, "elapsed_time": "15:25:35", "remaining_time": "1:03:23"}
512
+ {"current_steps": 512, "total_steps": 546, "loss": 0.4615, "lr": 1.2485245959398928e-07, "epoch": 2.79890560875513, "percentage": 93.77, "elapsed_time": "15:27:59", "remaining_time": "1:01:37"}
513
+ {"current_steps": 513, "total_steps": 546, "loss": 0.4846, "lr": 1.17847714230368e-07, "epoch": 2.80437756497948, "percentage": 93.96, "elapsed_time": "15:29:26", "remaining_time": "0:59:47"}
514
+ {"current_steps": 514, "total_steps": 546, "loss": 0.47, "lr": 1.1104283840146834e-07, "epoch": 2.80984952120383, "percentage": 94.14, "elapsed_time": "15:31:29", "remaining_time": "0:57:59"}
515
+ {"current_steps": 515, "total_steps": 546, "loss": 0.672, "lr": 1.044381106908493e-07, "epoch": 2.8153214774281805, "percentage": 94.32, "elapsed_time": "15:33:39", "remaining_time": "0:56:12"}
516
+ {"current_steps": 516, "total_steps": 546, "loss": 0.5008, "lr": 9.803380148824371e-08, "epoch": 2.820793433652531, "percentage": 94.51, "elapsed_time": "15:35:14", "remaining_time": "0:54:22"}
517
+ {"current_steps": 517, "total_steps": 546, "loss": 0.4817, "lr": 9.18301729784904e-08, "epoch": 2.8262653898768813, "percentage": 94.69, "elapsed_time": "15:36:40", "remaining_time": "0:52:32"}
518
+ {"current_steps": 518, "total_steps": 546, "loss": 0.5053, "lr": 8.582747913079448e-08, "epoch": 2.831737346101231, "percentage": 94.87, "elapsed_time": "15:38:40", "remaining_time": "0:50:44"}
519
+ {"current_steps": 519, "total_steps": 546, "loss": 0.4637, "lr": 8.00259656883362e-08, "epoch": 2.8372093023255816, "percentage": 95.05, "elapsed_time": "15:40:57", "remaining_time": "0:48:57"}
520
+ {"current_steps": 520, "total_steps": 546, "loss": 0.4491, "lr": 7.442587015820734e-08, "epoch": 2.8426812585499315, "percentage": 95.24, "elapsed_time": "15:43:05", "remaining_time": "0:47:09"}
521
+ {"current_steps": 521, "total_steps": 546, "loss": 0.5315, "lr": 6.902742180168953e-08, "epoch": 2.848153214774282, "percentage": 95.42, "elapsed_time": "15:44:35", "remaining_time": "0:45:19"}
522
+ {"current_steps": 522, "total_steps": 546, "loss": 0.4774, "lr": 6.38308416248673e-08, "epoch": 2.853625170998632, "percentage": 95.6, "elapsed_time": "15:46:26", "remaining_time": "0:43:30"}
523
+ {"current_steps": 523, "total_steps": 546, "loss": 0.479, "lr": 5.883634236958091e-08, "epoch": 2.859097127222982, "percentage": 95.79, "elapsed_time": "15:47:50", "remaining_time": "0:41:40"}
524
+ {"current_steps": 524, "total_steps": 546, "loss": 0.441, "lr": 5.4044128504717186e-08, "epoch": 2.8645690834473325, "percentage": 95.97, "elapsed_time": "15:50:01", "remaining_time": "0:39:53"}
525
+ {"current_steps": 525, "total_steps": 546, "loss": 0.5298, "lr": 4.945439621783843e-08, "epoch": 2.8700410396716824, "percentage": 96.15, "elapsed_time": "15:51:39", "remaining_time": "0:38:03"}
526
+ {"current_steps": 526, "total_steps": 546, "loss": 0.5647, "lr": 4.506733340714997e-08, "epoch": 2.875512995896033, "percentage": 96.34, "elapsed_time": "15:53:14", "remaining_time": "0:36:14"}
527
+ {"current_steps": 527, "total_steps": 546, "loss": 0.5675, "lr": 4.08831196738102e-08, "epoch": 2.880984952120383, "percentage": 96.52, "elapsed_time": "15:54:34", "remaining_time": "0:34:24"}
528
+ {"current_steps": 528, "total_steps": 546, "loss": 0.5109, "lr": 3.69019263145759e-08, "epoch": 2.886456908344733, "percentage": 96.7, "elapsed_time": "15:56:28", "remaining_time": "0:32:36"}
529
+ {"current_steps": 529, "total_steps": 546, "loss": 0.4531, "lr": 3.312391631479006e-08, "epoch": 2.8919288645690835, "percentage": 96.89, "elapsed_time": "15:57:48", "remaining_time": "0:30:46"}
530
+ {"current_steps": 530, "total_steps": 546, "loss": 0.5175, "lr": 2.9549244341708917e-08, "epoch": 2.8974008207934334, "percentage": 97.07, "elapsed_time": "15:58:56", "remaining_time": "0:28:56"}
531
+ {"current_steps": 531, "total_steps": 546, "loss": 0.4984, "lr": 2.6178056738170866e-08, "epoch": 2.902872777017784, "percentage": 97.25, "elapsed_time": "16:00:56", "remaining_time": "0:27:08"}
532
+ {"current_steps": 532, "total_steps": 546, "loss": 0.5347, "lr": 2.301049151660628e-08, "epoch": 2.908344733242134, "percentage": 97.44, "elapsed_time": "16:02:12", "remaining_time": "0:25:19"}
533
+ {"current_steps": 533, "total_steps": 546, "loss": 0.5113, "lr": 2.0046678353384254e-08, "epoch": 2.9138166894664845, "percentage": 97.62, "elapsed_time": "16:03:49", "remaining_time": "0:23:30"}
534
+ {"current_steps": 534, "total_steps": 546, "loss": 0.4774, "lr": 1.7286738583507935e-08, "epoch": 2.9192886456908345, "percentage": 97.8, "elapsed_time": "16:06:17", "remaining_time": "0:21:42"}
535
+ {"current_steps": 535, "total_steps": 546, "loss": 0.4891, "lr": 1.4730785195643527e-08, "epoch": 2.924760601915185, "percentage": 97.99, "elapsed_time": "16:07:51", "remaining_time": "0:19:53"}
536
+ {"current_steps": 536, "total_steps": 546, "loss": 0.4572, "lr": 1.2378922827496198e-08, "epoch": 2.9302325581395348, "percentage": 98.17, "elapsed_time": "16:09:53", "remaining_time": "0:18:05"}
537
+ {"current_steps": 537, "total_steps": 546, "loss": 0.4398, "lr": 1.0231247761528507e-08, "epoch": 2.935704514363885, "percentage": 98.35, "elapsed_time": "16:12:11", "remaining_time": "0:16:17"}
538
+ {"current_steps": 538, "total_steps": 546, "loss": 0.4239, "lr": 8.287847921013558e-09, "epoch": 2.9411764705882355, "percentage": 98.53, "elapsed_time": "16:13:40", "remaining_time": "0:14:28"}
539
+ {"current_steps": 539, "total_steps": 546, "loss": 0.5259, "lr": 6.548802866441218e-09, "epoch": 2.9466484268125854, "percentage": 98.72, "elapsed_time": "16:15:03", "remaining_time": "0:12:39"}
540
+ {"current_steps": 540, "total_steps": 546, "loss": 0.5069, "lr": 5.014183792256266e-09, "epoch": 2.952120383036936, "percentage": 98.9, "elapsed_time": "16:16:34", "remaining_time": "0:10:51"}
541
+ {"current_steps": 541, "total_steps": 546, "loss": 0.4951, "lr": 3.6840535239474063e-09, "epoch": 2.9575923392612857, "percentage": 99.08, "elapsed_time": "16:17:59", "remaining_time": "0:09:02"}
542
+ {"current_steps": 542, "total_steps": 546, "loss": 0.4817, "lr": 2.5584665154732015e-09, "epoch": 2.963064295485636, "percentage": 99.27, "elapsed_time": "16:19:49", "remaining_time": "0:07:13"}
543
+ {"current_steps": 543, "total_steps": 546, "loss": 0.5063, "lr": 1.6374688470327526e-09, "epoch": 2.9685362517099865, "percentage": 99.45, "elapsed_time": "16:21:43", "remaining_time": "0:05:25"}
544
+ {"current_steps": 544, "total_steps": 546, "loss": 0.5241, "lr": 9.210982231805388e-10, "epoch": 2.9740082079343364, "percentage": 99.63, "elapsed_time": "16:23:37", "remaining_time": "0:03:36"}
545
+ {"current_steps": 545, "total_steps": 546, "loss": 0.5268, "lr": 4.093839712815406e-10, "epoch": 2.9794801641586868, "percentage": 99.82, "elapsed_time": "16:25:33", "remaining_time": "0:01:48"}
546
+ {"current_steps": 546, "total_steps": 546, "loss": 0.4545, "lr": 1.0234704031220066e-10, "epoch": 2.9849521203830367, "percentage": 100.0, "elapsed_time": "16:27:29", "remaining_time": "0:00:00"}
547
+ {"current_steps": 546, "total_steps": 546, "epoch": 2.9849521203830367, "percentage": 100.0, "elapsed_time": "16:29:56", "remaining_time": "0:00:00"}