Upload trainer_log.jsonl with huggingface_hub
Browse files- trainer_log.jsonl +163 -0
trainer_log.jsonl
ADDED
@@ -0,0 +1,163 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{"current_steps": 1, "total_steps": 162, "loss": 0.7616, "lr": 5.882352941176471e-07, "epoch": 0.03614457831325301, "percentage": 0.62, "elapsed_time": "0:02:00", "remaining_time": "5:23:12"}
|
2 |
+
{"current_steps": 2, "total_steps": 162, "loss": 0.7427, "lr": 1.1764705882352942e-06, "epoch": 0.07228915662650602, "percentage": 1.23, "elapsed_time": "0:04:03", "remaining_time": "5:24:40"}
|
3 |
+
{"current_steps": 3, "total_steps": 162, "loss": 0.744, "lr": 1.7647058823529414e-06, "epoch": 0.10843373493975904, "percentage": 1.85, "elapsed_time": "0:05:59", "remaining_time": "5:17:10"}
|
4 |
+
{"current_steps": 4, "total_steps": 162, "loss": 0.7432, "lr": 2.3529411764705885e-06, "epoch": 0.14457831325301204, "percentage": 2.47, "elapsed_time": "0:07:39", "remaining_time": "5:02:34"}
|
5 |
+
{"current_steps": 5, "total_steps": 162, "loss": 0.7608, "lr": 2.9411764705882355e-06, "epoch": 0.18072289156626506, "percentage": 3.09, "elapsed_time": "0:09:10", "remaining_time": "4:48:15"}
|
6 |
+
{"current_steps": 6, "total_steps": 162, "loss": 0.7493, "lr": 3.529411764705883e-06, "epoch": 0.21686746987951808, "percentage": 3.7, "elapsed_time": "0:10:50", "remaining_time": "4:41:49"}
|
7 |
+
{"current_steps": 7, "total_steps": 162, "loss": 0.7395, "lr": 4.11764705882353e-06, "epoch": 0.25301204819277107, "percentage": 4.32, "elapsed_time": "0:12:34", "remaining_time": "4:38:16"}
|
8 |
+
{"current_steps": 8, "total_steps": 162, "loss": 0.7363, "lr": 4.705882352941177e-06, "epoch": 0.2891566265060241, "percentage": 4.94, "elapsed_time": "0:14:17", "remaining_time": "4:35:14"}
|
9 |
+
{"current_steps": 9, "total_steps": 162, "loss": 0.7224, "lr": 5.294117647058824e-06, "epoch": 0.3253012048192771, "percentage": 5.56, "elapsed_time": "0:15:49", "remaining_time": "4:29:08"}
|
10 |
+
{"current_steps": 10, "total_steps": 162, "loss": 0.7079, "lr": 5.882352941176471e-06, "epoch": 0.3614457831325301, "percentage": 6.17, "elapsed_time": "0:17:29", "remaining_time": "4:25:45"}
|
11 |
+
{"current_steps": 11, "total_steps": 162, "loss": 0.6976, "lr": 6.470588235294119e-06, "epoch": 0.39759036144578314, "percentage": 6.79, "elapsed_time": "0:18:59", "remaining_time": "4:20:46"}
|
12 |
+
{"current_steps": 12, "total_steps": 162, "loss": 0.6877, "lr": 7.058823529411766e-06, "epoch": 0.43373493975903615, "percentage": 7.41, "elapsed_time": "0:20:46", "remaining_time": "4:19:38"}
|
13 |
+
{"current_steps": 13, "total_steps": 162, "loss": 0.6651, "lr": 7.647058823529411e-06, "epoch": 0.46987951807228917, "percentage": 8.02, "elapsed_time": "0:22:41", "remaining_time": "4:20:05"}
|
14 |
+
{"current_steps": 14, "total_steps": 162, "loss": 0.6765, "lr": 8.23529411764706e-06, "epoch": 0.5060240963855421, "percentage": 8.64, "elapsed_time": "0:24:46", "remaining_time": "4:21:53"}
|
15 |
+
{"current_steps": 15, "total_steps": 162, "loss": 0.6804, "lr": 8.823529411764707e-06, "epoch": 0.5421686746987951, "percentage": 9.26, "elapsed_time": "0:26:30", "remaining_time": "4:19:47"}
|
16 |
+
{"current_steps": 16, "total_steps": 162, "loss": 0.6565, "lr": 9.411764705882354e-06, "epoch": 0.5783132530120482, "percentage": 9.88, "elapsed_time": "0:28:10", "remaining_time": "4:17:04"}
|
17 |
+
{"current_steps": 17, "total_steps": 162, "loss": 0.6346, "lr": 1e-05, "epoch": 0.6144578313253012, "percentage": 10.49, "elapsed_time": "0:30:05", "remaining_time": "4:16:41"}
|
18 |
+
{"current_steps": 18, "total_steps": 162, "loss": 0.669, "lr": 9.99882649009242e-06, "epoch": 0.6506024096385542, "percentage": 11.11, "elapsed_time": "0:31:35", "remaining_time": "4:12:42"}
|
19 |
+
{"current_steps": 19, "total_steps": 162, "loss": 0.6494, "lr": 9.995306511219885e-06, "epoch": 0.6867469879518072, "percentage": 11.73, "elapsed_time": "0:33:21", "remaining_time": "4:11:00"}
|
20 |
+
{"current_steps": 20, "total_steps": 162, "loss": 0.6397, "lr": 9.989441715674422e-06, "epoch": 0.7228915662650602, "percentage": 12.35, "elapsed_time": "0:35:06", "remaining_time": "4:09:16"}
|
21 |
+
{"current_steps": 21, "total_steps": 162, "loss": 0.645, "lr": 9.981234856414306e-06, "epoch": 0.7590361445783133, "percentage": 12.96, "elapsed_time": "0:37:23", "remaining_time": "4:11:00"}
|
22 |
+
{"current_steps": 22, "total_steps": 162, "loss": 0.6516, "lr": 9.970689785771798e-06, "epoch": 0.7951807228915663, "percentage": 13.58, "elapsed_time": "0:38:56", "remaining_time": "4:07:47"}
|
23 |
+
{"current_steps": 23, "total_steps": 162, "loss": 0.6296, "lr": 9.957811453644848e-06, "epoch": 0.8313253012048193, "percentage": 14.2, "elapsed_time": "0:40:39", "remaining_time": "4:05:44"}
|
24 |
+
{"current_steps": 24, "total_steps": 162, "loss": 0.6335, "lr": 9.942605905173593e-06, "epoch": 0.8674698795180723, "percentage": 14.81, "elapsed_time": "0:42:16", "remaining_time": "4:03:07"}
|
25 |
+
{"current_steps": 25, "total_steps": 162, "loss": 0.641, "lr": 9.925080277902743e-06, "epoch": 0.9036144578313253, "percentage": 15.43, "elapsed_time": "0:44:05", "remaining_time": "4:01:39"}
|
26 |
+
{"current_steps": 26, "total_steps": 162, "loss": 0.6236, "lr": 9.905242798431196e-06, "epoch": 0.9397590361445783, "percentage": 16.05, "elapsed_time": "0:46:02", "remaining_time": "4:00:50"}
|
27 |
+
{"current_steps": 27, "total_steps": 162, "loss": 0.6434, "lr": 9.883102778550434e-06, "epoch": 0.9759036144578314, "percentage": 16.67, "elapsed_time": "0:47:52", "remaining_time": "3:59:23"}
|
28 |
+
{"current_steps": 28, "total_steps": 162, "loss": 1.2338, "lr": 9.858670610873528e-06, "epoch": 1.036144578313253, "percentage": 17.28, "elapsed_time": "0:50:05", "remaining_time": "3:59:44"}
|
29 |
+
{"current_steps": 29, "total_steps": 162, "loss": 0.5655, "lr": 9.831957763956814e-06, "epoch": 1.072289156626506, "percentage": 17.9, "elapsed_time": "0:54:21", "remaining_time": "4:09:19"}
|
30 |
+
{"current_steps": 30, "total_steps": 162, "loss": 0.5669, "lr": 9.802976776916493e-06, "epoch": 1.108433734939759, "percentage": 18.52, "elapsed_time": "0:55:57", "remaining_time": "4:06:11"}
|
31 |
+
{"current_steps": 31, "total_steps": 162, "loss": 0.5765, "lr": 9.771741253542742e-06, "epoch": 1.144578313253012, "percentage": 19.14, "elapsed_time": "0:58:07", "remaining_time": "4:05:35"}
|
32 |
+
{"current_steps": 32, "total_steps": 162, "loss": 0.5701, "lr": 9.738265855914014e-06, "epoch": 1.180722891566265, "percentage": 19.75, "elapsed_time": "0:59:48", "remaining_time": "4:02:59"}
|
33 |
+
{"current_steps": 33, "total_steps": 162, "loss": 0.5825, "lr": 9.70256629751462e-06, "epoch": 1.216867469879518, "percentage": 20.37, "elapsed_time": "1:01:32", "remaining_time": "4:00:34"}
|
34 |
+
{"current_steps": 34, "total_steps": 162, "loss": 0.5575, "lr": 9.664659335858755e-06, "epoch": 1.2530120481927711, "percentage": 20.99, "elapsed_time": "1:03:27", "remaining_time": "3:58:55"}
|
35 |
+
{"current_steps": 35, "total_steps": 162, "loss": 0.5377, "lr": 9.624562764624445e-06, "epoch": 1.2891566265060241, "percentage": 21.6, "elapsed_time": "1:05:03", "remaining_time": "3:56:04"}
|
36 |
+
{"current_steps": 36, "total_steps": 162, "loss": 0.5801, "lr": 9.582295405301131e-06, "epoch": 1.3253012048192772, "percentage": 22.22, "elapsed_time": "1:06:42", "remaining_time": "3:53:27"}
|
37 |
+
{"current_steps": 37, "total_steps": 162, "loss": 0.5462, "lr": 9.537877098354787e-06, "epoch": 1.3614457831325302, "percentage": 22.84, "elapsed_time": "1:08:24", "remaining_time": "3:51:07"}
|
38 |
+
{"current_steps": 38, "total_steps": 162, "loss": 0.5689, "lr": 9.491328693914723e-06, "epoch": 1.3975903614457832, "percentage": 23.46, "elapsed_time": "1:10:19", "remaining_time": "3:49:28"}
|
39 |
+
{"current_steps": 39, "total_steps": 162, "loss": 0.5429, "lr": 9.442672041986456e-06, "epoch": 1.4337349397590362, "percentage": 24.07, "elapsed_time": "1:11:47", "remaining_time": "3:46:26"}
|
40 |
+
{"current_steps": 40, "total_steps": 162, "loss": 0.5554, "lr": 9.391929982195233e-06, "epoch": 1.4698795180722892, "percentage": 24.69, "elapsed_time": "1:13:14", "remaining_time": "3:43:23"}
|
41 |
+
{"current_steps": 41, "total_steps": 162, "loss": 0.5513, "lr": 9.339126333065008e-06, "epoch": 1.5060240963855422, "percentage": 25.31, "elapsed_time": "1:14:47", "remaining_time": "3:40:42"}
|
42 |
+
{"current_steps": 42, "total_steps": 162, "loss": 0.5419, "lr": 9.284285880837947e-06, "epoch": 1.5421686746987953, "percentage": 25.93, "elapsed_time": "1:16:38", "remaining_time": "3:38:58"}
|
43 |
+
{"current_steps": 43, "total_steps": 162, "loss": 0.5504, "lr": 9.22743436783966e-06, "epoch": 1.5783132530120483, "percentage": 26.54, "elapsed_time": "1:18:18", "remaining_time": "3:36:43"}
|
44 |
+
{"current_steps": 44, "total_steps": 162, "loss": 0.5435, "lr": 9.168598480395653e-06, "epoch": 1.6144578313253013, "percentage": 27.16, "elapsed_time": "1:19:51", "remaining_time": "3:34:08"}
|
45 |
+
{"current_steps": 45, "total_steps": 162, "loss": 0.5437, "lr": 9.107805836304658e-06, "epoch": 1.6506024096385543, "percentage": 27.78, "elapsed_time": "1:21:32", "remaining_time": "3:32:01"}
|
46 |
+
{"current_steps": 46, "total_steps": 162, "loss": 0.5485, "lr": 9.045084971874738e-06, "epoch": 1.6867469879518073, "percentage": 28.4, "elapsed_time": "1:23:21", "remaining_time": "3:30:11"}
|
47 |
+
{"current_steps": 47, "total_steps": 162, "loss": 0.5498, "lr": 8.98046532852822e-06, "epoch": 1.7228915662650603, "percentage": 29.01, "elapsed_time": "1:25:01", "remaining_time": "3:28:03"}
|
48 |
+
{"current_steps": 48, "total_steps": 162, "loss": 0.54, "lr": 8.91397723898178e-06, "epoch": 1.7590361445783134, "percentage": 29.63, "elapsed_time": "1:26:54", "remaining_time": "3:26:25"}
|
49 |
+
{"current_steps": 49, "total_steps": 162, "loss": 0.5558, "lr": 8.845651913008145e-06, "epoch": 1.7951807228915664, "percentage": 30.25, "elapsed_time": "1:28:44", "remaining_time": "3:24:38"}
|
50 |
+
{"current_steps": 50, "total_steps": 162, "loss": 0.5356, "lr": 8.775521422786104e-06, "epoch": 1.8313253012048194, "percentage": 30.86, "elapsed_time": "1:30:17", "remaining_time": "3:22:14"}
|
51 |
+
{"current_steps": 51, "total_steps": 162, "loss": 0.532, "lr": 8.703618687845697e-06, "epoch": 1.8674698795180724, "percentage": 31.48, "elapsed_time": "1:32:20", "remaining_time": "3:20:58"}
|
52 |
+
{"current_steps": 52, "total_steps": 162, "loss": 0.5414, "lr": 8.629977459615655e-06, "epoch": 1.9036144578313254, "percentage": 32.1, "elapsed_time": "1:33:53", "remaining_time": "3:18:37"}
|
53 |
+
{"current_steps": 53, "total_steps": 162, "loss": 0.5625, "lr": 8.554632305580355e-06, "epoch": 1.9397590361445785, "percentage": 32.72, "elapsed_time": "1:35:46", "remaining_time": "3:16:57"}
|
54 |
+
{"current_steps": 54, "total_steps": 162, "loss": 0.5483, "lr": 8.477618593053693e-06, "epoch": 1.9759036144578315, "percentage": 33.33, "elapsed_time": "1:37:21", "remaining_time": "3:14:42"}
|
55 |
+
{"current_steps": 55, "total_steps": 162, "loss": 0.9698, "lr": 8.39897247257754e-06, "epoch": 2.036144578313253, "percentage": 33.95, "elapsed_time": "1:39:29", "remaining_time": "3:13:33"}
|
56 |
+
{"current_steps": 56, "total_steps": 162, "loss": 0.4964, "lr": 8.318730860952523e-06, "epoch": 2.072289156626506, "percentage": 34.57, "elapsed_time": "1:41:25", "remaining_time": "3:11:59"}
|
57 |
+
{"current_steps": 57, "total_steps": 162, "loss": 0.468, "lr": 8.23693142390914e-06, "epoch": 2.108433734939759, "percentage": 35.19, "elapsed_time": "1:45:49", "remaining_time": "3:14:57"}
|
58 |
+
{"current_steps": 58, "total_steps": 162, "loss": 0.4674, "lr": 8.153612558427311e-06, "epoch": 2.144578313253012, "percentage": 35.8, "elapsed_time": "1:47:43", "remaining_time": "3:13:08"}
|
59 |
+
{"current_steps": 59, "total_steps": 162, "loss": 0.46, "lr": 8.068813374712689e-06, "epoch": 2.180722891566265, "percentage": 36.42, "elapsed_time": "1:49:15", "remaining_time": "3:10:43"}
|
60 |
+
{"current_steps": 60, "total_steps": 162, "loss": 0.4591, "lr": 7.982573677838172e-06, "epoch": 2.216867469879518, "percentage": 37.04, "elapsed_time": "1:50:58", "remaining_time": "3:08:40"}
|
61 |
+
{"current_steps": 61, "total_steps": 162, "loss": 0.4656, "lr": 7.894933949059245e-06, "epoch": 2.253012048192771, "percentage": 37.65, "elapsed_time": "1:52:49", "remaining_time": "3:06:49"}
|
62 |
+
{"current_steps": 62, "total_steps": 162, "loss": 0.4669, "lr": 7.805935326811913e-06, "epoch": 2.289156626506024, "percentage": 38.27, "elapsed_time": "1:54:30", "remaining_time": "3:04:41"}
|
63 |
+
{"current_steps": 63, "total_steps": 162, "loss": 0.4774, "lr": 7.715619587402165e-06, "epoch": 2.325301204819277, "percentage": 38.89, "elapsed_time": "1:56:21", "remaining_time": "3:02:50"}
|
64 |
+
{"current_steps": 64, "total_steps": 162, "loss": 0.4386, "lr": 7.624029125396004e-06, "epoch": 2.36144578313253, "percentage": 39.51, "elapsed_time": "1:58:25", "remaining_time": "3:01:19"}
|
65 |
+
{"current_steps": 65, "total_steps": 162, "loss": 0.4412, "lr": 7.53120693371927e-06, "epoch": 2.397590361445783, "percentage": 40.12, "elapsed_time": "2:00:05", "remaining_time": "2:59:12"}
|
66 |
+
{"current_steps": 66, "total_steps": 162, "loss": 0.4442, "lr": 7.437196583476597e-06, "epoch": 2.433734939759036, "percentage": 40.74, "elapsed_time": "2:01:44", "remaining_time": "2:57:04"}
|
67 |
+
{"current_steps": 67, "total_steps": 162, "loss": 0.4664, "lr": 7.342042203498952e-06, "epoch": 2.4698795180722892, "percentage": 41.36, "elapsed_time": "2:03:15", "remaining_time": "2:54:45"}
|
68 |
+
{"current_steps": 68, "total_steps": 162, "loss": 0.4386, "lr": 7.245788459629397e-06, "epoch": 2.5060240963855422, "percentage": 41.98, "elapsed_time": "2:04:58", "remaining_time": "2:52:45"}
|
69 |
+
{"current_steps": 69, "total_steps": 162, "loss": 0.4406, "lr": 7.148480533756759e-06, "epoch": 2.5421686746987953, "percentage": 42.59, "elapsed_time": "2:06:22", "remaining_time": "2:50:20"}
|
70 |
+
{"current_steps": 70, "total_steps": 162, "loss": 0.4568, "lr": 7.050164102607081e-06, "epoch": 2.5783132530120483, "percentage": 43.21, "elapsed_time": "2:08:23", "remaining_time": "2:48:45"}
|
71 |
+
{"current_steps": 71, "total_steps": 162, "loss": 0.4193, "lr": 6.950885316302773e-06, "epoch": 2.6144578313253013, "percentage": 43.83, "elapsed_time": "2:10:15", "remaining_time": "2:46:57"}
|
72 |
+
{"current_steps": 72, "total_steps": 162, "loss": 0.4265, "lr": 6.850690776699574e-06, "epoch": 2.6506024096385543, "percentage": 44.44, "elapsed_time": "2:11:57", "remaining_time": "2:44:57"}
|
73 |
+
{"current_steps": 73, "total_steps": 162, "loss": 0.4544, "lr": 6.749627515511443e-06, "epoch": 2.6867469879518073, "percentage": 45.06, "elapsed_time": "2:13:34", "remaining_time": "2:42:51"}
|
74 |
+
{"current_steps": 74, "total_steps": 162, "loss": 0.435, "lr": 6.647742972233703e-06, "epoch": 2.7228915662650603, "percentage": 45.68, "elapsed_time": "2:15:00", "remaining_time": "2:40:32"}
|
75 |
+
{"current_steps": 75, "total_steps": 162, "loss": 0.4466, "lr": 6.545084971874738e-06, "epoch": 2.7590361445783134, "percentage": 46.3, "elapsed_time": "2:16:44", "remaining_time": "2:38:37"}
|
76 |
+
{"current_steps": 76, "total_steps": 162, "loss": 0.4189, "lr": 6.441701702506755e-06, "epoch": 2.7951807228915664, "percentage": 46.91, "elapsed_time": "2:18:32", "remaining_time": "2:36:46"}
|
77 |
+
{"current_steps": 77, "total_steps": 162, "loss": 0.419, "lr": 6.337641692646106e-06, "epoch": 2.8313253012048194, "percentage": 47.53, "elapsed_time": "2:20:00", "remaining_time": "2:34:33"}
|
78 |
+
{"current_steps": 78, "total_steps": 162, "loss": 0.4361, "lr": 6.2329537884738115e-06, "epoch": 2.8674698795180724, "percentage": 48.15, "elapsed_time": "2:21:42", "remaining_time": "2:32:37"}
|
79 |
+
{"current_steps": 79, "total_steps": 162, "loss": 0.4588, "lr": 6.127687130906972e-06, "epoch": 2.9036144578313254, "percentage": 48.77, "elapsed_time": "2:23:37", "remaining_time": "2:30:54"}
|
80 |
+
{"current_steps": 80, "total_steps": 162, "loss": 0.4462, "lr": 6.021891132531825e-06, "epoch": 2.9397590361445785, "percentage": 49.38, "elapsed_time": "2:25:07", "remaining_time": "2:28:45"}
|
81 |
+
{"current_steps": 81, "total_steps": 162, "loss": 0.4599, "lr": 5.915615454409281e-06, "epoch": 2.9759036144578315, "percentage": 50.0, "elapsed_time": "2:26:58", "remaining_time": "2:26:58"}
|
82 |
+
{"current_steps": 82, "total_steps": 162, "loss": 0.8681, "lr": 5.808909982763825e-06, "epoch": 3.036144578313253, "percentage": 50.62, "elapsed_time": "2:29:48", "remaining_time": "2:26:09"}
|
83 |
+
{"current_steps": 83, "total_steps": 162, "loss": 0.387, "lr": 5.701824805566722e-06, "epoch": 3.072289156626506, "percentage": 51.23, "elapsed_time": "2:31:48", "remaining_time": "2:24:29"}
|
84 |
+
{"current_steps": 84, "total_steps": 162, "loss": 0.3973, "lr": 5.594410189024533e-06, "epoch": 3.108433734939759, "percentage": 51.85, "elapsed_time": "2:33:26", "remaining_time": "2:22:28"}
|
85 |
+
{"current_steps": 85, "total_steps": 162, "loss": 0.3706, "lr": 5.4867165539839505e-06, "epoch": 3.144578313253012, "percentage": 52.47, "elapsed_time": "2:38:04", "remaining_time": "2:23:11"}
|
86 |
+
{"current_steps": 86, "total_steps": 162, "loss": 0.3647, "lr": 5.378794452264053e-06, "epoch": 3.180722891566265, "percentage": 53.09, "elapsed_time": "2:39:54", "remaining_time": "2:21:18"}
|
87 |
+
{"current_steps": 87, "total_steps": 162, "loss": 0.3568, "lr": 5.270694542927089e-06, "epoch": 3.216867469879518, "percentage": 53.7, "elapsed_time": "2:41:28", "remaining_time": "2:19:12"}
|
88 |
+
{"current_steps": 88, "total_steps": 162, "loss": 0.3512, "lr": 5.1624675684989035e-06, "epoch": 3.253012048192771, "percentage": 54.32, "elapsed_time": "2:43:36", "remaining_time": "2:17:34"}
|
89 |
+
{"current_steps": 89, "total_steps": 162, "loss": 0.3561, "lr": 5.054164331150199e-06, "epoch": 3.289156626506024, "percentage": 54.94, "elapsed_time": "2:45:38", "remaining_time": "2:15:51"}
|
90 |
+
{"current_steps": 90, "total_steps": 162, "loss": 0.358, "lr": 4.945835668849801e-06, "epoch": 3.325301204819277, "percentage": 55.56, "elapsed_time": "2:47:28", "remaining_time": "2:13:58"}
|
91 |
+
{"current_steps": 91, "total_steps": 162, "loss": 0.3673, "lr": 4.837532431501098e-06, "epoch": 3.36144578313253, "percentage": 56.17, "elapsed_time": "2:49:14", "remaining_time": "2:12:02"}
|
92 |
+
{"current_steps": 92, "total_steps": 162, "loss": 0.3534, "lr": 4.729305457072913e-06, "epoch": 3.397590361445783, "percentage": 56.79, "elapsed_time": "2:50:53", "remaining_time": "2:10:01"}
|
93 |
+
{"current_steps": 93, "total_steps": 162, "loss": 0.3623, "lr": 4.621205547735949e-06, "epoch": 3.433734939759036, "percentage": 57.41, "elapsed_time": "2:52:29", "remaining_time": "2:07:58"}
|
94 |
+
{"current_steps": 94, "total_steps": 162, "loss": 0.3408, "lr": 4.513283446016052e-06, "epoch": 3.4698795180722892, "percentage": 58.02, "elapsed_time": "2:54:00", "remaining_time": "2:05:52"}
|
95 |
+
{"current_steps": 95, "total_steps": 162, "loss": 0.3612, "lr": 4.4055898109754684e-06, "epoch": 3.5060240963855422, "percentage": 58.64, "elapsed_time": "2:55:54", "remaining_time": "2:04:03"}
|
96 |
+
{"current_steps": 96, "total_steps": 162, "loss": 0.3696, "lr": 4.298175194433279e-06, "epoch": 3.5421686746987953, "percentage": 59.26, "elapsed_time": "2:57:41", "remaining_time": "2:02:09"}
|
97 |
+
{"current_steps": 97, "total_steps": 162, "loss": 0.3652, "lr": 4.191090017236177e-06, "epoch": 3.5783132530120483, "percentage": 59.88, "elapsed_time": "2:59:21", "remaining_time": "2:00:11"}
|
98 |
+
{"current_steps": 98, "total_steps": 162, "loss": 0.3422, "lr": 4.0843845455907195e-06, "epoch": 3.6144578313253013, "percentage": 60.49, "elapsed_time": "3:00:59", "remaining_time": "1:58:12"}
|
99 |
+
{"current_steps": 99, "total_steps": 162, "loss": 0.3717, "lr": 3.9781088674681764e-06, "epoch": 3.6506024096385543, "percentage": 61.11, "elapsed_time": "3:02:36", "remaining_time": "1:56:12"}
|
100 |
+
{"current_steps": 100, "total_steps": 162, "loss": 0.3436, "lr": 3.87231286909303e-06, "epoch": 3.6867469879518073, "percentage": 61.73, "elapsed_time": "3:04:09", "remaining_time": "1:54:10"}
|
101 |
+
{"current_steps": 101, "total_steps": 162, "loss": 0.3584, "lr": 3.767046211526191e-06, "epoch": 3.7228915662650603, "percentage": 62.35, "elapsed_time": "3:05:49", "remaining_time": "1:52:13"}
|
102 |
+
{"current_steps": 102, "total_steps": 162, "loss": 0.3751, "lr": 3.662358307353897e-06, "epoch": 3.7590361445783134, "percentage": 62.96, "elapsed_time": "3:07:21", "remaining_time": "1:50:12"}
|
103 |
+
{"current_steps": 103, "total_steps": 162, "loss": 0.3578, "lr": 3.5582982974932467e-06, "epoch": 3.7951807228915664, "percentage": 63.58, "elapsed_time": "3:09:14", "remaining_time": "1:48:23"}
|
104 |
+
{"current_steps": 104, "total_steps": 162, "loss": 0.3504, "lr": 3.4549150281252635e-06, "epoch": 3.8313253012048194, "percentage": 64.2, "elapsed_time": "3:11:24", "remaining_time": "1:46:45"}
|
105 |
+
{"current_steps": 105, "total_steps": 162, "loss": 0.3371, "lr": 3.3522570277662986e-06, "epoch": 3.8674698795180724, "percentage": 64.81, "elapsed_time": "3:13:06", "remaining_time": "1:44:49"}
|
106 |
+
{"current_steps": 106, "total_steps": 162, "loss": 0.3565, "lr": 3.250372484488558e-06, "epoch": 3.9036144578313254, "percentage": 65.43, "elapsed_time": "3:14:52", "remaining_time": "1:42:56"}
|
107 |
+
{"current_steps": 107, "total_steps": 162, "loss": 0.3649, "lr": 3.149309223300428e-06, "epoch": 3.9397590361445785, "percentage": 66.05, "elapsed_time": "3:16:43", "remaining_time": "1:41:07"}
|
108 |
+
{"current_steps": 108, "total_steps": 162, "loss": 0.3413, "lr": 3.0491146836972273e-06, "epoch": 3.9759036144578315, "percentage": 66.67, "elapsed_time": "3:18:23", "remaining_time": "1:39:11"}
|
109 |
+
{"current_steps": 109, "total_steps": 162, "loss": 0.6546, "lr": 2.9498358973929197e-06, "epoch": 4.036144578313253, "percentage": 67.28, "elapsed_time": "3:20:37", "remaining_time": "1:37:33"}
|
110 |
+
{"current_steps": 110, "total_steps": 162, "loss": 0.32, "lr": 2.8515194662432423e-06, "epoch": 4.072289156626506, "percentage": 67.9, "elapsed_time": "3:22:14", "remaining_time": "1:35:36"}
|
111 |
+
{"current_steps": 111, "total_steps": 162, "loss": 0.3009, "lr": 2.7542115403706067e-06, "epoch": 4.108433734939759, "percentage": 68.52, "elapsed_time": "3:23:53", "remaining_time": "1:33:40"}
|
112 |
+
{"current_steps": 112, "total_steps": 162, "loss": 0.2888, "lr": 2.65795779650105e-06, "epoch": 4.144578313253012, "percentage": 69.14, "elapsed_time": "3:25:37", "remaining_time": "1:31:47"}
|
113 |
+
{"current_steps": 113, "total_steps": 162, "loss": 0.3289, "lr": 2.562803416523405e-06, "epoch": 4.180722891566265, "percentage": 69.75, "elapsed_time": "3:30:35", "remaining_time": "1:31:18"}
|
114 |
+
{"current_steps": 114, "total_steps": 162, "loss": 0.2918, "lr": 2.46879306628073e-06, "epoch": 4.216867469879518, "percentage": 70.37, "elapsed_time": "3:32:17", "remaining_time": "1:29:23"}
|
115 |
+
{"current_steps": 115, "total_steps": 162, "loss": 0.2918, "lr": 2.375970874603998e-06, "epoch": 4.253012048192771, "percentage": 70.99, "elapsed_time": "3:33:49", "remaining_time": "1:27:23"}
|
116 |
+
{"current_steps": 116, "total_steps": 162, "loss": 0.3083, "lr": 2.2843804125978356e-06, "epoch": 4.289156626506024, "percentage": 71.6, "elapsed_time": "3:35:36", "remaining_time": "1:25:29"}
|
117 |
+
{"current_steps": 117, "total_steps": 162, "loss": 0.2965, "lr": 2.1940646731880887e-06, "epoch": 4.325301204819277, "percentage": 72.22, "elapsed_time": "3:37:05", "remaining_time": "1:23:29"}
|
118 |
+
{"current_steps": 118, "total_steps": 162, "loss": 0.2753, "lr": 2.105066050940758e-06, "epoch": 4.36144578313253, "percentage": 72.84, "elapsed_time": "3:38:52", "remaining_time": "1:21:36"}
|
119 |
+
{"current_steps": 119, "total_steps": 162, "loss": 0.3069, "lr": 2.0174263221618307e-06, "epoch": 4.397590361445783, "percentage": 73.46, "elapsed_time": "3:40:37", "remaining_time": "1:19:43"}
|
120 |
+
{"current_steps": 120, "total_steps": 162, "loss": 0.2963, "lr": 1.931186625287313e-06, "epoch": 4.433734939759036, "percentage": 74.07, "elapsed_time": "3:42:18", "remaining_time": "1:17:48"}
|
121 |
+
{"current_steps": 121, "total_steps": 162, "loss": 0.2941, "lr": 1.8463874415726918e-06, "epoch": 4.469879518072289, "percentage": 74.69, "elapsed_time": "3:43:54", "remaining_time": "1:15:52"}
|
122 |
+
{"current_steps": 122, "total_steps": 162, "loss": 0.2933, "lr": 1.7630685760908623e-06, "epoch": 4.506024096385542, "percentage": 75.31, "elapsed_time": "3:45:53", "remaining_time": "1:14:03"}
|
123 |
+
{"current_steps": 123, "total_steps": 162, "loss": 0.312, "lr": 1.6812691390474788e-06, "epoch": 4.542168674698795, "percentage": 75.93, "elapsed_time": "3:47:44", "remaining_time": "1:12:12"}
|
124 |
+
{"current_steps": 124, "total_steps": 162, "loss": 0.2687, "lr": 1.6010275274224607e-06, "epoch": 4.578313253012048, "percentage": 76.54, "elapsed_time": "3:49:22", "remaining_time": "1:10:17"}
|
125 |
+
{"current_steps": 125, "total_steps": 162, "loss": 0.2856, "lr": 1.5223814069463077e-06, "epoch": 4.614457831325301, "percentage": 77.16, "elapsed_time": "3:51:15", "remaining_time": "1:08:27"}
|
126 |
+
{"current_steps": 126, "total_steps": 162, "loss": 0.2624, "lr": 1.4453676944196477e-06, "epoch": 4.650602409638554, "percentage": 77.78, "elapsed_time": "3:53:01", "remaining_time": "1:06:34"}
|
127 |
+
{"current_steps": 127, "total_steps": 162, "loss": 0.295, "lr": 1.370022540384347e-06, "epoch": 4.686746987951807, "percentage": 78.4, "elapsed_time": "3:54:55", "remaining_time": "1:04:44"}
|
128 |
+
{"current_steps": 128, "total_steps": 162, "loss": 0.2872, "lr": 1.296381312154305e-06, "epoch": 4.72289156626506, "percentage": 79.01, "elapsed_time": "3:56:31", "remaining_time": "1:02:49"}
|
129 |
+
{"current_steps": 129, "total_steps": 162, "loss": 0.289, "lr": 1.2244785772138972e-06, "epoch": 4.759036144578313, "percentage": 79.63, "elapsed_time": "3:58:26", "remaining_time": "1:00:59"}
|
130 |
+
{"current_steps": 130, "total_steps": 162, "loss": 0.2843, "lr": 1.1543480869918555e-06, "epoch": 4.795180722891566, "percentage": 80.25, "elapsed_time": "3:59:57", "remaining_time": "0:59:04"}
|
131 |
+
{"current_steps": 131, "total_steps": 162, "loss": 0.2841, "lr": 1.0860227610182222e-06, "epoch": 4.831325301204819, "percentage": 80.86, "elapsed_time": "4:01:48", "remaining_time": "0:57:13"}
|
132 |
+
{"current_steps": 132, "total_steps": 162, "loss": 0.2949, "lr": 1.0195346714717813e-06, "epoch": 4.867469879518072, "percentage": 81.48, "elapsed_time": "4:03:26", "remaining_time": "0:55:19"}
|
133 |
+
{"current_steps": 133, "total_steps": 162, "loss": 0.2935, "lr": 9.549150281252633e-07, "epoch": 4.903614457831325, "percentage": 82.1, "elapsed_time": "4:04:56", "remaining_time": "0:53:24"}
|
134 |
+
{"current_steps": 134, "total_steps": 162, "loss": 0.2852, "lr": 8.921941636953435e-07, "epoch": 4.9397590361445785, "percentage": 82.72, "elapsed_time": "4:06:31", "remaining_time": "0:51:30"}
|
135 |
+
{"current_steps": 135, "total_steps": 162, "loss": 0.3026, "lr": 8.314015196043501e-07, "epoch": 4.975903614457831, "percentage": 83.33, "elapsed_time": "4:08:30", "remaining_time": "0:49:42"}
|
136 |
+
{"current_steps": 136, "total_steps": 162, "loss": 0.5577, "lr": 7.725656321603414e-07, "epoch": 5.036144578313253, "percentage": 83.95, "elapsed_time": "4:11:32", "remaining_time": "0:48:05"}
|
137 |
+
{"current_steps": 137, "total_steps": 162, "loss": 0.2559, "lr": 7.157141191620548e-07, "epoch": 5.072289156626506, "percentage": 84.57, "elapsed_time": "4:13:18", "remaining_time": "0:46:13"}
|
138 |
+
{"current_steps": 138, "total_steps": 162, "loss": 0.2612, "lr": 6.60873666934993e-07, "epoch": 5.108433734939759, "percentage": 85.19, "elapsed_time": "4:15:08", "remaining_time": "0:44:22"}
|
139 |
+
{"current_steps": 139, "total_steps": 162, "loss": 0.2997, "lr": 6.080700178047688e-07, "epoch": 5.144578313253012, "percentage": 85.8, "elapsed_time": "4:16:55", "remaining_time": "0:42:30"}
|
140 |
+
{"current_steps": 140, "total_steps": 162, "loss": 0.2893, "lr": 5.573279580135438e-07, "epoch": 5.180722891566265, "percentage": 86.42, "elapsed_time": "4:18:53", "remaining_time": "0:40:41"}
|
141 |
+
{"current_steps": 141, "total_steps": 162, "loss": 0.2676, "lr": 5.086713060852788e-07, "epoch": 5.216867469879518, "percentage": 87.04, "elapsed_time": "4:23:11", "remaining_time": "0:39:11"}
|
142 |
+
{"current_steps": 142, "total_steps": 162, "loss": 0.2433, "lr": 4.6212290164521554e-07, "epoch": 5.253012048192771, "percentage": 87.65, "elapsed_time": "4:24:45", "remaining_time": "0:37:17"}
|
143 |
+
{"current_steps": 143, "total_steps": 162, "loss": 0.2898, "lr": 4.1770459469887003e-07, "epoch": 5.289156626506024, "percentage": 88.27, "elapsed_time": "4:26:26", "remaining_time": "0:35:24"}
|
144 |
+
{"current_steps": 144, "total_steps": 162, "loss": 0.2554, "lr": 3.754372353755559e-07, "epoch": 5.325301204819277, "percentage": 88.89, "elapsed_time": "4:27:59", "remaining_time": "0:33:29"}
|
145 |
+
{"current_steps": 145, "total_steps": 162, "loss": 0.2363, "lr": 3.35340664141246e-07, "epoch": 5.36144578313253, "percentage": 89.51, "elapsed_time": "4:29:40", "remaining_time": "0:31:37"}
|
146 |
+
{"current_steps": 146, "total_steps": 162, "loss": 0.2471, "lr": 2.974337024853802e-07, "epoch": 5.397590361445783, "percentage": 90.12, "elapsed_time": "4:31:14", "remaining_time": "0:29:43"}
|
147 |
+
{"current_steps": 147, "total_steps": 162, "loss": 0.2399, "lr": 2.617341440859883e-07, "epoch": 5.433734939759036, "percentage": 90.74, "elapsed_time": "4:32:40", "remaining_time": "0:27:49"}
|
148 |
+
{"current_steps": 148, "total_steps": 162, "loss": 0.2651, "lr": 2.2825874645725942e-07, "epoch": 5.469879518072289, "percentage": 91.36, "elapsed_time": "4:34:17", "remaining_time": "0:25:56"}
|
149 |
+
{"current_steps": 149, "total_steps": 162, "loss": 0.2525, "lr": 1.9702322308350675e-07, "epoch": 5.506024096385542, "percentage": 91.98, "elapsed_time": "4:36:01", "remaining_time": "0:24:04"}
|
150 |
+
{"current_steps": 150, "total_steps": 162, "loss": 0.2871, "lr": 1.6804223604318825e-07, "epoch": 5.542168674698795, "percentage": 92.59, "elapsed_time": "4:37:32", "remaining_time": "0:22:12"}
|
151 |
+
{"current_steps": 151, "total_steps": 162, "loss": 0.242, "lr": 1.413293891264722e-07, "epoch": 5.578313253012048, "percentage": 93.21, "elapsed_time": "4:39:15", "remaining_time": "0:20:20"}
|
152 |
+
{"current_steps": 152, "total_steps": 162, "loss": 0.2704, "lr": 1.1689722144956672e-07, "epoch": 5.614457831325301, "percentage": 93.83, "elapsed_time": "4:41:07", "remaining_time": "0:18:29"}
|
153 |
+
{"current_steps": 153, "total_steps": 162, "loss": 0.2681, "lr": 9.475720156880419e-08, "epoch": 5.650602409638554, "percentage": 94.44, "elapsed_time": "4:42:43", "remaining_time": "0:16:37"}
|
154 |
+
{"current_steps": 154, "total_steps": 162, "loss": 0.2789, "lr": 7.491972209725807e-08, "epoch": 5.686746987951807, "percentage": 95.06, "elapsed_time": "4:44:45", "remaining_time": "0:14:47"}
|
155 |
+
{"current_steps": 155, "total_steps": 162, "loss": 0.239, "lr": 5.739409482640956e-08, "epoch": 5.72289156626506, "percentage": 95.68, "elapsed_time": "4:46:33", "remaining_time": "0:12:56"}
|
156 |
+
{"current_steps": 156, "total_steps": 162, "loss": 0.2624, "lr": 4.2188546355153016e-08, "epoch": 5.759036144578313, "percentage": 96.3, "elapsed_time": "4:48:46", "remaining_time": "0:11:06"}
|
157 |
+
{"current_steps": 157, "total_steps": 162, "loss": 0.2616, "lr": 2.9310214228202016e-08, "epoch": 5.795180722891566, "percentage": 96.91, "elapsed_time": "4:50:29", "remaining_time": "0:09:15"}
|
158 |
+
{"current_steps": 158, "total_steps": 162, "loss": 0.2651, "lr": 1.8765143585693924e-08, "epoch": 5.831325301204819, "percentage": 97.53, "elapsed_time": "4:52:02", "remaining_time": "0:07:23"}
|
159 |
+
{"current_steps": 159, "total_steps": 162, "loss": 0.2655, "lr": 1.0558284325578038e-08, "epoch": 5.867469879518072, "percentage": 98.15, "elapsed_time": "4:53:34", "remaining_time": "0:05:32"}
|
160 |
+
{"current_steps": 160, "total_steps": 162, "loss": 0.2887, "lr": 4.69348878011644e-09, "epoch": 5.903614457831325, "percentage": 98.77, "elapsed_time": "4:55:33", "remaining_time": "0:03:41"}
|
161 |
+
{"current_steps": 161, "total_steps": 162, "loss": 0.278, "lr": 1.173509907579362e-09, "epoch": 5.9397590361445785, "percentage": 99.38, "elapsed_time": "4:57:14", "remaining_time": "0:01:50"}
|
162 |
+
{"current_steps": 162, "total_steps": 162, "loss": 0.2823, "lr": 0.0, "epoch": 5.975903614457831, "percentage": 100.0, "elapsed_time": "4:58:53", "remaining_time": "0:00:00"}
|
163 |
+
{"current_steps": 162, "total_steps": 162, "epoch": 5.975903614457831, "percentage": 100.0, "elapsed_time": "5:01:30", "remaining_time": "0:00:00"}
|