File size: 58,113 Bytes
0c4fbc9
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
{"current_steps": 1, "total_steps": 320, "loss": 0.508, "lr": 3.125e-06, "epoch": 0.00625, "percentage": 0.31, "elapsed_time": "0:00:27", "remaining_time": "2:25:16"}
{"current_steps": 2, "total_steps": 320, "loss": 0.3989, "lr": 6.25e-06, "epoch": 0.0125, "percentage": 0.62, "elapsed_time": "0:00:44", "remaining_time": "1:57:50"}
{"current_steps": 3, "total_steps": 320, "loss": 0.3526, "lr": 9.375000000000001e-06, "epoch": 0.01875, "percentage": 0.94, "elapsed_time": "0:01:01", "remaining_time": "1:48:31"}
{"current_steps": 4, "total_steps": 320, "loss": 0.3927, "lr": 1.25e-05, "epoch": 0.025, "percentage": 1.25, "elapsed_time": "0:01:18", "remaining_time": "1:43:44"}
{"current_steps": 5, "total_steps": 320, "loss": 0.3232, "lr": 1.5625e-05, "epoch": 0.03125, "percentage": 1.56, "elapsed_time": "0:01:35", "remaining_time": "1:40:47"}
{"current_steps": 6, "total_steps": 320, "loss": 0.3486, "lr": 1.8750000000000002e-05, "epoch": 0.0375, "percentage": 1.88, "elapsed_time": "0:01:53", "remaining_time": "1:38:42"}
{"current_steps": 7, "total_steps": 320, "loss": 0.3894, "lr": 2.1875e-05, "epoch": 0.04375, "percentage": 2.19, "elapsed_time": "0:02:10", "remaining_time": "1:37:07"}
{"current_steps": 8, "total_steps": 320, "loss": 0.3606, "lr": 2.5e-05, "epoch": 0.05, "percentage": 2.5, "elapsed_time": "0:02:27", "remaining_time": "1:35:52"}
{"current_steps": 9, "total_steps": 320, "loss": 0.3323, "lr": 2.8125000000000003e-05, "epoch": 0.05625, "percentage": 2.81, "elapsed_time": "0:02:44", "remaining_time": "1:34:48"}
{"current_steps": 10, "total_steps": 320, "loss": 0.3689, "lr": 3.125e-05, "epoch": 0.0625, "percentage": 3.12, "elapsed_time": "0:03:01", "remaining_time": "1:33:54"}
{"current_steps": 11, "total_steps": 320, "loss": 0.3825, "lr": 3.4375e-05, "epoch": 0.06875, "percentage": 3.44, "elapsed_time": "0:03:18", "remaining_time": "1:33:06"}
{"current_steps": 12, "total_steps": 320, "loss": 0.3368, "lr": 3.7500000000000003e-05, "epoch": 0.075, "percentage": 3.75, "elapsed_time": "0:03:35", "remaining_time": "1:32:23"}
{"current_steps": 13, "total_steps": 320, "loss": 0.3345, "lr": 4.0625000000000005e-05, "epoch": 0.08125, "percentage": 4.06, "elapsed_time": "0:03:53", "remaining_time": "1:31:44"}
{"current_steps": 14, "total_steps": 320, "loss": 0.3176, "lr": 4.375e-05, "epoch": 0.0875, "percentage": 4.38, "elapsed_time": "0:04:10", "remaining_time": "1:31:19"}
{"current_steps": 15, "total_steps": 320, "loss": 0.3136, "lr": 4.6875e-05, "epoch": 0.09375, "percentage": 4.69, "elapsed_time": "0:04:27", "remaining_time": "1:30:45"}
{"current_steps": 16, "total_steps": 320, "loss": 0.2986, "lr": 5e-05, "epoch": 0.1, "percentage": 5.0, "elapsed_time": "0:04:44", "remaining_time": "1:30:13"}
{"current_steps": 17, "total_steps": 320, "loss": 0.2691, "lr": 5.3125000000000004e-05, "epoch": 0.10625, "percentage": 5.31, "elapsed_time": "0:05:02", "remaining_time": "1:29:48"}
{"current_steps": 18, "total_steps": 320, "loss": 0.3044, "lr": 5.6250000000000005e-05, "epoch": 0.1125, "percentage": 5.62, "elapsed_time": "0:05:19", "remaining_time": "1:29:19"}
{"current_steps": 19, "total_steps": 320, "loss": 0.232, "lr": 5.9375e-05, "epoch": 0.11875, "percentage": 5.94, "elapsed_time": "0:05:36", "remaining_time": "1:28:52"}
{"current_steps": 20, "total_steps": 320, "loss": 0.237, "lr": 6.25e-05, "epoch": 0.125, "percentage": 6.25, "elapsed_time": "0:05:53", "remaining_time": "1:28:25"}
{"current_steps": 21, "total_steps": 320, "loss": 0.2708, "lr": 6.562500000000001e-05, "epoch": 0.13125, "percentage": 6.56, "elapsed_time": "0:06:10", "remaining_time": "1:28:00"}
{"current_steps": 22, "total_steps": 320, "loss": 0.2334, "lr": 6.875e-05, "epoch": 0.1375, "percentage": 6.88, "elapsed_time": "0:06:27", "remaining_time": "1:27:35"}
{"current_steps": 23, "total_steps": 320, "loss": 0.1994, "lr": 7.1875e-05, "epoch": 0.14375, "percentage": 7.19, "elapsed_time": "0:06:45", "remaining_time": "1:27:11"}
{"current_steps": 24, "total_steps": 320, "loss": 0.2253, "lr": 7.500000000000001e-05, "epoch": 0.15, "percentage": 7.5, "elapsed_time": "0:07:02", "remaining_time": "1:26:47"}
{"current_steps": 25, "total_steps": 320, "loss": 0.2677, "lr": 7.8125e-05, "epoch": 0.15625, "percentage": 7.81, "elapsed_time": "0:07:19", "remaining_time": "1:26:24"}
{"current_steps": 26, "total_steps": 320, "loss": 0.1909, "lr": 8.125000000000001e-05, "epoch": 0.1625, "percentage": 8.12, "elapsed_time": "0:07:36", "remaining_time": "1:26:01"}
{"current_steps": 27, "total_steps": 320, "loss": 0.2352, "lr": 8.4375e-05, "epoch": 0.16875, "percentage": 8.44, "elapsed_time": "0:07:53", "remaining_time": "1:25:39"}
{"current_steps": 28, "total_steps": 320, "loss": 0.2312, "lr": 8.75e-05, "epoch": 0.175, "percentage": 8.75, "elapsed_time": "0:08:10", "remaining_time": "1:25:16"}
{"current_steps": 29, "total_steps": 320, "loss": 0.2571, "lr": 9.062500000000001e-05, "epoch": 0.18125, "percentage": 9.06, "elapsed_time": "0:08:27", "remaining_time": "1:24:54"}
{"current_steps": 30, "total_steps": 320, "loss": 0.2181, "lr": 9.375e-05, "epoch": 0.1875, "percentage": 9.38, "elapsed_time": "0:08:44", "remaining_time": "1:24:33"}
{"current_steps": 31, "total_steps": 320, "loss": 0.1768, "lr": 9.687500000000001e-05, "epoch": 0.19375, "percentage": 9.69, "elapsed_time": "0:09:01", "remaining_time": "1:24:12"}
{"current_steps": 32, "total_steps": 320, "loss": 0.1995, "lr": 0.0001, "epoch": 0.2, "percentage": 10.0, "elapsed_time": "0:09:19", "remaining_time": "1:23:51"}
{"current_steps": 33, "total_steps": 320, "loss": 0.2344, "lr": 9.999702525000749e-05, "epoch": 0.20625, "percentage": 10.31, "elapsed_time": "0:09:36", "remaining_time": "1:23:30"}
{"current_steps": 34, "total_steps": 320, "loss": 0.1581, "lr": 9.998810135399546e-05, "epoch": 0.2125, "percentage": 10.62, "elapsed_time": "0:09:53", "remaining_time": "1:23:10"}
{"current_steps": 35, "total_steps": 320, "loss": 0.2129, "lr": 9.997322937381829e-05, "epoch": 0.21875, "percentage": 10.94, "elapsed_time": "0:10:10", "remaining_time": "1:22:49"}
{"current_steps": 36, "total_steps": 320, "loss": 0.1837, "lr": 9.99524110790929e-05, "epoch": 0.225, "percentage": 11.25, "elapsed_time": "0:10:27", "remaining_time": "1:22:29"}
{"current_steps": 37, "total_steps": 320, "loss": 0.1881, "lr": 9.992564894698816e-05, "epoch": 0.23125, "percentage": 11.56, "elapsed_time": "0:10:44", "remaining_time": "1:22:09"}
{"current_steps": 38, "total_steps": 320, "loss": 0.1837, "lr": 9.989294616193017e-05, "epoch": 0.2375, "percentage": 11.88, "elapsed_time": "0:11:01", "remaining_time": "1:21:49"}
{"current_steps": 39, "total_steps": 320, "loss": 0.1918, "lr": 9.985430661522333e-05, "epoch": 0.24375, "percentage": 12.19, "elapsed_time": "0:11:18", "remaining_time": "1:21:29"}
{"current_steps": 40, "total_steps": 320, "loss": 0.1823, "lr": 9.980973490458728e-05, "epoch": 0.25, "percentage": 12.5, "elapsed_time": "0:11:35", "remaining_time": "1:21:10"}
{"current_steps": 41, "total_steps": 320, "loss": 0.2191, "lr": 9.975923633360985e-05, "epoch": 0.25625, "percentage": 12.81, "elapsed_time": "0:11:52", "remaining_time": "1:20:50"}
{"current_steps": 42, "total_steps": 320, "loss": 0.1671, "lr": 9.970281691111598e-05, "epoch": 0.2625, "percentage": 13.12, "elapsed_time": "0:12:09", "remaining_time": "1:20:31"}
{"current_steps": 43, "total_steps": 320, "loss": 0.1445, "lr": 9.964048335045275e-05, "epoch": 0.26875, "percentage": 13.44, "elapsed_time": "0:12:27", "remaining_time": "1:20:12"}
{"current_steps": 44, "total_steps": 320, "loss": 0.1883, "lr": 9.957224306869053e-05, "epoch": 0.275, "percentage": 13.75, "elapsed_time": "0:12:44", "remaining_time": "1:19:54"}
{"current_steps": 45, "total_steps": 320, "loss": 0.1912, "lr": 9.949810418574039e-05, "epoch": 0.28125, "percentage": 14.06, "elapsed_time": "0:13:01", "remaining_time": "1:19:35"}
{"current_steps": 46, "total_steps": 320, "loss": 0.1781, "lr": 9.941807552338804e-05, "epoch": 0.2875, "percentage": 14.37, "elapsed_time": "0:13:18", "remaining_time": "1:19:16"}
{"current_steps": 47, "total_steps": 320, "loss": 0.1741, "lr": 9.933216660424395e-05, "epoch": 0.29375, "percentage": 14.69, "elapsed_time": "0:13:35", "remaining_time": "1:18:58"}
{"current_steps": 48, "total_steps": 320, "loss": 0.1862, "lr": 9.924038765061042e-05, "epoch": 0.3, "percentage": 15.0, "elapsed_time": "0:13:52", "remaining_time": "1:18:39"}
{"current_steps": 49, "total_steps": 320, "loss": 0.1948, "lr": 9.914274958326505e-05, "epoch": 0.30625, "percentage": 15.31, "elapsed_time": "0:14:09", "remaining_time": "1:18:21"}
{"current_steps": 50, "total_steps": 320, "loss": 0.1387, "lr": 9.903926402016153e-05, "epoch": 0.3125, "percentage": 15.62, "elapsed_time": "0:14:27", "remaining_time": "1:18:02"}
{"current_steps": 51, "total_steps": 320, "loss": 0.1897, "lr": 9.892994327504693e-05, "epoch": 0.31875, "percentage": 15.94, "elapsed_time": "0:14:44", "remaining_time": "1:17:44"}
{"current_steps": 52, "total_steps": 320, "loss": 0.1878, "lr": 9.881480035599667e-05, "epoch": 0.325, "percentage": 16.25, "elapsed_time": "0:15:01", "remaining_time": "1:17:25"}
{"current_steps": 53, "total_steps": 320, "loss": 0.194, "lr": 9.869384896386668e-05, "epoch": 0.33125, "percentage": 16.56, "elapsed_time": "0:15:18", "remaining_time": "1:17:07"}
{"current_steps": 54, "total_steps": 320, "loss": 0.1881, "lr": 9.856710349066307e-05, "epoch": 0.3375, "percentage": 16.88, "elapsed_time": "0:15:35", "remaining_time": "1:16:48"}
{"current_steps": 55, "total_steps": 320, "loss": 0.2129, "lr": 9.843457901782967e-05, "epoch": 0.34375, "percentage": 17.19, "elapsed_time": "0:15:52", "remaining_time": "1:16:30"}
{"current_steps": 56, "total_steps": 320, "loss": 0.187, "lr": 9.829629131445342e-05, "epoch": 0.35, "percentage": 17.5, "elapsed_time": "0:16:09", "remaining_time": "1:16:11"}
{"current_steps": 57, "total_steps": 320, "loss": 0.1952, "lr": 9.815225683538814e-05, "epoch": 0.35625, "percentage": 17.81, "elapsed_time": "0:16:26", "remaining_time": "1:15:53"}
{"current_steps": 58, "total_steps": 320, "loss": 0.1722, "lr": 9.800249271929645e-05, "epoch": 0.3625, "percentage": 18.12, "elapsed_time": "0:16:43", "remaining_time": "1:15:35"}
{"current_steps": 59, "total_steps": 320, "loss": 0.1852, "lr": 9.784701678661045e-05, "epoch": 0.36875, "percentage": 18.44, "elapsed_time": "0:17:01", "remaining_time": "1:15:16"}
{"current_steps": 60, "total_steps": 320, "loss": 0.1861, "lr": 9.768584753741134e-05, "epoch": 0.375, "percentage": 18.75, "elapsed_time": "0:17:18", "remaining_time": "1:14:58"}
{"current_steps": 61, "total_steps": 320, "loss": 0.1681, "lr": 9.751900414922805e-05, "epoch": 0.38125, "percentage": 19.06, "elapsed_time": "0:17:35", "remaining_time": "1:14:40"}
{"current_steps": 62, "total_steps": 320, "loss": 0.1768, "lr": 9.73465064747553e-05, "epoch": 0.3875, "percentage": 19.38, "elapsed_time": "0:17:52", "remaining_time": "1:14:22"}
{"current_steps": 63, "total_steps": 320, "loss": 0.1592, "lr": 9.716837503949127e-05, "epoch": 0.39375, "percentage": 19.69, "elapsed_time": "0:18:09", "remaining_time": "1:14:04"}
{"current_steps": 64, "total_steps": 320, "loss": 0.2007, "lr": 9.698463103929542e-05, "epoch": 0.4, "percentage": 20.0, "elapsed_time": "0:18:26", "remaining_time": "1:13:46"}
{"current_steps": 65, "total_steps": 320, "loss": 0.1499, "lr": 9.67952963378663e-05, "epoch": 0.40625, "percentage": 20.31, "elapsed_time": "0:18:43", "remaining_time": "1:13:28"}
{"current_steps": 66, "total_steps": 320, "loss": 0.1702, "lr": 9.660039346413994e-05, "epoch": 0.4125, "percentage": 20.62, "elapsed_time": "0:19:00", "remaining_time": "1:13:10"}
{"current_steps": 67, "total_steps": 320, "loss": 0.172, "lr": 9.639994560960923e-05, "epoch": 0.41875, "percentage": 20.94, "elapsed_time": "0:19:17", "remaining_time": "1:12:52"}
{"current_steps": 68, "total_steps": 320, "loss": 0.1363, "lr": 9.619397662556435e-05, "epoch": 0.425, "percentage": 21.25, "elapsed_time": "0:19:35", "remaining_time": "1:12:34"}
{"current_steps": 69, "total_steps": 320, "loss": 0.1664, "lr": 9.598251102025461e-05, "epoch": 0.43125, "percentage": 21.56, "elapsed_time": "0:19:52", "remaining_time": "1:12:16"}
{"current_steps": 70, "total_steps": 320, "loss": 0.1439, "lr": 9.576557395597236e-05, "epoch": 0.4375, "percentage": 21.88, "elapsed_time": "0:20:09", "remaining_time": "1:11:58"}
{"current_steps": 71, "total_steps": 320, "loss": 0.1526, "lr": 9.554319124605879e-05, "epoch": 0.44375, "percentage": 22.19, "elapsed_time": "0:20:26", "remaining_time": "1:11:41"}
{"current_steps": 72, "total_steps": 320, "loss": 0.1514, "lr": 9.53153893518325e-05, "epoch": 0.45, "percentage": 22.5, "elapsed_time": "0:20:43", "remaining_time": "1:11:23"}
{"current_steps": 73, "total_steps": 320, "loss": 0.1481, "lr": 9.508219537944081e-05, "epoch": 0.45625, "percentage": 22.81, "elapsed_time": "0:21:00", "remaining_time": "1:11:05"}
{"current_steps": 74, "total_steps": 320, "loss": 0.1552, "lr": 9.484363707663442e-05, "epoch": 0.4625, "percentage": 23.12, "elapsed_time": "0:21:17", "remaining_time": "1:10:48"}
{"current_steps": 75, "total_steps": 320, "loss": 0.1533, "lr": 9.459974282946571e-05, "epoch": 0.46875, "percentage": 23.44, "elapsed_time": "0:21:35", "remaining_time": "1:10:30"}
{"current_steps": 76, "total_steps": 320, "loss": 0.15, "lr": 9.435054165891109e-05, "epoch": 0.475, "percentage": 23.75, "elapsed_time": "0:21:52", "remaining_time": "1:10:12"}
{"current_steps": 77, "total_steps": 320, "loss": 0.1633, "lr": 9.409606321741775e-05, "epoch": 0.48125, "percentage": 24.06, "elapsed_time": "0:22:09", "remaining_time": "1:09:55"}
{"current_steps": 78, "total_steps": 320, "loss": 0.1675, "lr": 9.38363377853754e-05, "epoch": 0.4875, "percentage": 24.38, "elapsed_time": "0:22:26", "remaining_time": "1:09:37"}
{"current_steps": 79, "total_steps": 320, "loss": 0.1649, "lr": 9.357139626751308e-05, "epoch": 0.49375, "percentage": 24.69, "elapsed_time": "0:22:43", "remaining_time": "1:09:19"}
{"current_steps": 80, "total_steps": 320, "loss": 0.1818, "lr": 9.330127018922194e-05, "epoch": 0.5, "percentage": 25.0, "elapsed_time": "0:23:00", "remaining_time": "1:09:02"}
{"current_steps": 81, "total_steps": 320, "loss": 0.1535, "lr": 9.302599169280395e-05, "epoch": 0.50625, "percentage": 25.31, "elapsed_time": "0:23:17", "remaining_time": "1:08:44"}
{"current_steps": 82, "total_steps": 320, "loss": 0.1573, "lr": 9.274559353364734e-05, "epoch": 0.5125, "percentage": 25.62, "elapsed_time": "0:23:34", "remaining_time": "1:08:26"}
{"current_steps": 83, "total_steps": 320, "loss": 0.1552, "lr": 9.246010907632895e-05, "epoch": 0.51875, "percentage": 25.94, "elapsed_time": "0:23:51", "remaining_time": "1:08:08"}
{"current_steps": 84, "total_steps": 320, "loss": 0.1348, "lr": 9.21695722906443e-05, "epoch": 0.525, "percentage": 26.25, "elapsed_time": "0:24:08", "remaining_time": "1:07:50"}
{"current_steps": 85, "total_steps": 320, "loss": 0.1541, "lr": 9.18740177475654e-05, "epoch": 0.53125, "percentage": 26.56, "elapsed_time": "0:24:26", "remaining_time": "1:07:33"}
{"current_steps": 86, "total_steps": 320, "loss": 0.1584, "lr": 9.157348061512727e-05, "epoch": 0.5375, "percentage": 26.88, "elapsed_time": "0:24:43", "remaining_time": "1:07:15"}
{"current_steps": 87, "total_steps": 320, "loss": 0.1558, "lr": 9.126799665424319e-05, "epoch": 0.54375, "percentage": 27.19, "elapsed_time": "0:25:00", "remaining_time": "1:06:57"}
{"current_steps": 88, "total_steps": 320, "loss": 0.178, "lr": 9.09576022144496e-05, "epoch": 0.55, "percentage": 27.5, "elapsed_time": "0:25:17", "remaining_time": "1:06:39"}
{"current_steps": 89, "total_steps": 320, "loss": 0.1382, "lr": 9.064233422958077e-05, "epoch": 0.55625, "percentage": 27.81, "elapsed_time": "0:25:34", "remaining_time": "1:06:22"}
{"current_steps": 90, "total_steps": 320, "loss": 0.2028, "lr": 9.032223021337414e-05, "epoch": 0.5625, "percentage": 28.12, "elapsed_time": "0:25:51", "remaining_time": "1:06:04"}
{"current_steps": 91, "total_steps": 320, "loss": 0.1564, "lr": 8.999732825500648e-05, "epoch": 0.56875, "percentage": 28.44, "elapsed_time": "0:26:08", "remaining_time": "1:05:46"}
{"current_steps": 92, "total_steps": 320, "loss": 0.1748, "lr": 8.966766701456177e-05, "epoch": 0.575, "percentage": 28.75, "elapsed_time": "0:26:25", "remaining_time": "1:05:29"}
{"current_steps": 93, "total_steps": 320, "loss": 0.166, "lr": 8.933328571843084e-05, "epoch": 0.58125, "percentage": 29.06, "elapsed_time": "0:26:42", "remaining_time": "1:05:11"}
{"current_steps": 94, "total_steps": 320, "loss": 0.1371, "lr": 8.899422415464409e-05, "epoch": 0.5875, "percentage": 29.38, "elapsed_time": "0:26:59", "remaining_time": "1:04:54"}
{"current_steps": 95, "total_steps": 320, "loss": 0.1695, "lr": 8.865052266813685e-05, "epoch": 0.59375, "percentage": 29.69, "elapsed_time": "0:27:16", "remaining_time": "1:04:36"}
{"current_steps": 96, "total_steps": 320, "loss": 0.1397, "lr": 8.83022221559489e-05, "epoch": 0.6, "percentage": 30.0, "elapsed_time": "0:27:33", "remaining_time": "1:04:18"}
{"current_steps": 97, "total_steps": 320, "loss": 0.1475, "lr": 8.79493640623581e-05, "epoch": 0.60625, "percentage": 30.31, "elapsed_time": "0:27:50", "remaining_time": "1:04:01"}
{"current_steps": 98, "total_steps": 320, "loss": 0.1455, "lr": 8.759199037394887e-05, "epoch": 0.6125, "percentage": 30.63, "elapsed_time": "0:28:08", "remaining_time": "1:03:44"}
{"current_steps": 99, "total_steps": 320, "loss": 0.155, "lr": 8.723014361461632e-05, "epoch": 0.61875, "percentage": 30.94, "elapsed_time": "0:28:25", "remaining_time": "1:03:27"}
{"current_steps": 100, "total_steps": 320, "loss": 0.14, "lr": 8.68638668405062e-05, "epoch": 0.625, "percentage": 31.25, "elapsed_time": "0:28:43", "remaining_time": "1:03:11"}
{"current_steps": 101, "total_steps": 320, "loss": 0.1268, "lr": 8.649320363489179e-05, "epoch": 0.63125, "percentage": 31.56, "elapsed_time": "0:29:00", "remaining_time": "1:02:53"}
{"current_steps": 102, "total_steps": 320, "loss": 0.174, "lr": 8.611819810298778e-05, "epoch": 0.6375, "percentage": 31.87, "elapsed_time": "0:29:17", "remaining_time": "1:02:36"}
{"current_steps": 103, "total_steps": 320, "loss": 0.1314, "lr": 8.573889486670233e-05, "epoch": 0.64375, "percentage": 32.19, "elapsed_time": "0:29:34", "remaining_time": "1:02:19"}
{"current_steps": 104, "total_steps": 320, "loss": 0.1563, "lr": 8.535533905932738e-05, "epoch": 0.65, "percentage": 32.5, "elapsed_time": "0:29:51", "remaining_time": "1:02:01"}
{"current_steps": 105, "total_steps": 320, "loss": 0.2076, "lr": 8.496757632016836e-05, "epoch": 0.65625, "percentage": 32.81, "elapsed_time": "0:30:09", "remaining_time": "1:01:44"}
{"current_steps": 106, "total_steps": 320, "loss": 0.1516, "lr": 8.457565278911348e-05, "epoch": 0.6625, "percentage": 33.12, "elapsed_time": "0:30:26", "remaining_time": "1:01:26"}
{"current_steps": 107, "total_steps": 320, "loss": 0.163, "lr": 8.417961510114356e-05, "epoch": 0.66875, "percentage": 33.44, "elapsed_time": "0:30:43", "remaining_time": "1:01:09"}
{"current_steps": 108, "total_steps": 320, "loss": 0.1351, "lr": 8.377951038078302e-05, "epoch": 0.675, "percentage": 33.75, "elapsed_time": "0:31:00", "remaining_time": "1:00:51"}
{"current_steps": 109, "total_steps": 320, "loss": 0.1181, "lr": 8.337538623649237e-05, "epoch": 0.68125, "percentage": 34.06, "elapsed_time": "0:31:17", "remaining_time": "1:00:34"}
{"current_steps": 110, "total_steps": 320, "loss": 0.1404, "lr": 8.296729075500344e-05, "epoch": 0.6875, "percentage": 34.38, "elapsed_time": "0:31:34", "remaining_time": "1:00:16"}
{"current_steps": 111, "total_steps": 320, "loss": 0.1746, "lr": 8.255527249559746e-05, "epoch": 0.69375, "percentage": 34.69, "elapsed_time": "0:31:51", "remaining_time": "0:59:59"}
{"current_steps": 112, "total_steps": 320, "loss": 0.1724, "lr": 8.213938048432697e-05, "epoch": 0.7, "percentage": 35.0, "elapsed_time": "0:32:08", "remaining_time": "0:59:41"}
{"current_steps": 113, "total_steps": 320, "loss": 0.1469, "lr": 8.171966420818228e-05, "epoch": 0.70625, "percentage": 35.31, "elapsed_time": "0:32:25", "remaining_time": "0:59:24"}
{"current_steps": 114, "total_steps": 320, "loss": 0.1692, "lr": 8.129617360920296e-05, "epoch": 0.7125, "percentage": 35.62, "elapsed_time": "0:32:42", "remaining_time": "0:59:06"}
{"current_steps": 115, "total_steps": 320, "loss": 0.145, "lr": 8.086895907853526e-05, "epoch": 0.71875, "percentage": 35.94, "elapsed_time": "0:32:59", "remaining_time": "0:58:49"}
{"current_steps": 116, "total_steps": 320, "loss": 0.1401, "lr": 8.043807145043604e-05, "epoch": 0.725, "percentage": 36.25, "elapsed_time": "0:33:17", "remaining_time": "0:58:31"}
{"current_steps": 117, "total_steps": 320, "loss": 0.1289, "lr": 8.000356199622405e-05, "epoch": 0.73125, "percentage": 36.56, "elapsed_time": "0:33:34", "remaining_time": "0:58:14"}
{"current_steps": 118, "total_steps": 320, "loss": 0.1191, "lr": 7.956548241817912e-05, "epoch": 0.7375, "percentage": 36.88, "elapsed_time": "0:33:51", "remaining_time": "0:57:57"}
{"current_steps": 119, "total_steps": 320, "loss": 0.1679, "lr": 7.912388484339012e-05, "epoch": 0.74375, "percentage": 37.19, "elapsed_time": "0:34:08", "remaining_time": "0:57:39"}
{"current_steps": 120, "total_steps": 320, "loss": 0.1455, "lr": 7.86788218175523e-05, "epoch": 0.75, "percentage": 37.5, "elapsed_time": "0:34:25", "remaining_time": "0:57:22"}
{"current_steps": 121, "total_steps": 320, "loss": 0.1387, "lr": 7.823034629871503e-05, "epoch": 0.75625, "percentage": 37.81, "elapsed_time": "0:34:42", "remaining_time": "0:57:04"}
{"current_steps": 122, "total_steps": 320, "loss": 0.1595, "lr": 7.777851165098012e-05, "epoch": 0.7625, "percentage": 38.12, "elapsed_time": "0:34:59", "remaining_time": "0:56:47"}
{"current_steps": 123, "total_steps": 320, "loss": 0.1591, "lr": 7.732337163815217e-05, "epoch": 0.76875, "percentage": 38.44, "elapsed_time": "0:35:16", "remaining_time": "0:56:30"}
{"current_steps": 124, "total_steps": 320, "loss": 0.1623, "lr": 7.68649804173412e-05, "epoch": 0.775, "percentage": 38.75, "elapsed_time": "0:35:33", "remaining_time": "0:56:12"}
{"current_steps": 125, "total_steps": 320, "loss": 0.155, "lr": 7.64033925325184e-05, "epoch": 0.78125, "percentage": 39.06, "elapsed_time": "0:35:51", "remaining_time": "0:55:55"}
{"current_steps": 126, "total_steps": 320, "loss": 0.1524, "lr": 7.593866290802608e-05, "epoch": 0.7875, "percentage": 39.38, "elapsed_time": "0:36:08", "remaining_time": "0:55:38"}
{"current_steps": 127, "total_steps": 320, "loss": 0.1599, "lr": 7.54708468420421e-05, "epoch": 0.79375, "percentage": 39.69, "elapsed_time": "0:36:25", "remaining_time": "0:55:20"}
{"current_steps": 128, "total_steps": 320, "loss": 0.1554, "lr": 7.500000000000001e-05, "epoch": 0.8, "percentage": 40.0, "elapsed_time": "0:36:42", "remaining_time": "0:55:03"}
{"current_steps": 129, "total_steps": 320, "loss": 0.1538, "lr": 7.45261784079654e-05, "epoch": 0.80625, "percentage": 40.31, "elapsed_time": "0:36:59", "remaining_time": "0:54:46"}
{"current_steps": 130, "total_steps": 320, "loss": 0.1525, "lr": 7.404943844596939e-05, "epoch": 0.8125, "percentage": 40.62, "elapsed_time": "0:37:16", "remaining_time": "0:54:29"}
{"current_steps": 131, "total_steps": 320, "loss": 0.1478, "lr": 7.35698368412999e-05, "epoch": 0.81875, "percentage": 40.94, "elapsed_time": "0:37:33", "remaining_time": "0:54:11"}
{"current_steps": 132, "total_steps": 320, "loss": 0.1484, "lr": 7.308743066175172e-05, "epoch": 0.825, "percentage": 41.25, "elapsed_time": "0:37:50", "remaining_time": "0:53:54"}
{"current_steps": 133, "total_steps": 320, "loss": 0.124, "lr": 7.2602277308836e-05, "epoch": 0.83125, "percentage": 41.56, "elapsed_time": "0:38:08", "remaining_time": "0:53:36"}
{"current_steps": 134, "total_steps": 320, "loss": 0.1422, "lr": 7.211443451095007e-05, "epoch": 0.8375, "percentage": 41.88, "elapsed_time": "0:38:25", "remaining_time": "0:53:19"}
{"current_steps": 135, "total_steps": 320, "loss": 0.1488, "lr": 7.162396031650831e-05, "epoch": 0.84375, "percentage": 42.19, "elapsed_time": "0:38:42", "remaining_time": "0:53:02"}
{"current_steps": 136, "total_steps": 320, "loss": 0.1227, "lr": 7.113091308703498e-05, "epoch": 0.85, "percentage": 42.5, "elapsed_time": "0:38:59", "remaining_time": "0:52:44"}
{"current_steps": 137, "total_steps": 320, "loss": 0.1397, "lr": 7.063535149021973e-05, "epoch": 0.85625, "percentage": 42.81, "elapsed_time": "0:39:16", "remaining_time": "0:52:27"}
{"current_steps": 138, "total_steps": 320, "loss": 0.1489, "lr": 7.013733449293687e-05, "epoch": 0.8625, "percentage": 43.12, "elapsed_time": "0:39:33", "remaining_time": "0:52:10"}
{"current_steps": 139, "total_steps": 320, "loss": 0.1625, "lr": 6.96369213542287e-05, "epoch": 0.86875, "percentage": 43.44, "elapsed_time": "0:39:50", "remaining_time": "0:51:52"}
{"current_steps": 140, "total_steps": 320, "loss": 0.1575, "lr": 6.91341716182545e-05, "epoch": 0.875, "percentage": 43.75, "elapsed_time": "0:40:07", "remaining_time": "0:51:35"}
{"current_steps": 141, "total_steps": 320, "loss": 0.1367, "lr": 6.862914510720515e-05, "epoch": 0.88125, "percentage": 44.06, "elapsed_time": "0:40:24", "remaining_time": "0:51:18"}
{"current_steps": 142, "total_steps": 320, "loss": 0.1269, "lr": 6.812190191418508e-05, "epoch": 0.8875, "percentage": 44.38, "elapsed_time": "0:40:41", "remaining_time": "0:51:00"}
{"current_steps": 143, "total_steps": 320, "loss": 0.1653, "lr": 6.761250239606169e-05, "epoch": 0.89375, "percentage": 44.69, "elapsed_time": "0:40:58", "remaining_time": "0:50:43"}
{"current_steps": 144, "total_steps": 320, "loss": 0.163, "lr": 6.710100716628344e-05, "epoch": 0.9, "percentage": 45.0, "elapsed_time": "0:41:15", "remaining_time": "0:50:25"}
{"current_steps": 145, "total_steps": 320, "loss": 0.1372, "lr": 6.658747708766762e-05, "epoch": 0.90625, "percentage": 45.31, "elapsed_time": "0:41:32", "remaining_time": "0:50:08"}
{"current_steps": 146, "total_steps": 320, "loss": 0.1666, "lr": 6.607197326515808e-05, "epoch": 0.9125, "percentage": 45.62, "elapsed_time": "0:41:49", "remaining_time": "0:49:51"}
{"current_steps": 147, "total_steps": 320, "loss": 0.1608, "lr": 6.555455703855454e-05, "epoch": 0.91875, "percentage": 45.94, "elapsed_time": "0:42:07", "remaining_time": "0:49:34"}
{"current_steps": 148, "total_steps": 320, "loss": 0.1358, "lr": 6.503528997521366e-05, "epoch": 0.925, "percentage": 46.25, "elapsed_time": "0:42:24", "remaining_time": "0:49:16"}
{"current_steps": 149, "total_steps": 320, "loss": 0.1467, "lr": 6.451423386272312e-05, "epoch": 0.93125, "percentage": 46.56, "elapsed_time": "0:42:41", "remaining_time": "0:48:59"}
{"current_steps": 150, "total_steps": 320, "loss": 0.1602, "lr": 6.399145070154961e-05, "epoch": 0.9375, "percentage": 46.88, "elapsed_time": "0:42:58", "remaining_time": "0:48:42"}
{"current_steps": 151, "total_steps": 320, "loss": 0.1491, "lr": 6.346700269766132e-05, "epoch": 0.94375, "percentage": 47.19, "elapsed_time": "0:43:15", "remaining_time": "0:48:24"}
{"current_steps": 152, "total_steps": 320, "loss": 0.1503, "lr": 6.294095225512603e-05, "epoch": 0.95, "percentage": 47.5, "elapsed_time": "0:43:32", "remaining_time": "0:48:07"}
{"current_steps": 153, "total_steps": 320, "loss": 0.1394, "lr": 6.241336196868582e-05, "epoch": 0.95625, "percentage": 47.81, "elapsed_time": "0:43:49", "remaining_time": "0:47:50"}
{"current_steps": 154, "total_steps": 320, "loss": 0.1471, "lr": 6.188429461630866e-05, "epoch": 0.9625, "percentage": 48.12, "elapsed_time": "0:44:06", "remaining_time": "0:47:33"}
{"current_steps": 155, "total_steps": 320, "loss": 0.1163, "lr": 6.135381315171867e-05, "epoch": 0.96875, "percentage": 48.44, "elapsed_time": "0:44:24", "remaining_time": "0:47:15"}
{"current_steps": 156, "total_steps": 320, "loss": 0.1414, "lr": 6.0821980696905146e-05, "epoch": 0.975, "percentage": 48.75, "elapsed_time": "0:44:41", "remaining_time": "0:46:58"}
{"current_steps": 157, "total_steps": 320, "loss": 0.1371, "lr": 6.0288860534611745e-05, "epoch": 0.98125, "percentage": 49.06, "elapsed_time": "0:44:58", "remaining_time": "0:46:41"}
{"current_steps": 158, "total_steps": 320, "loss": 0.1591, "lr": 5.9754516100806423e-05, "epoch": 0.9875, "percentage": 49.38, "elapsed_time": "0:45:15", "remaining_time": "0:46:24"}
{"current_steps": 159, "total_steps": 320, "loss": 0.1136, "lr": 5.9219010977133173e-05, "epoch": 0.99375, "percentage": 49.69, "elapsed_time": "0:45:32", "remaining_time": "0:46:06"}
{"current_steps": 160, "total_steps": 320, "loss": 0.1355, "lr": 5.868240888334653e-05, "epoch": 1.0, "percentage": 50.0, "elapsed_time": "0:45:49", "remaining_time": "0:45:49"}
{"current_steps": 161, "total_steps": 320, "loss": 0.1389, "lr": 5.814477366972945e-05, "epoch": 1.00625, "percentage": 50.31, "elapsed_time": "0:46:06", "remaining_time": "0:45:32"}
{"current_steps": 162, "total_steps": 320, "loss": 0.1278, "lr": 5.7606169309495836e-05, "epoch": 1.0125, "percentage": 50.62, "elapsed_time": "0:46:23", "remaining_time": "0:45:15"}
{"current_steps": 163, "total_steps": 320, "loss": 0.1266, "lr": 5.706665989117839e-05, "epoch": 1.01875, "percentage": 50.94, "elapsed_time": "0:46:40", "remaining_time": "0:44:57"}
{"current_steps": 164, "total_steps": 320, "loss": 0.1344, "lr": 5.6526309611002594e-05, "epoch": 1.025, "percentage": 51.25, "elapsed_time": "0:46:58", "remaining_time": "0:44:40"}
{"current_steps": 165, "total_steps": 320, "loss": 0.11, "lr": 5.5985182765248126e-05, "epoch": 1.03125, "percentage": 51.56, "elapsed_time": "0:47:15", "remaining_time": "0:44:23"}
{"current_steps": 166, "total_steps": 320, "loss": 0.1177, "lr": 5.544334374259823e-05, "epoch": 1.0375, "percentage": 51.88, "elapsed_time": "0:47:32", "remaining_time": "0:44:05"}
{"current_steps": 167, "total_steps": 320, "loss": 0.1519, "lr": 5.490085701647805e-05, "epoch": 1.04375, "percentage": 52.19, "elapsed_time": "0:47:49", "remaining_time": "0:43:48"}
{"current_steps": 168, "total_steps": 320, "loss": 0.1388, "lr": 5.435778713738292e-05, "epoch": 1.05, "percentage": 52.5, "elapsed_time": "0:48:06", "remaining_time": "0:43:31"}
{"current_steps": 169, "total_steps": 320, "loss": 0.1315, "lr": 5.381419872519763e-05, "epoch": 1.05625, "percentage": 52.81, "elapsed_time": "0:48:23", "remaining_time": "0:43:14"}
{"current_steps": 170, "total_steps": 320, "loss": 0.1513, "lr": 5.327015646150716e-05, "epoch": 1.0625, "percentage": 53.12, "elapsed_time": "0:48:40", "remaining_time": "0:42:56"}
{"current_steps": 171, "total_steps": 320, "loss": 0.1265, "lr": 5.2725725081900325e-05, "epoch": 1.06875, "percentage": 53.44, "elapsed_time": "0:48:57", "remaining_time": "0:42:39"}
{"current_steps": 172, "total_steps": 320, "loss": 0.1346, "lr": 5.218096936826681e-05, "epoch": 1.075, "percentage": 53.75, "elapsed_time": "0:49:14", "remaining_time": "0:42:22"}
{"current_steps": 173, "total_steps": 320, "loss": 0.1129, "lr": 5.1635954141088813e-05, "epoch": 1.08125, "percentage": 54.06, "elapsed_time": "0:49:31", "remaining_time": "0:42:05"}
{"current_steps": 174, "total_steps": 320, "loss": 0.1031, "lr": 5.1090744251728064e-05, "epoch": 1.0875, "percentage": 54.37, "elapsed_time": "0:49:48", "remaining_time": "0:41:47"}
{"current_steps": 175, "total_steps": 320, "loss": 0.1093, "lr": 5.054540457470912e-05, "epoch": 1.09375, "percentage": 54.69, "elapsed_time": "0:50:05", "remaining_time": "0:41:30"}
{"current_steps": 176, "total_steps": 320, "loss": 0.1283, "lr": 5e-05, "epoch": 1.1, "percentage": 55.0, "elapsed_time": "0:50:22", "remaining_time": "0:41:13"}
{"current_steps": 177, "total_steps": 320, "loss": 0.1163, "lr": 4.945459542529089e-05, "epoch": 1.10625, "percentage": 55.31, "elapsed_time": "0:50:40", "remaining_time": "0:40:56"}
{"current_steps": 178, "total_steps": 320, "loss": 0.1188, "lr": 4.890925574827195e-05, "epoch": 1.1125, "percentage": 55.62, "elapsed_time": "0:50:57", "remaining_time": "0:40:38"}
{"current_steps": 179, "total_steps": 320, "loss": 0.1742, "lr": 4.83640458589112e-05, "epoch": 1.11875, "percentage": 55.94, "elapsed_time": "0:51:14", "remaining_time": "0:40:21"}
{"current_steps": 180, "total_steps": 320, "loss": 0.1217, "lr": 4.781903063173321e-05, "epoch": 1.125, "percentage": 56.25, "elapsed_time": "0:51:31", "remaining_time": "0:40:04"}
{"current_steps": 181, "total_steps": 320, "loss": 0.1047, "lr": 4.727427491809968e-05, "epoch": 1.13125, "percentage": 56.56, "elapsed_time": "0:51:48", "remaining_time": "0:39:47"}
{"current_steps": 182, "total_steps": 320, "loss": 0.1288, "lr": 4.6729843538492847e-05, "epoch": 1.1375, "percentage": 56.88, "elapsed_time": "0:52:05", "remaining_time": "0:39:30"}
{"current_steps": 183, "total_steps": 320, "loss": 0.1123, "lr": 4.618580127480238e-05, "epoch": 1.14375, "percentage": 57.19, "elapsed_time": "0:52:22", "remaining_time": "0:39:12"}
{"current_steps": 184, "total_steps": 320, "loss": 0.1096, "lr": 4.564221286261709e-05, "epoch": 1.15, "percentage": 57.5, "elapsed_time": "0:52:40", "remaining_time": "0:38:55"}
{"current_steps": 185, "total_steps": 320, "loss": 0.1237, "lr": 4.509914298352197e-05, "epoch": 1.15625, "percentage": 57.81, "elapsed_time": "0:52:57", "remaining_time": "0:38:38"}
{"current_steps": 186, "total_steps": 320, "loss": 0.1256, "lr": 4.4556656257401786e-05, "epoch": 1.1625, "percentage": 58.13, "elapsed_time": "0:53:14", "remaining_time": "0:38:21"}
{"current_steps": 187, "total_steps": 320, "loss": 0.087, "lr": 4.4014817234751885e-05, "epoch": 1.16875, "percentage": 58.44, "elapsed_time": "0:53:32", "remaining_time": "0:38:04"}
{"current_steps": 188, "total_steps": 320, "loss": 0.132, "lr": 4.347369038899744e-05, "epoch": 1.175, "percentage": 58.75, "elapsed_time": "0:53:49", "remaining_time": "0:37:47"}
{"current_steps": 189, "total_steps": 320, "loss": 0.1342, "lr": 4.2933340108821644e-05, "epoch": 1.18125, "percentage": 59.06, "elapsed_time": "0:54:06", "remaining_time": "0:37:30"}
{"current_steps": 190, "total_steps": 320, "loss": 0.1144, "lr": 4.239383069050417e-05, "epoch": 1.1875, "percentage": 59.38, "elapsed_time": "0:54:23", "remaining_time": "0:37:13"}
{"current_steps": 191, "total_steps": 320, "loss": 0.11, "lr": 4.185522633027057e-05, "epoch": 1.19375, "percentage": 59.69, "elapsed_time": "0:54:40", "remaining_time": "0:36:55"}
{"current_steps": 192, "total_steps": 320, "loss": 0.1256, "lr": 4.131759111665349e-05, "epoch": 1.2, "percentage": 60.0, "elapsed_time": "0:54:57", "remaining_time": "0:36:38"}
{"current_steps": 193, "total_steps": 320, "loss": 0.1387, "lr": 4.078098902286683e-05, "epoch": 1.20625, "percentage": 60.31, "elapsed_time": "0:55:15", "remaining_time": "0:36:21"}
{"current_steps": 194, "total_steps": 320, "loss": 0.1154, "lr": 4.0245483899193595e-05, "epoch": 1.2125, "percentage": 60.62, "elapsed_time": "0:55:32", "remaining_time": "0:36:04"}
{"current_steps": 195, "total_steps": 320, "loss": 0.1277, "lr": 3.971113946538826e-05, "epoch": 1.21875, "percentage": 60.94, "elapsed_time": "0:55:49", "remaining_time": "0:35:46"}
{"current_steps": 196, "total_steps": 320, "loss": 0.1245, "lr": 3.917801930309486e-05, "epoch": 1.225, "percentage": 61.25, "elapsed_time": "0:56:06", "remaining_time": "0:35:29"}
{"current_steps": 197, "total_steps": 320, "loss": 0.1149, "lr": 3.864618684828134e-05, "epoch": 1.23125, "percentage": 61.56, "elapsed_time": "0:56:23", "remaining_time": "0:35:12"}
{"current_steps": 198, "total_steps": 320, "loss": 0.1137, "lr": 3.8115705383691355e-05, "epoch": 1.2375, "percentage": 61.88, "elapsed_time": "0:56:40", "remaining_time": "0:34:55"}
{"current_steps": 199, "total_steps": 320, "loss": 0.1411, "lr": 3.758663803131418e-05, "epoch": 1.24375, "percentage": 62.19, "elapsed_time": "0:56:57", "remaining_time": "0:34:38"}
{"current_steps": 200, "total_steps": 320, "loss": 0.117, "lr": 3.705904774487396e-05, "epoch": 1.25, "percentage": 62.5, "elapsed_time": "0:57:14", "remaining_time": "0:34:20"}
{"current_steps": 200, "total_steps": 320, "eval_loss": 0.13555637001991272, "epoch": 1.25, "percentage": 62.5, "elapsed_time": "0:57:29", "remaining_time": "0:34:29"}
{"current_steps": 201, "total_steps": 320, "loss": 0.1317, "lr": 3.65329973023387e-05, "epoch": 1.25625, "percentage": 62.81, "elapsed_time": "0:57:47", "remaining_time": "0:34:13"}
{"current_steps": 202, "total_steps": 320, "loss": 0.1485, "lr": 3.60085492984504e-05, "epoch": 1.2625, "percentage": 63.12, "elapsed_time": "0:58:04", "remaining_time": "0:33:55"}
{"current_steps": 203, "total_steps": 320, "loss": 0.127, "lr": 3.5485766137276894e-05, "epoch": 1.26875, "percentage": 63.44, "elapsed_time": "0:58:22", "remaining_time": "0:33:38"}
{"current_steps": 204, "total_steps": 320, "loss": 0.1298, "lr": 3.4964710024786354e-05, "epoch": 1.275, "percentage": 63.75, "elapsed_time": "0:58:39", "remaining_time": "0:33:21"}
{"current_steps": 205, "total_steps": 320, "loss": 0.1218, "lr": 3.4445442961445464e-05, "epoch": 1.28125, "percentage": 64.06, "elapsed_time": "0:58:56", "remaining_time": "0:33:03"}
{"current_steps": 206, "total_steps": 320, "loss": 0.0911, "lr": 3.392802673484193e-05, "epoch": 1.2875, "percentage": 64.38, "elapsed_time": "0:59:13", "remaining_time": "0:32:46"}
{"current_steps": 207, "total_steps": 320, "loss": 0.1105, "lr": 3.341252291233241e-05, "epoch": 1.29375, "percentage": 64.69, "elapsed_time": "0:59:30", "remaining_time": "0:32:29"}
{"current_steps": 208, "total_steps": 320, "loss": 0.157, "lr": 3.289899283371657e-05, "epoch": 1.3, "percentage": 65.0, "elapsed_time": "0:59:47", "remaining_time": "0:32:11"}
{"current_steps": 209, "total_steps": 320, "loss": 0.1167, "lr": 3.2387497603938326e-05, "epoch": 1.30625, "percentage": 65.31, "elapsed_time": "1:00:04", "remaining_time": "0:31:54"}
{"current_steps": 210, "total_steps": 320, "loss": 0.1267, "lr": 3.1878098085814924e-05, "epoch": 1.3125, "percentage": 65.62, "elapsed_time": "1:00:21", "remaining_time": "0:31:37"}
{"current_steps": 211, "total_steps": 320, "loss": 0.1405, "lr": 3.137085489279485e-05, "epoch": 1.31875, "percentage": 65.94, "elapsed_time": "1:00:38", "remaining_time": "0:31:19"}
{"current_steps": 212, "total_steps": 320, "loss": 0.1454, "lr": 3.086582838174551e-05, "epoch": 1.325, "percentage": 66.25, "elapsed_time": "1:00:55", "remaining_time": "0:31:02"}
{"current_steps": 213, "total_steps": 320, "loss": 0.1228, "lr": 3.0363078645771303e-05, "epoch": 1.33125, "percentage": 66.56, "elapsed_time": "1:01:12", "remaining_time": "0:30:45"}
{"current_steps": 214, "total_steps": 320, "loss": 0.1155, "lr": 2.9862665507063147e-05, "epoch": 1.3375, "percentage": 66.88, "elapsed_time": "1:01:30", "remaining_time": "0:30:27"}
{"current_steps": 215, "total_steps": 320, "loss": 0.114, "lr": 2.936464850978027e-05, "epoch": 1.34375, "percentage": 67.19, "elapsed_time": "1:01:47", "remaining_time": "0:30:10"}
{"current_steps": 216, "total_steps": 320, "loss": 0.131, "lr": 2.886908691296504e-05, "epoch": 1.35, "percentage": 67.5, "elapsed_time": "1:02:04", "remaining_time": "0:29:53"}
{"current_steps": 217, "total_steps": 320, "loss": 0.118, "lr": 2.8376039683491686e-05, "epoch": 1.35625, "percentage": 67.81, "elapsed_time": "1:02:21", "remaining_time": "0:29:35"}
{"current_steps": 218, "total_steps": 320, "loss": 0.1206, "lr": 2.7885565489049946e-05, "epoch": 1.3625, "percentage": 68.12, "elapsed_time": "1:02:38", "remaining_time": "0:29:18"}
{"current_steps": 219, "total_steps": 320, "loss": 0.1196, "lr": 2.7397722691164018e-05, "epoch": 1.36875, "percentage": 68.44, "elapsed_time": "1:02:55", "remaining_time": "0:29:01"}
{"current_steps": 220, "total_steps": 320, "loss": 0.1257, "lr": 2.6912569338248315e-05, "epoch": 1.375, "percentage": 68.75, "elapsed_time": "1:03:12", "remaining_time": "0:28:43"}
{"current_steps": 221, "total_steps": 320, "loss": 0.1078, "lr": 2.6430163158700115e-05, "epoch": 1.38125, "percentage": 69.06, "elapsed_time": "1:03:29", "remaining_time": "0:28:26"}
{"current_steps": 222, "total_steps": 320, "loss": 0.1039, "lr": 2.595056155403063e-05, "epoch": 1.3875, "percentage": 69.38, "elapsed_time": "1:03:47", "remaining_time": "0:28:09"}
{"current_steps": 223, "total_steps": 320, "loss": 0.1044, "lr": 2.54738215920346e-05, "epoch": 1.39375, "percentage": 69.69, "elapsed_time": "1:04:04", "remaining_time": "0:27:52"}
{"current_steps": 224, "total_steps": 320, "loss": 0.1152, "lr": 2.500000000000001e-05, "epoch": 1.4, "percentage": 70.0, "elapsed_time": "1:04:21", "remaining_time": "0:27:34"}
{"current_steps": 225, "total_steps": 320, "loss": 0.1234, "lr": 2.4529153157957913e-05, "epoch": 1.40625, "percentage": 70.31, "elapsed_time": "1:04:38", "remaining_time": "0:27:17"}
{"current_steps": 226, "total_steps": 320, "loss": 0.1193, "lr": 2.4061337091973918e-05, "epoch": 1.4125, "percentage": 70.62, "elapsed_time": "1:04:55", "remaining_time": "0:27:00"}
{"current_steps": 227, "total_steps": 320, "loss": 0.1452, "lr": 2.3596607467481603e-05, "epoch": 1.41875, "percentage": 70.94, "elapsed_time": "1:05:12", "remaining_time": "0:26:43"}
{"current_steps": 228, "total_steps": 320, "loss": 0.0936, "lr": 2.3135019582658802e-05, "epoch": 1.425, "percentage": 71.25, "elapsed_time": "1:05:29", "remaining_time": "0:26:25"}
{"current_steps": 229, "total_steps": 320, "loss": 0.1194, "lr": 2.2676628361847836e-05, "epoch": 1.43125, "percentage": 71.56, "elapsed_time": "1:05:46", "remaining_time": "0:26:08"}
{"current_steps": 230, "total_steps": 320, "loss": 0.1328, "lr": 2.2221488349019903e-05, "epoch": 1.4375, "percentage": 71.88, "elapsed_time": "1:06:04", "remaining_time": "0:25:51"}
{"current_steps": 231, "total_steps": 320, "loss": 0.1079, "lr": 2.176965370128498e-05, "epoch": 1.44375, "percentage": 72.19, "elapsed_time": "1:06:21", "remaining_time": "0:25:33"}
{"current_steps": 232, "total_steps": 320, "loss": 0.1225, "lr": 2.132117818244771e-05, "epoch": 1.45, "percentage": 72.5, "elapsed_time": "1:06:38", "remaining_time": "0:25:16"}
{"current_steps": 233, "total_steps": 320, "loss": 0.1521, "lr": 2.08761151566099e-05, "epoch": 1.45625, "percentage": 72.81, "elapsed_time": "1:06:55", "remaining_time": "0:24:59"}
{"current_steps": 234, "total_steps": 320, "loss": 0.1214, "lr": 2.0434517581820896e-05, "epoch": 1.4625, "percentage": 73.12, "elapsed_time": "1:07:12", "remaining_time": "0:24:42"}
{"current_steps": 235, "total_steps": 320, "loss": 0.1305, "lr": 1.999643800377596e-05, "epoch": 1.46875, "percentage": 73.44, "elapsed_time": "1:07:29", "remaining_time": "0:24:24"}
{"current_steps": 236, "total_steps": 320, "loss": 0.1259, "lr": 1.9561928549563968e-05, "epoch": 1.475, "percentage": 73.75, "elapsed_time": "1:07:46", "remaining_time": "0:24:07"}
{"current_steps": 237, "total_steps": 320, "loss": 0.1313, "lr": 1.913104092146476e-05, "epoch": 1.48125, "percentage": 74.06, "elapsed_time": "1:08:03", "remaining_time": "0:23:50"}
{"current_steps": 238, "total_steps": 320, "loss": 0.1082, "lr": 1.8703826390797048e-05, "epoch": 1.4875, "percentage": 74.38, "elapsed_time": "1:08:20", "remaining_time": "0:23:32"}
{"current_steps": 239, "total_steps": 320, "loss": 0.1254, "lr": 1.8280335791817733e-05, "epoch": 1.49375, "percentage": 74.69, "elapsed_time": "1:08:37", "remaining_time": "0:23:15"}
{"current_steps": 240, "total_steps": 320, "loss": 0.0976, "lr": 1.7860619515673033e-05, "epoch": 1.5, "percentage": 75.0, "elapsed_time": "1:08:54", "remaining_time": "0:22:58"}
{"current_steps": 241, "total_steps": 320, "loss": 0.118, "lr": 1.7444727504402553e-05, "epoch": 1.50625, "percentage": 75.31, "elapsed_time": "1:09:12", "remaining_time": "0:22:41"}
{"current_steps": 242, "total_steps": 320, "loss": 0.1221, "lr": 1.703270924499656e-05, "epoch": 1.5125, "percentage": 75.62, "elapsed_time": "1:09:29", "remaining_time": "0:22:23"}
{"current_steps": 243, "total_steps": 320, "loss": 0.1415, "lr": 1.662461376350764e-05, "epoch": 1.51875, "percentage": 75.94, "elapsed_time": "1:09:46", "remaining_time": "0:22:06"}
{"current_steps": 244, "total_steps": 320, "loss": 0.1241, "lr": 1.622048961921699e-05, "epoch": 1.525, "percentage": 76.25, "elapsed_time": "1:10:03", "remaining_time": "0:21:49"}
{"current_steps": 245, "total_steps": 320, "loss": 0.1109, "lr": 1.5820384898856434e-05, "epoch": 1.53125, "percentage": 76.56, "elapsed_time": "1:10:20", "remaining_time": "0:21:31"}
{"current_steps": 246, "total_steps": 320, "loss": 0.1171, "lr": 1.5424347210886538e-05, "epoch": 1.5375, "percentage": 76.88, "elapsed_time": "1:10:37", "remaining_time": "0:21:14"}
{"current_steps": 247, "total_steps": 320, "loss": 0.1087, "lr": 1.5032423679831642e-05, "epoch": 1.54375, "percentage": 77.19, "elapsed_time": "1:10:54", "remaining_time": "0:20:57"}
{"current_steps": 248, "total_steps": 320, "loss": 0.1228, "lr": 1.4644660940672627e-05, "epoch": 1.55, "percentage": 77.5, "elapsed_time": "1:11:11", "remaining_time": "0:20:40"}
{"current_steps": 249, "total_steps": 320, "loss": 0.1217, "lr": 1.4261105133297692e-05, "epoch": 1.55625, "percentage": 77.81, "elapsed_time": "1:11:28", "remaining_time": "0:20:22"}
{"current_steps": 250, "total_steps": 320, "loss": 0.1114, "lr": 1.3881801897012225e-05, "epoch": 1.5625, "percentage": 78.12, "elapsed_time": "1:11:46", "remaining_time": "0:20:05"}
{"current_steps": 251, "total_steps": 320, "loss": 0.1022, "lr": 1.3506796365108232e-05, "epoch": 1.56875, "percentage": 78.44, "elapsed_time": "1:12:03", "remaining_time": "0:19:48"}
{"current_steps": 252, "total_steps": 320, "loss": 0.1114, "lr": 1.3136133159493802e-05, "epoch": 1.575, "percentage": 78.75, "elapsed_time": "1:12:20", "remaining_time": "0:19:31"}
{"current_steps": 253, "total_steps": 320, "loss": 0.1183, "lr": 1.2769856385383688e-05, "epoch": 1.58125, "percentage": 79.06, "elapsed_time": "1:12:37", "remaining_time": "0:19:13"}
{"current_steps": 254, "total_steps": 320, "loss": 0.1152, "lr": 1.2408009626051137e-05, "epoch": 1.5875, "percentage": 79.38, "elapsed_time": "1:12:54", "remaining_time": "0:18:56"}
{"current_steps": 255, "total_steps": 320, "loss": 0.0925, "lr": 1.2050635937641908e-05, "epoch": 1.59375, "percentage": 79.69, "elapsed_time": "1:13:11", "remaining_time": "0:18:39"}
{"current_steps": 256, "total_steps": 320, "loss": 0.1283, "lr": 1.1697777844051105e-05, "epoch": 1.6, "percentage": 80.0, "elapsed_time": "1:13:28", "remaining_time": "0:18:22"}
{"current_steps": 257, "total_steps": 320, "loss": 0.13, "lr": 1.134947733186315e-05, "epoch": 1.60625, "percentage": 80.31, "elapsed_time": "1:13:46", "remaining_time": "0:18:04"}
{"current_steps": 258, "total_steps": 320, "loss": 0.1107, "lr": 1.100577584535592e-05, "epoch": 1.6125, "percentage": 80.62, "elapsed_time": "1:14:03", "remaining_time": "0:17:47"}
{"current_steps": 259, "total_steps": 320, "loss": 0.1061, "lr": 1.0666714281569151e-05, "epoch": 1.61875, "percentage": 80.94, "elapsed_time": "1:14:20", "remaining_time": "0:17:30"}
{"current_steps": 260, "total_steps": 320, "loss": 0.1151, "lr": 1.0332332985438248e-05, "epoch": 1.625, "percentage": 81.25, "elapsed_time": "1:14:37", "remaining_time": "0:17:13"}
{"current_steps": 261, "total_steps": 320, "loss": 0.1288, "lr": 1.000267174499352e-05, "epoch": 1.63125, "percentage": 81.56, "elapsed_time": "1:14:54", "remaining_time": "0:16:55"}
{"current_steps": 262, "total_steps": 320, "loss": 0.1096, "lr": 9.677769786625867e-06, "epoch": 1.6375, "percentage": 81.88, "elapsed_time": "1:15:11", "remaining_time": "0:16:38"}
{"current_steps": 263, "total_steps": 320, "loss": 0.0998, "lr": 9.357665770419244e-06, "epoch": 1.64375, "percentage": 82.19, "elapsed_time": "1:15:28", "remaining_time": "0:16:21"}
{"current_steps": 264, "total_steps": 320, "loss": 0.1083, "lr": 9.042397785550405e-06, "epoch": 1.65, "percentage": 82.5, "elapsed_time": "1:15:45", "remaining_time": "0:16:04"}
{"current_steps": 265, "total_steps": 320, "loss": 0.118, "lr": 8.732003345756811e-06, "epoch": 1.65625, "percentage": 82.81, "elapsed_time": "1:16:02", "remaining_time": "0:15:46"}
{"current_steps": 266, "total_steps": 320, "loss": 0.1088, "lr": 8.426519384872733e-06, "epoch": 1.6625, "percentage": 83.12, "elapsed_time": "1:16:19", "remaining_time": "0:15:29"}
{"current_steps": 267, "total_steps": 320, "loss": 0.1239, "lr": 8.125982252434611e-06, "epoch": 1.66875, "percentage": 83.44, "elapsed_time": "1:16:36", "remaining_time": "0:15:12"}
{"current_steps": 268, "total_steps": 320, "loss": 0.1164, "lr": 7.830427709355725e-06, "epoch": 1.675, "percentage": 83.75, "elapsed_time": "1:16:54", "remaining_time": "0:14:55"}
{"current_steps": 269, "total_steps": 320, "loss": 0.0855, "lr": 7.539890923671062e-06, "epoch": 1.68125, "percentage": 84.06, "elapsed_time": "1:17:11", "remaining_time": "0:14:38"}
{"current_steps": 270, "total_steps": 320, "loss": 0.1395, "lr": 7.2544064663526815e-06, "epoch": 1.6875, "percentage": 84.38, "elapsed_time": "1:17:28", "remaining_time": "0:14:20"}
{"current_steps": 271, "total_steps": 320, "loss": 0.1081, "lr": 6.974008307196056e-06, "epoch": 1.69375, "percentage": 84.69, "elapsed_time": "1:17:45", "remaining_time": "0:14:03"}
{"current_steps": 272, "total_steps": 320, "loss": 0.1358, "lr": 6.698729810778065e-06, "epoch": 1.7, "percentage": 85.0, "elapsed_time": "1:18:02", "remaining_time": "0:13:46"}
{"current_steps": 273, "total_steps": 320, "loss": 0.1208, "lr": 6.428603732486937e-06, "epoch": 1.70625, "percentage": 85.31, "elapsed_time": "1:18:20", "remaining_time": "0:13:29"}
{"current_steps": 274, "total_steps": 320, "loss": 0.1208, "lr": 6.163662214624616e-06, "epoch": 1.7125, "percentage": 85.62, "elapsed_time": "1:18:37", "remaining_time": "0:13:11"}
{"current_steps": 275, "total_steps": 320, "loss": 0.0961, "lr": 5.903936782582253e-06, "epoch": 1.71875, "percentage": 85.94, "elapsed_time": "1:18:54", "remaining_time": "0:12:54"}
{"current_steps": 276, "total_steps": 320, "loss": 0.1328, "lr": 5.649458341088915e-06, "epoch": 1.725, "percentage": 86.25, "elapsed_time": "1:19:11", "remaining_time": "0:12:37"}
{"current_steps": 277, "total_steps": 320, "loss": 0.1137, "lr": 5.400257170534295e-06, "epoch": 1.73125, "percentage": 86.56, "elapsed_time": "1:19:28", "remaining_time": "0:12:20"}
{"current_steps": 278, "total_steps": 320, "loss": 0.0963, "lr": 5.156362923365588e-06, "epoch": 1.7375, "percentage": 86.88, "elapsed_time": "1:19:46", "remaining_time": "0:12:03"}
{"current_steps": 279, "total_steps": 320, "loss": 0.1299, "lr": 4.917804620559202e-06, "epoch": 1.74375, "percentage": 87.19, "elapsed_time": "1:20:03", "remaining_time": "0:11:45"}
{"current_steps": 280, "total_steps": 320, "loss": 0.1003, "lr": 4.684610648167503e-06, "epoch": 1.75, "percentage": 87.5, "elapsed_time": "1:20:20", "remaining_time": "0:11:28"}
{"current_steps": 281, "total_steps": 320, "loss": 0.1005, "lr": 4.456808753941205e-06, "epoch": 1.75625, "percentage": 87.81, "elapsed_time": "1:20:37", "remaining_time": "0:11:11"}
{"current_steps": 282, "total_steps": 320, "loss": 0.1184, "lr": 4.234426044027645e-06, "epoch": 1.7625, "percentage": 88.12, "elapsed_time": "1:20:54", "remaining_time": "0:10:54"}
{"current_steps": 283, "total_steps": 320, "loss": 0.1083, "lr": 4.017488979745387e-06, "epoch": 1.76875, "percentage": 88.44, "elapsed_time": "1:21:11", "remaining_time": "0:10:36"}
{"current_steps": 284, "total_steps": 320, "loss": 0.1349, "lr": 3.8060233744356633e-06, "epoch": 1.775, "percentage": 88.75, "elapsed_time": "1:21:28", "remaining_time": "0:10:19"}
{"current_steps": 285, "total_steps": 320, "loss": 0.1189, "lr": 3.600054390390778e-06, "epoch": 1.78125, "percentage": 89.06, "elapsed_time": "1:21:45", "remaining_time": "0:10:02"}
{"current_steps": 286, "total_steps": 320, "loss": 0.1124, "lr": 3.3996065358600782e-06, "epoch": 1.7875, "percentage": 89.38, "elapsed_time": "1:22:03", "remaining_time": "0:09:45"}
{"current_steps": 287, "total_steps": 320, "loss": 0.1242, "lr": 3.2047036621337236e-06, "epoch": 1.79375, "percentage": 89.69, "elapsed_time": "1:22:20", "remaining_time": "0:09:28"}
{"current_steps": 288, "total_steps": 320, "loss": 0.1269, "lr": 3.0153689607045845e-06, "epoch": 1.8, "percentage": 90.0, "elapsed_time": "1:22:37", "remaining_time": "0:09:10"}
{"current_steps": 289, "total_steps": 320, "loss": 0.108, "lr": 2.8316249605087386e-06, "epoch": 1.80625, "percentage": 90.31, "elapsed_time": "1:22:54", "remaining_time": "0:08:53"}
{"current_steps": 290, "total_steps": 320, "loss": 0.104, "lr": 2.653493525244721e-06, "epoch": 1.8125, "percentage": 90.62, "elapsed_time": "1:23:11", "remaining_time": "0:08:36"}
{"current_steps": 291, "total_steps": 320, "loss": 0.1227, "lr": 2.4809958507719444e-06, "epoch": 1.81875, "percentage": 90.94, "elapsed_time": "1:23:28", "remaining_time": "0:08:19"}
{"current_steps": 292, "total_steps": 320, "loss": 0.1122, "lr": 2.314152462588659e-06, "epoch": 1.825, "percentage": 91.25, "elapsed_time": "1:23:45", "remaining_time": "0:08:01"}
{"current_steps": 293, "total_steps": 320, "loss": 0.1206, "lr": 2.152983213389559e-06, "epoch": 1.83125, "percentage": 91.56, "elapsed_time": "1:24:02", "remaining_time": "0:07:44"}
{"current_steps": 294, "total_steps": 320, "loss": 0.0849, "lr": 1.99750728070357e-06, "epoch": 1.8375, "percentage": 91.88, "elapsed_time": "1:24:19", "remaining_time": "0:07:27"}
{"current_steps": 295, "total_steps": 320, "loss": 0.1168, "lr": 1.8477431646118648e-06, "epoch": 1.84375, "percentage": 92.19, "elapsed_time": "1:24:36", "remaining_time": "0:07:10"}
{"current_steps": 296, "total_steps": 320, "loss": 0.1002, "lr": 1.70370868554659e-06, "epoch": 1.85, "percentage": 92.5, "elapsed_time": "1:24:53", "remaining_time": "0:06:53"}
{"current_steps": 297, "total_steps": 320, "loss": 0.1204, "lr": 1.565420982170346e-06, "epoch": 1.85625, "percentage": 92.81, "elapsed_time": "1:25:11", "remaining_time": "0:06:35"}
{"current_steps": 298, "total_steps": 320, "loss": 0.1052, "lr": 1.4328965093369283e-06, "epoch": 1.8625, "percentage": 93.12, "elapsed_time": "1:25:28", "remaining_time": "0:06:18"}
{"current_steps": 299, "total_steps": 320, "loss": 0.1185, "lr": 1.3061510361333185e-06, "epoch": 1.86875, "percentage": 93.44, "elapsed_time": "1:25:45", "remaining_time": "0:06:01"}
{"current_steps": 300, "total_steps": 320, "loss": 0.1372, "lr": 1.1851996440033319e-06, "epoch": 1.875, "percentage": 93.75, "elapsed_time": "1:26:02", "remaining_time": "0:05:44"}
{"current_steps": 301, "total_steps": 320, "loss": 0.1374, "lr": 1.0700567249530834e-06, "epoch": 1.88125, "percentage": 94.06, "elapsed_time": "1:27:49", "remaining_time": "0:05:32"}
{"current_steps": 302, "total_steps": 320, "loss": 0.1265, "lr": 9.607359798384785e-07, "epoch": 1.8875, "percentage": 94.38, "elapsed_time": "1:28:07", "remaining_time": "0:05:15"}
{"current_steps": 303, "total_steps": 320, "loss": 0.1156, "lr": 8.572504167349449e-07, "epoch": 1.89375, "percentage": 94.69, "elapsed_time": "1:28:24", "remaining_time": "0:04:57"}
{"current_steps": 304, "total_steps": 320, "loss": 0.1131, "lr": 7.596123493895991e-07, "epoch": 1.9, "percentage": 95.0, "elapsed_time": "1:28:41", "remaining_time": "0:04:40"}
{"current_steps": 305, "total_steps": 320, "loss": 0.1212, "lr": 6.678333957560512e-07, "epoch": 1.90625, "percentage": 95.31, "elapsed_time": "1:28:58", "remaining_time": "0:04:22"}
{"current_steps": 306, "total_steps": 320, "loss": 0.1249, "lr": 5.81924476611967e-07, "epoch": 1.9125, "percentage": 95.62, "elapsed_time": "1:29:16", "remaining_time": "0:04:05"}
{"current_steps": 307, "total_steps": 320, "loss": 0.1123, "lr": 5.018958142596065e-07, "epoch": 1.91875, "percentage": 95.94, "elapsed_time": "1:29:33", "remaining_time": "0:03:47"}
{"current_steps": 308, "total_steps": 320, "loss": 0.1017, "lr": 4.277569313094809e-07, "epoch": 1.925, "percentage": 96.25, "elapsed_time": "1:29:50", "remaining_time": "0:03:30"}
{"current_steps": 309, "total_steps": 320, "loss": 0.1265, "lr": 3.59516649547248e-07, "epoch": 1.93125, "percentage": 96.56, "elapsed_time": "1:30:07", "remaining_time": "0:03:12"}
{"current_steps": 310, "total_steps": 320, "loss": 0.139, "lr": 2.971830888840177e-07, "epoch": 1.9375, "percentage": 96.88, "elapsed_time": "1:30:24", "remaining_time": "0:02:54"}
{"current_steps": 311, "total_steps": 320, "loss": 0.1015, "lr": 2.407636663901591e-07, "epoch": 1.94375, "percentage": 97.19, "elapsed_time": "1:30:42", "remaining_time": "0:02:37"}
{"current_steps": 312, "total_steps": 320, "loss": 0.1294, "lr": 1.9026509541272275e-07, "epoch": 1.95, "percentage": 97.5, "elapsed_time": "1:30:59", "remaining_time": "0:02:19"}
{"current_steps": 313, "total_steps": 320, "loss": 0.1282, "lr": 1.4569338477666838e-07, "epoch": 1.95625, "percentage": 97.81, "elapsed_time": "1:31:16", "remaining_time": "0:02:02"}
{"current_steps": 314, "total_steps": 320, "loss": 0.1103, "lr": 1.0705383806982606e-07, "epoch": 1.9625, "percentage": 98.12, "elapsed_time": "1:31:33", "remaining_time": "0:01:44"}
{"current_steps": 315, "total_steps": 320, "loss": 0.1114, "lr": 7.43510530118452e-08, "epoch": 1.96875, "percentage": 98.44, "elapsed_time": "1:31:51", "remaining_time": "0:01:27"}
{"current_steps": 316, "total_steps": 320, "loss": 0.1202, "lr": 4.7588920907110094e-08, "epoch": 1.975, "percentage": 98.75, "elapsed_time": "1:32:08", "remaining_time": "0:01:09"}
{"current_steps": 317, "total_steps": 320, "loss": 0.1172, "lr": 2.6770626181715773e-08, "epoch": 1.98125, "percentage": 99.06, "elapsed_time": "1:32:25", "remaining_time": "0:00:52"}
{"current_steps": 318, "total_steps": 320, "loss": 0.1239, "lr": 1.189864600454338e-08, "epoch": 1.9875, "percentage": 99.38, "elapsed_time": "1:32:42", "remaining_time": "0:00:34"}
{"current_steps": 319, "total_steps": 320, "loss": 0.1275, "lr": 2.974749992512571e-09, "epoch": 1.99375, "percentage": 99.69, "elapsed_time": "1:32:59", "remaining_time": "0:00:17"}
{"current_steps": 320, "total_steps": 320, "loss": 0.1243, "lr": 0.0, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "1:33:16", "remaining_time": "0:00:00"}
{"current_steps": 320, "total_steps": 320, "epoch": 2.0, "percentage": 100.0, "elapsed_time": "1:35:10", "remaining_time": "0:00:00"}