alinerodrigues commited on
Commit
31fac2e
·
1 Parent(s): d4d10c2

End of training

Browse files
Files changed (4) hide show
  1. all_results.json +17 -0
  2. eval_results.json +11 -0
  3. train_results.json +9 -0
  4. trainer_state.json +1414 -0
all_results.json ADDED
@@ -0,0 +1,17 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 117.0,
3
+ "eval_cer": 0.17969062784349407,
4
+ "eval_loss": 0.5485906004905701,
5
+ "eval_per": 0.3386834620073141,
6
+ "eval_runtime": 16.5773,
7
+ "eval_samples": 542,
8
+ "eval_samples_per_second": 32.695,
9
+ "eval_steps_per_second": 4.102,
10
+ "eval_wer": 0.35107679804957337,
11
+ "total_flos": 1.462030946643386e+19,
12
+ "train_loss": 1.771814914558979,
13
+ "train_runtime": 12938.9921,
14
+ "train_samples": 448,
15
+ "train_samples_per_second": 5.194,
16
+ "train_steps_per_second": 0.162
17
+ }
eval_results.json ADDED
@@ -0,0 +1,11 @@
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 117.0,
3
+ "eval_cer": 0.17969062784349407,
4
+ "eval_loss": 0.5485906004905701,
5
+ "eval_per": 0.3386834620073141,
6
+ "eval_runtime": 16.5773,
7
+ "eval_samples": 542,
8
+ "eval_samples_per_second": 32.695,
9
+ "eval_steps_per_second": 4.102,
10
+ "eval_wer": 0.35107679804957337
11
+ }
train_results.json ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 117.0,
3
+ "total_flos": 1.462030946643386e+19,
4
+ "train_loss": 1.771814914558979,
5
+ "train_runtime": 12938.9921,
6
+ "train_samples": 448,
7
+ "train_samples_per_second": 5.194,
8
+ "train_steps_per_second": 0.162
9
+ }
trainer_state.json ADDED
@@ -0,0 +1,1414 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": 0.5485906004905701,
3
+ "best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-17/checkpoint-1358",
4
+ "epoch": 117.0,
5
+ "global_step": 1638,
6
+ "is_hyper_param_search": false,
7
+ "is_local_process_zero": true,
8
+ "is_world_process_zero": true,
9
+ "log_history": [
10
+ {
11
+ "epoch": 0.07,
12
+ "learning_rate": 0.0,
13
+ "loss": 38.4208,
14
+ "step": 1
15
+ },
16
+ {
17
+ "epoch": 1.0,
18
+ "eval_cer": 1.2145950864422201,
19
+ "eval_loss": 41.80952453613281,
20
+ "eval_per": 1.0056887444128404,
21
+ "eval_runtime": 16.4211,
22
+ "eval_samples_per_second": 33.006,
23
+ "eval_steps_per_second": 4.141,
24
+ "eval_wer": 1.0056887444128404,
25
+ "step": 14
26
+ },
27
+ {
28
+ "epoch": 2.0,
29
+ "eval_cer": 0.9618562329390354,
30
+ "eval_loss": 12.287281036376953,
31
+ "eval_per": 1.0,
32
+ "eval_runtime": 16.3942,
33
+ "eval_samples_per_second": 33.06,
34
+ "eval_steps_per_second": 4.148,
35
+ "eval_wer": 1.0,
36
+ "step": 28
37
+ },
38
+ {
39
+ "epoch": 3.0,
40
+ "eval_cer": 0.9618562329390354,
41
+ "eval_loss": 4.809342861175537,
42
+ "eval_per": 1.0,
43
+ "eval_runtime": 17.8009,
44
+ "eval_samples_per_second": 30.448,
45
+ "eval_steps_per_second": 3.82,
46
+ "eval_wer": 1.0,
47
+ "step": 42
48
+ },
49
+ {
50
+ "epoch": 4.0,
51
+ "eval_cer": 0.9618562329390354,
52
+ "eval_loss": 3.9737813472747803,
53
+ "eval_per": 1.0,
54
+ "eval_runtime": 16.1587,
55
+ "eval_samples_per_second": 33.542,
56
+ "eval_steps_per_second": 4.208,
57
+ "eval_wer": 1.0,
58
+ "step": 56
59
+ },
60
+ {
61
+ "epoch": 5.0,
62
+ "eval_cer": 0.9618562329390354,
63
+ "eval_loss": 3.6683900356292725,
64
+ "eval_per": 1.0,
65
+ "eval_runtime": 17.3608,
66
+ "eval_samples_per_second": 31.22,
67
+ "eval_steps_per_second": 3.917,
68
+ "eval_wer": 1.0,
69
+ "step": 70
70
+ },
71
+ {
72
+ "epoch": 6.0,
73
+ "eval_cer": 0.9618562329390354,
74
+ "eval_loss": 3.5007262229919434,
75
+ "eval_per": 1.0,
76
+ "eval_runtime": 16.8377,
77
+ "eval_samples_per_second": 32.19,
78
+ "eval_steps_per_second": 4.039,
79
+ "eval_wer": 1.0,
80
+ "step": 84
81
+ },
82
+ {
83
+ "epoch": 7.0,
84
+ "eval_cer": 0.9618562329390354,
85
+ "eval_loss": 3.3854148387908936,
86
+ "eval_per": 1.0,
87
+ "eval_runtime": 15.8896,
88
+ "eval_samples_per_second": 34.11,
89
+ "eval_steps_per_second": 4.28,
90
+ "eval_wer": 1.0,
91
+ "step": 98
92
+ },
93
+ {
94
+ "epoch": 7.14,
95
+ "learning_rate": 3.853775853775854e-05,
96
+ "loss": 11.8009,
97
+ "step": 100
98
+ },
99
+ {
100
+ "epoch": 8.0,
101
+ "eval_cer": 0.9618562329390354,
102
+ "eval_loss": 3.450645923614502,
103
+ "eval_per": 1.0,
104
+ "eval_runtime": 16.3597,
105
+ "eval_samples_per_second": 33.13,
106
+ "eval_steps_per_second": 4.157,
107
+ "eval_wer": 1.0,
108
+ "step": 112
109
+ },
110
+ {
111
+ "epoch": 9.0,
112
+ "eval_cer": 0.9618562329390354,
113
+ "eval_loss": 3.178906202316284,
114
+ "eval_per": 1.0,
115
+ "eval_runtime": 16.1702,
116
+ "eval_samples_per_second": 33.519,
117
+ "eval_steps_per_second": 4.205,
118
+ "eval_wer": 1.0,
119
+ "step": 126
120
+ },
121
+ {
122
+ "epoch": 10.0,
123
+ "eval_cer": 0.9618562329390354,
124
+ "eval_loss": 3.1274373531341553,
125
+ "eval_per": 1.0,
126
+ "eval_runtime": 16.9804,
127
+ "eval_samples_per_second": 31.919,
128
+ "eval_steps_per_second": 4.005,
129
+ "eval_wer": 1.0,
130
+ "step": 140
131
+ },
132
+ {
133
+ "epoch": 11.0,
134
+ "eval_cer": 0.9618562329390354,
135
+ "eval_loss": 3.1624248027801514,
136
+ "eval_per": 1.0,
137
+ "eval_runtime": 16.0626,
138
+ "eval_samples_per_second": 33.743,
139
+ "eval_steps_per_second": 4.233,
140
+ "eval_wer": 1.0,
141
+ "step": 154
142
+ },
143
+ {
144
+ "epoch": 12.0,
145
+ "eval_cer": 0.9618562329390354,
146
+ "eval_loss": 3.1065869331359863,
147
+ "eval_per": 1.0,
148
+ "eval_runtime": 15.7377,
149
+ "eval_samples_per_second": 34.44,
150
+ "eval_steps_per_second": 4.321,
151
+ "eval_wer": 1.0,
152
+ "step": 168
153
+ },
154
+ {
155
+ "epoch": 13.0,
156
+ "eval_cer": 0.9618562329390354,
157
+ "eval_loss": 3.0579798221588135,
158
+ "eval_per": 1.0,
159
+ "eval_runtime": 16.1086,
160
+ "eval_samples_per_second": 33.647,
161
+ "eval_steps_per_second": 4.221,
162
+ "eval_wer": 1.0,
163
+ "step": 182
164
+ },
165
+ {
166
+ "epoch": 14.0,
167
+ "eval_cer": 0.9618562329390354,
168
+ "eval_loss": 3.0477194786071777,
169
+ "eval_per": 1.0,
170
+ "eval_runtime": 17.7392,
171
+ "eval_samples_per_second": 30.554,
172
+ "eval_steps_per_second": 3.833,
173
+ "eval_wer": 1.0,
174
+ "step": 196
175
+ },
176
+ {
177
+ "epoch": 14.29,
178
+ "learning_rate": 3.6613756613756616e-05,
179
+ "loss": 3.0395,
180
+ "step": 200
181
+ },
182
+ {
183
+ "epoch": 15.0,
184
+ "eval_cer": 0.9618562329390354,
185
+ "eval_loss": 3.051933526992798,
186
+ "eval_per": 1.0,
187
+ "eval_runtime": 16.5102,
188
+ "eval_samples_per_second": 32.828,
189
+ "eval_steps_per_second": 4.119,
190
+ "eval_wer": 1.0,
191
+ "step": 210
192
+ },
193
+ {
194
+ "epoch": 16.0,
195
+ "eval_cer": 0.9618562329390354,
196
+ "eval_loss": 3.0363881587982178,
197
+ "eval_per": 1.0,
198
+ "eval_runtime": 16.6774,
199
+ "eval_samples_per_second": 32.499,
200
+ "eval_steps_per_second": 4.077,
201
+ "eval_wer": 1.0,
202
+ "step": 224
203
+ },
204
+ {
205
+ "epoch": 17.0,
206
+ "eval_cer": 0.9618562329390354,
207
+ "eval_loss": 3.015160083770752,
208
+ "eval_per": 1.0,
209
+ "eval_runtime": 17.0522,
210
+ "eval_samples_per_second": 31.785,
211
+ "eval_steps_per_second": 3.988,
212
+ "eval_wer": 1.0,
213
+ "step": 238
214
+ },
215
+ {
216
+ "epoch": 18.0,
217
+ "eval_cer": 0.9618562329390354,
218
+ "eval_loss": 3.0166876316070557,
219
+ "eval_per": 1.0,
220
+ "eval_runtime": 16.1958,
221
+ "eval_samples_per_second": 33.465,
222
+ "eval_steps_per_second": 4.199,
223
+ "eval_wer": 1.0,
224
+ "step": 252
225
+ },
226
+ {
227
+ "epoch": 19.0,
228
+ "eval_cer": 0.9618562329390354,
229
+ "eval_loss": 3.0129683017730713,
230
+ "eval_per": 1.0,
231
+ "eval_runtime": 17.0594,
232
+ "eval_samples_per_second": 31.771,
233
+ "eval_steps_per_second": 3.986,
234
+ "eval_wer": 1.0,
235
+ "step": 266
236
+ },
237
+ {
238
+ "epoch": 20.0,
239
+ "eval_cer": 0.9618562329390354,
240
+ "eval_loss": 3.0103399753570557,
241
+ "eval_per": 1.0,
242
+ "eval_runtime": 16.6483,
243
+ "eval_samples_per_second": 32.556,
244
+ "eval_steps_per_second": 4.084,
245
+ "eval_wer": 1.0,
246
+ "step": 280
247
+ },
248
+ {
249
+ "epoch": 21.0,
250
+ "eval_cer": 0.9618562329390354,
251
+ "eval_loss": 2.9993834495544434,
252
+ "eval_per": 1.0,
253
+ "eval_runtime": 16.1419,
254
+ "eval_samples_per_second": 33.577,
255
+ "eval_steps_per_second": 4.213,
256
+ "eval_wer": 1.0,
257
+ "step": 294
258
+ },
259
+ {
260
+ "epoch": 21.43,
261
+ "learning_rate": 3.468975468975469e-05,
262
+ "loss": 2.9424,
263
+ "step": 300
264
+ },
265
+ {
266
+ "epoch": 22.0,
267
+ "eval_cer": 0.9618562329390354,
268
+ "eval_loss": 2.999858856201172,
269
+ "eval_per": 1.0,
270
+ "eval_runtime": 16.4633,
271
+ "eval_samples_per_second": 32.922,
272
+ "eval_steps_per_second": 4.13,
273
+ "eval_wer": 1.0,
274
+ "step": 308
275
+ },
276
+ {
277
+ "epoch": 23.0,
278
+ "eval_cer": 0.9618562329390354,
279
+ "eval_loss": 3.000885486602783,
280
+ "eval_per": 1.0,
281
+ "eval_runtime": 16.4157,
282
+ "eval_samples_per_second": 33.017,
283
+ "eval_steps_per_second": 4.142,
284
+ "eval_wer": 1.0,
285
+ "step": 322
286
+ },
287
+ {
288
+ "epoch": 24.0,
289
+ "eval_cer": 0.9618562329390354,
290
+ "eval_loss": 3.002438545227051,
291
+ "eval_per": 1.0,
292
+ "eval_runtime": 16.3396,
293
+ "eval_samples_per_second": 33.171,
294
+ "eval_steps_per_second": 4.162,
295
+ "eval_wer": 1.0,
296
+ "step": 336
297
+ },
298
+ {
299
+ "epoch": 25.0,
300
+ "eval_cer": 0.9618562329390354,
301
+ "eval_loss": 3.000091552734375,
302
+ "eval_per": 1.0,
303
+ "eval_runtime": 16.2524,
304
+ "eval_samples_per_second": 33.349,
305
+ "eval_steps_per_second": 4.184,
306
+ "eval_wer": 1.0,
307
+ "step": 350
308
+ },
309
+ {
310
+ "epoch": 26.0,
311
+ "eval_cer": 0.9618562329390354,
312
+ "eval_loss": 2.989057779312134,
313
+ "eval_per": 1.0,
314
+ "eval_runtime": 16.9129,
315
+ "eval_samples_per_second": 32.047,
316
+ "eval_steps_per_second": 4.021,
317
+ "eval_wer": 1.0,
318
+ "step": 364
319
+ },
320
+ {
321
+ "epoch": 27.0,
322
+ "eval_cer": 0.9618562329390354,
323
+ "eval_loss": 2.988072633743286,
324
+ "eval_per": 1.0,
325
+ "eval_runtime": 16.8979,
326
+ "eval_samples_per_second": 32.075,
327
+ "eval_steps_per_second": 4.024,
328
+ "eval_wer": 1.0,
329
+ "step": 378
330
+ },
331
+ {
332
+ "epoch": 28.0,
333
+ "eval_cer": 0.9618562329390354,
334
+ "eval_loss": 2.97031569480896,
335
+ "eval_per": 1.0,
336
+ "eval_runtime": 16.5706,
337
+ "eval_samples_per_second": 32.708,
338
+ "eval_steps_per_second": 4.104,
339
+ "eval_wer": 1.0,
340
+ "step": 392
341
+ },
342
+ {
343
+ "epoch": 28.57,
344
+ "learning_rate": 3.276575276575277e-05,
345
+ "loss": 2.9154,
346
+ "step": 400
347
+ },
348
+ {
349
+ "epoch": 29.0,
350
+ "eval_cer": 0.9618562329390354,
351
+ "eval_loss": 2.9531471729278564,
352
+ "eval_per": 1.0,
353
+ "eval_runtime": 16.0162,
354
+ "eval_samples_per_second": 33.841,
355
+ "eval_steps_per_second": 4.246,
356
+ "eval_wer": 1.0,
357
+ "step": 406
358
+ },
359
+ {
360
+ "epoch": 30.0,
361
+ "eval_cer": 0.9618562329390354,
362
+ "eval_loss": 2.920755624771118,
363
+ "eval_per": 1.0,
364
+ "eval_runtime": 16.2922,
365
+ "eval_samples_per_second": 33.267,
366
+ "eval_steps_per_second": 4.174,
367
+ "eval_wer": 1.0,
368
+ "step": 420
369
+ },
370
+ {
371
+ "epoch": 31.0,
372
+ "eval_cer": 0.9618562329390354,
373
+ "eval_loss": 2.898137331008911,
374
+ "eval_per": 1.0,
375
+ "eval_runtime": 16.1037,
376
+ "eval_samples_per_second": 33.657,
377
+ "eval_steps_per_second": 4.223,
378
+ "eval_wer": 1.0,
379
+ "step": 434
380
+ },
381
+ {
382
+ "epoch": 32.0,
383
+ "eval_cer": 0.9618562329390354,
384
+ "eval_loss": 2.8320581912994385,
385
+ "eval_per": 1.0,
386
+ "eval_runtime": 16.1007,
387
+ "eval_samples_per_second": 33.663,
388
+ "eval_steps_per_second": 4.223,
389
+ "eval_wer": 1.0,
390
+ "step": 448
391
+ },
392
+ {
393
+ "epoch": 33.0,
394
+ "eval_cer": 0.9618562329390354,
395
+ "eval_loss": 2.7583184242248535,
396
+ "eval_per": 1.0,
397
+ "eval_runtime": 16.3232,
398
+ "eval_samples_per_second": 33.204,
399
+ "eval_steps_per_second": 4.166,
400
+ "eval_wer": 1.0,
401
+ "step": 462
402
+ },
403
+ {
404
+ "epoch": 34.0,
405
+ "eval_cer": 0.9616014558689718,
406
+ "eval_loss": 2.6405322551727295,
407
+ "eval_per": 1.0,
408
+ "eval_runtime": 16.4064,
409
+ "eval_samples_per_second": 33.036,
410
+ "eval_steps_per_second": 4.145,
411
+ "eval_wer": 1.0,
412
+ "step": 476
413
+ },
414
+ {
415
+ "epoch": 35.0,
416
+ "eval_cer": 0.8832029117379436,
417
+ "eval_loss": 2.5071756839752197,
418
+ "eval_per": 1.0,
419
+ "eval_runtime": 16.3137,
420
+ "eval_samples_per_second": 33.224,
421
+ "eval_steps_per_second": 4.168,
422
+ "eval_wer": 1.0,
423
+ "step": 490
424
+ },
425
+ {
426
+ "epoch": 35.71,
427
+ "learning_rate": 3.0841750841750846e-05,
428
+ "loss": 2.7552,
429
+ "step": 500
430
+ },
431
+ {
432
+ "epoch": 36.0,
433
+ "eval_cer": 0.6144131028207461,
434
+ "eval_loss": 2.1546847820281982,
435
+ "eval_per": 1.0,
436
+ "eval_runtime": 16.1444,
437
+ "eval_samples_per_second": 33.572,
438
+ "eval_steps_per_second": 4.212,
439
+ "eval_wer": 1.0,
440
+ "step": 504
441
+ },
442
+ {
443
+ "epoch": 37.0,
444
+ "eval_cer": 0.49958143767060964,
445
+ "eval_loss": 1.7564772367477417,
446
+ "eval_per": 1.0,
447
+ "eval_runtime": 16.6494,
448
+ "eval_samples_per_second": 32.554,
449
+ "eval_steps_per_second": 4.084,
450
+ "eval_wer": 1.0,
451
+ "step": 518
452
+ },
453
+ {
454
+ "epoch": 38.0,
455
+ "eval_cer": 0.40651501364877163,
456
+ "eval_loss": 1.460233211517334,
457
+ "eval_per": 1.0,
458
+ "eval_runtime": 16.6864,
459
+ "eval_samples_per_second": 32.482,
460
+ "eval_steps_per_second": 4.075,
461
+ "eval_wer": 1.0,
462
+ "step": 532
463
+ },
464
+ {
465
+ "epoch": 39.0,
466
+ "eval_cer": 0.36578707916287534,
467
+ "eval_loss": 1.2268937826156616,
468
+ "eval_per": 0.9892320195042665,
469
+ "eval_runtime": 16.8505,
470
+ "eval_samples_per_second": 32.165,
471
+ "eval_steps_per_second": 4.035,
472
+ "eval_wer": 0.989638358390898,
473
+ "step": 546
474
+ },
475
+ {
476
+ "epoch": 40.0,
477
+ "eval_cer": 0.3204731574158326,
478
+ "eval_loss": 1.0905884504318237,
479
+ "eval_per": 0.8833807395367737,
480
+ "eval_runtime": 16.8204,
481
+ "eval_samples_per_second": 32.223,
482
+ "eval_steps_per_second": 4.043,
483
+ "eval_wer": 0.8880536367330354,
484
+ "step": 560
485
+ },
486
+ {
487
+ "epoch": 41.0,
488
+ "eval_cer": 0.26314831665150135,
489
+ "eval_loss": 0.9941390752792358,
490
+ "eval_per": 0.6603006907761073,
491
+ "eval_runtime": 16.4361,
492
+ "eval_samples_per_second": 32.976,
493
+ "eval_steps_per_second": 4.137,
494
+ "eval_wer": 0.6771637545713125,
495
+ "step": 574
496
+ },
497
+ {
498
+ "epoch": 42.0,
499
+ "eval_cer": 0.23221110100090991,
500
+ "eval_loss": 0.9132717847824097,
501
+ "eval_per": 0.5154408776919951,
502
+ "eval_runtime": 16.9668,
503
+ "eval_samples_per_second": 31.945,
504
+ "eval_steps_per_second": 4.008,
505
+ "eval_wer": 0.5422592442096709,
506
+ "step": 588
507
+ },
508
+ {
509
+ "epoch": 42.86,
510
+ "learning_rate": 2.8917748917748916e-05,
511
+ "loss": 1.4599,
512
+ "step": 600
513
+ },
514
+ {
515
+ "epoch": 43.0,
516
+ "eval_cer": 0.22413102820746134,
517
+ "eval_loss": 0.8487069010734558,
518
+ "eval_per": 0.48821617228768793,
519
+ "eval_runtime": 16.6557,
520
+ "eval_samples_per_second": 32.541,
521
+ "eval_steps_per_second": 4.083,
522
+ "eval_wer": 0.5142218610321008,
523
+ "step": 602
524
+ },
525
+ {
526
+ "epoch": 44.0,
527
+ "eval_cer": 0.22074613284804367,
528
+ "eval_loss": 0.8211185336112976,
529
+ "eval_per": 0.46261682242990654,
530
+ "eval_runtime": 16.0355,
531
+ "eval_samples_per_second": 33.8,
532
+ "eval_steps_per_second": 4.241,
533
+ "eval_wer": 0.48984152783421375,
534
+ "step": 616
535
+ },
536
+ {
537
+ "epoch": 45.0,
538
+ "eval_cer": 0.214049135577798,
539
+ "eval_loss": 0.7671909332275391,
540
+ "eval_per": 0.4518488419341731,
541
+ "eval_runtime": 16.1929,
542
+ "eval_samples_per_second": 33.471,
543
+ "eval_steps_per_second": 4.199,
544
+ "eval_wer": 0.48029256399837467,
545
+ "step": 630
546
+ },
547
+ {
548
+ "epoch": 46.0,
549
+ "eval_cer": 0.2092083712465878,
550
+ "eval_loss": 0.7431579828262329,
551
+ "eval_per": 0.44453474197480697,
552
+ "eval_runtime": 16.359,
553
+ "eval_samples_per_second": 33.132,
554
+ "eval_steps_per_second": 4.157,
555
+ "eval_wer": 0.4707436001625356,
556
+ "step": 644
557
+ },
558
+ {
559
+ "epoch": 47.0,
560
+ "eval_cer": 0.2059326660600546,
561
+ "eval_loss": 0.7389556765556335,
562
+ "eval_per": 0.42624949207639173,
563
+ "eval_runtime": 16.6785,
564
+ "eval_samples_per_second": 32.497,
565
+ "eval_steps_per_second": 4.077,
566
+ "eval_wer": 0.44920763917106865,
567
+ "step": 658
568
+ },
569
+ {
570
+ "epoch": 48.0,
571
+ "eval_cer": 0.2011282984531392,
572
+ "eval_loss": 0.699397087097168,
573
+ "eval_per": 0.41060544494108087,
574
+ "eval_runtime": 16.5887,
575
+ "eval_samples_per_second": 32.673,
576
+ "eval_steps_per_second": 4.099,
577
+ "eval_wer": 0.43478260869565216,
578
+ "step": 672
579
+ },
580
+ {
581
+ "epoch": 49.0,
582
+ "eval_cer": 0.19909008189262967,
583
+ "eval_loss": 0.6998735070228577,
584
+ "eval_per": 0.3998374644453474,
585
+ "eval_runtime": 16.3728,
586
+ "eval_samples_per_second": 33.104,
587
+ "eval_steps_per_second": 4.153,
588
+ "eval_wer": 0.4229987809833401,
589
+ "step": 686
590
+ },
591
+ {
592
+ "epoch": 50.0,
593
+ "learning_rate": 2.6993746993746993e-05,
594
+ "loss": 0.7585,
595
+ "step": 700
596
+ },
597
+ {
598
+ "epoch": 50.0,
599
+ "eval_cer": 0.19588717015468607,
600
+ "eval_loss": 0.6737520098686218,
601
+ "eval_per": 0.38825680617635105,
602
+ "eval_runtime": 16.7385,
603
+ "eval_samples_per_second": 32.38,
604
+ "eval_steps_per_second": 4.062,
605
+ "eval_wer": 0.4122308004876067,
606
+ "step": 700
607
+ },
608
+ {
609
+ "epoch": 51.0,
610
+ "eval_cer": 0.19628753412192904,
611
+ "eval_loss": 0.6696569919586182,
612
+ "eval_per": 0.38581877285656235,
613
+ "eval_runtime": 16.5913,
614
+ "eval_samples_per_second": 32.668,
615
+ "eval_steps_per_second": 4.099,
616
+ "eval_wer": 0.4093864282811865,
617
+ "step": 714
618
+ },
619
+ {
620
+ "epoch": 52.0,
621
+ "eval_cer": 0.19963603275705186,
622
+ "eval_loss": 0.6706883907318115,
623
+ "eval_per": 0.39536773669240144,
624
+ "eval_runtime": 18.473,
625
+ "eval_samples_per_second": 29.34,
626
+ "eval_steps_per_second": 3.681,
627
+ "eval_wer": 0.41629418935392115,
628
+ "step": 728
629
+ },
630
+ {
631
+ "epoch": 53.0,
632
+ "eval_cer": 0.19417652411282985,
633
+ "eval_loss": 0.6397454738616943,
634
+ "eval_per": 0.38317757009345793,
635
+ "eval_runtime": 16.3057,
636
+ "eval_samples_per_second": 33.24,
637
+ "eval_steps_per_second": 4.17,
638
+ "eval_wer": 0.40308817553839904,
639
+ "step": 742
640
+ },
641
+ {
642
+ "epoch": 54.0,
643
+ "eval_cer": 0.19388535031847134,
644
+ "eval_loss": 0.6293218731880188,
645
+ "eval_per": 0.38358390898008937,
646
+ "eval_runtime": 16.6245,
647
+ "eval_samples_per_second": 32.603,
648
+ "eval_steps_per_second": 4.09,
649
+ "eval_wer": 0.4039008533116619,
650
+ "step": 756
651
+ },
652
+ {
653
+ "epoch": 55.0,
654
+ "eval_cer": 0.19457688808007279,
655
+ "eval_loss": 0.6479354500770569,
656
+ "eval_per": 0.3852092645266152,
657
+ "eval_runtime": 17.0356,
658
+ "eval_samples_per_second": 31.816,
659
+ "eval_steps_per_second": 3.992,
660
+ "eval_wer": 0.4026818366517676,
661
+ "step": 770
662
+ },
663
+ {
664
+ "epoch": 56.0,
665
+ "eval_cer": 0.19344858962693356,
666
+ "eval_loss": 0.6307466626167297,
667
+ "eval_per": 0.38216172287687933,
668
+ "eval_runtime": 15.9943,
669
+ "eval_samples_per_second": 33.887,
670
+ "eval_steps_per_second": 4.252,
671
+ "eval_wer": 0.39821210889882164,
672
+ "step": 784
673
+ },
674
+ {
675
+ "epoch": 57.0,
676
+ "eval_cer": 0.190828025477707,
677
+ "eval_loss": 0.6166068911552429,
678
+ "eval_per": 0.36733035351483134,
679
+ "eval_runtime": 18.3763,
680
+ "eval_samples_per_second": 29.495,
681
+ "eval_steps_per_second": 3.7,
682
+ "eval_wer": 0.3843965867533523,
683
+ "step": 798
684
+ },
685
+ {
686
+ "epoch": 57.14,
687
+ "learning_rate": 2.506974506974507e-05,
688
+ "loss": 0.5473,
689
+ "step": 800
690
+ },
691
+ {
692
+ "epoch": 58.0,
693
+ "eval_cer": 0.19064604185623293,
694
+ "eval_loss": 0.6098698377609253,
695
+ "eval_per": 0.3707842340511987,
696
+ "eval_runtime": 17.7821,
697
+ "eval_samples_per_second": 30.48,
698
+ "eval_steps_per_second": 3.824,
699
+ "eval_wer": 0.3860219422998781,
700
+ "step": 812
701
+ },
702
+ {
703
+ "epoch": 59.0,
704
+ "eval_cer": 0.19039126478616925,
705
+ "eval_loss": 0.6007358431816101,
706
+ "eval_per": 0.3730190979276717,
707
+ "eval_runtime": 17.0728,
708
+ "eval_samples_per_second": 31.746,
709
+ "eval_steps_per_second": 3.983,
710
+ "eval_wer": 0.386834620073141,
711
+ "step": 826
712
+ },
713
+ {
714
+ "epoch": 60.0,
715
+ "eval_cer": 0.19275705186533212,
716
+ "eval_loss": 0.6191249489784241,
717
+ "eval_per": 0.3744412840308818,
718
+ "eval_runtime": 16.4977,
719
+ "eval_samples_per_second": 32.853,
720
+ "eval_steps_per_second": 4.122,
721
+ "eval_wer": 0.3884599756196668,
722
+ "step": 840
723
+ },
724
+ {
725
+ "epoch": 61.0,
726
+ "eval_cer": 0.1891901728844404,
727
+ "eval_loss": 0.6014622449874878,
728
+ "eval_per": 0.3732222673709874,
729
+ "eval_runtime": 16.6101,
730
+ "eval_samples_per_second": 32.631,
731
+ "eval_steps_per_second": 4.094,
732
+ "eval_wer": 0.3884599756196668,
733
+ "step": 854
734
+ },
735
+ {
736
+ "epoch": 62.0,
737
+ "eval_cer": 0.19017288444040037,
738
+ "eval_loss": 0.5964884757995605,
739
+ "eval_per": 0.36875253961804144,
740
+ "eval_runtime": 17.8493,
741
+ "eval_samples_per_second": 30.365,
742
+ "eval_steps_per_second": 3.81,
743
+ "eval_wer": 0.3837870784234051,
744
+ "step": 868
745
+ },
746
+ {
747
+ "epoch": 63.0,
748
+ "eval_cer": 0.19042766151046406,
749
+ "eval_loss": 0.5926450490951538,
750
+ "eval_per": 0.3667208451848842,
751
+ "eval_runtime": 17.884,
752
+ "eval_samples_per_second": 30.306,
753
+ "eval_steps_per_second": 3.802,
754
+ "eval_wer": 0.38256806176351077,
755
+ "step": 882
756
+ },
757
+ {
758
+ "epoch": 64.0,
759
+ "eval_cer": 0.19210191082802547,
760
+ "eval_loss": 0.6187658905982971,
761
+ "eval_per": 0.376472978464039,
762
+ "eval_runtime": 17.0859,
763
+ "eval_samples_per_second": 31.722,
764
+ "eval_steps_per_second": 3.98,
765
+ "eval_wer": 0.39211702559934986,
766
+ "step": 896
767
+ },
768
+ {
769
+ "epoch": 64.29,
770
+ "learning_rate": 2.3145743145743147e-05,
771
+ "loss": 0.443,
772
+ "step": 900
773
+ },
774
+ {
775
+ "epoch": 65.0,
776
+ "eval_cer": 0.1891537761601456,
777
+ "eval_loss": 0.5834715366363525,
778
+ "eval_per": 0.36895570906135716,
779
+ "eval_runtime": 16.6058,
780
+ "eval_samples_per_second": 32.639,
781
+ "eval_steps_per_second": 4.095,
782
+ "eval_wer": 0.3829744006501422,
783
+ "step": 910
784
+ },
785
+ {
786
+ "epoch": 66.0,
787
+ "eval_cer": 0.1902820746132848,
788
+ "eval_loss": 0.5914222598075867,
789
+ "eval_per": 0.3722064201544088,
790
+ "eval_runtime": 17.2325,
791
+ "eval_samples_per_second": 31.452,
792
+ "eval_steps_per_second": 3.946,
793
+ "eval_wer": 0.38703778951645673,
794
+ "step": 924
795
+ },
796
+ {
797
+ "epoch": 67.0,
798
+ "eval_cer": 0.1875523202911738,
799
+ "eval_loss": 0.582801878452301,
800
+ "eval_per": 0.36265745631856966,
801
+ "eval_runtime": 16.3441,
802
+ "eval_samples_per_second": 33.162,
803
+ "eval_steps_per_second": 4.161,
804
+ "eval_wer": 0.3778951645672491,
805
+ "step": 938
806
+ },
807
+ {
808
+ "epoch": 68.0,
809
+ "eval_cer": 0.1857324840764331,
810
+ "eval_loss": 0.5744664072990417,
811
+ "eval_per": 0.35757822023567654,
812
+ "eval_runtime": 17.4764,
813
+ "eval_samples_per_second": 31.013,
814
+ "eval_steps_per_second": 3.891,
815
+ "eval_wer": 0.3722064201544088,
816
+ "step": 952
817
+ },
818
+ {
819
+ "epoch": 69.0,
820
+ "eval_cer": 0.18817106460418562,
821
+ "eval_loss": 0.5785911083221436,
822
+ "eval_per": 0.3632669646485169,
823
+ "eval_runtime": 16.8602,
824
+ "eval_samples_per_second": 32.147,
825
+ "eval_steps_per_second": 4.033,
826
+ "eval_wer": 0.3795205201137749,
827
+ "step": 966
828
+ },
829
+ {
830
+ "epoch": 70.0,
831
+ "eval_cer": 0.1884258416742493,
832
+ "eval_loss": 0.5868948698043823,
833
+ "eval_per": 0.36042259244209673,
834
+ "eval_runtime": 16.384,
835
+ "eval_samples_per_second": 33.081,
836
+ "eval_steps_per_second": 4.15,
837
+ "eval_wer": 0.37505079236082894,
838
+ "step": 980
839
+ },
840
+ {
841
+ "epoch": 71.0,
842
+ "eval_cer": 0.18878980891719746,
843
+ "eval_loss": 0.592288076877594,
844
+ "eval_per": 0.3596099146688338,
845
+ "eval_runtime": 16.4263,
846
+ "eval_samples_per_second": 32.996,
847
+ "eval_steps_per_second": 4.14,
848
+ "eval_wer": 0.37525396180414466,
849
+ "step": 994
850
+ },
851
+ {
852
+ "epoch": 71.43,
853
+ "learning_rate": 2.1221741221741224e-05,
854
+ "loss": 0.3564,
855
+ "step": 1000
856
+ },
857
+ {
858
+ "epoch": 72.0,
859
+ "eval_cer": 0.18587807097361236,
860
+ "eval_loss": 0.5706638097763062,
861
+ "eval_per": 0.35778138967899226,
862
+ "eval_runtime": 16.3727,
863
+ "eval_samples_per_second": 33.104,
864
+ "eval_steps_per_second": 4.153,
865
+ "eval_wer": 0.37139374238114586,
866
+ "step": 1008
867
+ },
868
+ {
869
+ "epoch": 73.0,
870
+ "eval_cer": 0.1856960873521383,
871
+ "eval_loss": 0.5733203887939453,
872
+ "eval_per": 0.35514018691588783,
873
+ "eval_runtime": 16.1456,
874
+ "eval_samples_per_second": 33.569,
875
+ "eval_steps_per_second": 4.212,
876
+ "eval_wer": 0.3699715562779358,
877
+ "step": 1022
878
+ },
879
+ {
880
+ "epoch": 74.0,
881
+ "eval_cer": 0.1854413102820746,
882
+ "eval_loss": 0.5731407403945923,
883
+ "eval_per": 0.35656237301909793,
884
+ "eval_runtime": 16.2817,
885
+ "eval_samples_per_second": 33.289,
886
+ "eval_steps_per_second": 4.176,
887
+ "eval_wer": 0.370581064607883,
888
+ "step": 1036
889
+ },
890
+ {
891
+ "epoch": 75.0,
892
+ "eval_cer": 0.18467697907188352,
893
+ "eval_loss": 0.5643908381462097,
894
+ "eval_per": 0.3531084924827306,
895
+ "eval_runtime": 16.6661,
896
+ "eval_samples_per_second": 32.521,
897
+ "eval_steps_per_second": 4.08,
898
+ "eval_wer": 0.3669240146281999,
899
+ "step": 1050
900
+ },
901
+ {
902
+ "epoch": 76.0,
903
+ "eval_cer": 0.18522292993630574,
904
+ "eval_loss": 0.5660921335220337,
905
+ "eval_per": 0.3555465258025193,
906
+ "eval_runtime": 16.5118,
907
+ "eval_samples_per_second": 32.825,
908
+ "eval_steps_per_second": 4.118,
909
+ "eval_wer": 0.37017472572125154,
910
+ "step": 1064
911
+ },
912
+ {
913
+ "epoch": 77.0,
914
+ "eval_cer": 0.18474977252047317,
915
+ "eval_loss": 0.5705360174179077,
916
+ "eval_per": 0.3512799674928891,
917
+ "eval_runtime": 17.1186,
918
+ "eval_samples_per_second": 31.661,
919
+ "eval_steps_per_second": 3.972,
920
+ "eval_wer": 0.3675335229581471,
921
+ "step": 1078
922
+ },
923
+ {
924
+ "epoch": 78.0,
925
+ "eval_cer": 0.1835122838944495,
926
+ "eval_loss": 0.5630640983581543,
927
+ "eval_per": 0.35270215359609913,
928
+ "eval_runtime": 17.2728,
929
+ "eval_samples_per_second": 31.379,
930
+ "eval_steps_per_second": 3.937,
931
+ "eval_wer": 0.3671271840715156,
932
+ "step": 1092
933
+ },
934
+ {
935
+ "epoch": 78.57,
936
+ "learning_rate": 1.92977392977393e-05,
937
+ "loss": 0.3456,
938
+ "step": 1100
939
+ },
940
+ {
941
+ "epoch": 79.0,
942
+ "eval_cer": 0.18311191992720655,
943
+ "eval_loss": 0.5674863457679749,
944
+ "eval_per": 0.35026412027631043,
945
+ "eval_runtime": 16.31,
946
+ "eval_samples_per_second": 33.231,
947
+ "eval_steps_per_second": 4.169,
948
+ "eval_wer": 0.3650954896383584,
949
+ "step": 1106
950
+ },
951
+ {
952
+ "epoch": 80.0,
953
+ "eval_cer": 0.1846041856232939,
954
+ "eval_loss": 0.5696778297424316,
955
+ "eval_per": 0.35067045916294187,
956
+ "eval_runtime": 16.3755,
957
+ "eval_samples_per_second": 33.098,
958
+ "eval_steps_per_second": 4.153,
959
+ "eval_wer": 0.3644859813084112,
960
+ "step": 1120
961
+ },
962
+ {
963
+ "epoch": 81.0,
964
+ "eval_cer": 0.18409463148316652,
965
+ "eval_loss": 0.5643677711486816,
966
+ "eval_per": 0.34924827305973183,
967
+ "eval_runtime": 16.3983,
968
+ "eval_samples_per_second": 33.052,
969
+ "eval_steps_per_second": 4.147,
970
+ "eval_wer": 0.36306379520520116,
971
+ "step": 1134
972
+ },
973
+ {
974
+ "epoch": 82.0,
975
+ "eval_cer": 0.1843494085532302,
976
+ "eval_loss": 0.56571364402771,
977
+ "eval_per": 0.34802925639983745,
978
+ "eval_runtime": 16.5291,
979
+ "eval_samples_per_second": 32.791,
980
+ "eval_steps_per_second": 4.114,
981
+ "eval_wer": 0.36265745631856966,
982
+ "step": 1148
983
+ },
984
+ {
985
+ "epoch": 83.0,
986
+ "eval_cer": 0.1875523202911738,
987
+ "eval_loss": 0.5830783247947693,
988
+ "eval_per": 0.3522958147094677,
989
+ "eval_runtime": 16.4238,
990
+ "eval_samples_per_second": 33.001,
991
+ "eval_steps_per_second": 4.14,
992
+ "eval_wer": 0.36793986184477856,
993
+ "step": 1162
994
+ },
995
+ {
996
+ "epoch": 84.0,
997
+ "eval_cer": 0.1861692447679709,
998
+ "eval_loss": 0.5823647975921631,
999
+ "eval_per": 0.3522958147094677,
1000
+ "eval_runtime": 17.5122,
1001
+ "eval_samples_per_second": 30.95,
1002
+ "eval_steps_per_second": 3.883,
1003
+ "eval_wer": 0.3659081674116213,
1004
+ "step": 1176
1005
+ },
1006
+ {
1007
+ "epoch": 85.0,
1008
+ "eval_cer": 0.18333030027297542,
1009
+ "eval_loss": 0.5567490458488464,
1010
+ "eval_per": 0.3508736286062576,
1011
+ "eval_runtime": 16.4517,
1012
+ "eval_samples_per_second": 32.945,
1013
+ "eval_steps_per_second": 4.133,
1014
+ "eval_wer": 0.36529865908167414,
1015
+ "step": 1190
1016
+ },
1017
+ {
1018
+ "epoch": 85.71,
1019
+ "learning_rate": 1.7373737373737375e-05,
1020
+ "loss": 0.3073,
1021
+ "step": 1200
1022
+ },
1023
+ {
1024
+ "epoch": 86.0,
1025
+ "eval_cer": 0.1851501364877161,
1026
+ "eval_loss": 0.5755050778388977,
1027
+ "eval_per": 0.35067045916294187,
1028
+ "eval_runtime": 17.6602,
1029
+ "eval_samples_per_second": 30.691,
1030
+ "eval_steps_per_second": 3.85,
1031
+ "eval_wer": 0.36489232019504264,
1032
+ "step": 1204
1033
+ },
1034
+ {
1035
+ "epoch": 87.0,
1036
+ "eval_cer": 0.18289353958143767,
1037
+ "eval_loss": 0.5590367913246155,
1038
+ "eval_per": 0.3449817147501016,
1039
+ "eval_runtime": 16.7556,
1040
+ "eval_samples_per_second": 32.347,
1041
+ "eval_steps_per_second": 4.058,
1042
+ "eval_wer": 0.3585940674522552,
1043
+ "step": 1218
1044
+ },
1045
+ {
1046
+ "epoch": 88.0,
1047
+ "eval_cer": 0.18347588717015467,
1048
+ "eval_loss": 0.5662943720817566,
1049
+ "eval_per": 0.34802925639983745,
1050
+ "eval_runtime": 16.6011,
1051
+ "eval_samples_per_second": 32.649,
1052
+ "eval_steps_per_second": 4.096,
1053
+ "eval_wer": 0.3610321007720439,
1054
+ "step": 1232
1055
+ },
1056
+ {
1057
+ "epoch": 89.0,
1058
+ "eval_cer": 0.18507734303912649,
1059
+ "eval_loss": 0.5733785629272461,
1060
+ "eval_per": 0.3468102397399431,
1061
+ "eval_runtime": 16.1986,
1062
+ "eval_samples_per_second": 33.46,
1063
+ "eval_steps_per_second": 4.198,
1064
+ "eval_wer": 0.3618447785453068,
1065
+ "step": 1246
1066
+ },
1067
+ {
1068
+ "epoch": 90.0,
1069
+ "eval_cer": 0.18303912647861692,
1070
+ "eval_loss": 0.5656831860542297,
1071
+ "eval_per": 0.34579439252336447,
1072
+ "eval_runtime": 16.3772,
1073
+ "eval_samples_per_second": 33.095,
1074
+ "eval_steps_per_second": 4.152,
1075
+ "eval_wer": 0.36021942299878096,
1076
+ "step": 1260
1077
+ },
1078
+ {
1079
+ "epoch": 91.0,
1080
+ "eval_cer": 0.18278434940855323,
1081
+ "eval_loss": 0.5650802850723267,
1082
+ "eval_per": 0.3441690369768387,
1083
+ "eval_runtime": 17.4779,
1084
+ "eval_samples_per_second": 31.011,
1085
+ "eval_steps_per_second": 3.891,
1086
+ "eval_wer": 0.35778138967899226,
1087
+ "step": 1274
1088
+ },
1089
+ {
1090
+ "epoch": 92.0,
1091
+ "eval_cer": 0.18202001819836214,
1092
+ "eval_loss": 0.5608470439910889,
1093
+ "eval_per": 0.3415278342137342,
1094
+ "eval_runtime": 16.5014,
1095
+ "eval_samples_per_second": 32.846,
1096
+ "eval_steps_per_second": 4.121,
1097
+ "eval_wer": 0.35574969524583505,
1098
+ "step": 1288
1099
+ },
1100
+ {
1101
+ "epoch": 92.86,
1102
+ "learning_rate": 1.544973544973545e-05,
1103
+ "loss": 0.2836,
1104
+ "step": 1300
1105
+ },
1106
+ {
1107
+ "epoch": 93.0,
1108
+ "eval_cer": 0.18067333939945404,
1109
+ "eval_loss": 0.5504541993141174,
1110
+ "eval_per": 0.3388866314506298,
1111
+ "eval_runtime": 16.701,
1112
+ "eval_samples_per_second": 32.453,
1113
+ "eval_steps_per_second": 4.072,
1114
+ "eval_wer": 0.3524989841527834,
1115
+ "step": 1302
1116
+ },
1117
+ {
1118
+ "epoch": 94.0,
1119
+ "eval_cer": 0.17979981801637854,
1120
+ "eval_loss": 0.5494620203971863,
1121
+ "eval_per": 0.33746444534741976,
1122
+ "eval_runtime": 17.2521,
1123
+ "eval_samples_per_second": 31.416,
1124
+ "eval_steps_per_second": 3.942,
1125
+ "eval_wer": 0.3500609508329947,
1126
+ "step": 1316
1127
+ },
1128
+ {
1129
+ "epoch": 95.0,
1130
+ "eval_cer": 0.1816196542311192,
1131
+ "eval_loss": 0.5693331360816956,
1132
+ "eval_per": 0.34315318976026005,
1133
+ "eval_runtime": 16.3033,
1134
+ "eval_samples_per_second": 33.245,
1135
+ "eval_steps_per_second": 4.171,
1136
+ "eval_wer": 0.35574969524583505,
1137
+ "step": 1330
1138
+ },
1139
+ {
1140
+ "epoch": 96.0,
1141
+ "eval_cer": 0.1822020018198362,
1142
+ "eval_loss": 0.5638025999069214,
1143
+ "eval_per": 0.34173100365705,
1144
+ "eval_runtime": 16.8945,
1145
+ "eval_samples_per_second": 32.081,
1146
+ "eval_steps_per_second": 4.025,
1147
+ "eval_wer": 0.3563592035757822,
1148
+ "step": 1344
1149
+ },
1150
+ {
1151
+ "epoch": 97.0,
1152
+ "eval_cer": 0.17969062784349407,
1153
+ "eval_loss": 0.5485906004905701,
1154
+ "eval_per": 0.3386834620073141,
1155
+ "eval_runtime": 16.6823,
1156
+ "eval_samples_per_second": 32.489,
1157
+ "eval_steps_per_second": 4.076,
1158
+ "eval_wer": 0.35107679804957337,
1159
+ "step": 1358
1160
+ },
1161
+ {
1162
+ "epoch": 98.0,
1163
+ "eval_cer": 0.18096451319381257,
1164
+ "eval_loss": 0.5618489980697632,
1165
+ "eval_per": 0.3415278342137342,
1166
+ "eval_runtime": 16.6547,
1167
+ "eval_samples_per_second": 32.543,
1168
+ "eval_steps_per_second": 4.083,
1169
+ "eval_wer": 0.3545306785859407,
1170
+ "step": 1372
1171
+ },
1172
+ {
1173
+ "epoch": 99.0,
1174
+ "eval_cer": 0.1799818016378526,
1175
+ "eval_loss": 0.5637105703353882,
1176
+ "eval_per": 0.33990247866720846,
1177
+ "eval_runtime": 16.8199,
1178
+ "eval_samples_per_second": 32.224,
1179
+ "eval_steps_per_second": 4.043,
1180
+ "eval_wer": 0.3514831369362048,
1181
+ "step": 1386
1182
+ },
1183
+ {
1184
+ "epoch": 100.0,
1185
+ "learning_rate": 1.3525733525733527e-05,
1186
+ "loss": 0.2502,
1187
+ "step": 1400
1188
+ },
1189
+ {
1190
+ "epoch": 100.0,
1191
+ "eval_cer": 0.1810373066424022,
1192
+ "eval_loss": 0.5658114552497864,
1193
+ "eval_per": 0.3437626980902072,
1194
+ "eval_runtime": 16.859,
1195
+ "eval_samples_per_second": 32.149,
1196
+ "eval_steps_per_second": 4.033,
1197
+ "eval_wer": 0.3555465258025193,
1198
+ "step": 1400
1199
+ },
1200
+ {
1201
+ "epoch": 101.0,
1202
+ "eval_cer": 0.17954504094631482,
1203
+ "eval_loss": 0.552661657333374,
1204
+ "eval_per": 0.3411214953271028,
1205
+ "eval_runtime": 17.0552,
1206
+ "eval_samples_per_second": 31.779,
1207
+ "eval_steps_per_second": 3.987,
1208
+ "eval_wer": 0.3524989841527834,
1209
+ "step": 1414
1210
+ },
1211
+ {
1212
+ "epoch": 102.0,
1213
+ "eval_cer": 0.18067333939945404,
1214
+ "eval_loss": 0.5701059699058533,
1215
+ "eval_per": 0.343965867533523,
1216
+ "eval_runtime": 17.649,
1217
+ "eval_samples_per_second": 30.71,
1218
+ "eval_steps_per_second": 3.853,
1219
+ "eval_wer": 0.3561560341324665,
1220
+ "step": 1428
1221
+ },
1222
+ {
1223
+ "epoch": 103.0,
1224
+ "eval_cer": 0.17936305732484076,
1225
+ "eval_loss": 0.554296612739563,
1226
+ "eval_per": 0.3388866314506298,
1227
+ "eval_runtime": 16.2178,
1228
+ "eval_samples_per_second": 33.42,
1229
+ "eval_steps_per_second": 4.193,
1230
+ "eval_wer": 0.34965461194636327,
1231
+ "step": 1442
1232
+ },
1233
+ {
1234
+ "epoch": 104.0,
1235
+ "eval_cer": 0.18034576888080073,
1236
+ "eval_loss": 0.5659683346748352,
1237
+ "eval_per": 0.33990247866720846,
1238
+ "eval_runtime": 16.8247,
1239
+ "eval_samples_per_second": 32.214,
1240
+ "eval_steps_per_second": 4.042,
1241
+ "eval_wer": 0.3508736286062576,
1242
+ "step": 1456
1243
+ },
1244
+ {
1245
+ "epoch": 105.0,
1246
+ "eval_cer": 0.17950864422202,
1247
+ "eval_loss": 0.5542871952056885,
1248
+ "eval_per": 0.33990247866720846,
1249
+ "eval_runtime": 16.8641,
1250
+ "eval_samples_per_second": 32.139,
1251
+ "eval_steps_per_second": 4.032,
1252
+ "eval_wer": 0.3500609508329947,
1253
+ "step": 1470
1254
+ },
1255
+ {
1256
+ "epoch": 106.0,
1257
+ "eval_cer": 0.181656050955414,
1258
+ "eval_loss": 0.5742031931877136,
1259
+ "eval_per": 0.34315318976026005,
1260
+ "eval_runtime": 16.2772,
1261
+ "eval_samples_per_second": 33.298,
1262
+ "eval_steps_per_second": 4.178,
1263
+ "eval_wer": 0.3547338480292564,
1264
+ "step": 1484
1265
+ },
1266
+ {
1267
+ "epoch": 107.0,
1268
+ "eval_cer": 0.178926296633303,
1269
+ "eval_loss": 0.5526788830757141,
1270
+ "eval_per": 0.33502641202763106,
1271
+ "eval_runtime": 16.3123,
1272
+ "eval_samples_per_second": 33.227,
1273
+ "eval_steps_per_second": 4.169,
1274
+ "eval_wer": 0.34538805363673303,
1275
+ "step": 1498
1276
+ },
1277
+ {
1278
+ "epoch": 107.14,
1279
+ "learning_rate": 1.1601731601731604e-05,
1280
+ "loss": 0.2368,
1281
+ "step": 1500
1282
+ },
1283
+ {
1284
+ "epoch": 108.0,
1285
+ "eval_cer": 0.178926296633303,
1286
+ "eval_loss": 0.5576502084732056,
1287
+ "eval_per": 0.3378707842340512,
1288
+ "eval_runtime": 16.2769,
1289
+ "eval_samples_per_second": 33.299,
1290
+ "eval_steps_per_second": 4.178,
1291
+ "eval_wer": 0.34965461194636327,
1292
+ "step": 1512
1293
+ },
1294
+ {
1295
+ "epoch": 109.0,
1296
+ "eval_cer": 0.1788898999090082,
1297
+ "eval_loss": 0.5539444088935852,
1298
+ "eval_per": 0.3356359203575782,
1299
+ "eval_runtime": 17.6723,
1300
+ "eval_samples_per_second": 30.669,
1301
+ "eval_steps_per_second": 3.848,
1302
+ "eval_wer": 0.3451848841934173,
1303
+ "step": 1526
1304
+ },
1305
+ {
1306
+ "epoch": 110.0,
1307
+ "eval_cer": 0.18020018198362148,
1308
+ "eval_loss": 0.5699580311775208,
1309
+ "eval_per": 0.34173100365705,
1310
+ "eval_runtime": 16.5072,
1311
+ "eval_samples_per_second": 32.834,
1312
+ "eval_steps_per_second": 4.119,
1313
+ "eval_wer": 0.35168630637952053,
1314
+ "step": 1540
1315
+ },
1316
+ {
1317
+ "epoch": 111.0,
1318
+ "eval_cer": 0.17939945404913557,
1319
+ "eval_loss": 0.5626676678657532,
1320
+ "eval_per": 0.33969930922389274,
1321
+ "eval_runtime": 16.5149,
1322
+ "eval_samples_per_second": 32.819,
1323
+ "eval_steps_per_second": 4.117,
1324
+ "eval_wer": 0.3500609508329947,
1325
+ "step": 1554
1326
+ },
1327
+ {
1328
+ "epoch": 112.0,
1329
+ "eval_cer": 0.17965423111919926,
1330
+ "eval_loss": 0.5622020363807678,
1331
+ "eval_per": 0.3405119869971556,
1332
+ "eval_runtime": 18.514,
1333
+ "eval_samples_per_second": 29.275,
1334
+ "eval_steps_per_second": 3.673,
1335
+ "eval_wer": 0.34965461194636327,
1336
+ "step": 1568
1337
+ },
1338
+ {
1339
+ "epoch": 113.0,
1340
+ "eval_cer": 0.18005459508644223,
1341
+ "eval_loss": 0.570824146270752,
1342
+ "eval_per": 0.3403088175538399,
1343
+ "eval_runtime": 16.7958,
1344
+ "eval_samples_per_second": 32.27,
1345
+ "eval_steps_per_second": 4.049,
1346
+ "eval_wer": 0.34945144250304755,
1347
+ "step": 1582
1348
+ },
1349
+ {
1350
+ "epoch": 114.0,
1351
+ "eval_cer": 0.18045495905368517,
1352
+ "eval_loss": 0.5732950568199158,
1353
+ "eval_per": 0.3401056481105242,
1354
+ "eval_runtime": 17.5602,
1355
+ "eval_samples_per_second": 30.865,
1356
+ "eval_steps_per_second": 3.872,
1357
+ "eval_wer": 0.35107679804957337,
1358
+ "step": 1596
1359
+ },
1360
+ {
1361
+ "epoch": 114.29,
1362
+ "learning_rate": 9.677729677729679e-06,
1363
+ "loss": 0.2288,
1364
+ "step": 1600
1365
+ },
1366
+ {
1367
+ "epoch": 115.0,
1368
+ "eval_cer": 0.17950864422202,
1369
+ "eval_loss": 0.5614627599716187,
1370
+ "eval_per": 0.3386834620073141,
1371
+ "eval_runtime": 18.0091,
1372
+ "eval_samples_per_second": 30.096,
1373
+ "eval_steps_per_second": 3.776,
1374
+ "eval_wer": 0.34863876472978467,
1375
+ "step": 1610
1376
+ },
1377
+ {
1378
+ "epoch": 116.0,
1379
+ "eval_cer": 0.1808553230209281,
1380
+ "eval_loss": 0.5741183757781982,
1381
+ "eval_per": 0.33969930922389274,
1382
+ "eval_runtime": 16.588,
1383
+ "eval_samples_per_second": 32.674,
1384
+ "eval_steps_per_second": 4.099,
1385
+ "eval_wer": 0.34965461194636327,
1386
+ "step": 1624
1387
+ },
1388
+ {
1389
+ "epoch": 117.0,
1390
+ "eval_cer": 0.17958143767060963,
1391
+ "eval_loss": 0.5609710812568665,
1392
+ "eval_per": 0.33726127590410404,
1393
+ "eval_runtime": 16.4333,
1394
+ "eval_samples_per_second": 32.982,
1395
+ "eval_steps_per_second": 4.138,
1396
+ "eval_wer": 0.3459975619666802,
1397
+ "step": 1638
1398
+ },
1399
+ {
1400
+ "epoch": 117.0,
1401
+ "step": 1638,
1402
+ "total_flos": 1.462030946643386e+19,
1403
+ "train_loss": 1.771814914558979,
1404
+ "train_runtime": 12938.9921,
1405
+ "train_samples_per_second": 5.194,
1406
+ "train_steps_per_second": 0.162
1407
+ }
1408
+ ],
1409
+ "max_steps": 2100,
1410
+ "num_train_epochs": 150,
1411
+ "total_flos": 1.462030946643386e+19,
1412
+ "trial_name": null,
1413
+ "trial_params": null
1414
+ }