|
{ |
|
"best_metric": 0.564974844455719, |
|
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-12/checkpoint-1498", |
|
"epoch": 127.0, |
|
"global_step": 1778, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 3e-05, |
|
"loss": 37.6216, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 23.20707130432129, |
|
"eval_runtime": 53.2412, |
|
"eval_samples_per_second": 10.18, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 1.0, |
|
"step": 14 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 6.9366374015808105, |
|
"eval_runtime": 52.8966, |
|
"eval_samples_per_second": 10.246, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 1.0, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 4.42495059967041, |
|
"eval_runtime": 53.0892, |
|
"eval_samples_per_second": 10.209, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 1.0, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.915421962738037, |
|
"eval_runtime": 52.9638, |
|
"eval_samples_per_second": 10.233, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.684857130050659, |
|
"eval_runtime": 53.3885, |
|
"eval_samples_per_second": 10.152, |
|
"eval_steps_per_second": 1.274, |
|
"eval_wer": 1.0, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.52828049659729, |
|
"eval_runtime": 52.9774, |
|
"eval_samples_per_second": 10.231, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.371574640274048, |
|
"eval_runtime": 53.0413, |
|
"eval_samples_per_second": 10.218, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 1.0, |
|
"step": 98 |
|
}, |
|
{ |
|
"epoch": 7.14, |
|
"learning_rate": 2.862857142857143e-05, |
|
"loss": 8.823, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.265662670135498, |
|
"eval_runtime": 52.9677, |
|
"eval_samples_per_second": 10.233, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1796252727508545, |
|
"eval_runtime": 53.0173, |
|
"eval_samples_per_second": 10.223, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.156822919845581, |
|
"eval_runtime": 52.9813, |
|
"eval_samples_per_second": 10.23, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1071083545684814, |
|
"eval_runtime": 52.9255, |
|
"eval_samples_per_second": 10.241, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 1.0, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0891101360321045, |
|
"eval_runtime": 53.0174, |
|
"eval_samples_per_second": 10.223, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.058786153793335, |
|
"eval_runtime": 53.0158, |
|
"eval_samples_per_second": 10.223, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.042229175567627, |
|
"eval_runtime": 53.05, |
|
"eval_samples_per_second": 10.217, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 1.0, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"learning_rate": 2.72e-05, |
|
"loss": 3.0574, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.038764238357544, |
|
"eval_runtime": 52.9184, |
|
"eval_samples_per_second": 10.242, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 1.0, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0324084758758545, |
|
"eval_runtime": 53.3043, |
|
"eval_samples_per_second": 10.168, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 1.0, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.025251865386963, |
|
"eval_runtime": 52.9716, |
|
"eval_samples_per_second": 10.232, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 238 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.010026454925537, |
|
"eval_runtime": 52.9941, |
|
"eval_samples_per_second": 10.228, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0079331398010254, |
|
"eval_runtime": 52.9545, |
|
"eval_samples_per_second": 10.235, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 266 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0150105953216553, |
|
"eval_runtime": 52.9312, |
|
"eval_samples_per_second": 10.24, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 1.0, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0032567977905273, |
|
"eval_runtime": 52.9575, |
|
"eval_samples_per_second": 10.235, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 21.43, |
|
"learning_rate": 2.5771428571428574e-05, |
|
"loss": 2.95, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.999887466430664, |
|
"eval_runtime": 52.9429, |
|
"eval_samples_per_second": 10.237, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9940125942230225, |
|
"eval_runtime": 52.9557, |
|
"eval_samples_per_second": 10.235, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 322 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9982004165649414, |
|
"eval_runtime": 53.3517, |
|
"eval_samples_per_second": 10.159, |
|
"eval_steps_per_second": 1.275, |
|
"eval_wer": 1.0, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0212087631225586, |
|
"eval_runtime": 52.917, |
|
"eval_samples_per_second": 10.242, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 1.0, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.995063543319702, |
|
"eval_runtime": 52.9179, |
|
"eval_samples_per_second": 10.242, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 1.0, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.989276885986328, |
|
"eval_runtime": 52.9648, |
|
"eval_samples_per_second": 10.233, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.990724802017212, |
|
"eval_runtime": 52.9049, |
|
"eval_samples_per_second": 10.245, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 1.0, |
|
"step": 392 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"learning_rate": 2.434285714285714e-05, |
|
"loss": 2.9233, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9889469146728516, |
|
"eval_runtime": 53.0796, |
|
"eval_samples_per_second": 10.211, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 1.0, |
|
"step": 406 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9812769889831543, |
|
"eval_runtime": 53.0284, |
|
"eval_samples_per_second": 10.221, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 1.0, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9795358180999756, |
|
"eval_runtime": 53.6697, |
|
"eval_samples_per_second": 10.099, |
|
"eval_steps_per_second": 1.267, |
|
"eval_wer": 1.0, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9633467197418213, |
|
"eval_runtime": 53.1489, |
|
"eval_samples_per_second": 10.198, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 1.0, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_cer": 0.9585441310282075, |
|
"eval_loss": 2.9652762413024902, |
|
"eval_runtime": 53.0687, |
|
"eval_samples_per_second": 10.213, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 1.0, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9050323963165283, |
|
"eval_runtime": 53.1009, |
|
"eval_samples_per_second": 10.207, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 1.0, |
|
"step": 476 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.8805932998657227, |
|
"eval_runtime": 53.2017, |
|
"eval_samples_per_second": 10.188, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 1.0, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 35.71, |
|
"learning_rate": 2.2914285714285714e-05, |
|
"loss": 2.8852, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.822971820831299, |
|
"eval_runtime": 53.1752, |
|
"eval_samples_per_second": 10.193, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 1.0, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.780466318130493, |
|
"eval_runtime": 53.2177, |
|
"eval_samples_per_second": 10.185, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 1.0, |
|
"step": 518 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_cer": 0.9571974522292994, |
|
"eval_loss": 2.70436954498291, |
|
"eval_runtime": 53.1033, |
|
"eval_samples_per_second": 10.207, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 1.0, |
|
"step": 532 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_cer": 0.9558507734303913, |
|
"eval_loss": 2.6560797691345215, |
|
"eval_runtime": 53.1469, |
|
"eval_samples_per_second": 10.198, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 1.0, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_cer": 0.9254231119199272, |
|
"eval_loss": 2.547485828399658, |
|
"eval_runtime": 53.1445, |
|
"eval_samples_per_second": 10.199, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 1.0, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_cer": 0.7458416742493176, |
|
"eval_loss": 2.333609104156494, |
|
"eval_runtime": 53.2579, |
|
"eval_samples_per_second": 10.177, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 1.0, |
|
"step": 574 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_cer": 0.5467879890809827, |
|
"eval_loss": 2.069585084915161, |
|
"eval_runtime": 53.2259, |
|
"eval_samples_per_second": 10.183, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 1.0, |
|
"step": 588 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"learning_rate": 2.1485714285714284e-05, |
|
"loss": 2.5339, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_cer": 0.49714285714285716, |
|
"eval_loss": 1.7759531736373901, |
|
"eval_runtime": 53.69, |
|
"eval_samples_per_second": 10.095, |
|
"eval_steps_per_second": 1.267, |
|
"eval_wer": 1.0, |
|
"step": 602 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_cer": 0.4545950864422202, |
|
"eval_loss": 1.5432746410369873, |
|
"eval_runtime": 53.2888, |
|
"eval_samples_per_second": 10.171, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 1.0, |
|
"step": 616 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_cer": 0.4066606005459509, |
|
"eval_loss": 1.352888584136963, |
|
"eval_runtime": 53.6434, |
|
"eval_samples_per_second": 10.104, |
|
"eval_steps_per_second": 1.268, |
|
"eval_wer": 1.0, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_cer": 0.38340309372156506, |
|
"eval_loss": 1.214944839477539, |
|
"eval_runtime": 53.2877, |
|
"eval_samples_per_second": 10.171, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 0.9997968305566842, |
|
"step": 644 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_cer": 0.35781619654231117, |
|
"eval_loss": 1.0925143957138062, |
|
"eval_runtime": 53.2174, |
|
"eval_samples_per_second": 10.185, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.9943112555871597, |
|
"step": 658 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_cer": 0.3129390354868062, |
|
"eval_loss": 1.023630976676941, |
|
"eval_runtime": 53.2114, |
|
"eval_samples_per_second": 10.186, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.8953677366924014, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_cer": 0.26227479526842584, |
|
"eval_loss": 0.9525313377380371, |
|
"eval_runtime": 53.2409, |
|
"eval_samples_per_second": 10.18, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.7062169849654611, |
|
"step": 686 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 2.0057142857142858e-05, |
|
"loss": 1.3395, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.22009099181073705, |
|
"eval_loss": 0.8921615481376648, |
|
"eval_runtime": 53.2916, |
|
"eval_samples_per_second": 10.17, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 0.5062982527427875, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_cer": 0.21150136487716106, |
|
"eval_loss": 0.8068466782569885, |
|
"eval_runtime": 53.2081, |
|
"eval_samples_per_second": 10.186, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.47744819179195447, |
|
"step": 714 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_cer": 0.20764331210191084, |
|
"eval_loss": 0.7931560277938843, |
|
"eval_runtime": 53.422, |
|
"eval_samples_per_second": 10.146, |
|
"eval_steps_per_second": 1.273, |
|
"eval_wer": 0.45530272247054043, |
|
"step": 728 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_cer": 0.20658780709736124, |
|
"eval_loss": 0.7725641131401062, |
|
"eval_runtime": 53.3035, |
|
"eval_samples_per_second": 10.168, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 0.4453474197480699, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_cer": 0.2026569608735214, |
|
"eval_loss": 0.755141019821167, |
|
"eval_runtime": 53.6653, |
|
"eval_samples_per_second": 10.1, |
|
"eval_steps_per_second": 1.267, |
|
"eval_wer": 0.4339699309223893, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_cer": 0.20385805277525024, |
|
"eval_loss": 0.7420439720153809, |
|
"eval_runtime": 53.1999, |
|
"eval_samples_per_second": 10.188, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.4305160503860219, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_cer": 0.2008371246587807, |
|
"eval_loss": 0.7146174311637878, |
|
"eval_runtime": 53.5808, |
|
"eval_samples_per_second": 10.116, |
|
"eval_steps_per_second": 1.269, |
|
"eval_wer": 0.42117025599349855, |
|
"step": 784 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_cer": 0.195705186533212, |
|
"eval_loss": 0.6767785549163818, |
|
"eval_runtime": 53.1793, |
|
"eval_samples_per_second": 10.192, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.4095895977245022, |
|
"step": 798 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"learning_rate": 1.8628571428571428e-05, |
|
"loss": 0.7419, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_cer": 0.1961783439490446, |
|
"eval_loss": 0.6767465472221375, |
|
"eval_runtime": 53.2804, |
|
"eval_samples_per_second": 10.173, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 0.40796424217797644, |
|
"step": 812 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_cer": 0.19712465878070973, |
|
"eval_loss": 0.6708809733390808, |
|
"eval_runtime": 53.3292, |
|
"eval_samples_per_second": 10.163, |
|
"eval_steps_per_second": 1.275, |
|
"eval_wer": 0.4069483949613978, |
|
"step": 826 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_cer": 0.19665150136487716, |
|
"eval_loss": 0.6790570020675659, |
|
"eval_runtime": 53.2448, |
|
"eval_samples_per_second": 10.179, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.4024786672084518, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_cer": 0.19381255686988172, |
|
"eval_loss": 0.6560342311859131, |
|
"eval_runtime": 53.279, |
|
"eval_samples_per_second": 10.173, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 0.4028850060950833, |
|
"step": 854 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_cer": 0.19392174704276616, |
|
"eval_loss": 0.6473817229270935, |
|
"eval_runtime": 53.2557, |
|
"eval_samples_per_second": 10.177, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.3976026005688744, |
|
"step": 868 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_cer": 0.19414012738853503, |
|
"eval_loss": 0.6583911180496216, |
|
"eval_runtime": 53.2562, |
|
"eval_samples_per_second": 10.177, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.39821210889882164, |
|
"step": 882 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_cer": 0.19381255686988172, |
|
"eval_loss": 0.6618856191635132, |
|
"eval_runtime": 53.4299, |
|
"eval_samples_per_second": 10.144, |
|
"eval_steps_per_second": 1.273, |
|
"eval_wer": 0.39597724502234866, |
|
"step": 896 |
|
}, |
|
{ |
|
"epoch": 64.29, |
|
"learning_rate": 1.72e-05, |
|
"loss": 0.5254, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_cer": 0.19363057324840766, |
|
"eval_loss": 0.6513723134994507, |
|
"eval_runtime": 53.2194, |
|
"eval_samples_per_second": 10.184, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3923201950426656, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_cer": 0.19148316651501365, |
|
"eval_loss": 0.6362853050231934, |
|
"eval_runtime": 53.25, |
|
"eval_samples_per_second": 10.178, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.3874441284030882, |
|
"step": 924 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_cer": 0.19002729754322112, |
|
"eval_loss": 0.6173312067985535, |
|
"eval_runtime": 53.2465, |
|
"eval_samples_per_second": 10.179, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.3797236895570906, |
|
"step": 938 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_cer": 0.19177434030937215, |
|
"eval_loss": 0.6283513307571411, |
|
"eval_runtime": 53.1947, |
|
"eval_samples_per_second": 10.189, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.38866314506298255, |
|
"step": 952 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_cer": 0.18966333030027296, |
|
"eval_loss": 0.6152955293655396, |
|
"eval_runtime": 53.1902, |
|
"eval_samples_per_second": 10.19, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3766761479073547, |
|
"step": 966 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_cer": 0.18787989080982712, |
|
"eval_loss": 0.6083645820617676, |
|
"eval_runtime": 53.1965, |
|
"eval_samples_per_second": 10.189, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.37362860625761884, |
|
"step": 980 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_cer": 0.1899909008189263, |
|
"eval_loss": 0.6196299195289612, |
|
"eval_runtime": 53.1375, |
|
"eval_samples_per_second": 10.2, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 0.3772856562373019, |
|
"step": 994 |
|
}, |
|
{ |
|
"epoch": 71.43, |
|
"learning_rate": 1.577142857142857e-05, |
|
"loss": 0.4219, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_cer": 0.18988171064604187, |
|
"eval_loss": 0.6074672341346741, |
|
"eval_runtime": 53.2378, |
|
"eval_samples_per_second": 10.181, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.3730190979276717, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_cer": 0.1883894449499545, |
|
"eval_loss": 0.6016885042190552, |
|
"eval_runtime": 53.2097, |
|
"eval_samples_per_second": 10.186, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.37119057293783014, |
|
"step": 1022 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_cer": 0.18722474977252046, |
|
"eval_loss": 0.5947157740592957, |
|
"eval_runtime": 53.1687, |
|
"eval_samples_per_second": 10.194, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3693620479479886, |
|
"step": 1036 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_cer": 0.1889353958143767, |
|
"eval_loss": 0.5974624752998352, |
|
"eval_runtime": 53.2006, |
|
"eval_samples_per_second": 10.188, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3695652173913043, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_cer": 0.18868061874431302, |
|
"eval_loss": 0.6020309925079346, |
|
"eval_runtime": 53.2351, |
|
"eval_samples_per_second": 10.181, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.37281592848435596, |
|
"step": 1064 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_cer": 0.1891537761601456, |
|
"eval_loss": 0.5994043946266174, |
|
"eval_runtime": 53.1703, |
|
"eval_samples_per_second": 10.194, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.37037789516456726, |
|
"step": 1078 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_cer": 0.18773430391264787, |
|
"eval_loss": 0.5821866393089294, |
|
"eval_runtime": 53.6598, |
|
"eval_samples_per_second": 10.101, |
|
"eval_steps_per_second": 1.267, |
|
"eval_wer": 0.3715969118244616, |
|
"step": 1092 |
|
}, |
|
{ |
|
"epoch": 78.57, |
|
"learning_rate": 1.4342857142857143e-05, |
|
"loss": 0.385, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_cer": 0.18929936305732484, |
|
"eval_loss": 0.6073063015937805, |
|
"eval_runtime": 53.2561, |
|
"eval_samples_per_second": 10.177, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.374238114587566, |
|
"step": 1106 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_cer": 0.18740673339399455, |
|
"eval_loss": 0.6028934121131897, |
|
"eval_runtime": 53.1886, |
|
"eval_samples_per_second": 10.19, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.37281592848435596, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_cer": 0.18682438580527752, |
|
"eval_loss": 0.5961212515830994, |
|
"eval_runtime": 53.2244, |
|
"eval_samples_per_second": 10.183, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3699715562779358, |
|
"step": 1134 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_cer": 0.1870427661510464, |
|
"eval_loss": 0.6032407283782959, |
|
"eval_runtime": 53.2843, |
|
"eval_samples_per_second": 10.172, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 0.37017472572125154, |
|
"step": 1148 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_cer": 0.1889353958143767, |
|
"eval_loss": 0.611492395401001, |
|
"eval_runtime": 53.1834, |
|
"eval_samples_per_second": 10.191, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3722064201544088, |
|
"step": 1162 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_cer": 0.18831665150136487, |
|
"eval_loss": 0.6018120646476746, |
|
"eval_runtime": 53.2232, |
|
"eval_samples_per_second": 10.184, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.36895570906135716, |
|
"step": 1176 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_cer": 0.18547770700636942, |
|
"eval_loss": 0.5824325084686279, |
|
"eval_runtime": 53.2981, |
|
"eval_samples_per_second": 10.169, |
|
"eval_steps_per_second": 1.276, |
|
"eval_wer": 0.36651767574156846, |
|
"step": 1190 |
|
}, |
|
{ |
|
"epoch": 85.71, |
|
"learning_rate": 1.2914285714285713e-05, |
|
"loss": 0.3463, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_cer": 0.18660600545950864, |
|
"eval_loss": 0.5985358953475952, |
|
"eval_runtime": 53.1709, |
|
"eval_samples_per_second": 10.194, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3669240146281999, |
|
"step": 1204 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_cer": 0.18609645131938127, |
|
"eval_loss": 0.5833200812339783, |
|
"eval_runtime": 53.1104, |
|
"eval_samples_per_second": 10.205, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 0.3669240146281999, |
|
"step": 1218 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_cer": 0.1861692447679709, |
|
"eval_loss": 0.5775151252746582, |
|
"eval_runtime": 53.1027, |
|
"eval_samples_per_second": 10.207, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.3636733035351483, |
|
"step": 1232 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_cer": 0.18496815286624205, |
|
"eval_loss": 0.5746987462043762, |
|
"eval_runtime": 53.0756, |
|
"eval_samples_per_second": 10.212, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.36062576188541245, |
|
"step": 1246 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_cer": 0.18507734303912649, |
|
"eval_loss": 0.5784278512001038, |
|
"eval_runtime": 53.0821, |
|
"eval_samples_per_second": 10.211, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.36387647297846404, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_cer": 0.18580527752502274, |
|
"eval_loss": 0.5841168165206909, |
|
"eval_runtime": 53.1168, |
|
"eval_samples_per_second": 10.204, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 0.36042259244209673, |
|
"step": 1274 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_cer": 0.18496815286624205, |
|
"eval_loss": 0.5761845707893372, |
|
"eval_runtime": 53.1679, |
|
"eval_samples_per_second": 10.194, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.36550182852498986, |
|
"step": 1288 |
|
}, |
|
{ |
|
"epoch": 92.86, |
|
"learning_rate": 1.1485714285714285e-05, |
|
"loss": 0.3237, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_cer": 0.1854049135577798, |
|
"eval_loss": 0.5835999846458435, |
|
"eval_runtime": 53.1013, |
|
"eval_samples_per_second": 10.207, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.3598130841121495, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_cer": 0.18409463148316652, |
|
"eval_loss": 0.576073408126831, |
|
"eval_runtime": 53.509, |
|
"eval_samples_per_second": 10.129, |
|
"eval_steps_per_second": 1.271, |
|
"eval_wer": 0.3587972368955709, |
|
"step": 1316 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_cer": 0.1848225659690628, |
|
"eval_loss": 0.5822096467018127, |
|
"eval_runtime": 53.2494, |
|
"eval_samples_per_second": 10.179, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.3596099146688338, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_cer": 0.18496815286624205, |
|
"eval_loss": 0.5886383652687073, |
|
"eval_runtime": 53.1468, |
|
"eval_samples_per_second": 10.198, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.35920357578220236, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_cer": 0.1830027297543221, |
|
"eval_loss": 0.5695921182632446, |
|
"eval_runtime": 53.2532, |
|
"eval_samples_per_second": 10.178, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.3573750507923608, |
|
"step": 1358 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_cer": 0.18358507734303914, |
|
"eval_loss": 0.5794330835342407, |
|
"eval_runtime": 53.1395, |
|
"eval_samples_per_second": 10.2, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 0.3587972368955709, |
|
"step": 1372 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_cer": 0.18365787079162876, |
|
"eval_loss": 0.5768290758132935, |
|
"eval_runtime": 53.1965, |
|
"eval_samples_per_second": 10.189, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3569687119057294, |
|
"step": 1386 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"learning_rate": 1.0057142857142857e-05, |
|
"loss": 0.2799, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_cer": 0.18442220200181983, |
|
"eval_loss": 0.5836793184280396, |
|
"eval_runtime": 53.2358, |
|
"eval_samples_per_second": 10.181, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.35778138967899226, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 101.0, |
|
"eval_cer": 0.18263876251137398, |
|
"eval_loss": 0.5696985721588135, |
|
"eval_runtime": 53.2164, |
|
"eval_samples_per_second": 10.185, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3524989841527834, |
|
"step": 1414 |
|
}, |
|
{ |
|
"epoch": 102.0, |
|
"eval_cer": 0.18336669699727023, |
|
"eval_loss": 0.5795508027076721, |
|
"eval_runtime": 53.1474, |
|
"eval_samples_per_second": 10.198, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.35656237301909793, |
|
"step": 1428 |
|
}, |
|
{ |
|
"epoch": 103.0, |
|
"eval_cer": 0.18249317561419473, |
|
"eval_loss": 0.571198046207428, |
|
"eval_runtime": 53.193, |
|
"eval_samples_per_second": 10.189, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3549370174725721, |
|
"step": 1442 |
|
}, |
|
{ |
|
"epoch": 104.0, |
|
"eval_cer": 0.18289353958143767, |
|
"eval_loss": 0.5795718431472778, |
|
"eval_runtime": 53.0944, |
|
"eval_samples_per_second": 10.208, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.3555465258025193, |
|
"step": 1456 |
|
}, |
|
{ |
|
"epoch": 105.0, |
|
"eval_cer": 0.1835122838944495, |
|
"eval_loss": 0.5758859515190125, |
|
"eval_runtime": 53.062, |
|
"eval_samples_per_second": 10.214, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 0.35534335635920355, |
|
"step": 1470 |
|
}, |
|
{ |
|
"epoch": 106.0, |
|
"eval_cer": 0.18307552320291173, |
|
"eval_loss": 0.5749973058700562, |
|
"eval_runtime": 53.2134, |
|
"eval_samples_per_second": 10.185, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3561560341324665, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 107.0, |
|
"eval_cer": 0.18231119199272067, |
|
"eval_loss": 0.564974844455719, |
|
"eval_runtime": 53.1418, |
|
"eval_samples_per_second": 10.199, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 0.35270215359609913, |
|
"step": 1498 |
|
}, |
|
{ |
|
"epoch": 107.14, |
|
"learning_rate": 8.628571428571429e-06, |
|
"loss": 0.2674, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 108.0, |
|
"eval_cer": 0.18231119199272067, |
|
"eval_loss": 0.5676841139793396, |
|
"eval_runtime": 53.12, |
|
"eval_samples_per_second": 10.203, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 0.349857781389679, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 109.0, |
|
"eval_cer": 0.18263876251137398, |
|
"eval_loss": 0.5698859691619873, |
|
"eval_runtime": 53.173, |
|
"eval_samples_per_second": 10.193, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.35412433969930923, |
|
"step": 1526 |
|
}, |
|
{ |
|
"epoch": 110.0, |
|
"eval_cer": 0.1837306642402184, |
|
"eval_loss": 0.5779122710227966, |
|
"eval_runtime": 53.1485, |
|
"eval_samples_per_second": 10.198, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3555465258025193, |
|
"step": 1540 |
|
}, |
|
{ |
|
"epoch": 111.0, |
|
"eval_cer": 0.18336669699727023, |
|
"eval_loss": 0.5792039036750793, |
|
"eval_runtime": 53.5286, |
|
"eval_samples_per_second": 10.125, |
|
"eval_steps_per_second": 1.27, |
|
"eval_wer": 0.35514018691588783, |
|
"step": 1554 |
|
}, |
|
{ |
|
"epoch": 112.0, |
|
"eval_cer": 0.18289353958143767, |
|
"eval_loss": 0.5696908831596375, |
|
"eval_runtime": 53.1508, |
|
"eval_samples_per_second": 10.197, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3573750507923608, |
|
"step": 1568 |
|
}, |
|
{ |
|
"epoch": 113.0, |
|
"eval_cer": 0.18394904458598726, |
|
"eval_loss": 0.5852411389350891, |
|
"eval_runtime": 53.0856, |
|
"eval_samples_per_second": 10.21, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.35900040633888664, |
|
"step": 1582 |
|
}, |
|
{ |
|
"epoch": 114.0, |
|
"eval_cer": 0.18289353958143767, |
|
"eval_loss": 0.5735089778900146, |
|
"eval_runtime": 53.149, |
|
"eval_samples_per_second": 10.198, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3537180008126778, |
|
"step": 1596 |
|
}, |
|
{ |
|
"epoch": 114.29, |
|
"learning_rate": 7.2e-06, |
|
"loss": 0.2611, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 115.0, |
|
"eval_cer": 0.18318471337579617, |
|
"eval_loss": 0.577383279800415, |
|
"eval_runtime": 53.1629, |
|
"eval_samples_per_second": 10.195, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3545306785859407, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 116.0, |
|
"eval_cer": 0.1840582347588717, |
|
"eval_loss": 0.5835606455802917, |
|
"eval_runtime": 53.1573, |
|
"eval_samples_per_second": 10.196, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3555465258025193, |
|
"step": 1624 |
|
}, |
|
{ |
|
"epoch": 117.0, |
|
"eval_cer": 0.18322111010009098, |
|
"eval_loss": 0.5749671459197998, |
|
"eval_runtime": 53.1768, |
|
"eval_samples_per_second": 10.192, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.35168630637952053, |
|
"step": 1638 |
|
}, |
|
{ |
|
"epoch": 118.0, |
|
"eval_cer": 0.18245677888989992, |
|
"eval_loss": 0.5771631598472595, |
|
"eval_runtime": 53.195, |
|
"eval_samples_per_second": 10.189, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.35209264526615197, |
|
"step": 1652 |
|
}, |
|
{ |
|
"epoch": 119.0, |
|
"eval_cer": 0.18307552320291173, |
|
"eval_loss": 0.5793441534042358, |
|
"eval_runtime": 53.2698, |
|
"eval_samples_per_second": 10.175, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.35209264526615197, |
|
"step": 1666 |
|
}, |
|
{ |
|
"epoch": 120.0, |
|
"eval_cer": 0.18282074613284804, |
|
"eval_loss": 0.575577974319458, |
|
"eval_runtime": 53.2251, |
|
"eval_samples_per_second": 10.183, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.35168630637952053, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 121.0, |
|
"eval_cer": 0.1830027297543221, |
|
"eval_loss": 0.5794119834899902, |
|
"eval_runtime": 53.1856, |
|
"eval_samples_per_second": 10.191, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.35168630637952053, |
|
"step": 1694 |
|
}, |
|
{ |
|
"epoch": 121.43, |
|
"learning_rate": 5.7714285714285715e-06, |
|
"loss": 0.2476, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 122.0, |
|
"eval_cer": 0.18274795268425842, |
|
"eval_loss": 0.5718653202056885, |
|
"eval_runtime": 53.2426, |
|
"eval_samples_per_second": 10.18, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.35209264526615197, |
|
"step": 1708 |
|
}, |
|
{ |
|
"epoch": 123.0, |
|
"eval_cer": 0.1830027297543221, |
|
"eval_loss": 0.5803536772727966, |
|
"eval_runtime": 53.2083, |
|
"eval_samples_per_second": 10.186, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.35432750914262495, |
|
"step": 1722 |
|
}, |
|
{ |
|
"epoch": 124.0, |
|
"eval_cer": 0.18249317561419473, |
|
"eval_loss": 0.5728517174720764, |
|
"eval_runtime": 53.1988, |
|
"eval_samples_per_second": 10.188, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3539211702559935, |
|
"step": 1736 |
|
}, |
|
{ |
|
"epoch": 125.0, |
|
"eval_cer": 0.18318471337579617, |
|
"eval_loss": 0.5873575806617737, |
|
"eval_runtime": 53.0805, |
|
"eval_samples_per_second": 10.211, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.35188947582283625, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 126.0, |
|
"eval_cer": 0.18260236578707917, |
|
"eval_loss": 0.5776769518852234, |
|
"eval_runtime": 53.1869, |
|
"eval_samples_per_second": 10.19, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.35331166192604635, |
|
"step": 1764 |
|
}, |
|
{ |
|
"epoch": 127.0, |
|
"eval_cer": 0.18223839854413104, |
|
"eval_loss": 0.5761721730232239, |
|
"eval_runtime": 53.4852, |
|
"eval_samples_per_second": 10.134, |
|
"eval_steps_per_second": 1.271, |
|
"eval_wer": 0.3531084924827306, |
|
"step": 1778 |
|
}, |
|
{ |
|
"epoch": 127.0, |
|
"step": 1778, |
|
"total_flos": 1.5870191391607497e+19, |
|
"train_loss": 1.6193932103091606, |
|
"train_runtime": 26266.2725, |
|
"train_samples_per_second": 2.558, |
|
"train_steps_per_second": 0.08 |
|
} |
|
], |
|
"max_steps": 2100, |
|
"num_train_epochs": 150, |
|
"total_flos": 1.5870191391607497e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|