|
{ |
|
"best_metric": 0.556138277053833, |
|
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-13/checkpoint-1736", |
|
"epoch": 144.0, |
|
"global_step": 2016, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 3e-05, |
|
"loss": 38.268, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 0.9430027297543221, |
|
"eval_loss": 32.05844497680664, |
|
"eval_runtime": 53.1315, |
|
"eval_samples_per_second": 10.201, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 1.0, |
|
"step": 14 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 10.376302719116211, |
|
"eval_runtime": 52.6044, |
|
"eval_samples_per_second": 10.303, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 4.8976359367370605, |
|
"eval_runtime": 52.7604, |
|
"eval_samples_per_second": 10.273, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 4.040638446807861, |
|
"eval_runtime": 53.2305, |
|
"eval_samples_per_second": 10.182, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 1.0, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.7469818592071533, |
|
"eval_runtime": 52.5947, |
|
"eval_samples_per_second": 10.305, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.5903122425079346, |
|
"eval_runtime": 52.8025, |
|
"eval_samples_per_second": 10.265, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 1.0, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.474977493286133, |
|
"eval_runtime": 52.6757, |
|
"eval_samples_per_second": 10.289, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 98 |
|
}, |
|
{ |
|
"epoch": 7.14, |
|
"learning_rate": 2.862857142857143e-05, |
|
"loss": 10.1654, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.3405568599700928, |
|
"eval_runtime": 52.6172, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.226734161376953, |
|
"eval_runtime": 52.664, |
|
"eval_samples_per_second": 10.292, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1887271404266357, |
|
"eval_runtime": 52.6591, |
|
"eval_samples_per_second": 10.293, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.130089521408081, |
|
"eval_runtime": 53.0211, |
|
"eval_samples_per_second": 10.222, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1045610904693604, |
|
"eval_runtime": 52.5606, |
|
"eval_samples_per_second": 10.312, |
|
"eval_steps_per_second": 1.294, |
|
"eval_wer": 1.0, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.090874433517456, |
|
"eval_runtime": 52.5759, |
|
"eval_samples_per_second": 10.309, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0602762699127197, |
|
"eval_runtime": 52.7319, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"learning_rate": 2.72e-05, |
|
"loss": 3.0823, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0584146976470947, |
|
"eval_runtime": 52.6179, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0485479831695557, |
|
"eval_runtime": 52.7143, |
|
"eval_samples_per_second": 10.282, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.046433925628662, |
|
"eval_runtime": 52.6205, |
|
"eval_samples_per_second": 10.3, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 238 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.024200916290283, |
|
"eval_runtime": 52.7522, |
|
"eval_samples_per_second": 10.274, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0237276554107666, |
|
"eval_runtime": 52.648, |
|
"eval_samples_per_second": 10.295, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 266 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0304243564605713, |
|
"eval_runtime": 52.7771, |
|
"eval_samples_per_second": 10.27, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 1.0, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0118603706359863, |
|
"eval_runtime": 52.6742, |
|
"eval_samples_per_second": 10.29, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 21.43, |
|
"learning_rate": 2.5771428571428574e-05, |
|
"loss": 2.9562, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.014829158782959, |
|
"eval_runtime": 52.6427, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0060625076293945, |
|
"eval_runtime": 52.7555, |
|
"eval_samples_per_second": 10.274, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 322 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0041589736938477, |
|
"eval_runtime": 52.7518, |
|
"eval_samples_per_second": 10.275, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.003258228302002, |
|
"eval_runtime": 52.9828, |
|
"eval_samples_per_second": 10.23, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0028507709503174, |
|
"eval_runtime": 52.639, |
|
"eval_samples_per_second": 10.297, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.008204460144043, |
|
"eval_runtime": 52.7037, |
|
"eval_samples_per_second": 10.284, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9955995082855225, |
|
"eval_runtime": 52.6334, |
|
"eval_samples_per_second": 10.298, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 392 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"learning_rate": 2.434285714285714e-05, |
|
"loss": 2.9262, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.994765043258667, |
|
"eval_runtime": 52.6138, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 406 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.998243808746338, |
|
"eval_runtime": 52.831, |
|
"eval_samples_per_second": 10.259, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 1.0, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.996180295944214, |
|
"eval_runtime": 52.6837, |
|
"eval_samples_per_second": 10.288, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9930543899536133, |
|
"eval_runtime": 53.1611, |
|
"eval_samples_per_second": 10.195, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 1.0, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9809184074401855, |
|
"eval_runtime": 52.778, |
|
"eval_samples_per_second": 10.269, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 1.0, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.980422019958496, |
|
"eval_runtime": 52.6744, |
|
"eval_samples_per_second": 10.29, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 476 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9742188453674316, |
|
"eval_runtime": 52.6886, |
|
"eval_samples_per_second": 10.287, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 35.71, |
|
"learning_rate": 2.2914285714285714e-05, |
|
"loss": 2.9125, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.95219349861145, |
|
"eval_runtime": 52.7664, |
|
"eval_samples_per_second": 10.272, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9014649391174316, |
|
"eval_runtime": 52.6811, |
|
"eval_samples_per_second": 10.288, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 518 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.852219581604004, |
|
"eval_runtime": 52.7271, |
|
"eval_samples_per_second": 10.279, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 532 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.828482151031494, |
|
"eval_runtime": 52.6182, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_cer": 0.9614558689717926, |
|
"eval_loss": 2.729363441467285, |
|
"eval_runtime": 52.6938, |
|
"eval_samples_per_second": 10.286, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_cer": 0.9605095541401274, |
|
"eval_loss": 2.6491127014160156, |
|
"eval_runtime": 53.1167, |
|
"eval_samples_per_second": 10.204, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 1.0, |
|
"step": 574 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_cer": 0.8949590536851684, |
|
"eval_loss": 2.4882705211639404, |
|
"eval_runtime": 52.7981, |
|
"eval_samples_per_second": 10.266, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 1.0, |
|
"step": 588 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"learning_rate": 2.1485714285714284e-05, |
|
"loss": 2.7205, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_cer": 0.836505914467698, |
|
"eval_loss": 2.3630661964416504, |
|
"eval_runtime": 52.7032, |
|
"eval_samples_per_second": 10.284, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 602 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_cer": 0.607424931756142, |
|
"eval_loss": 2.054628610610962, |
|
"eval_runtime": 52.7506, |
|
"eval_samples_per_second": 10.275, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 616 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_cer": 0.5147952684258417, |
|
"eval_loss": 1.7867237329483032, |
|
"eval_runtime": 53.2436, |
|
"eval_samples_per_second": 10.18, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 1.0, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_cer": 0.4532120109190173, |
|
"eval_loss": 1.5452687740325928, |
|
"eval_runtime": 52.8784, |
|
"eval_samples_per_second": 10.25, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 1.0, |
|
"step": 644 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_cer": 0.40640582347588716, |
|
"eval_loss": 1.3553940057754517, |
|
"eval_runtime": 52.7768, |
|
"eval_samples_per_second": 10.27, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.9989841527834213, |
|
"step": 658 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_cer": 0.3669881710646042, |
|
"eval_loss": 1.201612114906311, |
|
"eval_runtime": 52.8752, |
|
"eval_samples_per_second": 10.251, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.982933766761479, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_cer": 0.3167242948134668, |
|
"eval_loss": 1.0777251720428467, |
|
"eval_runtime": 52.8059, |
|
"eval_samples_per_second": 10.264, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.8805363673303536, |
|
"step": 686 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 2.0057142857142858e-05, |
|
"loss": 1.6469, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.2594358507734304, |
|
"eval_loss": 0.978954017162323, |
|
"eval_runtime": 52.919, |
|
"eval_samples_per_second": 10.242, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 0.7029662738724096, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_cer": 0.22238398544131027, |
|
"eval_loss": 0.8961830735206604, |
|
"eval_runtime": 52.8398, |
|
"eval_samples_per_second": 10.257, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.5270215359609914, |
|
"step": 714 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_cer": 0.21757961783439492, |
|
"eval_loss": 0.8428747653961182, |
|
"eval_runtime": 52.8781, |
|
"eval_samples_per_second": 10.25, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.4973587972368956, |
|
"step": 728 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_cer": 0.2089171974522293, |
|
"eval_loss": 0.8158747553825378, |
|
"eval_runtime": 53.3812, |
|
"eval_samples_per_second": 10.153, |
|
"eval_steps_per_second": 1.274, |
|
"eval_wer": 0.4658675335229581, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_cer": 0.20658780709736124, |
|
"eval_loss": 0.7980368137359619, |
|
"eval_runtime": 52.8695, |
|
"eval_samples_per_second": 10.252, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.4512393336042259, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_cer": 0.20440400363967243, |
|
"eval_loss": 0.7540920376777649, |
|
"eval_runtime": 52.8272, |
|
"eval_samples_per_second": 10.26, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.4441284030881755, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_cer": 0.20152866242038217, |
|
"eval_loss": 0.7299144864082336, |
|
"eval_runtime": 52.846, |
|
"eval_samples_per_second": 10.256, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.42726533929297034, |
|
"step": 784 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_cer": 0.1964331210191083, |
|
"eval_loss": 0.7077798843383789, |
|
"eval_runtime": 52.7856, |
|
"eval_samples_per_second": 10.268, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.40918325883787077, |
|
"step": 798 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"learning_rate": 1.8628571428571428e-05, |
|
"loss": 0.7997, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_cer": 0.1973430391264786, |
|
"eval_loss": 0.7078654170036316, |
|
"eval_runtime": 52.7848, |
|
"eval_samples_per_second": 10.268, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.4110117838277123, |
|
"step": 812 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_cer": 0.19832575068243857, |
|
"eval_loss": 0.6861252784729004, |
|
"eval_runtime": 52.8203, |
|
"eval_samples_per_second": 10.261, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.41365298659081673, |
|
"step": 826 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_cer": 0.1975250227479527, |
|
"eval_loss": 0.7035004496574402, |
|
"eval_runtime": 53.0259, |
|
"eval_samples_per_second": 10.221, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 0.4010564811052418, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_cer": 0.19417652411282985, |
|
"eval_loss": 0.6675873398780823, |
|
"eval_runtime": 52.839, |
|
"eval_samples_per_second": 10.258, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.4000406338886631, |
|
"step": 854 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_cer": 0.19366696997270247, |
|
"eval_loss": 0.6562079787254333, |
|
"eval_runtime": 52.8072, |
|
"eval_samples_per_second": 10.264, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3980089394555059, |
|
"step": 868 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_cer": 0.1910828025477707, |
|
"eval_loss": 0.6579793691635132, |
|
"eval_runtime": 52.8351, |
|
"eval_samples_per_second": 10.258, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.38500609508329947, |
|
"step": 882 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_cer": 0.19253867151956325, |
|
"eval_loss": 0.6642553806304932, |
|
"eval_runtime": 52.8162, |
|
"eval_samples_per_second": 10.262, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.39110117838277125, |
|
"step": 896 |
|
}, |
|
{ |
|
"epoch": 64.29, |
|
"learning_rate": 1.72e-05, |
|
"loss": 0.5379, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_cer": 0.19282984531392175, |
|
"eval_loss": 0.6532391309738159, |
|
"eval_runtime": 52.87, |
|
"eval_samples_per_second": 10.252, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.39292970337261274, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_cer": 0.19064604185623293, |
|
"eval_loss": 0.6483404040336609, |
|
"eval_runtime": 52.7892, |
|
"eval_samples_per_second": 10.267, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3866314506298253, |
|
"step": 924 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_cer": 0.18696997270245677, |
|
"eval_loss": 0.6266820430755615, |
|
"eval_runtime": 53.3837, |
|
"eval_samples_per_second": 10.153, |
|
"eval_steps_per_second": 1.274, |
|
"eval_wer": 0.3756603006907761, |
|
"step": 938 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_cer": 0.18798908098271155, |
|
"eval_loss": 0.6296297907829285, |
|
"eval_runtime": 52.8207, |
|
"eval_samples_per_second": 10.261, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.3793173506704592, |
|
"step": 952 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_cer": 0.19020928116469518, |
|
"eval_loss": 0.6414676904678345, |
|
"eval_runtime": 52.8153, |
|
"eval_samples_per_second": 10.262, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.37850467289719625, |
|
"step": 966 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_cer": 0.18846223839854412, |
|
"eval_loss": 0.6227236986160278, |
|
"eval_runtime": 52.8625, |
|
"eval_samples_per_second": 10.253, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.3746444534741975, |
|
"step": 980 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_cer": 0.1878434940855323, |
|
"eval_loss": 0.6213016510009766, |
|
"eval_runtime": 52.7591, |
|
"eval_samples_per_second": 10.273, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.37383177570093457, |
|
"step": 994 |
|
}, |
|
{ |
|
"epoch": 71.43, |
|
"learning_rate": 1.577142857142857e-05, |
|
"loss": 0.4372, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_cer": 0.18718835304822565, |
|
"eval_loss": 0.6110479831695557, |
|
"eval_runtime": 52.7876, |
|
"eval_samples_per_second": 10.268, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.37261275904104024, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_cer": 0.1861692447679709, |
|
"eval_loss": 0.6018897294998169, |
|
"eval_runtime": 52.8613, |
|
"eval_samples_per_second": 10.253, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.3695652173913043, |
|
"step": 1022 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_cer": 0.18671519563239308, |
|
"eval_loss": 0.6036959290504456, |
|
"eval_runtime": 53.2023, |
|
"eval_samples_per_second": 10.188, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3722064201544088, |
|
"step": 1036 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_cer": 0.188098271155596, |
|
"eval_loss": 0.5993600487709045, |
|
"eval_runtime": 52.8215, |
|
"eval_samples_per_second": 10.261, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.3657049979683056, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_cer": 0.18806187443130118, |
|
"eval_loss": 0.6083250641822815, |
|
"eval_runtime": 52.971, |
|
"eval_samples_per_second": 10.232, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.37037789516456726, |
|
"step": 1064 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_cer": 0.1864968152866242, |
|
"eval_loss": 0.5837586522102356, |
|
"eval_runtime": 53.4695, |
|
"eval_samples_per_second": 10.137, |
|
"eval_steps_per_second": 1.272, |
|
"eval_wer": 0.3695652173913043, |
|
"step": 1078 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_cer": 0.18547770700636942, |
|
"eval_loss": 0.5794845819473267, |
|
"eval_runtime": 52.8335, |
|
"eval_samples_per_second": 10.259, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.3718000812677773, |
|
"step": 1092 |
|
}, |
|
{ |
|
"epoch": 78.57, |
|
"learning_rate": 1.4342857142857143e-05, |
|
"loss": 0.3912, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_cer": 0.18773430391264787, |
|
"eval_loss": 0.6201197504997253, |
|
"eval_runtime": 52.909, |
|
"eval_samples_per_second": 10.244, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 0.37139374238114586, |
|
"step": 1106 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_cer": 0.1854413102820746, |
|
"eval_loss": 0.5914958715438843, |
|
"eval_runtime": 52.8551, |
|
"eval_samples_per_second": 10.254, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.366111336854937, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_cer": 0.18427661510464058, |
|
"eval_loss": 0.5893952250480652, |
|
"eval_runtime": 52.9037, |
|
"eval_samples_per_second": 10.245, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 0.3650954896383584, |
|
"step": 1134 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_cer": 0.18591446769790718, |
|
"eval_loss": 0.5993715524673462, |
|
"eval_runtime": 52.7967, |
|
"eval_samples_per_second": 10.266, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3681430312880943, |
|
"step": 1148 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_cer": 0.18642402183803458, |
|
"eval_loss": 0.6001280546188354, |
|
"eval_runtime": 52.869, |
|
"eval_samples_per_second": 10.252, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.36550182852498986, |
|
"step": 1162 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_cer": 0.1864968152866242, |
|
"eval_loss": 0.6007617115974426, |
|
"eval_runtime": 52.8415, |
|
"eval_samples_per_second": 10.257, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.36529865908167414, |
|
"step": 1176 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_cer": 0.18322111010009098, |
|
"eval_loss": 0.5769873857498169, |
|
"eval_runtime": 52.8264, |
|
"eval_samples_per_second": 10.26, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.36021942299878096, |
|
"step": 1190 |
|
}, |
|
{ |
|
"epoch": 85.71, |
|
"learning_rate": 1.2914285714285713e-05, |
|
"loss": 0.3485, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_cer": 0.18358507734303914, |
|
"eval_loss": 0.5905404686927795, |
|
"eval_runtime": 52.731, |
|
"eval_samples_per_second": 10.279, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.35656237301909793, |
|
"step": 1204 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_cer": 0.18278434940855323, |
|
"eval_loss": 0.5810394287109375, |
|
"eval_runtime": 52.802, |
|
"eval_samples_per_second": 10.265, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.35798455912230803, |
|
"step": 1218 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_cer": 0.1829663330300273, |
|
"eval_loss": 0.5765053033828735, |
|
"eval_runtime": 53.0488, |
|
"eval_samples_per_second": 10.217, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 0.3583908980089395, |
|
"step": 1232 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_cer": 0.18453139217470427, |
|
"eval_loss": 0.5901545286178589, |
|
"eval_runtime": 52.796, |
|
"eval_samples_per_second": 10.266, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.36407964242177976, |
|
"step": 1246 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_cer": 0.18307552320291173, |
|
"eval_loss": 0.581239640712738, |
|
"eval_runtime": 52.8224, |
|
"eval_samples_per_second": 10.261, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.36143843965867534, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_cer": 0.18438580527752502, |
|
"eval_loss": 0.5965577960014343, |
|
"eval_runtime": 52.9107, |
|
"eval_samples_per_second": 10.244, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 0.3585940674522552, |
|
"step": 1274 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_cer": 0.18223839854413104, |
|
"eval_loss": 0.5686241388320923, |
|
"eval_runtime": 53.3712, |
|
"eval_samples_per_second": 10.155, |
|
"eval_steps_per_second": 1.274, |
|
"eval_wer": 0.35574969524583505, |
|
"step": 1288 |
|
}, |
|
{ |
|
"epoch": 92.86, |
|
"learning_rate": 1.1485714285714285e-05, |
|
"loss": 0.3234, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_cer": 0.18282074613284804, |
|
"eval_loss": 0.5839269161224365, |
|
"eval_runtime": 52.8855, |
|
"eval_samples_per_second": 10.249, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.35534335635920355, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_cer": 0.18198362147406733, |
|
"eval_loss": 0.5765420198440552, |
|
"eval_runtime": 52.892, |
|
"eval_samples_per_second": 10.247, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.35534335635920355, |
|
"step": 1316 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_cer": 0.18202001819836214, |
|
"eval_loss": 0.5779678225517273, |
|
"eval_runtime": 52.8619, |
|
"eval_samples_per_second": 10.253, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.35656237301909793, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_cer": 0.18343949044585986, |
|
"eval_loss": 0.5862200260162354, |
|
"eval_runtime": 52.9527, |
|
"eval_samples_per_second": 10.236, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.3596099146688338, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_cer": 0.18209281164695176, |
|
"eval_loss": 0.5701762437820435, |
|
"eval_runtime": 52.8493, |
|
"eval_samples_per_second": 10.256, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.3555465258025193, |
|
"step": 1358 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_cer": 0.18205641492265695, |
|
"eval_loss": 0.5787171721458435, |
|
"eval_runtime": 52.8738, |
|
"eval_samples_per_second": 10.251, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.3547338480292564, |
|
"step": 1372 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_cer": 0.1823839854413103, |
|
"eval_loss": 0.5766745209693909, |
|
"eval_runtime": 52.9499, |
|
"eval_samples_per_second": 10.236, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.3531084924827306, |
|
"step": 1386 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"learning_rate": 1.0057142857142857e-05, |
|
"loss": 0.2803, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_cer": 0.18183803457688807, |
|
"eval_loss": 0.5778467655181885, |
|
"eval_runtime": 53.096, |
|
"eval_samples_per_second": 10.208, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.3569687119057294, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 101.0, |
|
"eval_cer": 0.18172884440400364, |
|
"eval_loss": 0.5759402513504028, |
|
"eval_runtime": 53.4646, |
|
"eval_samples_per_second": 10.138, |
|
"eval_steps_per_second": 1.272, |
|
"eval_wer": 0.35432750914262495, |
|
"step": 1414 |
|
}, |
|
{ |
|
"epoch": 102.0, |
|
"eval_cer": 0.1823839854413103, |
|
"eval_loss": 0.5838054418563843, |
|
"eval_runtime": 53.0092, |
|
"eval_samples_per_second": 10.225, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 0.3571718813490451, |
|
"step": 1428 |
|
}, |
|
{ |
|
"epoch": 103.0, |
|
"eval_cer": 0.18154686078252957, |
|
"eval_loss": 0.569597065448761, |
|
"eval_runtime": 53.1914, |
|
"eval_samples_per_second": 10.19, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.35412433969930923, |
|
"step": 1442 |
|
}, |
|
{ |
|
"epoch": 104.0, |
|
"eval_cer": 0.18202001819836214, |
|
"eval_loss": 0.5723647475242615, |
|
"eval_runtime": 52.9421, |
|
"eval_samples_per_second": 10.238, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.35412433969930923, |
|
"step": 1456 |
|
}, |
|
{ |
|
"epoch": 105.0, |
|
"eval_cer": 0.18202001819836214, |
|
"eval_loss": 0.5698366165161133, |
|
"eval_runtime": 53.0166, |
|
"eval_samples_per_second": 10.223, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 0.35432750914262495, |
|
"step": 1470 |
|
}, |
|
{ |
|
"epoch": 106.0, |
|
"eval_cer": 0.1816196542311192, |
|
"eval_loss": 0.5727118253707886, |
|
"eval_runtime": 52.9397, |
|
"eval_samples_per_second": 10.238, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.3522958147094677, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 107.0, |
|
"eval_cer": 0.1808553230209281, |
|
"eval_loss": 0.5609294176101685, |
|
"eval_runtime": 53.3257, |
|
"eval_samples_per_second": 10.164, |
|
"eval_steps_per_second": 1.275, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1498 |
|
}, |
|
{ |
|
"epoch": 107.14, |
|
"learning_rate": 8.628571428571429e-06, |
|
"loss": 0.2718, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 108.0, |
|
"eval_cer": 0.18070973612374885, |
|
"eval_loss": 0.5654597282409668, |
|
"eval_runtime": 52.8748, |
|
"eval_samples_per_second": 10.251, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.34965461194636327, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 109.0, |
|
"eval_cer": 0.18158325750682439, |
|
"eval_loss": 0.5761396884918213, |
|
"eval_runtime": 52.7804, |
|
"eval_samples_per_second": 10.269, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.35351483136936207, |
|
"step": 1526 |
|
}, |
|
{ |
|
"epoch": 110.0, |
|
"eval_cer": 0.18147406733393995, |
|
"eval_loss": 0.5753419995307922, |
|
"eval_runtime": 52.7887, |
|
"eval_samples_per_second": 10.267, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3522958147094677, |
|
"step": 1540 |
|
}, |
|
{ |
|
"epoch": 111.0, |
|
"eval_cer": 0.18049135577797998, |
|
"eval_loss": 0.5703160762786865, |
|
"eval_runtime": 52.7573, |
|
"eval_samples_per_second": 10.273, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.35026412027631043, |
|
"step": 1554 |
|
}, |
|
{ |
|
"epoch": 112.0, |
|
"eval_cer": 0.18020018198362148, |
|
"eval_loss": 0.5622747540473938, |
|
"eval_runtime": 52.7621, |
|
"eval_samples_per_second": 10.273, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.34701340918325885, |
|
"step": 1568 |
|
}, |
|
{ |
|
"epoch": 113.0, |
|
"eval_cer": 0.18129208371246588, |
|
"eval_loss": 0.5722905993461609, |
|
"eval_runtime": 52.84, |
|
"eval_samples_per_second": 10.257, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1582 |
|
}, |
|
{ |
|
"epoch": 114.0, |
|
"eval_cer": 0.18030937215650591, |
|
"eval_loss": 0.5607832670211792, |
|
"eval_runtime": 52.8599, |
|
"eval_samples_per_second": 10.254, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.34863876472978467, |
|
"step": 1596 |
|
}, |
|
{ |
|
"epoch": 114.29, |
|
"learning_rate": 7.2e-06, |
|
"loss": 0.2614, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 115.0, |
|
"eval_cer": 0.18089171974522292, |
|
"eval_loss": 0.5612644553184509, |
|
"eval_runtime": 52.8176, |
|
"eval_samples_per_second": 10.262, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 116.0, |
|
"eval_cer": 0.18172884440400364, |
|
"eval_loss": 0.5742478370666504, |
|
"eval_runtime": 52.8139, |
|
"eval_samples_per_second": 10.262, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.35331166192604635, |
|
"step": 1624 |
|
}, |
|
{ |
|
"epoch": 117.0, |
|
"eval_cer": 0.18172884440400364, |
|
"eval_loss": 0.5715382695198059, |
|
"eval_runtime": 52.8096, |
|
"eval_samples_per_second": 10.263, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3522958147094677, |
|
"step": 1638 |
|
}, |
|
{ |
|
"epoch": 118.0, |
|
"eval_cer": 0.18169244767970882, |
|
"eval_loss": 0.5695165395736694, |
|
"eval_runtime": 52.7498, |
|
"eval_samples_per_second": 10.275, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.35331166192604635, |
|
"step": 1652 |
|
}, |
|
{ |
|
"epoch": 119.0, |
|
"eval_cer": 0.18245677888989992, |
|
"eval_loss": 0.571264386177063, |
|
"eval_runtime": 52.7339, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.3531084924827306, |
|
"step": 1666 |
|
}, |
|
{ |
|
"epoch": 120.0, |
|
"eval_cer": 0.18205641492265695, |
|
"eval_loss": 0.5664474368095398, |
|
"eval_runtime": 52.8509, |
|
"eval_samples_per_second": 10.255, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.35331166192604635, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 121.0, |
|
"eval_cer": 0.1821656050955414, |
|
"eval_loss": 0.5716355443000793, |
|
"eval_runtime": 52.7551, |
|
"eval_samples_per_second": 10.274, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.3531084924827306, |
|
"step": 1694 |
|
}, |
|
{ |
|
"epoch": 121.43, |
|
"learning_rate": 5.7714285714285715e-06, |
|
"loss": 0.2463, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 122.0, |
|
"eval_cer": 0.18100090991810738, |
|
"eval_loss": 0.568006694316864, |
|
"eval_runtime": 52.7861, |
|
"eval_samples_per_second": 10.268, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.347622917513206, |
|
"step": 1708 |
|
}, |
|
{ |
|
"epoch": 123.0, |
|
"eval_cer": 0.18169244767970882, |
|
"eval_loss": 0.5760354399681091, |
|
"eval_runtime": 52.8132, |
|
"eval_samples_per_second": 10.263, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.35270215359609913, |
|
"step": 1722 |
|
}, |
|
{ |
|
"epoch": 124.0, |
|
"eval_cer": 0.1802729754322111, |
|
"eval_loss": 0.556138277053833, |
|
"eval_runtime": 52.7767, |
|
"eval_samples_per_second": 10.27, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.34559122308004875, |
|
"step": 1736 |
|
}, |
|
{ |
|
"epoch": 125.0, |
|
"eval_cer": 0.18118289353958145, |
|
"eval_loss": 0.5698420405387878, |
|
"eval_runtime": 52.7433, |
|
"eval_samples_per_second": 10.276, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.34782608695652173, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 126.0, |
|
"eval_cer": 0.18111010009099182, |
|
"eval_loss": 0.5667452216148376, |
|
"eval_runtime": 52.7698, |
|
"eval_samples_per_second": 10.271, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.34823242584315317, |
|
"step": 1764 |
|
}, |
|
{ |
|
"epoch": 127.0, |
|
"eval_cer": 0.1813284804367607, |
|
"eval_loss": 0.5677050948143005, |
|
"eval_runtime": 52.7873, |
|
"eval_samples_per_second": 10.268, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.34782608695652173, |
|
"step": 1778 |
|
}, |
|
{ |
|
"epoch": 128.0, |
|
"eval_cer": 0.18045495905368517, |
|
"eval_loss": 0.5681147575378418, |
|
"eval_runtime": 53.1709, |
|
"eval_samples_per_second": 10.194, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.34457537586347015, |
|
"step": 1792 |
|
}, |
|
{ |
|
"epoch": 128.57, |
|
"learning_rate": 4.342857142857143e-06, |
|
"loss": 0.2477, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 129.0, |
|
"eval_cer": 0.18089171974522292, |
|
"eval_loss": 0.5665947794914246, |
|
"eval_runtime": 52.9379, |
|
"eval_samples_per_second": 10.238, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 0.34701340918325885, |
|
"step": 1806 |
|
}, |
|
{ |
|
"epoch": 130.0, |
|
"eval_cer": 0.18041856232939035, |
|
"eval_loss": 0.5696049928665161, |
|
"eval_runtime": 52.7984, |
|
"eval_samples_per_second": 10.265, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.34579439252336447, |
|
"step": 1820 |
|
}, |
|
{ |
|
"epoch": 131.0, |
|
"eval_cer": 0.1810373066424022, |
|
"eval_loss": 0.5704218149185181, |
|
"eval_runtime": 52.8548, |
|
"eval_samples_per_second": 10.255, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.34782608695652173, |
|
"step": 1834 |
|
}, |
|
{ |
|
"epoch": 132.0, |
|
"eval_cer": 0.18078252957233848, |
|
"eval_loss": 0.5655524134635925, |
|
"eval_runtime": 52.9545, |
|
"eval_samples_per_second": 10.235, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.34701340918325885, |
|
"step": 1848 |
|
}, |
|
{ |
|
"epoch": 133.0, |
|
"eval_cer": 0.18070973612374885, |
|
"eval_loss": 0.5696657299995422, |
|
"eval_runtime": 52.865, |
|
"eval_samples_per_second": 10.253, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.34721657862657457, |
|
"step": 1862 |
|
}, |
|
{ |
|
"epoch": 134.0, |
|
"eval_cer": 0.18096451319381257, |
|
"eval_loss": 0.5716409683227539, |
|
"eval_runtime": 52.8035, |
|
"eval_samples_per_second": 10.264, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.34721657862657457, |
|
"step": 1876 |
|
}, |
|
{ |
|
"epoch": 135.0, |
|
"eval_cer": 0.18096451319381257, |
|
"eval_loss": 0.5742436647415161, |
|
"eval_runtime": 52.961, |
|
"eval_samples_per_second": 10.234, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.3484355952864689, |
|
"step": 1890 |
|
}, |
|
{ |
|
"epoch": 135.71, |
|
"learning_rate": 2.9142857142857142e-06, |
|
"loss": 0.221, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 136.0, |
|
"eval_cer": 0.18074613284804367, |
|
"eval_loss": 0.567115306854248, |
|
"eval_runtime": 52.8477, |
|
"eval_samples_per_second": 10.256, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.34721657862657457, |
|
"step": 1904 |
|
}, |
|
{ |
|
"epoch": 137.0, |
|
"eval_cer": 0.18096451319381257, |
|
"eval_loss": 0.5669675469398499, |
|
"eval_runtime": 52.9196, |
|
"eval_samples_per_second": 10.242, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 0.3462007314099959, |
|
"step": 1918 |
|
}, |
|
{ |
|
"epoch": 138.0, |
|
"eval_cer": 0.18100090991810738, |
|
"eval_loss": 0.5674601793289185, |
|
"eval_runtime": 53.2148, |
|
"eval_samples_per_second": 10.185, |
|
"eval_steps_per_second": 1.278, |
|
"eval_wer": 0.3459975619666802, |
|
"step": 1932 |
|
}, |
|
{ |
|
"epoch": 139.0, |
|
"eval_cer": 0.18100090991810738, |
|
"eval_loss": 0.5703522562980652, |
|
"eval_runtime": 53.4902, |
|
"eval_samples_per_second": 10.133, |
|
"eval_steps_per_second": 1.271, |
|
"eval_wer": 0.3462007314099959, |
|
"step": 1946 |
|
}, |
|
{ |
|
"epoch": 140.0, |
|
"eval_cer": 0.1808189262966333, |
|
"eval_loss": 0.5675067901611328, |
|
"eval_runtime": 53.2601, |
|
"eval_samples_per_second": 10.176, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.34579439252336447, |
|
"step": 1960 |
|
}, |
|
{ |
|
"epoch": 141.0, |
|
"eval_cer": 0.1800181983621474, |
|
"eval_loss": 0.5617998838424683, |
|
"eval_runtime": 53.8381, |
|
"eval_samples_per_second": 10.067, |
|
"eval_steps_per_second": 1.263, |
|
"eval_wer": 0.3443722064201544, |
|
"step": 1974 |
|
}, |
|
{ |
|
"epoch": 142.0, |
|
"eval_cer": 0.1799818016378526, |
|
"eval_loss": 0.563258171081543, |
|
"eval_runtime": 53.4467, |
|
"eval_samples_per_second": 10.141, |
|
"eval_steps_per_second": 1.272, |
|
"eval_wer": 0.34538805363673303, |
|
"step": 1988 |
|
}, |
|
{ |
|
"epoch": 142.86, |
|
"learning_rate": 1.4857142857142858e-06, |
|
"loss": 0.2217, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 143.0, |
|
"eval_cer": 0.18067333939945404, |
|
"eval_loss": 0.5663711428642273, |
|
"eval_runtime": 53.0769, |
|
"eval_samples_per_second": 10.212, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.34559122308004875, |
|
"step": 2002 |
|
}, |
|
{ |
|
"epoch": 144.0, |
|
"eval_cer": 0.18100090991810738, |
|
"eval_loss": 0.5682144165039062, |
|
"eval_runtime": 53.3453, |
|
"eval_samples_per_second": 10.16, |
|
"eval_steps_per_second": 1.275, |
|
"eval_wer": 0.3462007314099959, |
|
"step": 2016 |
|
}, |
|
{ |
|
"epoch": 144.0, |
|
"step": 2016, |
|
"total_flos": 1.799432351021922e+19, |
|
"train_loss": 1.5532687327691488, |
|
"train_runtime": 29581.7912, |
|
"train_samples_per_second": 2.272, |
|
"train_steps_per_second": 0.071 |
|
} |
|
], |
|
"max_steps": 2100, |
|
"num_train_epochs": 150, |
|
"total_flos": 1.799432351021922e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|