|
{ |
|
"best_metric": 0.5552828907966614, |
|
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-9/checkpoint-1512", |
|
"epoch": 128.0, |
|
"global_step": 1792, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 3e-05, |
|
"loss": 37.5508, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 23.137550354003906, |
|
"eval_runtime": 52.9452, |
|
"eval_samples_per_second": 10.237, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 14 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 6.50360107421875, |
|
"eval_runtime": 52.53, |
|
"eval_samples_per_second": 10.318, |
|
"eval_steps_per_second": 1.294, |
|
"eval_wer": 1.0, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 4.391931056976318, |
|
"eval_runtime": 52.983, |
|
"eval_samples_per_second": 10.23, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.944124221801758, |
|
"eval_runtime": 52.4812, |
|
"eval_samples_per_second": 10.328, |
|
"eval_steps_per_second": 1.296, |
|
"eval_wer": 1.0, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.730649709701538, |
|
"eval_runtime": 52.6687, |
|
"eval_samples_per_second": 10.291, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.5761733055114746, |
|
"eval_runtime": 52.4991, |
|
"eval_samples_per_second": 10.324, |
|
"eval_steps_per_second": 1.295, |
|
"eval_wer": 1.0, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.4128713607788086, |
|
"eval_runtime": 52.9491, |
|
"eval_samples_per_second": 10.236, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 1.0, |
|
"step": 98 |
|
}, |
|
{ |
|
"epoch": 7.14, |
|
"learning_rate": 2.8614285714285714e-05, |
|
"loss": 8.6902, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.285918951034546, |
|
"eval_runtime": 52.5221, |
|
"eval_samples_per_second": 10.319, |
|
"eval_steps_per_second": 1.295, |
|
"eval_wer": 1.0, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.219179391860962, |
|
"eval_runtime": 53.0718, |
|
"eval_samples_per_second": 10.213, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 1.0, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.1479437351226807, |
|
"eval_runtime": 52.485, |
|
"eval_samples_per_second": 10.327, |
|
"eval_steps_per_second": 1.296, |
|
"eval_wer": 1.0, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.106292963027954, |
|
"eval_runtime": 52.586, |
|
"eval_samples_per_second": 10.307, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0896878242492676, |
|
"eval_runtime": 52.4874, |
|
"eval_samples_per_second": 10.326, |
|
"eval_steps_per_second": 1.296, |
|
"eval_wer": 1.0, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.084855794906616, |
|
"eval_runtime": 52.6206, |
|
"eval_samples_per_second": 10.3, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.048473596572876, |
|
"eval_runtime": 52.5487, |
|
"eval_samples_per_second": 10.314, |
|
"eval_steps_per_second": 1.294, |
|
"eval_wer": 1.0, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"learning_rate": 2.7185714285714287e-05, |
|
"loss": 3.059, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0495524406433105, |
|
"eval_runtime": 52.5935, |
|
"eval_samples_per_second": 10.305, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0509705543518066, |
|
"eval_runtime": 52.5135, |
|
"eval_samples_per_second": 10.321, |
|
"eval_steps_per_second": 1.295, |
|
"eval_wer": 1.0, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.042844533920288, |
|
"eval_runtime": 52.5458, |
|
"eval_samples_per_second": 10.315, |
|
"eval_steps_per_second": 1.294, |
|
"eval_wer": 1.0, |
|
"step": 238 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.033111572265625, |
|
"eval_runtime": 52.5883, |
|
"eval_samples_per_second": 10.306, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.035349130630493, |
|
"eval_runtime": 52.5405, |
|
"eval_samples_per_second": 10.316, |
|
"eval_steps_per_second": 1.294, |
|
"eval_wer": 1.0, |
|
"step": 266 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0217459201812744, |
|
"eval_runtime": 52.6413, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0107431411743164, |
|
"eval_runtime": 52.5958, |
|
"eval_samples_per_second": 10.305, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 21.43, |
|
"learning_rate": 2.5757142857142857e-05, |
|
"loss": 2.9492, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 3.0068299770355225, |
|
"eval_runtime": 52.8053, |
|
"eval_samples_per_second": 10.264, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 1.0, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9949989318847656, |
|
"eval_runtime": 52.5717, |
|
"eval_samples_per_second": 10.31, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 322 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.989611864089966, |
|
"eval_runtime": 53.0076, |
|
"eval_samples_per_second": 10.225, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 1.0, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9687271118164062, |
|
"eval_runtime": 52.6125, |
|
"eval_samples_per_second": 10.302, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.947374105453491, |
|
"eval_runtime": 52.5637, |
|
"eval_samples_per_second": 10.311, |
|
"eval_steps_per_second": 1.294, |
|
"eval_wer": 1.0, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.9414024353027344, |
|
"eval_runtime": 52.648, |
|
"eval_samples_per_second": 10.295, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.84250807762146, |
|
"eval_runtime": 52.5712, |
|
"eval_samples_per_second": 10.31, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 392 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"learning_rate": 2.432857142857143e-05, |
|
"loss": 2.8892, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.7813332080841064, |
|
"eval_runtime": 52.64, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 406 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 2.7269773483276367, |
|
"eval_runtime": 52.5989, |
|
"eval_samples_per_second": 10.304, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_cer": 0.9606187443130119, |
|
"eval_loss": 2.6644980907440186, |
|
"eval_runtime": 52.6591, |
|
"eval_samples_per_second": 10.293, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_cer": 0.9138853503184713, |
|
"eval_loss": 2.5593061447143555, |
|
"eval_runtime": 52.5942, |
|
"eval_samples_per_second": 10.305, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 1.0, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 33.0, |
|
"eval_cer": 0.7002729754322111, |
|
"eval_loss": 2.3229565620422363, |
|
"eval_runtime": 53.1245, |
|
"eval_samples_per_second": 10.202, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 1.0, |
|
"step": 462 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_cer": 0.535796178343949, |
|
"eval_loss": 1.9706292152404785, |
|
"eval_runtime": 52.7199, |
|
"eval_samples_per_second": 10.281, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 476 |
|
}, |
|
{ |
|
"epoch": 35.0, |
|
"eval_cer": 0.45481346678798906, |
|
"eval_loss": 1.7085232734680176, |
|
"eval_runtime": 52.7281, |
|
"eval_samples_per_second": 10.279, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9997968305566842, |
|
"step": 490 |
|
}, |
|
{ |
|
"epoch": 35.71, |
|
"learning_rate": 2.29e-05, |
|
"loss": 2.3937, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_cer": 0.4063694267515924, |
|
"eval_loss": 1.449361801147461, |
|
"eval_runtime": 52.6273, |
|
"eval_samples_per_second": 10.299, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 1.0, |
|
"step": 504 |
|
}, |
|
{ |
|
"epoch": 37.0, |
|
"eval_cer": 0.38471337579617837, |
|
"eval_loss": 1.286526083946228, |
|
"eval_runtime": 52.7236, |
|
"eval_samples_per_second": 10.28, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0, |
|
"step": 518 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_cer": 0.3659326660600546, |
|
"eval_loss": 1.1509252786636353, |
|
"eval_runtime": 52.6429, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.9947175944737912, |
|
"step": 532 |
|
}, |
|
{ |
|
"epoch": 39.0, |
|
"eval_cer": 0.3182893539581438, |
|
"eval_loss": 1.0466662645339966, |
|
"eval_runtime": 52.7531, |
|
"eval_samples_per_second": 10.274, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.903088175538399, |
|
"step": 546 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_cer": 0.24043676069153777, |
|
"eval_loss": 0.9831815361976624, |
|
"eval_runtime": 52.6494, |
|
"eval_samples_per_second": 10.295, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.5960991466883381, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 41.0, |
|
"eval_cer": 0.22227479526842583, |
|
"eval_loss": 0.892058789730072, |
|
"eval_runtime": 53.2461, |
|
"eval_samples_per_second": 10.179, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.5048760666395774, |
|
"step": 574 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_cer": 0.21233848953594175, |
|
"eval_loss": 0.8306074738502502, |
|
"eval_runtime": 52.8348, |
|
"eval_samples_per_second": 10.258, |
|
"eval_steps_per_second": 1.287, |
|
"eval_wer": 0.4687119057293783, |
|
"step": 588 |
|
}, |
|
{ |
|
"epoch": 42.86, |
|
"learning_rate": 2.1471428571428574e-05, |
|
"loss": 1.0877, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 43.0, |
|
"eval_cer": 0.20880800727934487, |
|
"eval_loss": 0.8016981482505798, |
|
"eval_runtime": 52.6157, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.45631856968711904, |
|
"step": 602 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_cer": 0.2045859872611465, |
|
"eval_loss": 0.7715625166893005, |
|
"eval_runtime": 52.6399, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.4404713531084925, |
|
"step": 616 |
|
}, |
|
{ |
|
"epoch": 45.0, |
|
"eval_cer": 0.2053867151956324, |
|
"eval_loss": 0.7693753838539124, |
|
"eval_runtime": 52.708, |
|
"eval_samples_per_second": 10.283, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.4406745225518082, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_cer": 0.20367606915377617, |
|
"eval_loss": 0.7451383471488953, |
|
"eval_runtime": 52.7002, |
|
"eval_samples_per_second": 10.285, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.4315318976026006, |
|
"step": 644 |
|
}, |
|
{ |
|
"epoch": 47.0, |
|
"eval_cer": 0.19956323930846223, |
|
"eval_loss": 0.7111817598342896, |
|
"eval_runtime": 53.2448, |
|
"eval_samples_per_second": 10.179, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.42503047541649736, |
|
"step": 658 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_cer": 0.19581437670609644, |
|
"eval_loss": 0.7007989883422852, |
|
"eval_runtime": 52.7775, |
|
"eval_samples_per_second": 10.27, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.41162129215765947, |
|
"step": 672 |
|
}, |
|
{ |
|
"epoch": 49.0, |
|
"eval_cer": 0.19799818016378526, |
|
"eval_loss": 0.7140166163444519, |
|
"eval_runtime": 52.6495, |
|
"eval_samples_per_second": 10.294, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.40572937830150346, |
|
"step": 686 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"learning_rate": 2.004285714285714e-05, |
|
"loss": 0.6292, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.19883530482256598, |
|
"eval_loss": 0.7207656502723694, |
|
"eval_runtime": 52.6919, |
|
"eval_samples_per_second": 10.286, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.41141812271434375, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 51.0, |
|
"eval_cer": 0.19366696997270247, |
|
"eval_loss": 0.6675068140029907, |
|
"eval_runtime": 52.8778, |
|
"eval_samples_per_second": 10.25, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.40329134498171476, |
|
"step": 714 |
|
}, |
|
{ |
|
"epoch": 52.0, |
|
"eval_cer": 0.19384895359417653, |
|
"eval_loss": 0.6650232672691345, |
|
"eval_runtime": 52.6583, |
|
"eval_samples_per_second": 10.293, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.4014628199918732, |
|
"step": 728 |
|
}, |
|
{ |
|
"epoch": 53.0, |
|
"eval_cer": 0.1937761601455869, |
|
"eval_loss": 0.6550155878067017, |
|
"eval_runtime": 52.7667, |
|
"eval_samples_per_second": 10.272, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.4012596505485575, |
|
"step": 742 |
|
}, |
|
{ |
|
"epoch": 54.0, |
|
"eval_cer": 0.19315741583257506, |
|
"eval_loss": 0.6477207541465759, |
|
"eval_runtime": 52.6665, |
|
"eval_samples_per_second": 10.291, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.3990247866720845, |
|
"step": 756 |
|
}, |
|
{ |
|
"epoch": 55.0, |
|
"eval_cer": 0.19319381255686988, |
|
"eval_loss": 0.6361698508262634, |
|
"eval_runtime": 52.6325, |
|
"eval_samples_per_second": 10.298, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.39597724502234866, |
|
"step": 770 |
|
}, |
|
{ |
|
"epoch": 56.0, |
|
"eval_cer": 0.192975432211101, |
|
"eval_loss": 0.632267951965332, |
|
"eval_runtime": 52.7108, |
|
"eval_samples_per_second": 10.283, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.39191385615603413, |
|
"step": 784 |
|
}, |
|
{ |
|
"epoch": 57.0, |
|
"eval_cer": 0.19206551410373066, |
|
"eval_loss": 0.626406192779541, |
|
"eval_runtime": 52.675, |
|
"eval_samples_per_second": 10.29, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.38703778951645673, |
|
"step": 798 |
|
}, |
|
{ |
|
"epoch": 57.14, |
|
"learning_rate": 1.8614285714285715e-05, |
|
"loss": 0.4739, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 58.0, |
|
"eval_cer": 0.19210191082802547, |
|
"eval_loss": 0.6290065050125122, |
|
"eval_runtime": 52.661, |
|
"eval_samples_per_second": 10.292, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.38724095895977245, |
|
"step": 812 |
|
}, |
|
{ |
|
"epoch": 59.0, |
|
"eval_cer": 0.19253867151956325, |
|
"eval_loss": 0.6206580400466919, |
|
"eval_runtime": 52.6443, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.38642828118650957, |
|
"step": 826 |
|
}, |
|
{ |
|
"epoch": 60.0, |
|
"eval_cer": 0.19184713375796178, |
|
"eval_loss": 0.6177613735198975, |
|
"eval_runtime": 52.6855, |
|
"eval_samples_per_second": 10.287, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.38581877285656235, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 61.0, |
|
"eval_cer": 0.19177434030937215, |
|
"eval_loss": 0.6217214465141296, |
|
"eval_runtime": 53.1515, |
|
"eval_samples_per_second": 10.197, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3860219422998781, |
|
"step": 854 |
|
}, |
|
{ |
|
"epoch": 62.0, |
|
"eval_cer": 0.1899545040946315, |
|
"eval_loss": 0.6078172922134399, |
|
"eval_runtime": 52.6994, |
|
"eval_samples_per_second": 10.285, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.37992685900040635, |
|
"step": 868 |
|
}, |
|
{ |
|
"epoch": 63.0, |
|
"eval_cer": 0.1889353958143767, |
|
"eval_loss": 0.6072229146957397, |
|
"eval_runtime": 52.8038, |
|
"eval_samples_per_second": 10.264, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3780983340105648, |
|
"step": 882 |
|
}, |
|
{ |
|
"epoch": 64.0, |
|
"eval_cer": 0.18831665150136487, |
|
"eval_loss": 0.6067555546760559, |
|
"eval_runtime": 52.6766, |
|
"eval_samples_per_second": 10.289, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.37606663957740755, |
|
"step": 896 |
|
}, |
|
{ |
|
"epoch": 64.29, |
|
"learning_rate": 1.7185714285714285e-05, |
|
"loss": 0.3855, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 65.0, |
|
"eval_cer": 0.1870427661510464, |
|
"eval_loss": 0.5944907665252686, |
|
"eval_runtime": 52.7345, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.3748476229175132, |
|
"step": 910 |
|
}, |
|
{ |
|
"epoch": 66.0, |
|
"eval_cer": 0.1899545040946315, |
|
"eval_loss": 0.6194169521331787, |
|
"eval_runtime": 52.7092, |
|
"eval_samples_per_second": 10.283, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.37992685900040635, |
|
"step": 924 |
|
}, |
|
{ |
|
"epoch": 67.0, |
|
"eval_cer": 0.18846223839854412, |
|
"eval_loss": 0.6044437289237976, |
|
"eval_runtime": 52.6167, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.3793173506704592, |
|
"step": 938 |
|
}, |
|
{ |
|
"epoch": 68.0, |
|
"eval_cer": 0.18798908098271155, |
|
"eval_loss": 0.5945860147476196, |
|
"eval_runtime": 52.6643, |
|
"eval_samples_per_second": 10.292, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.37505079236082894, |
|
"step": 952 |
|
}, |
|
{ |
|
"epoch": 69.0, |
|
"eval_cer": 0.18798908098271155, |
|
"eval_loss": 0.6115556955337524, |
|
"eval_runtime": 52.6187, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.37139374238114586, |
|
"step": 966 |
|
}, |
|
{ |
|
"epoch": 70.0, |
|
"eval_cer": 0.18609645131938127, |
|
"eval_loss": 0.5876884460449219, |
|
"eval_runtime": 52.6386, |
|
"eval_samples_per_second": 10.297, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.36793986184477856, |
|
"step": 980 |
|
}, |
|
{ |
|
"epoch": 71.0, |
|
"eval_cer": 0.18627843494085533, |
|
"eval_loss": 0.5861026048660278, |
|
"eval_runtime": 52.6444, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.36793986184477856, |
|
"step": 994 |
|
}, |
|
{ |
|
"epoch": 71.43, |
|
"learning_rate": 1.5757142857142858e-05, |
|
"loss": 0.3302, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 72.0, |
|
"eval_cer": 0.18562329390354868, |
|
"eval_loss": 0.580510139465332, |
|
"eval_runtime": 52.6419, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.3685493701747257, |
|
"step": 1008 |
|
}, |
|
{ |
|
"epoch": 73.0, |
|
"eval_cer": 0.1862056414922657, |
|
"eval_loss": 0.586155354976654, |
|
"eval_runtime": 52.6421, |
|
"eval_samples_per_second": 10.296, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.37139374238114586, |
|
"step": 1022 |
|
}, |
|
{ |
|
"epoch": 74.0, |
|
"eval_cer": 0.18656960873521383, |
|
"eval_loss": 0.5920763611793518, |
|
"eval_runtime": 52.6765, |
|
"eval_samples_per_second": 10.289, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.372003250711093, |
|
"step": 1036 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_cer": 0.185368516833485, |
|
"eval_loss": 0.5692393779754639, |
|
"eval_runtime": 52.7333, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.36834620073141, |
|
"step": 1050 |
|
}, |
|
{ |
|
"epoch": 76.0, |
|
"eval_cer": 0.18777070063694268, |
|
"eval_loss": 0.5922245979309082, |
|
"eval_runtime": 52.7512, |
|
"eval_samples_per_second": 10.275, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.37017472572125154, |
|
"step": 1064 |
|
}, |
|
{ |
|
"epoch": 77.0, |
|
"eval_cer": 0.18828025477707006, |
|
"eval_loss": 0.6105178594589233, |
|
"eval_runtime": 52.65, |
|
"eval_samples_per_second": 10.294, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.3709874034945144, |
|
"step": 1078 |
|
}, |
|
{ |
|
"epoch": 78.0, |
|
"eval_cer": 0.18558689717925386, |
|
"eval_loss": 0.5873062014579773, |
|
"eval_runtime": 53.0336, |
|
"eval_samples_per_second": 10.22, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 0.36834620073141, |
|
"step": 1092 |
|
}, |
|
{ |
|
"epoch": 78.57, |
|
"learning_rate": 1.4328571428571428e-05, |
|
"loss": 0.3046, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 79.0, |
|
"eval_cer": 0.18587807097361236, |
|
"eval_loss": 0.5825892090797424, |
|
"eval_runtime": 52.7458, |
|
"eval_samples_per_second": 10.276, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.3681430312880943, |
|
"step": 1106 |
|
}, |
|
{ |
|
"epoch": 80.0, |
|
"eval_cer": 0.18445859872611464, |
|
"eval_loss": 0.5792315006256104, |
|
"eval_runtime": 53.1292, |
|
"eval_samples_per_second": 10.202, |
|
"eval_steps_per_second": 1.28, |
|
"eval_wer": 0.3632669646485169, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 81.0, |
|
"eval_cer": 0.18347588717015467, |
|
"eval_loss": 0.5737511515617371, |
|
"eval_runtime": 52.6677, |
|
"eval_samples_per_second": 10.291, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.3610321007720439, |
|
"step": 1134 |
|
}, |
|
{ |
|
"epoch": 82.0, |
|
"eval_cer": 0.1843130118289354, |
|
"eval_loss": 0.579399585723877, |
|
"eval_runtime": 53.0003, |
|
"eval_samples_per_second": 10.226, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 0.36245428687525394, |
|
"step": 1148 |
|
}, |
|
{ |
|
"epoch": 83.0, |
|
"eval_cer": 0.18289353958143767, |
|
"eval_loss": 0.5766276121139526, |
|
"eval_runtime": 52.6724, |
|
"eval_samples_per_second": 10.29, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.3563592035757822, |
|
"step": 1162 |
|
}, |
|
{ |
|
"epoch": 84.0, |
|
"eval_cer": 0.1830027297543221, |
|
"eval_loss": 0.5745117664337158, |
|
"eval_runtime": 52.7431, |
|
"eval_samples_per_second": 10.276, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.35778138967899226, |
|
"step": 1176 |
|
}, |
|
{ |
|
"epoch": 85.0, |
|
"eval_cer": 0.18140127388535032, |
|
"eval_loss": 0.561495840549469, |
|
"eval_runtime": 52.6016, |
|
"eval_samples_per_second": 10.304, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 0.3555465258025193, |
|
"step": 1190 |
|
}, |
|
{ |
|
"epoch": 85.71, |
|
"learning_rate": 1.29e-05, |
|
"loss": 0.2927, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 86.0, |
|
"eval_cer": 0.18282074613284804, |
|
"eval_loss": 0.5853651762008667, |
|
"eval_runtime": 52.6345, |
|
"eval_samples_per_second": 10.297, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.36143843965867534, |
|
"step": 1204 |
|
}, |
|
{ |
|
"epoch": 87.0, |
|
"eval_cer": 0.1835122838944495, |
|
"eval_loss": 0.5817971229553223, |
|
"eval_runtime": 52.7194, |
|
"eval_samples_per_second": 10.281, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.36245428687525394, |
|
"step": 1218 |
|
}, |
|
{ |
|
"epoch": 88.0, |
|
"eval_cer": 0.18154686078252957, |
|
"eval_loss": 0.5613023638725281, |
|
"eval_runtime": 52.6918, |
|
"eval_samples_per_second": 10.286, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.35778138967899226, |
|
"step": 1232 |
|
}, |
|
{ |
|
"epoch": 89.0, |
|
"eval_cer": 0.18125568698817107, |
|
"eval_loss": 0.5661023259162903, |
|
"eval_runtime": 52.6276, |
|
"eval_samples_per_second": 10.299, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.3549370174725721, |
|
"step": 1246 |
|
}, |
|
{ |
|
"epoch": 90.0, |
|
"eval_cer": 0.18202001819836214, |
|
"eval_loss": 0.5794751048088074, |
|
"eval_runtime": 52.7536, |
|
"eval_samples_per_second": 10.274, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.36042259244209673, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 91.0, |
|
"eval_cer": 0.18020018198362148, |
|
"eval_loss": 0.5604133605957031, |
|
"eval_runtime": 52.6351, |
|
"eval_samples_per_second": 10.297, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.35209264526615197, |
|
"step": 1274 |
|
}, |
|
{ |
|
"epoch": 92.0, |
|
"eval_cer": 0.1821656050955414, |
|
"eval_loss": 0.5738141536712646, |
|
"eval_runtime": 52.6638, |
|
"eval_samples_per_second": 10.292, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.35900040633888664, |
|
"step": 1288 |
|
}, |
|
{ |
|
"epoch": 92.86, |
|
"learning_rate": 1.1471428571428572e-05, |
|
"loss": 0.2576, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 93.0, |
|
"eval_cer": 0.18140127388535032, |
|
"eval_loss": 0.5658465623855591, |
|
"eval_runtime": 52.9846, |
|
"eval_samples_per_second": 10.229, |
|
"eval_steps_per_second": 1.283, |
|
"eval_wer": 0.3573750507923608, |
|
"step": 1302 |
|
}, |
|
{ |
|
"epoch": 94.0, |
|
"eval_cer": 0.1808189262966333, |
|
"eval_loss": 0.5620054006576538, |
|
"eval_runtime": 52.617, |
|
"eval_samples_per_second": 10.301, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1316 |
|
}, |
|
{ |
|
"epoch": 95.0, |
|
"eval_cer": 0.18100090991810738, |
|
"eval_loss": 0.5709471106529236, |
|
"eval_runtime": 52.6962, |
|
"eval_samples_per_second": 10.285, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.35412433969930923, |
|
"step": 1330 |
|
}, |
|
{ |
|
"epoch": 96.0, |
|
"eval_cer": 0.1799454049135578, |
|
"eval_loss": 0.5674740076065063, |
|
"eval_runtime": 52.6892, |
|
"eval_samples_per_second": 10.287, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.35026412027631043, |
|
"step": 1344 |
|
}, |
|
{ |
|
"epoch": 97.0, |
|
"eval_cer": 0.18151046405823476, |
|
"eval_loss": 0.5788221955299377, |
|
"eval_runtime": 53.0799, |
|
"eval_samples_per_second": 10.211, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.3549370174725721, |
|
"step": 1358 |
|
}, |
|
{ |
|
"epoch": 98.0, |
|
"eval_cer": 0.18096451319381257, |
|
"eval_loss": 0.5730317234992981, |
|
"eval_runtime": 52.5988, |
|
"eval_samples_per_second": 10.304, |
|
"eval_steps_per_second": 1.293, |
|
"eval_wer": 0.3524989841527834, |
|
"step": 1372 |
|
}, |
|
{ |
|
"epoch": 99.0, |
|
"eval_cer": 0.1802729754322111, |
|
"eval_loss": 0.5693602561950684, |
|
"eval_runtime": 52.6503, |
|
"eval_samples_per_second": 10.294, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1386 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"learning_rate": 1.0042857142857144e-05, |
|
"loss": 0.2273, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 100.0, |
|
"eval_cer": 0.18070973612374885, |
|
"eval_loss": 0.5747684240341187, |
|
"eval_runtime": 52.7106, |
|
"eval_samples_per_second": 10.283, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.35270215359609913, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 101.0, |
|
"eval_cer": 0.17965423111919926, |
|
"eval_loss": 0.5688263773918152, |
|
"eval_runtime": 52.691, |
|
"eval_samples_per_second": 10.286, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.3512799674928891, |
|
"step": 1414 |
|
}, |
|
{ |
|
"epoch": 102.0, |
|
"eval_cer": 0.18045495905368517, |
|
"eval_loss": 0.5767450332641602, |
|
"eval_runtime": 52.6967, |
|
"eval_samples_per_second": 10.285, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.35534335635920355, |
|
"step": 1428 |
|
}, |
|
{ |
|
"epoch": 103.0, |
|
"eval_cer": 0.18118289353958145, |
|
"eval_loss": 0.5758454203605652, |
|
"eval_runtime": 52.6575, |
|
"eval_samples_per_second": 10.293, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.35290532303941485, |
|
"step": 1442 |
|
}, |
|
{ |
|
"epoch": 104.0, |
|
"eval_cer": 0.17929026387625113, |
|
"eval_loss": 0.5641180872917175, |
|
"eval_runtime": 52.7234, |
|
"eval_samples_per_second": 10.28, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.35067045916294187, |
|
"step": 1456 |
|
}, |
|
{ |
|
"epoch": 105.0, |
|
"eval_cer": 0.178926296633303, |
|
"eval_loss": 0.5628452897071838, |
|
"eval_runtime": 52.9721, |
|
"eval_samples_per_second": 10.232, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.34945144250304755, |
|
"step": 1470 |
|
}, |
|
{ |
|
"epoch": 106.0, |
|
"eval_cer": 0.1788898999090082, |
|
"eval_loss": 0.5728613138198853, |
|
"eval_runtime": 52.6612, |
|
"eval_samples_per_second": 10.292, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.3466070702966274, |
|
"step": 1484 |
|
}, |
|
{ |
|
"epoch": 107.0, |
|
"eval_cer": 0.17983621474067335, |
|
"eval_loss": 0.5722076892852783, |
|
"eval_runtime": 52.7987, |
|
"eval_samples_per_second": 10.265, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.34965461194636327, |
|
"step": 1498 |
|
}, |
|
{ |
|
"epoch": 107.14, |
|
"learning_rate": 8.614285714285714e-06, |
|
"loss": 0.2181, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 108.0, |
|
"eval_cer": 0.17881710646041857, |
|
"eval_loss": 0.5552828907966614, |
|
"eval_runtime": 52.6793, |
|
"eval_samples_per_second": 10.289, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.3466070702966274, |
|
"step": 1512 |
|
}, |
|
{ |
|
"epoch": 109.0, |
|
"eval_cer": 0.1792174704276615, |
|
"eval_loss": 0.5581598877906799, |
|
"eval_runtime": 52.8837, |
|
"eval_samples_per_second": 10.249, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.3484355952864689, |
|
"step": 1526 |
|
}, |
|
{ |
|
"epoch": 110.0, |
|
"eval_cer": 0.18020018198362148, |
|
"eval_loss": 0.5701535940170288, |
|
"eval_runtime": 52.7198, |
|
"eval_samples_per_second": 10.281, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.35209264526615197, |
|
"step": 1540 |
|
}, |
|
{ |
|
"epoch": 111.0, |
|
"eval_cer": 0.17976342129208372, |
|
"eval_loss": 0.5691486597061157, |
|
"eval_runtime": 52.7934, |
|
"eval_samples_per_second": 10.266, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.35046728971962615, |
|
"step": 1554 |
|
}, |
|
{ |
|
"epoch": 112.0, |
|
"eval_cer": 0.17856232939035488, |
|
"eval_loss": 0.560352087020874, |
|
"eval_runtime": 52.6568, |
|
"eval_samples_per_second": 10.293, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.34701340918325885, |
|
"step": 1568 |
|
}, |
|
{ |
|
"epoch": 113.0, |
|
"eval_cer": 0.17950864422202, |
|
"eval_loss": 0.5661062002182007, |
|
"eval_runtime": 52.8124, |
|
"eval_samples_per_second": 10.263, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.34823242584315317, |
|
"step": 1582 |
|
}, |
|
{ |
|
"epoch": 114.0, |
|
"eval_cer": 0.17961783439490445, |
|
"eval_loss": 0.5682941675186157, |
|
"eval_runtime": 52.7057, |
|
"eval_samples_per_second": 10.284, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.35107679804957337, |
|
"step": 1596 |
|
}, |
|
{ |
|
"epoch": 114.29, |
|
"learning_rate": 7.185714285714286e-06, |
|
"loss": 0.2171, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 115.0, |
|
"eval_cer": 0.17979981801637854, |
|
"eval_loss": 0.573845624923706, |
|
"eval_runtime": 52.7754, |
|
"eval_samples_per_second": 10.27, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3508736286062576, |
|
"step": 1610 |
|
}, |
|
{ |
|
"epoch": 116.0, |
|
"eval_cer": 0.17932666060054595, |
|
"eval_loss": 0.5730240941047668, |
|
"eval_runtime": 52.7098, |
|
"eval_samples_per_second": 10.283, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.34579439252336447, |
|
"step": 1624 |
|
}, |
|
{ |
|
"epoch": 117.0, |
|
"eval_cer": 0.178926296633303, |
|
"eval_loss": 0.5704598426818848, |
|
"eval_runtime": 52.6695, |
|
"eval_samples_per_second": 10.291, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.34559122308004875, |
|
"step": 1638 |
|
}, |
|
{ |
|
"epoch": 118.0, |
|
"eval_cer": 0.17961783439490445, |
|
"eval_loss": 0.5813525319099426, |
|
"eval_runtime": 53.1651, |
|
"eval_samples_per_second": 10.195, |
|
"eval_steps_per_second": 1.279, |
|
"eval_wer": 0.3466070702966274, |
|
"step": 1652 |
|
}, |
|
{ |
|
"epoch": 119.0, |
|
"eval_cer": 0.17907188353048226, |
|
"eval_loss": 0.5714964866638184, |
|
"eval_runtime": 52.764, |
|
"eval_samples_per_second": 10.272, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.3441690369768387, |
|
"step": 1666 |
|
}, |
|
{ |
|
"epoch": 120.0, |
|
"eval_cer": 0.17976342129208372, |
|
"eval_loss": 0.5720311403274536, |
|
"eval_runtime": 53.0408, |
|
"eval_samples_per_second": 10.219, |
|
"eval_steps_per_second": 1.282, |
|
"eval_wer": 0.34701340918325885, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 121.0, |
|
"eval_cer": 0.17969062784349407, |
|
"eval_loss": 0.5768777132034302, |
|
"eval_runtime": 52.7851, |
|
"eval_samples_per_second": 10.268, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.34701340918325885, |
|
"step": 1694 |
|
}, |
|
{ |
|
"epoch": 121.43, |
|
"learning_rate": 5.7571428571428574e-06, |
|
"loss": 0.1986, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 122.0, |
|
"eval_cer": 0.1791810737033667, |
|
"eval_loss": 0.571117639541626, |
|
"eval_runtime": 52.9656, |
|
"eval_samples_per_second": 10.233, |
|
"eval_steps_per_second": 1.284, |
|
"eval_wer": 0.3464039008533117, |
|
"step": 1708 |
|
}, |
|
{ |
|
"epoch": 123.0, |
|
"eval_cer": 0.17903548680618744, |
|
"eval_loss": 0.5728168487548828, |
|
"eval_runtime": 52.927, |
|
"eval_samples_per_second": 10.241, |
|
"eval_steps_per_second": 1.285, |
|
"eval_wer": 0.3441690369768387, |
|
"step": 1722 |
|
}, |
|
{ |
|
"epoch": 124.0, |
|
"eval_cer": 0.17830755232029116, |
|
"eval_loss": 0.5667761564254761, |
|
"eval_runtime": 52.78, |
|
"eval_samples_per_second": 10.269, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3449817147501016, |
|
"step": 1736 |
|
}, |
|
{ |
|
"epoch": 125.0, |
|
"eval_cer": 0.17969062784349407, |
|
"eval_loss": 0.5855135321617126, |
|
"eval_runtime": 52.7911, |
|
"eval_samples_per_second": 10.267, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3484355952864689, |
|
"step": 1750 |
|
}, |
|
{ |
|
"epoch": 126.0, |
|
"eval_cer": 0.17827115559599635, |
|
"eval_loss": 0.5667468905448914, |
|
"eval_runtime": 52.8968, |
|
"eval_samples_per_second": 10.246, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.3427468508736286, |
|
"step": 1764 |
|
}, |
|
{ |
|
"epoch": 127.0, |
|
"eval_cer": 0.1788898999090082, |
|
"eval_loss": 0.5710840821266174, |
|
"eval_runtime": 52.7705, |
|
"eval_samples_per_second": 10.271, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.3459975619666802, |
|
"step": 1778 |
|
}, |
|
{ |
|
"epoch": 128.0, |
|
"eval_cer": 0.1781255686988171, |
|
"eval_loss": 0.5681577920913696, |
|
"eval_runtime": 52.7919, |
|
"eval_samples_per_second": 10.267, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.3443722064201544, |
|
"step": 1792 |
|
}, |
|
{ |
|
"epoch": 128.0, |
|
"step": 1792, |
|
"total_flos": 1.5995217836155625e+19, |
|
"train_loss": 1.3990157055003303, |
|
"train_runtime": 26333.2616, |
|
"train_samples_per_second": 2.552, |
|
"train_steps_per_second": 0.08 |
|
} |
|
], |
|
"max_steps": 2100, |
|
"num_train_epochs": 150, |
|
"total_flos": 1.5995217836155625e+19, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|