wav2vec2-large-xlsr-coraa-exp-9 / trainer_state.json
alinerodrigues's picture
End of training
167ee21
{
"best_metric": 0.5552828907966614,
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-9/checkpoint-1512",
"epoch": 128.0,
"global_step": 1792,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 3e-05,
"loss": 37.5508,
"step": 1
},
{
"epoch": 1.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 23.137550354003906,
"eval_runtime": 52.9452,
"eval_samples_per_second": 10.237,
"eval_steps_per_second": 1.284,
"eval_wer": 1.0,
"step": 14
},
{
"epoch": 2.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 6.50360107421875,
"eval_runtime": 52.53,
"eval_samples_per_second": 10.318,
"eval_steps_per_second": 1.294,
"eval_wer": 1.0,
"step": 28
},
{
"epoch": 3.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 4.391931056976318,
"eval_runtime": 52.983,
"eval_samples_per_second": 10.23,
"eval_steps_per_second": 1.283,
"eval_wer": 1.0,
"step": 42
},
{
"epoch": 4.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.944124221801758,
"eval_runtime": 52.4812,
"eval_samples_per_second": 10.328,
"eval_steps_per_second": 1.296,
"eval_wer": 1.0,
"step": 56
},
{
"epoch": 5.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.730649709701538,
"eval_runtime": 52.6687,
"eval_samples_per_second": 10.291,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 70
},
{
"epoch": 6.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.5761733055114746,
"eval_runtime": 52.4991,
"eval_samples_per_second": 10.324,
"eval_steps_per_second": 1.295,
"eval_wer": 1.0,
"step": 84
},
{
"epoch": 7.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.4128713607788086,
"eval_runtime": 52.9491,
"eval_samples_per_second": 10.236,
"eval_steps_per_second": 1.284,
"eval_wer": 1.0,
"step": 98
},
{
"epoch": 7.14,
"learning_rate": 2.8614285714285714e-05,
"loss": 8.6902,
"step": 100
},
{
"epoch": 8.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.285918951034546,
"eval_runtime": 52.5221,
"eval_samples_per_second": 10.319,
"eval_steps_per_second": 1.295,
"eval_wer": 1.0,
"step": 112
},
{
"epoch": 9.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.219179391860962,
"eval_runtime": 53.0718,
"eval_samples_per_second": 10.213,
"eval_steps_per_second": 1.281,
"eval_wer": 1.0,
"step": 126
},
{
"epoch": 10.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.1479437351226807,
"eval_runtime": 52.485,
"eval_samples_per_second": 10.327,
"eval_steps_per_second": 1.296,
"eval_wer": 1.0,
"step": 140
},
{
"epoch": 11.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.106292963027954,
"eval_runtime": 52.586,
"eval_samples_per_second": 10.307,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 154
},
{
"epoch": 12.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0896878242492676,
"eval_runtime": 52.4874,
"eval_samples_per_second": 10.326,
"eval_steps_per_second": 1.296,
"eval_wer": 1.0,
"step": 168
},
{
"epoch": 13.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.084855794906616,
"eval_runtime": 52.6206,
"eval_samples_per_second": 10.3,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 182
},
{
"epoch": 14.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.048473596572876,
"eval_runtime": 52.5487,
"eval_samples_per_second": 10.314,
"eval_steps_per_second": 1.294,
"eval_wer": 1.0,
"step": 196
},
{
"epoch": 14.29,
"learning_rate": 2.7185714285714287e-05,
"loss": 3.059,
"step": 200
},
{
"epoch": 15.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0495524406433105,
"eval_runtime": 52.5935,
"eval_samples_per_second": 10.305,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 210
},
{
"epoch": 16.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0509705543518066,
"eval_runtime": 52.5135,
"eval_samples_per_second": 10.321,
"eval_steps_per_second": 1.295,
"eval_wer": 1.0,
"step": 224
},
{
"epoch": 17.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.042844533920288,
"eval_runtime": 52.5458,
"eval_samples_per_second": 10.315,
"eval_steps_per_second": 1.294,
"eval_wer": 1.0,
"step": 238
},
{
"epoch": 18.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.033111572265625,
"eval_runtime": 52.5883,
"eval_samples_per_second": 10.306,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 252
},
{
"epoch": 19.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.035349130630493,
"eval_runtime": 52.5405,
"eval_samples_per_second": 10.316,
"eval_steps_per_second": 1.294,
"eval_wer": 1.0,
"step": 266
},
{
"epoch": 20.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0217459201812744,
"eval_runtime": 52.6413,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 280
},
{
"epoch": 21.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0107431411743164,
"eval_runtime": 52.5958,
"eval_samples_per_second": 10.305,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 294
},
{
"epoch": 21.43,
"learning_rate": 2.5757142857142857e-05,
"loss": 2.9492,
"step": 300
},
{
"epoch": 22.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0068299770355225,
"eval_runtime": 52.8053,
"eval_samples_per_second": 10.264,
"eval_steps_per_second": 1.288,
"eval_wer": 1.0,
"step": 308
},
{
"epoch": 23.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9949989318847656,
"eval_runtime": 52.5717,
"eval_samples_per_second": 10.31,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 322
},
{
"epoch": 24.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.989611864089966,
"eval_runtime": 53.0076,
"eval_samples_per_second": 10.225,
"eval_steps_per_second": 1.283,
"eval_wer": 1.0,
"step": 336
},
{
"epoch": 25.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9687271118164062,
"eval_runtime": 52.6125,
"eval_samples_per_second": 10.302,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 350
},
{
"epoch": 26.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.947374105453491,
"eval_runtime": 52.5637,
"eval_samples_per_second": 10.311,
"eval_steps_per_second": 1.294,
"eval_wer": 1.0,
"step": 364
},
{
"epoch": 27.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9414024353027344,
"eval_runtime": 52.648,
"eval_samples_per_second": 10.295,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 378
},
{
"epoch": 28.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.84250807762146,
"eval_runtime": 52.5712,
"eval_samples_per_second": 10.31,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 392
},
{
"epoch": 28.57,
"learning_rate": 2.432857142857143e-05,
"loss": 2.8892,
"step": 400
},
{
"epoch": 29.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.7813332080841064,
"eval_runtime": 52.64,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 406
},
{
"epoch": 30.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.7269773483276367,
"eval_runtime": 52.5989,
"eval_samples_per_second": 10.304,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 420
},
{
"epoch": 31.0,
"eval_cer": 0.9606187443130119,
"eval_loss": 2.6644980907440186,
"eval_runtime": 52.6591,
"eval_samples_per_second": 10.293,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 434
},
{
"epoch": 32.0,
"eval_cer": 0.9138853503184713,
"eval_loss": 2.5593061447143555,
"eval_runtime": 52.5942,
"eval_samples_per_second": 10.305,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 448
},
{
"epoch": 33.0,
"eval_cer": 0.7002729754322111,
"eval_loss": 2.3229565620422363,
"eval_runtime": 53.1245,
"eval_samples_per_second": 10.202,
"eval_steps_per_second": 1.28,
"eval_wer": 1.0,
"step": 462
},
{
"epoch": 34.0,
"eval_cer": 0.535796178343949,
"eval_loss": 1.9706292152404785,
"eval_runtime": 52.7199,
"eval_samples_per_second": 10.281,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 476
},
{
"epoch": 35.0,
"eval_cer": 0.45481346678798906,
"eval_loss": 1.7085232734680176,
"eval_runtime": 52.7281,
"eval_samples_per_second": 10.279,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9997968305566842,
"step": 490
},
{
"epoch": 35.71,
"learning_rate": 2.29e-05,
"loss": 2.3937,
"step": 500
},
{
"epoch": 36.0,
"eval_cer": 0.4063694267515924,
"eval_loss": 1.449361801147461,
"eval_runtime": 52.6273,
"eval_samples_per_second": 10.299,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 504
},
{
"epoch": 37.0,
"eval_cer": 0.38471337579617837,
"eval_loss": 1.286526083946228,
"eval_runtime": 52.7236,
"eval_samples_per_second": 10.28,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 518
},
{
"epoch": 38.0,
"eval_cer": 0.3659326660600546,
"eval_loss": 1.1509252786636353,
"eval_runtime": 52.6429,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 0.9947175944737912,
"step": 532
},
{
"epoch": 39.0,
"eval_cer": 0.3182893539581438,
"eval_loss": 1.0466662645339966,
"eval_runtime": 52.7531,
"eval_samples_per_second": 10.274,
"eval_steps_per_second": 1.289,
"eval_wer": 0.903088175538399,
"step": 546
},
{
"epoch": 40.0,
"eval_cer": 0.24043676069153777,
"eval_loss": 0.9831815361976624,
"eval_runtime": 52.6494,
"eval_samples_per_second": 10.295,
"eval_steps_per_second": 1.292,
"eval_wer": 0.5960991466883381,
"step": 560
},
{
"epoch": 41.0,
"eval_cer": 0.22227479526842583,
"eval_loss": 0.892058789730072,
"eval_runtime": 53.2461,
"eval_samples_per_second": 10.179,
"eval_steps_per_second": 1.277,
"eval_wer": 0.5048760666395774,
"step": 574
},
{
"epoch": 42.0,
"eval_cer": 0.21233848953594175,
"eval_loss": 0.8306074738502502,
"eval_runtime": 52.8348,
"eval_samples_per_second": 10.258,
"eval_steps_per_second": 1.287,
"eval_wer": 0.4687119057293783,
"step": 588
},
{
"epoch": 42.86,
"learning_rate": 2.1471428571428574e-05,
"loss": 1.0877,
"step": 600
},
{
"epoch": 43.0,
"eval_cer": 0.20880800727934487,
"eval_loss": 0.8016981482505798,
"eval_runtime": 52.6157,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 0.45631856968711904,
"step": 602
},
{
"epoch": 44.0,
"eval_cer": 0.2045859872611465,
"eval_loss": 0.7715625166893005,
"eval_runtime": 52.6399,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 0.4404713531084925,
"step": 616
},
{
"epoch": 45.0,
"eval_cer": 0.2053867151956324,
"eval_loss": 0.7693753838539124,
"eval_runtime": 52.708,
"eval_samples_per_second": 10.283,
"eval_steps_per_second": 1.29,
"eval_wer": 0.4406745225518082,
"step": 630
},
{
"epoch": 46.0,
"eval_cer": 0.20367606915377617,
"eval_loss": 0.7451383471488953,
"eval_runtime": 52.7002,
"eval_samples_per_second": 10.285,
"eval_steps_per_second": 1.29,
"eval_wer": 0.4315318976026006,
"step": 644
},
{
"epoch": 47.0,
"eval_cer": 0.19956323930846223,
"eval_loss": 0.7111817598342896,
"eval_runtime": 53.2448,
"eval_samples_per_second": 10.179,
"eval_steps_per_second": 1.277,
"eval_wer": 0.42503047541649736,
"step": 658
},
{
"epoch": 48.0,
"eval_cer": 0.19581437670609644,
"eval_loss": 0.7007989883422852,
"eval_runtime": 52.7775,
"eval_samples_per_second": 10.27,
"eval_steps_per_second": 1.288,
"eval_wer": 0.41162129215765947,
"step": 672
},
{
"epoch": 49.0,
"eval_cer": 0.19799818016378526,
"eval_loss": 0.7140166163444519,
"eval_runtime": 52.6495,
"eval_samples_per_second": 10.294,
"eval_steps_per_second": 1.292,
"eval_wer": 0.40572937830150346,
"step": 686
},
{
"epoch": 50.0,
"learning_rate": 2.004285714285714e-05,
"loss": 0.6292,
"step": 700
},
{
"epoch": 50.0,
"eval_cer": 0.19883530482256598,
"eval_loss": 0.7207656502723694,
"eval_runtime": 52.6919,
"eval_samples_per_second": 10.286,
"eval_steps_per_second": 1.291,
"eval_wer": 0.41141812271434375,
"step": 700
},
{
"epoch": 51.0,
"eval_cer": 0.19366696997270247,
"eval_loss": 0.6675068140029907,
"eval_runtime": 52.8778,
"eval_samples_per_second": 10.25,
"eval_steps_per_second": 1.286,
"eval_wer": 0.40329134498171476,
"step": 714
},
{
"epoch": 52.0,
"eval_cer": 0.19384895359417653,
"eval_loss": 0.6650232672691345,
"eval_runtime": 52.6583,
"eval_samples_per_second": 10.293,
"eval_steps_per_second": 1.291,
"eval_wer": 0.4014628199918732,
"step": 728
},
{
"epoch": 53.0,
"eval_cer": 0.1937761601455869,
"eval_loss": 0.6550155878067017,
"eval_runtime": 52.7667,
"eval_samples_per_second": 10.272,
"eval_steps_per_second": 1.289,
"eval_wer": 0.4012596505485575,
"step": 742
},
{
"epoch": 54.0,
"eval_cer": 0.19315741583257506,
"eval_loss": 0.6477207541465759,
"eval_runtime": 52.6665,
"eval_samples_per_second": 10.291,
"eval_steps_per_second": 1.291,
"eval_wer": 0.3990247866720845,
"step": 756
},
{
"epoch": 55.0,
"eval_cer": 0.19319381255686988,
"eval_loss": 0.6361698508262634,
"eval_runtime": 52.6325,
"eval_samples_per_second": 10.298,
"eval_steps_per_second": 1.292,
"eval_wer": 0.39597724502234866,
"step": 770
},
{
"epoch": 56.0,
"eval_cer": 0.192975432211101,
"eval_loss": 0.632267951965332,
"eval_runtime": 52.7108,
"eval_samples_per_second": 10.283,
"eval_steps_per_second": 1.29,
"eval_wer": 0.39191385615603413,
"step": 784
},
{
"epoch": 57.0,
"eval_cer": 0.19206551410373066,
"eval_loss": 0.626406192779541,
"eval_runtime": 52.675,
"eval_samples_per_second": 10.29,
"eval_steps_per_second": 1.291,
"eval_wer": 0.38703778951645673,
"step": 798
},
{
"epoch": 57.14,
"learning_rate": 1.8614285714285715e-05,
"loss": 0.4739,
"step": 800
},
{
"epoch": 58.0,
"eval_cer": 0.19210191082802547,
"eval_loss": 0.6290065050125122,
"eval_runtime": 52.661,
"eval_samples_per_second": 10.292,
"eval_steps_per_second": 1.291,
"eval_wer": 0.38724095895977245,
"step": 812
},
{
"epoch": 59.0,
"eval_cer": 0.19253867151956325,
"eval_loss": 0.6206580400466919,
"eval_runtime": 52.6443,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 0.38642828118650957,
"step": 826
},
{
"epoch": 60.0,
"eval_cer": 0.19184713375796178,
"eval_loss": 0.6177613735198975,
"eval_runtime": 52.6855,
"eval_samples_per_second": 10.287,
"eval_steps_per_second": 1.291,
"eval_wer": 0.38581877285656235,
"step": 840
},
{
"epoch": 61.0,
"eval_cer": 0.19177434030937215,
"eval_loss": 0.6217214465141296,
"eval_runtime": 53.1515,
"eval_samples_per_second": 10.197,
"eval_steps_per_second": 1.279,
"eval_wer": 0.3860219422998781,
"step": 854
},
{
"epoch": 62.0,
"eval_cer": 0.1899545040946315,
"eval_loss": 0.6078172922134399,
"eval_runtime": 52.6994,
"eval_samples_per_second": 10.285,
"eval_steps_per_second": 1.29,
"eval_wer": 0.37992685900040635,
"step": 868
},
{
"epoch": 63.0,
"eval_cer": 0.1889353958143767,
"eval_loss": 0.6072229146957397,
"eval_runtime": 52.8038,
"eval_samples_per_second": 10.264,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3780983340105648,
"step": 882
},
{
"epoch": 64.0,
"eval_cer": 0.18831665150136487,
"eval_loss": 0.6067555546760559,
"eval_runtime": 52.6766,
"eval_samples_per_second": 10.289,
"eval_steps_per_second": 1.291,
"eval_wer": 0.37606663957740755,
"step": 896
},
{
"epoch": 64.29,
"learning_rate": 1.7185714285714285e-05,
"loss": 0.3855,
"step": 900
},
{
"epoch": 65.0,
"eval_cer": 0.1870427661510464,
"eval_loss": 0.5944907665252686,
"eval_runtime": 52.7345,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.289,
"eval_wer": 0.3748476229175132,
"step": 910
},
{
"epoch": 66.0,
"eval_cer": 0.1899545040946315,
"eval_loss": 0.6194169521331787,
"eval_runtime": 52.7092,
"eval_samples_per_second": 10.283,
"eval_steps_per_second": 1.29,
"eval_wer": 0.37992685900040635,
"step": 924
},
{
"epoch": 67.0,
"eval_cer": 0.18846223839854412,
"eval_loss": 0.6044437289237976,
"eval_runtime": 52.6167,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 0.3793173506704592,
"step": 938
},
{
"epoch": 68.0,
"eval_cer": 0.18798908098271155,
"eval_loss": 0.5945860147476196,
"eval_runtime": 52.6643,
"eval_samples_per_second": 10.292,
"eval_steps_per_second": 1.291,
"eval_wer": 0.37505079236082894,
"step": 952
},
{
"epoch": 69.0,
"eval_cer": 0.18798908098271155,
"eval_loss": 0.6115556955337524,
"eval_runtime": 52.6187,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 0.37139374238114586,
"step": 966
},
{
"epoch": 70.0,
"eval_cer": 0.18609645131938127,
"eval_loss": 0.5876884460449219,
"eval_runtime": 52.6386,
"eval_samples_per_second": 10.297,
"eval_steps_per_second": 1.292,
"eval_wer": 0.36793986184477856,
"step": 980
},
{
"epoch": 71.0,
"eval_cer": 0.18627843494085533,
"eval_loss": 0.5861026048660278,
"eval_runtime": 52.6444,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 0.36793986184477856,
"step": 994
},
{
"epoch": 71.43,
"learning_rate": 1.5757142857142858e-05,
"loss": 0.3302,
"step": 1000
},
{
"epoch": 72.0,
"eval_cer": 0.18562329390354868,
"eval_loss": 0.580510139465332,
"eval_runtime": 52.6419,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 0.3685493701747257,
"step": 1008
},
{
"epoch": 73.0,
"eval_cer": 0.1862056414922657,
"eval_loss": 0.586155354976654,
"eval_runtime": 52.6421,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 0.37139374238114586,
"step": 1022
},
{
"epoch": 74.0,
"eval_cer": 0.18656960873521383,
"eval_loss": 0.5920763611793518,
"eval_runtime": 52.6765,
"eval_samples_per_second": 10.289,
"eval_steps_per_second": 1.291,
"eval_wer": 0.372003250711093,
"step": 1036
},
{
"epoch": 75.0,
"eval_cer": 0.185368516833485,
"eval_loss": 0.5692393779754639,
"eval_runtime": 52.7333,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.29,
"eval_wer": 0.36834620073141,
"step": 1050
},
{
"epoch": 76.0,
"eval_cer": 0.18777070063694268,
"eval_loss": 0.5922245979309082,
"eval_runtime": 52.7512,
"eval_samples_per_second": 10.275,
"eval_steps_per_second": 1.289,
"eval_wer": 0.37017472572125154,
"step": 1064
},
{
"epoch": 77.0,
"eval_cer": 0.18828025477707006,
"eval_loss": 0.6105178594589233,
"eval_runtime": 52.65,
"eval_samples_per_second": 10.294,
"eval_steps_per_second": 1.292,
"eval_wer": 0.3709874034945144,
"step": 1078
},
{
"epoch": 78.0,
"eval_cer": 0.18558689717925386,
"eval_loss": 0.5873062014579773,
"eval_runtime": 53.0336,
"eval_samples_per_second": 10.22,
"eval_steps_per_second": 1.282,
"eval_wer": 0.36834620073141,
"step": 1092
},
{
"epoch": 78.57,
"learning_rate": 1.4328571428571428e-05,
"loss": 0.3046,
"step": 1100
},
{
"epoch": 79.0,
"eval_cer": 0.18587807097361236,
"eval_loss": 0.5825892090797424,
"eval_runtime": 52.7458,
"eval_samples_per_second": 10.276,
"eval_steps_per_second": 1.289,
"eval_wer": 0.3681430312880943,
"step": 1106
},
{
"epoch": 80.0,
"eval_cer": 0.18445859872611464,
"eval_loss": 0.5792315006256104,
"eval_runtime": 53.1292,
"eval_samples_per_second": 10.202,
"eval_steps_per_second": 1.28,
"eval_wer": 0.3632669646485169,
"step": 1120
},
{
"epoch": 81.0,
"eval_cer": 0.18347588717015467,
"eval_loss": 0.5737511515617371,
"eval_runtime": 52.6677,
"eval_samples_per_second": 10.291,
"eval_steps_per_second": 1.291,
"eval_wer": 0.3610321007720439,
"step": 1134
},
{
"epoch": 82.0,
"eval_cer": 0.1843130118289354,
"eval_loss": 0.579399585723877,
"eval_runtime": 53.0003,
"eval_samples_per_second": 10.226,
"eval_steps_per_second": 1.283,
"eval_wer": 0.36245428687525394,
"step": 1148
},
{
"epoch": 83.0,
"eval_cer": 0.18289353958143767,
"eval_loss": 0.5766276121139526,
"eval_runtime": 52.6724,
"eval_samples_per_second": 10.29,
"eval_steps_per_second": 1.291,
"eval_wer": 0.3563592035757822,
"step": 1162
},
{
"epoch": 84.0,
"eval_cer": 0.1830027297543221,
"eval_loss": 0.5745117664337158,
"eval_runtime": 52.7431,
"eval_samples_per_second": 10.276,
"eval_steps_per_second": 1.289,
"eval_wer": 0.35778138967899226,
"step": 1176
},
{
"epoch": 85.0,
"eval_cer": 0.18140127388535032,
"eval_loss": 0.561495840549469,
"eval_runtime": 52.6016,
"eval_samples_per_second": 10.304,
"eval_steps_per_second": 1.293,
"eval_wer": 0.3555465258025193,
"step": 1190
},
{
"epoch": 85.71,
"learning_rate": 1.29e-05,
"loss": 0.2927,
"step": 1200
},
{
"epoch": 86.0,
"eval_cer": 0.18282074613284804,
"eval_loss": 0.5853651762008667,
"eval_runtime": 52.6345,
"eval_samples_per_second": 10.297,
"eval_steps_per_second": 1.292,
"eval_wer": 0.36143843965867534,
"step": 1204
},
{
"epoch": 87.0,
"eval_cer": 0.1835122838944495,
"eval_loss": 0.5817971229553223,
"eval_runtime": 52.7194,
"eval_samples_per_second": 10.281,
"eval_steps_per_second": 1.29,
"eval_wer": 0.36245428687525394,
"step": 1218
},
{
"epoch": 88.0,
"eval_cer": 0.18154686078252957,
"eval_loss": 0.5613023638725281,
"eval_runtime": 52.6918,
"eval_samples_per_second": 10.286,
"eval_steps_per_second": 1.291,
"eval_wer": 0.35778138967899226,
"step": 1232
},
{
"epoch": 89.0,
"eval_cer": 0.18125568698817107,
"eval_loss": 0.5661023259162903,
"eval_runtime": 52.6276,
"eval_samples_per_second": 10.299,
"eval_steps_per_second": 1.292,
"eval_wer": 0.3549370174725721,
"step": 1246
},
{
"epoch": 90.0,
"eval_cer": 0.18202001819836214,
"eval_loss": 0.5794751048088074,
"eval_runtime": 52.7536,
"eval_samples_per_second": 10.274,
"eval_steps_per_second": 1.289,
"eval_wer": 0.36042259244209673,
"step": 1260
},
{
"epoch": 91.0,
"eval_cer": 0.18020018198362148,
"eval_loss": 0.5604133605957031,
"eval_runtime": 52.6351,
"eval_samples_per_second": 10.297,
"eval_steps_per_second": 1.292,
"eval_wer": 0.35209264526615197,
"step": 1274
},
{
"epoch": 92.0,
"eval_cer": 0.1821656050955414,
"eval_loss": 0.5738141536712646,
"eval_runtime": 52.6638,
"eval_samples_per_second": 10.292,
"eval_steps_per_second": 1.291,
"eval_wer": 0.35900040633888664,
"step": 1288
},
{
"epoch": 92.86,
"learning_rate": 1.1471428571428572e-05,
"loss": 0.2576,
"step": 1300
},
{
"epoch": 93.0,
"eval_cer": 0.18140127388535032,
"eval_loss": 0.5658465623855591,
"eval_runtime": 52.9846,
"eval_samples_per_second": 10.229,
"eval_steps_per_second": 1.283,
"eval_wer": 0.3573750507923608,
"step": 1302
},
{
"epoch": 94.0,
"eval_cer": 0.1808189262966333,
"eval_loss": 0.5620054006576538,
"eval_runtime": 52.617,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 0.35107679804957337,
"step": 1316
},
{
"epoch": 95.0,
"eval_cer": 0.18100090991810738,
"eval_loss": 0.5709471106529236,
"eval_runtime": 52.6962,
"eval_samples_per_second": 10.285,
"eval_steps_per_second": 1.29,
"eval_wer": 0.35412433969930923,
"step": 1330
},
{
"epoch": 96.0,
"eval_cer": 0.1799454049135578,
"eval_loss": 0.5674740076065063,
"eval_runtime": 52.6892,
"eval_samples_per_second": 10.287,
"eval_steps_per_second": 1.291,
"eval_wer": 0.35026412027631043,
"step": 1344
},
{
"epoch": 97.0,
"eval_cer": 0.18151046405823476,
"eval_loss": 0.5788221955299377,
"eval_runtime": 53.0799,
"eval_samples_per_second": 10.211,
"eval_steps_per_second": 1.281,
"eval_wer": 0.3549370174725721,
"step": 1358
},
{
"epoch": 98.0,
"eval_cer": 0.18096451319381257,
"eval_loss": 0.5730317234992981,
"eval_runtime": 52.5988,
"eval_samples_per_second": 10.304,
"eval_steps_per_second": 1.293,
"eval_wer": 0.3524989841527834,
"step": 1372
},
{
"epoch": 99.0,
"eval_cer": 0.1802729754322111,
"eval_loss": 0.5693602561950684,
"eval_runtime": 52.6503,
"eval_samples_per_second": 10.294,
"eval_steps_per_second": 1.292,
"eval_wer": 0.35107679804957337,
"step": 1386
},
{
"epoch": 100.0,
"learning_rate": 1.0042857142857144e-05,
"loss": 0.2273,
"step": 1400
},
{
"epoch": 100.0,
"eval_cer": 0.18070973612374885,
"eval_loss": 0.5747684240341187,
"eval_runtime": 52.7106,
"eval_samples_per_second": 10.283,
"eval_steps_per_second": 1.29,
"eval_wer": 0.35270215359609913,
"step": 1400
},
{
"epoch": 101.0,
"eval_cer": 0.17965423111919926,
"eval_loss": 0.5688263773918152,
"eval_runtime": 52.691,
"eval_samples_per_second": 10.286,
"eval_steps_per_second": 1.291,
"eval_wer": 0.3512799674928891,
"step": 1414
},
{
"epoch": 102.0,
"eval_cer": 0.18045495905368517,
"eval_loss": 0.5767450332641602,
"eval_runtime": 52.6967,
"eval_samples_per_second": 10.285,
"eval_steps_per_second": 1.29,
"eval_wer": 0.35534335635920355,
"step": 1428
},
{
"epoch": 103.0,
"eval_cer": 0.18118289353958145,
"eval_loss": 0.5758454203605652,
"eval_runtime": 52.6575,
"eval_samples_per_second": 10.293,
"eval_steps_per_second": 1.291,
"eval_wer": 0.35290532303941485,
"step": 1442
},
{
"epoch": 104.0,
"eval_cer": 0.17929026387625113,
"eval_loss": 0.5641180872917175,
"eval_runtime": 52.7234,
"eval_samples_per_second": 10.28,
"eval_steps_per_second": 1.29,
"eval_wer": 0.35067045916294187,
"step": 1456
},
{
"epoch": 105.0,
"eval_cer": 0.178926296633303,
"eval_loss": 0.5628452897071838,
"eval_runtime": 52.9721,
"eval_samples_per_second": 10.232,
"eval_steps_per_second": 1.284,
"eval_wer": 0.34945144250304755,
"step": 1470
},
{
"epoch": 106.0,
"eval_cer": 0.1788898999090082,
"eval_loss": 0.5728613138198853,
"eval_runtime": 52.6612,
"eval_samples_per_second": 10.292,
"eval_steps_per_second": 1.291,
"eval_wer": 0.3466070702966274,
"step": 1484
},
{
"epoch": 107.0,
"eval_cer": 0.17983621474067335,
"eval_loss": 0.5722076892852783,
"eval_runtime": 52.7987,
"eval_samples_per_second": 10.265,
"eval_steps_per_second": 1.288,
"eval_wer": 0.34965461194636327,
"step": 1498
},
{
"epoch": 107.14,
"learning_rate": 8.614285714285714e-06,
"loss": 0.2181,
"step": 1500
},
{
"epoch": 108.0,
"eval_cer": 0.17881710646041857,
"eval_loss": 0.5552828907966614,
"eval_runtime": 52.6793,
"eval_samples_per_second": 10.289,
"eval_steps_per_second": 1.291,
"eval_wer": 0.3466070702966274,
"step": 1512
},
{
"epoch": 109.0,
"eval_cer": 0.1792174704276615,
"eval_loss": 0.5581598877906799,
"eval_runtime": 52.8837,
"eval_samples_per_second": 10.249,
"eval_steps_per_second": 1.286,
"eval_wer": 0.3484355952864689,
"step": 1526
},
{
"epoch": 110.0,
"eval_cer": 0.18020018198362148,
"eval_loss": 0.5701535940170288,
"eval_runtime": 52.7198,
"eval_samples_per_second": 10.281,
"eval_steps_per_second": 1.29,
"eval_wer": 0.35209264526615197,
"step": 1540
},
{
"epoch": 111.0,
"eval_cer": 0.17976342129208372,
"eval_loss": 0.5691486597061157,
"eval_runtime": 52.7934,
"eval_samples_per_second": 10.266,
"eval_steps_per_second": 1.288,
"eval_wer": 0.35046728971962615,
"step": 1554
},
{
"epoch": 112.0,
"eval_cer": 0.17856232939035488,
"eval_loss": 0.560352087020874,
"eval_runtime": 52.6568,
"eval_samples_per_second": 10.293,
"eval_steps_per_second": 1.291,
"eval_wer": 0.34701340918325885,
"step": 1568
},
{
"epoch": 113.0,
"eval_cer": 0.17950864422202,
"eval_loss": 0.5661062002182007,
"eval_runtime": 52.8124,
"eval_samples_per_second": 10.263,
"eval_steps_per_second": 1.288,
"eval_wer": 0.34823242584315317,
"step": 1582
},
{
"epoch": 114.0,
"eval_cer": 0.17961783439490445,
"eval_loss": 0.5682941675186157,
"eval_runtime": 52.7057,
"eval_samples_per_second": 10.284,
"eval_steps_per_second": 1.29,
"eval_wer": 0.35107679804957337,
"step": 1596
},
{
"epoch": 114.29,
"learning_rate": 7.185714285714286e-06,
"loss": 0.2171,
"step": 1600
},
{
"epoch": 115.0,
"eval_cer": 0.17979981801637854,
"eval_loss": 0.573845624923706,
"eval_runtime": 52.7754,
"eval_samples_per_second": 10.27,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3508736286062576,
"step": 1610
},
{
"epoch": 116.0,
"eval_cer": 0.17932666060054595,
"eval_loss": 0.5730240941047668,
"eval_runtime": 52.7098,
"eval_samples_per_second": 10.283,
"eval_steps_per_second": 1.29,
"eval_wer": 0.34579439252336447,
"step": 1624
},
{
"epoch": 117.0,
"eval_cer": 0.178926296633303,
"eval_loss": 0.5704598426818848,
"eval_runtime": 52.6695,
"eval_samples_per_second": 10.291,
"eval_steps_per_second": 1.291,
"eval_wer": 0.34559122308004875,
"step": 1638
},
{
"epoch": 118.0,
"eval_cer": 0.17961783439490445,
"eval_loss": 0.5813525319099426,
"eval_runtime": 53.1651,
"eval_samples_per_second": 10.195,
"eval_steps_per_second": 1.279,
"eval_wer": 0.3466070702966274,
"step": 1652
},
{
"epoch": 119.0,
"eval_cer": 0.17907188353048226,
"eval_loss": 0.5714964866638184,
"eval_runtime": 52.764,
"eval_samples_per_second": 10.272,
"eval_steps_per_second": 1.289,
"eval_wer": 0.3441690369768387,
"step": 1666
},
{
"epoch": 120.0,
"eval_cer": 0.17976342129208372,
"eval_loss": 0.5720311403274536,
"eval_runtime": 53.0408,
"eval_samples_per_second": 10.219,
"eval_steps_per_second": 1.282,
"eval_wer": 0.34701340918325885,
"step": 1680
},
{
"epoch": 121.0,
"eval_cer": 0.17969062784349407,
"eval_loss": 0.5768777132034302,
"eval_runtime": 52.7851,
"eval_samples_per_second": 10.268,
"eval_steps_per_second": 1.288,
"eval_wer": 0.34701340918325885,
"step": 1694
},
{
"epoch": 121.43,
"learning_rate": 5.7571428571428574e-06,
"loss": 0.1986,
"step": 1700
},
{
"epoch": 122.0,
"eval_cer": 0.1791810737033667,
"eval_loss": 0.571117639541626,
"eval_runtime": 52.9656,
"eval_samples_per_second": 10.233,
"eval_steps_per_second": 1.284,
"eval_wer": 0.3464039008533117,
"step": 1708
},
{
"epoch": 123.0,
"eval_cer": 0.17903548680618744,
"eval_loss": 0.5728168487548828,
"eval_runtime": 52.927,
"eval_samples_per_second": 10.241,
"eval_steps_per_second": 1.285,
"eval_wer": 0.3441690369768387,
"step": 1722
},
{
"epoch": 124.0,
"eval_cer": 0.17830755232029116,
"eval_loss": 0.5667761564254761,
"eval_runtime": 52.78,
"eval_samples_per_second": 10.269,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3449817147501016,
"step": 1736
},
{
"epoch": 125.0,
"eval_cer": 0.17969062784349407,
"eval_loss": 0.5855135321617126,
"eval_runtime": 52.7911,
"eval_samples_per_second": 10.267,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3484355952864689,
"step": 1750
},
{
"epoch": 126.0,
"eval_cer": 0.17827115559599635,
"eval_loss": 0.5667468905448914,
"eval_runtime": 52.8968,
"eval_samples_per_second": 10.246,
"eval_steps_per_second": 1.286,
"eval_wer": 0.3427468508736286,
"step": 1764
},
{
"epoch": 127.0,
"eval_cer": 0.1788898999090082,
"eval_loss": 0.5710840821266174,
"eval_runtime": 52.7705,
"eval_samples_per_second": 10.271,
"eval_steps_per_second": 1.289,
"eval_wer": 0.3459975619666802,
"step": 1778
},
{
"epoch": 128.0,
"eval_cer": 0.1781255686988171,
"eval_loss": 0.5681577920913696,
"eval_runtime": 52.7919,
"eval_samples_per_second": 10.267,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3443722064201544,
"step": 1792
},
{
"epoch": 128.0,
"step": 1792,
"total_flos": 1.5995217836155625e+19,
"train_loss": 1.3990157055003303,
"train_runtime": 26333.2616,
"train_samples_per_second": 2.552,
"train_steps_per_second": 0.08
}
],
"max_steps": 2100,
"num_train_epochs": 150,
"total_flos": 1.5995217836155625e+19,
"trial_name": null,
"trial_params": null
}