wav2vec2-large-xlsr-coraa-exp-17 / trainer_state.json
alinerodrigues's picture
End of training
31fac2e
{
"best_metric": 0.5485906004905701,
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-17/checkpoint-1358",
"epoch": 117.0,
"global_step": 1638,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 0.0,
"loss": 38.4208,
"step": 1
},
{
"epoch": 1.0,
"eval_cer": 1.2145950864422201,
"eval_loss": 41.80952453613281,
"eval_per": 1.0056887444128404,
"eval_runtime": 16.4211,
"eval_samples_per_second": 33.006,
"eval_steps_per_second": 4.141,
"eval_wer": 1.0056887444128404,
"step": 14
},
{
"epoch": 2.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 12.287281036376953,
"eval_per": 1.0,
"eval_runtime": 16.3942,
"eval_samples_per_second": 33.06,
"eval_steps_per_second": 4.148,
"eval_wer": 1.0,
"step": 28
},
{
"epoch": 3.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 4.809342861175537,
"eval_per": 1.0,
"eval_runtime": 17.8009,
"eval_samples_per_second": 30.448,
"eval_steps_per_second": 3.82,
"eval_wer": 1.0,
"step": 42
},
{
"epoch": 4.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.9737813472747803,
"eval_per": 1.0,
"eval_runtime": 16.1587,
"eval_samples_per_second": 33.542,
"eval_steps_per_second": 4.208,
"eval_wer": 1.0,
"step": 56
},
{
"epoch": 5.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.6683900356292725,
"eval_per": 1.0,
"eval_runtime": 17.3608,
"eval_samples_per_second": 31.22,
"eval_steps_per_second": 3.917,
"eval_wer": 1.0,
"step": 70
},
{
"epoch": 6.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.5007262229919434,
"eval_per": 1.0,
"eval_runtime": 16.8377,
"eval_samples_per_second": 32.19,
"eval_steps_per_second": 4.039,
"eval_wer": 1.0,
"step": 84
},
{
"epoch": 7.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.3854148387908936,
"eval_per": 1.0,
"eval_runtime": 15.8896,
"eval_samples_per_second": 34.11,
"eval_steps_per_second": 4.28,
"eval_wer": 1.0,
"step": 98
},
{
"epoch": 7.14,
"learning_rate": 3.853775853775854e-05,
"loss": 11.8009,
"step": 100
},
{
"epoch": 8.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.450645923614502,
"eval_per": 1.0,
"eval_runtime": 16.3597,
"eval_samples_per_second": 33.13,
"eval_steps_per_second": 4.157,
"eval_wer": 1.0,
"step": 112
},
{
"epoch": 9.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.178906202316284,
"eval_per": 1.0,
"eval_runtime": 16.1702,
"eval_samples_per_second": 33.519,
"eval_steps_per_second": 4.205,
"eval_wer": 1.0,
"step": 126
},
{
"epoch": 10.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.1274373531341553,
"eval_per": 1.0,
"eval_runtime": 16.9804,
"eval_samples_per_second": 31.919,
"eval_steps_per_second": 4.005,
"eval_wer": 1.0,
"step": 140
},
{
"epoch": 11.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.1624248027801514,
"eval_per": 1.0,
"eval_runtime": 16.0626,
"eval_samples_per_second": 33.743,
"eval_steps_per_second": 4.233,
"eval_wer": 1.0,
"step": 154
},
{
"epoch": 12.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.1065869331359863,
"eval_per": 1.0,
"eval_runtime": 15.7377,
"eval_samples_per_second": 34.44,
"eval_steps_per_second": 4.321,
"eval_wer": 1.0,
"step": 168
},
{
"epoch": 13.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0579798221588135,
"eval_per": 1.0,
"eval_runtime": 16.1086,
"eval_samples_per_second": 33.647,
"eval_steps_per_second": 4.221,
"eval_wer": 1.0,
"step": 182
},
{
"epoch": 14.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0477194786071777,
"eval_per": 1.0,
"eval_runtime": 17.7392,
"eval_samples_per_second": 30.554,
"eval_steps_per_second": 3.833,
"eval_wer": 1.0,
"step": 196
},
{
"epoch": 14.29,
"learning_rate": 3.6613756613756616e-05,
"loss": 3.0395,
"step": 200
},
{
"epoch": 15.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.051933526992798,
"eval_per": 1.0,
"eval_runtime": 16.5102,
"eval_samples_per_second": 32.828,
"eval_steps_per_second": 4.119,
"eval_wer": 1.0,
"step": 210
},
{
"epoch": 16.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0363881587982178,
"eval_per": 1.0,
"eval_runtime": 16.6774,
"eval_samples_per_second": 32.499,
"eval_steps_per_second": 4.077,
"eval_wer": 1.0,
"step": 224
},
{
"epoch": 17.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.015160083770752,
"eval_per": 1.0,
"eval_runtime": 17.0522,
"eval_samples_per_second": 31.785,
"eval_steps_per_second": 3.988,
"eval_wer": 1.0,
"step": 238
},
{
"epoch": 18.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0166876316070557,
"eval_per": 1.0,
"eval_runtime": 16.1958,
"eval_samples_per_second": 33.465,
"eval_steps_per_second": 4.199,
"eval_wer": 1.0,
"step": 252
},
{
"epoch": 19.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0129683017730713,
"eval_per": 1.0,
"eval_runtime": 17.0594,
"eval_samples_per_second": 31.771,
"eval_steps_per_second": 3.986,
"eval_wer": 1.0,
"step": 266
},
{
"epoch": 20.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0103399753570557,
"eval_per": 1.0,
"eval_runtime": 16.6483,
"eval_samples_per_second": 32.556,
"eval_steps_per_second": 4.084,
"eval_wer": 1.0,
"step": 280
},
{
"epoch": 21.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9993834495544434,
"eval_per": 1.0,
"eval_runtime": 16.1419,
"eval_samples_per_second": 33.577,
"eval_steps_per_second": 4.213,
"eval_wer": 1.0,
"step": 294
},
{
"epoch": 21.43,
"learning_rate": 3.468975468975469e-05,
"loss": 2.9424,
"step": 300
},
{
"epoch": 22.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.999858856201172,
"eval_per": 1.0,
"eval_runtime": 16.4633,
"eval_samples_per_second": 32.922,
"eval_steps_per_second": 4.13,
"eval_wer": 1.0,
"step": 308
},
{
"epoch": 23.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.000885486602783,
"eval_per": 1.0,
"eval_runtime": 16.4157,
"eval_samples_per_second": 33.017,
"eval_steps_per_second": 4.142,
"eval_wer": 1.0,
"step": 322
},
{
"epoch": 24.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.002438545227051,
"eval_per": 1.0,
"eval_runtime": 16.3396,
"eval_samples_per_second": 33.171,
"eval_steps_per_second": 4.162,
"eval_wer": 1.0,
"step": 336
},
{
"epoch": 25.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.000091552734375,
"eval_per": 1.0,
"eval_runtime": 16.2524,
"eval_samples_per_second": 33.349,
"eval_steps_per_second": 4.184,
"eval_wer": 1.0,
"step": 350
},
{
"epoch": 26.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.989057779312134,
"eval_per": 1.0,
"eval_runtime": 16.9129,
"eval_samples_per_second": 32.047,
"eval_steps_per_second": 4.021,
"eval_wer": 1.0,
"step": 364
},
{
"epoch": 27.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.988072633743286,
"eval_per": 1.0,
"eval_runtime": 16.8979,
"eval_samples_per_second": 32.075,
"eval_steps_per_second": 4.024,
"eval_wer": 1.0,
"step": 378
},
{
"epoch": 28.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.97031569480896,
"eval_per": 1.0,
"eval_runtime": 16.5706,
"eval_samples_per_second": 32.708,
"eval_steps_per_second": 4.104,
"eval_wer": 1.0,
"step": 392
},
{
"epoch": 28.57,
"learning_rate": 3.276575276575277e-05,
"loss": 2.9154,
"step": 400
},
{
"epoch": 29.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9531471729278564,
"eval_per": 1.0,
"eval_runtime": 16.0162,
"eval_samples_per_second": 33.841,
"eval_steps_per_second": 4.246,
"eval_wer": 1.0,
"step": 406
},
{
"epoch": 30.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.920755624771118,
"eval_per": 1.0,
"eval_runtime": 16.2922,
"eval_samples_per_second": 33.267,
"eval_steps_per_second": 4.174,
"eval_wer": 1.0,
"step": 420
},
{
"epoch": 31.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.898137331008911,
"eval_per": 1.0,
"eval_runtime": 16.1037,
"eval_samples_per_second": 33.657,
"eval_steps_per_second": 4.223,
"eval_wer": 1.0,
"step": 434
},
{
"epoch": 32.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.8320581912994385,
"eval_per": 1.0,
"eval_runtime": 16.1007,
"eval_samples_per_second": 33.663,
"eval_steps_per_second": 4.223,
"eval_wer": 1.0,
"step": 448
},
{
"epoch": 33.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.7583184242248535,
"eval_per": 1.0,
"eval_runtime": 16.3232,
"eval_samples_per_second": 33.204,
"eval_steps_per_second": 4.166,
"eval_wer": 1.0,
"step": 462
},
{
"epoch": 34.0,
"eval_cer": 0.9616014558689718,
"eval_loss": 2.6405322551727295,
"eval_per": 1.0,
"eval_runtime": 16.4064,
"eval_samples_per_second": 33.036,
"eval_steps_per_second": 4.145,
"eval_wer": 1.0,
"step": 476
},
{
"epoch": 35.0,
"eval_cer": 0.8832029117379436,
"eval_loss": 2.5071756839752197,
"eval_per": 1.0,
"eval_runtime": 16.3137,
"eval_samples_per_second": 33.224,
"eval_steps_per_second": 4.168,
"eval_wer": 1.0,
"step": 490
},
{
"epoch": 35.71,
"learning_rate": 3.0841750841750846e-05,
"loss": 2.7552,
"step": 500
},
{
"epoch": 36.0,
"eval_cer": 0.6144131028207461,
"eval_loss": 2.1546847820281982,
"eval_per": 1.0,
"eval_runtime": 16.1444,
"eval_samples_per_second": 33.572,
"eval_steps_per_second": 4.212,
"eval_wer": 1.0,
"step": 504
},
{
"epoch": 37.0,
"eval_cer": 0.49958143767060964,
"eval_loss": 1.7564772367477417,
"eval_per": 1.0,
"eval_runtime": 16.6494,
"eval_samples_per_second": 32.554,
"eval_steps_per_second": 4.084,
"eval_wer": 1.0,
"step": 518
},
{
"epoch": 38.0,
"eval_cer": 0.40651501364877163,
"eval_loss": 1.460233211517334,
"eval_per": 1.0,
"eval_runtime": 16.6864,
"eval_samples_per_second": 32.482,
"eval_steps_per_second": 4.075,
"eval_wer": 1.0,
"step": 532
},
{
"epoch": 39.0,
"eval_cer": 0.36578707916287534,
"eval_loss": 1.2268937826156616,
"eval_per": 0.9892320195042665,
"eval_runtime": 16.8505,
"eval_samples_per_second": 32.165,
"eval_steps_per_second": 4.035,
"eval_wer": 0.989638358390898,
"step": 546
},
{
"epoch": 40.0,
"eval_cer": 0.3204731574158326,
"eval_loss": 1.0905884504318237,
"eval_per": 0.8833807395367737,
"eval_runtime": 16.8204,
"eval_samples_per_second": 32.223,
"eval_steps_per_second": 4.043,
"eval_wer": 0.8880536367330354,
"step": 560
},
{
"epoch": 41.0,
"eval_cer": 0.26314831665150135,
"eval_loss": 0.9941390752792358,
"eval_per": 0.6603006907761073,
"eval_runtime": 16.4361,
"eval_samples_per_second": 32.976,
"eval_steps_per_second": 4.137,
"eval_wer": 0.6771637545713125,
"step": 574
},
{
"epoch": 42.0,
"eval_cer": 0.23221110100090991,
"eval_loss": 0.9132717847824097,
"eval_per": 0.5154408776919951,
"eval_runtime": 16.9668,
"eval_samples_per_second": 31.945,
"eval_steps_per_second": 4.008,
"eval_wer": 0.5422592442096709,
"step": 588
},
{
"epoch": 42.86,
"learning_rate": 2.8917748917748916e-05,
"loss": 1.4599,
"step": 600
},
{
"epoch": 43.0,
"eval_cer": 0.22413102820746134,
"eval_loss": 0.8487069010734558,
"eval_per": 0.48821617228768793,
"eval_runtime": 16.6557,
"eval_samples_per_second": 32.541,
"eval_steps_per_second": 4.083,
"eval_wer": 0.5142218610321008,
"step": 602
},
{
"epoch": 44.0,
"eval_cer": 0.22074613284804367,
"eval_loss": 0.8211185336112976,
"eval_per": 0.46261682242990654,
"eval_runtime": 16.0355,
"eval_samples_per_second": 33.8,
"eval_steps_per_second": 4.241,
"eval_wer": 0.48984152783421375,
"step": 616
},
{
"epoch": 45.0,
"eval_cer": 0.214049135577798,
"eval_loss": 0.7671909332275391,
"eval_per": 0.4518488419341731,
"eval_runtime": 16.1929,
"eval_samples_per_second": 33.471,
"eval_steps_per_second": 4.199,
"eval_wer": 0.48029256399837467,
"step": 630
},
{
"epoch": 46.0,
"eval_cer": 0.2092083712465878,
"eval_loss": 0.7431579828262329,
"eval_per": 0.44453474197480697,
"eval_runtime": 16.359,
"eval_samples_per_second": 33.132,
"eval_steps_per_second": 4.157,
"eval_wer": 0.4707436001625356,
"step": 644
},
{
"epoch": 47.0,
"eval_cer": 0.2059326660600546,
"eval_loss": 0.7389556765556335,
"eval_per": 0.42624949207639173,
"eval_runtime": 16.6785,
"eval_samples_per_second": 32.497,
"eval_steps_per_second": 4.077,
"eval_wer": 0.44920763917106865,
"step": 658
},
{
"epoch": 48.0,
"eval_cer": 0.2011282984531392,
"eval_loss": 0.699397087097168,
"eval_per": 0.41060544494108087,
"eval_runtime": 16.5887,
"eval_samples_per_second": 32.673,
"eval_steps_per_second": 4.099,
"eval_wer": 0.43478260869565216,
"step": 672
},
{
"epoch": 49.0,
"eval_cer": 0.19909008189262967,
"eval_loss": 0.6998735070228577,
"eval_per": 0.3998374644453474,
"eval_runtime": 16.3728,
"eval_samples_per_second": 33.104,
"eval_steps_per_second": 4.153,
"eval_wer": 0.4229987809833401,
"step": 686
},
{
"epoch": 50.0,
"learning_rate": 2.6993746993746993e-05,
"loss": 0.7585,
"step": 700
},
{
"epoch": 50.0,
"eval_cer": 0.19588717015468607,
"eval_loss": 0.6737520098686218,
"eval_per": 0.38825680617635105,
"eval_runtime": 16.7385,
"eval_samples_per_second": 32.38,
"eval_steps_per_second": 4.062,
"eval_wer": 0.4122308004876067,
"step": 700
},
{
"epoch": 51.0,
"eval_cer": 0.19628753412192904,
"eval_loss": 0.6696569919586182,
"eval_per": 0.38581877285656235,
"eval_runtime": 16.5913,
"eval_samples_per_second": 32.668,
"eval_steps_per_second": 4.099,
"eval_wer": 0.4093864282811865,
"step": 714
},
{
"epoch": 52.0,
"eval_cer": 0.19963603275705186,
"eval_loss": 0.6706883907318115,
"eval_per": 0.39536773669240144,
"eval_runtime": 18.473,
"eval_samples_per_second": 29.34,
"eval_steps_per_second": 3.681,
"eval_wer": 0.41629418935392115,
"step": 728
},
{
"epoch": 53.0,
"eval_cer": 0.19417652411282985,
"eval_loss": 0.6397454738616943,
"eval_per": 0.38317757009345793,
"eval_runtime": 16.3057,
"eval_samples_per_second": 33.24,
"eval_steps_per_second": 4.17,
"eval_wer": 0.40308817553839904,
"step": 742
},
{
"epoch": 54.0,
"eval_cer": 0.19388535031847134,
"eval_loss": 0.6293218731880188,
"eval_per": 0.38358390898008937,
"eval_runtime": 16.6245,
"eval_samples_per_second": 32.603,
"eval_steps_per_second": 4.09,
"eval_wer": 0.4039008533116619,
"step": 756
},
{
"epoch": 55.0,
"eval_cer": 0.19457688808007279,
"eval_loss": 0.6479354500770569,
"eval_per": 0.3852092645266152,
"eval_runtime": 17.0356,
"eval_samples_per_second": 31.816,
"eval_steps_per_second": 3.992,
"eval_wer": 0.4026818366517676,
"step": 770
},
{
"epoch": 56.0,
"eval_cer": 0.19344858962693356,
"eval_loss": 0.6307466626167297,
"eval_per": 0.38216172287687933,
"eval_runtime": 15.9943,
"eval_samples_per_second": 33.887,
"eval_steps_per_second": 4.252,
"eval_wer": 0.39821210889882164,
"step": 784
},
{
"epoch": 57.0,
"eval_cer": 0.190828025477707,
"eval_loss": 0.6166068911552429,
"eval_per": 0.36733035351483134,
"eval_runtime": 18.3763,
"eval_samples_per_second": 29.495,
"eval_steps_per_second": 3.7,
"eval_wer": 0.3843965867533523,
"step": 798
},
{
"epoch": 57.14,
"learning_rate": 2.506974506974507e-05,
"loss": 0.5473,
"step": 800
},
{
"epoch": 58.0,
"eval_cer": 0.19064604185623293,
"eval_loss": 0.6098698377609253,
"eval_per": 0.3707842340511987,
"eval_runtime": 17.7821,
"eval_samples_per_second": 30.48,
"eval_steps_per_second": 3.824,
"eval_wer": 0.3860219422998781,
"step": 812
},
{
"epoch": 59.0,
"eval_cer": 0.19039126478616925,
"eval_loss": 0.6007358431816101,
"eval_per": 0.3730190979276717,
"eval_runtime": 17.0728,
"eval_samples_per_second": 31.746,
"eval_steps_per_second": 3.983,
"eval_wer": 0.386834620073141,
"step": 826
},
{
"epoch": 60.0,
"eval_cer": 0.19275705186533212,
"eval_loss": 0.6191249489784241,
"eval_per": 0.3744412840308818,
"eval_runtime": 16.4977,
"eval_samples_per_second": 32.853,
"eval_steps_per_second": 4.122,
"eval_wer": 0.3884599756196668,
"step": 840
},
{
"epoch": 61.0,
"eval_cer": 0.1891901728844404,
"eval_loss": 0.6014622449874878,
"eval_per": 0.3732222673709874,
"eval_runtime": 16.6101,
"eval_samples_per_second": 32.631,
"eval_steps_per_second": 4.094,
"eval_wer": 0.3884599756196668,
"step": 854
},
{
"epoch": 62.0,
"eval_cer": 0.19017288444040037,
"eval_loss": 0.5964884757995605,
"eval_per": 0.36875253961804144,
"eval_runtime": 17.8493,
"eval_samples_per_second": 30.365,
"eval_steps_per_second": 3.81,
"eval_wer": 0.3837870784234051,
"step": 868
},
{
"epoch": 63.0,
"eval_cer": 0.19042766151046406,
"eval_loss": 0.5926450490951538,
"eval_per": 0.3667208451848842,
"eval_runtime": 17.884,
"eval_samples_per_second": 30.306,
"eval_steps_per_second": 3.802,
"eval_wer": 0.38256806176351077,
"step": 882
},
{
"epoch": 64.0,
"eval_cer": 0.19210191082802547,
"eval_loss": 0.6187658905982971,
"eval_per": 0.376472978464039,
"eval_runtime": 17.0859,
"eval_samples_per_second": 31.722,
"eval_steps_per_second": 3.98,
"eval_wer": 0.39211702559934986,
"step": 896
},
{
"epoch": 64.29,
"learning_rate": 2.3145743145743147e-05,
"loss": 0.443,
"step": 900
},
{
"epoch": 65.0,
"eval_cer": 0.1891537761601456,
"eval_loss": 0.5834715366363525,
"eval_per": 0.36895570906135716,
"eval_runtime": 16.6058,
"eval_samples_per_second": 32.639,
"eval_steps_per_second": 4.095,
"eval_wer": 0.3829744006501422,
"step": 910
},
{
"epoch": 66.0,
"eval_cer": 0.1902820746132848,
"eval_loss": 0.5914222598075867,
"eval_per": 0.3722064201544088,
"eval_runtime": 17.2325,
"eval_samples_per_second": 31.452,
"eval_steps_per_second": 3.946,
"eval_wer": 0.38703778951645673,
"step": 924
},
{
"epoch": 67.0,
"eval_cer": 0.1875523202911738,
"eval_loss": 0.582801878452301,
"eval_per": 0.36265745631856966,
"eval_runtime": 16.3441,
"eval_samples_per_second": 33.162,
"eval_steps_per_second": 4.161,
"eval_wer": 0.3778951645672491,
"step": 938
},
{
"epoch": 68.0,
"eval_cer": 0.1857324840764331,
"eval_loss": 0.5744664072990417,
"eval_per": 0.35757822023567654,
"eval_runtime": 17.4764,
"eval_samples_per_second": 31.013,
"eval_steps_per_second": 3.891,
"eval_wer": 0.3722064201544088,
"step": 952
},
{
"epoch": 69.0,
"eval_cer": 0.18817106460418562,
"eval_loss": 0.5785911083221436,
"eval_per": 0.3632669646485169,
"eval_runtime": 16.8602,
"eval_samples_per_second": 32.147,
"eval_steps_per_second": 4.033,
"eval_wer": 0.3795205201137749,
"step": 966
},
{
"epoch": 70.0,
"eval_cer": 0.1884258416742493,
"eval_loss": 0.5868948698043823,
"eval_per": 0.36042259244209673,
"eval_runtime": 16.384,
"eval_samples_per_second": 33.081,
"eval_steps_per_second": 4.15,
"eval_wer": 0.37505079236082894,
"step": 980
},
{
"epoch": 71.0,
"eval_cer": 0.18878980891719746,
"eval_loss": 0.592288076877594,
"eval_per": 0.3596099146688338,
"eval_runtime": 16.4263,
"eval_samples_per_second": 32.996,
"eval_steps_per_second": 4.14,
"eval_wer": 0.37525396180414466,
"step": 994
},
{
"epoch": 71.43,
"learning_rate": 2.1221741221741224e-05,
"loss": 0.3564,
"step": 1000
},
{
"epoch": 72.0,
"eval_cer": 0.18587807097361236,
"eval_loss": 0.5706638097763062,
"eval_per": 0.35778138967899226,
"eval_runtime": 16.3727,
"eval_samples_per_second": 33.104,
"eval_steps_per_second": 4.153,
"eval_wer": 0.37139374238114586,
"step": 1008
},
{
"epoch": 73.0,
"eval_cer": 0.1856960873521383,
"eval_loss": 0.5733203887939453,
"eval_per": 0.35514018691588783,
"eval_runtime": 16.1456,
"eval_samples_per_second": 33.569,
"eval_steps_per_second": 4.212,
"eval_wer": 0.3699715562779358,
"step": 1022
},
{
"epoch": 74.0,
"eval_cer": 0.1854413102820746,
"eval_loss": 0.5731407403945923,
"eval_per": 0.35656237301909793,
"eval_runtime": 16.2817,
"eval_samples_per_second": 33.289,
"eval_steps_per_second": 4.176,
"eval_wer": 0.370581064607883,
"step": 1036
},
{
"epoch": 75.0,
"eval_cer": 0.18467697907188352,
"eval_loss": 0.5643908381462097,
"eval_per": 0.3531084924827306,
"eval_runtime": 16.6661,
"eval_samples_per_second": 32.521,
"eval_steps_per_second": 4.08,
"eval_wer": 0.3669240146281999,
"step": 1050
},
{
"epoch": 76.0,
"eval_cer": 0.18522292993630574,
"eval_loss": 0.5660921335220337,
"eval_per": 0.3555465258025193,
"eval_runtime": 16.5118,
"eval_samples_per_second": 32.825,
"eval_steps_per_second": 4.118,
"eval_wer": 0.37017472572125154,
"step": 1064
},
{
"epoch": 77.0,
"eval_cer": 0.18474977252047317,
"eval_loss": 0.5705360174179077,
"eval_per": 0.3512799674928891,
"eval_runtime": 17.1186,
"eval_samples_per_second": 31.661,
"eval_steps_per_second": 3.972,
"eval_wer": 0.3675335229581471,
"step": 1078
},
{
"epoch": 78.0,
"eval_cer": 0.1835122838944495,
"eval_loss": 0.5630640983581543,
"eval_per": 0.35270215359609913,
"eval_runtime": 17.2728,
"eval_samples_per_second": 31.379,
"eval_steps_per_second": 3.937,
"eval_wer": 0.3671271840715156,
"step": 1092
},
{
"epoch": 78.57,
"learning_rate": 1.92977392977393e-05,
"loss": 0.3456,
"step": 1100
},
{
"epoch": 79.0,
"eval_cer": 0.18311191992720655,
"eval_loss": 0.5674863457679749,
"eval_per": 0.35026412027631043,
"eval_runtime": 16.31,
"eval_samples_per_second": 33.231,
"eval_steps_per_second": 4.169,
"eval_wer": 0.3650954896383584,
"step": 1106
},
{
"epoch": 80.0,
"eval_cer": 0.1846041856232939,
"eval_loss": 0.5696778297424316,
"eval_per": 0.35067045916294187,
"eval_runtime": 16.3755,
"eval_samples_per_second": 33.098,
"eval_steps_per_second": 4.153,
"eval_wer": 0.3644859813084112,
"step": 1120
},
{
"epoch": 81.0,
"eval_cer": 0.18409463148316652,
"eval_loss": 0.5643677711486816,
"eval_per": 0.34924827305973183,
"eval_runtime": 16.3983,
"eval_samples_per_second": 33.052,
"eval_steps_per_second": 4.147,
"eval_wer": 0.36306379520520116,
"step": 1134
},
{
"epoch": 82.0,
"eval_cer": 0.1843494085532302,
"eval_loss": 0.56571364402771,
"eval_per": 0.34802925639983745,
"eval_runtime": 16.5291,
"eval_samples_per_second": 32.791,
"eval_steps_per_second": 4.114,
"eval_wer": 0.36265745631856966,
"step": 1148
},
{
"epoch": 83.0,
"eval_cer": 0.1875523202911738,
"eval_loss": 0.5830783247947693,
"eval_per": 0.3522958147094677,
"eval_runtime": 16.4238,
"eval_samples_per_second": 33.001,
"eval_steps_per_second": 4.14,
"eval_wer": 0.36793986184477856,
"step": 1162
},
{
"epoch": 84.0,
"eval_cer": 0.1861692447679709,
"eval_loss": 0.5823647975921631,
"eval_per": 0.3522958147094677,
"eval_runtime": 17.5122,
"eval_samples_per_second": 30.95,
"eval_steps_per_second": 3.883,
"eval_wer": 0.3659081674116213,
"step": 1176
},
{
"epoch": 85.0,
"eval_cer": 0.18333030027297542,
"eval_loss": 0.5567490458488464,
"eval_per": 0.3508736286062576,
"eval_runtime": 16.4517,
"eval_samples_per_second": 32.945,
"eval_steps_per_second": 4.133,
"eval_wer": 0.36529865908167414,
"step": 1190
},
{
"epoch": 85.71,
"learning_rate": 1.7373737373737375e-05,
"loss": 0.3073,
"step": 1200
},
{
"epoch": 86.0,
"eval_cer": 0.1851501364877161,
"eval_loss": 0.5755050778388977,
"eval_per": 0.35067045916294187,
"eval_runtime": 17.6602,
"eval_samples_per_second": 30.691,
"eval_steps_per_second": 3.85,
"eval_wer": 0.36489232019504264,
"step": 1204
},
{
"epoch": 87.0,
"eval_cer": 0.18289353958143767,
"eval_loss": 0.5590367913246155,
"eval_per": 0.3449817147501016,
"eval_runtime": 16.7556,
"eval_samples_per_second": 32.347,
"eval_steps_per_second": 4.058,
"eval_wer": 0.3585940674522552,
"step": 1218
},
{
"epoch": 88.0,
"eval_cer": 0.18347588717015467,
"eval_loss": 0.5662943720817566,
"eval_per": 0.34802925639983745,
"eval_runtime": 16.6011,
"eval_samples_per_second": 32.649,
"eval_steps_per_second": 4.096,
"eval_wer": 0.3610321007720439,
"step": 1232
},
{
"epoch": 89.0,
"eval_cer": 0.18507734303912649,
"eval_loss": 0.5733785629272461,
"eval_per": 0.3468102397399431,
"eval_runtime": 16.1986,
"eval_samples_per_second": 33.46,
"eval_steps_per_second": 4.198,
"eval_wer": 0.3618447785453068,
"step": 1246
},
{
"epoch": 90.0,
"eval_cer": 0.18303912647861692,
"eval_loss": 0.5656831860542297,
"eval_per": 0.34579439252336447,
"eval_runtime": 16.3772,
"eval_samples_per_second": 33.095,
"eval_steps_per_second": 4.152,
"eval_wer": 0.36021942299878096,
"step": 1260
},
{
"epoch": 91.0,
"eval_cer": 0.18278434940855323,
"eval_loss": 0.5650802850723267,
"eval_per": 0.3441690369768387,
"eval_runtime": 17.4779,
"eval_samples_per_second": 31.011,
"eval_steps_per_second": 3.891,
"eval_wer": 0.35778138967899226,
"step": 1274
},
{
"epoch": 92.0,
"eval_cer": 0.18202001819836214,
"eval_loss": 0.5608470439910889,
"eval_per": 0.3415278342137342,
"eval_runtime": 16.5014,
"eval_samples_per_second": 32.846,
"eval_steps_per_second": 4.121,
"eval_wer": 0.35574969524583505,
"step": 1288
},
{
"epoch": 92.86,
"learning_rate": 1.544973544973545e-05,
"loss": 0.2836,
"step": 1300
},
{
"epoch": 93.0,
"eval_cer": 0.18067333939945404,
"eval_loss": 0.5504541993141174,
"eval_per": 0.3388866314506298,
"eval_runtime": 16.701,
"eval_samples_per_second": 32.453,
"eval_steps_per_second": 4.072,
"eval_wer": 0.3524989841527834,
"step": 1302
},
{
"epoch": 94.0,
"eval_cer": 0.17979981801637854,
"eval_loss": 0.5494620203971863,
"eval_per": 0.33746444534741976,
"eval_runtime": 17.2521,
"eval_samples_per_second": 31.416,
"eval_steps_per_second": 3.942,
"eval_wer": 0.3500609508329947,
"step": 1316
},
{
"epoch": 95.0,
"eval_cer": 0.1816196542311192,
"eval_loss": 0.5693331360816956,
"eval_per": 0.34315318976026005,
"eval_runtime": 16.3033,
"eval_samples_per_second": 33.245,
"eval_steps_per_second": 4.171,
"eval_wer": 0.35574969524583505,
"step": 1330
},
{
"epoch": 96.0,
"eval_cer": 0.1822020018198362,
"eval_loss": 0.5638025999069214,
"eval_per": 0.34173100365705,
"eval_runtime": 16.8945,
"eval_samples_per_second": 32.081,
"eval_steps_per_second": 4.025,
"eval_wer": 0.3563592035757822,
"step": 1344
},
{
"epoch": 97.0,
"eval_cer": 0.17969062784349407,
"eval_loss": 0.5485906004905701,
"eval_per": 0.3386834620073141,
"eval_runtime": 16.6823,
"eval_samples_per_second": 32.489,
"eval_steps_per_second": 4.076,
"eval_wer": 0.35107679804957337,
"step": 1358
},
{
"epoch": 98.0,
"eval_cer": 0.18096451319381257,
"eval_loss": 0.5618489980697632,
"eval_per": 0.3415278342137342,
"eval_runtime": 16.6547,
"eval_samples_per_second": 32.543,
"eval_steps_per_second": 4.083,
"eval_wer": 0.3545306785859407,
"step": 1372
},
{
"epoch": 99.0,
"eval_cer": 0.1799818016378526,
"eval_loss": 0.5637105703353882,
"eval_per": 0.33990247866720846,
"eval_runtime": 16.8199,
"eval_samples_per_second": 32.224,
"eval_steps_per_second": 4.043,
"eval_wer": 0.3514831369362048,
"step": 1386
},
{
"epoch": 100.0,
"learning_rate": 1.3525733525733527e-05,
"loss": 0.2502,
"step": 1400
},
{
"epoch": 100.0,
"eval_cer": 0.1810373066424022,
"eval_loss": 0.5658114552497864,
"eval_per": 0.3437626980902072,
"eval_runtime": 16.859,
"eval_samples_per_second": 32.149,
"eval_steps_per_second": 4.033,
"eval_wer": 0.3555465258025193,
"step": 1400
},
{
"epoch": 101.0,
"eval_cer": 0.17954504094631482,
"eval_loss": 0.552661657333374,
"eval_per": 0.3411214953271028,
"eval_runtime": 17.0552,
"eval_samples_per_second": 31.779,
"eval_steps_per_second": 3.987,
"eval_wer": 0.3524989841527834,
"step": 1414
},
{
"epoch": 102.0,
"eval_cer": 0.18067333939945404,
"eval_loss": 0.5701059699058533,
"eval_per": 0.343965867533523,
"eval_runtime": 17.649,
"eval_samples_per_second": 30.71,
"eval_steps_per_second": 3.853,
"eval_wer": 0.3561560341324665,
"step": 1428
},
{
"epoch": 103.0,
"eval_cer": 0.17936305732484076,
"eval_loss": 0.554296612739563,
"eval_per": 0.3388866314506298,
"eval_runtime": 16.2178,
"eval_samples_per_second": 33.42,
"eval_steps_per_second": 4.193,
"eval_wer": 0.34965461194636327,
"step": 1442
},
{
"epoch": 104.0,
"eval_cer": 0.18034576888080073,
"eval_loss": 0.5659683346748352,
"eval_per": 0.33990247866720846,
"eval_runtime": 16.8247,
"eval_samples_per_second": 32.214,
"eval_steps_per_second": 4.042,
"eval_wer": 0.3508736286062576,
"step": 1456
},
{
"epoch": 105.0,
"eval_cer": 0.17950864422202,
"eval_loss": 0.5542871952056885,
"eval_per": 0.33990247866720846,
"eval_runtime": 16.8641,
"eval_samples_per_second": 32.139,
"eval_steps_per_second": 4.032,
"eval_wer": 0.3500609508329947,
"step": 1470
},
{
"epoch": 106.0,
"eval_cer": 0.181656050955414,
"eval_loss": 0.5742031931877136,
"eval_per": 0.34315318976026005,
"eval_runtime": 16.2772,
"eval_samples_per_second": 33.298,
"eval_steps_per_second": 4.178,
"eval_wer": 0.3547338480292564,
"step": 1484
},
{
"epoch": 107.0,
"eval_cer": 0.178926296633303,
"eval_loss": 0.5526788830757141,
"eval_per": 0.33502641202763106,
"eval_runtime": 16.3123,
"eval_samples_per_second": 33.227,
"eval_steps_per_second": 4.169,
"eval_wer": 0.34538805363673303,
"step": 1498
},
{
"epoch": 107.14,
"learning_rate": 1.1601731601731604e-05,
"loss": 0.2368,
"step": 1500
},
{
"epoch": 108.0,
"eval_cer": 0.178926296633303,
"eval_loss": 0.5576502084732056,
"eval_per": 0.3378707842340512,
"eval_runtime": 16.2769,
"eval_samples_per_second": 33.299,
"eval_steps_per_second": 4.178,
"eval_wer": 0.34965461194636327,
"step": 1512
},
{
"epoch": 109.0,
"eval_cer": 0.1788898999090082,
"eval_loss": 0.5539444088935852,
"eval_per": 0.3356359203575782,
"eval_runtime": 17.6723,
"eval_samples_per_second": 30.669,
"eval_steps_per_second": 3.848,
"eval_wer": 0.3451848841934173,
"step": 1526
},
{
"epoch": 110.0,
"eval_cer": 0.18020018198362148,
"eval_loss": 0.5699580311775208,
"eval_per": 0.34173100365705,
"eval_runtime": 16.5072,
"eval_samples_per_second": 32.834,
"eval_steps_per_second": 4.119,
"eval_wer": 0.35168630637952053,
"step": 1540
},
{
"epoch": 111.0,
"eval_cer": 0.17939945404913557,
"eval_loss": 0.5626676678657532,
"eval_per": 0.33969930922389274,
"eval_runtime": 16.5149,
"eval_samples_per_second": 32.819,
"eval_steps_per_second": 4.117,
"eval_wer": 0.3500609508329947,
"step": 1554
},
{
"epoch": 112.0,
"eval_cer": 0.17965423111919926,
"eval_loss": 0.5622020363807678,
"eval_per": 0.3405119869971556,
"eval_runtime": 18.514,
"eval_samples_per_second": 29.275,
"eval_steps_per_second": 3.673,
"eval_wer": 0.34965461194636327,
"step": 1568
},
{
"epoch": 113.0,
"eval_cer": 0.18005459508644223,
"eval_loss": 0.570824146270752,
"eval_per": 0.3403088175538399,
"eval_runtime": 16.7958,
"eval_samples_per_second": 32.27,
"eval_steps_per_second": 4.049,
"eval_wer": 0.34945144250304755,
"step": 1582
},
{
"epoch": 114.0,
"eval_cer": 0.18045495905368517,
"eval_loss": 0.5732950568199158,
"eval_per": 0.3401056481105242,
"eval_runtime": 17.5602,
"eval_samples_per_second": 30.865,
"eval_steps_per_second": 3.872,
"eval_wer": 0.35107679804957337,
"step": 1596
},
{
"epoch": 114.29,
"learning_rate": 9.677729677729679e-06,
"loss": 0.2288,
"step": 1600
},
{
"epoch": 115.0,
"eval_cer": 0.17950864422202,
"eval_loss": 0.5614627599716187,
"eval_per": 0.3386834620073141,
"eval_runtime": 18.0091,
"eval_samples_per_second": 30.096,
"eval_steps_per_second": 3.776,
"eval_wer": 0.34863876472978467,
"step": 1610
},
{
"epoch": 116.0,
"eval_cer": 0.1808553230209281,
"eval_loss": 0.5741183757781982,
"eval_per": 0.33969930922389274,
"eval_runtime": 16.588,
"eval_samples_per_second": 32.674,
"eval_steps_per_second": 4.099,
"eval_wer": 0.34965461194636327,
"step": 1624
},
{
"epoch": 117.0,
"eval_cer": 0.17958143767060963,
"eval_loss": 0.5609710812568665,
"eval_per": 0.33726127590410404,
"eval_runtime": 16.4333,
"eval_samples_per_second": 32.982,
"eval_steps_per_second": 4.138,
"eval_wer": 0.3459975619666802,
"step": 1638
},
{
"epoch": 117.0,
"step": 1638,
"total_flos": 1.462030946643386e+19,
"train_loss": 1.771814914558979,
"train_runtime": 12938.9921,
"train_samples_per_second": 5.194,
"train_steps_per_second": 0.162
}
],
"max_steps": 2100,
"num_train_epochs": 150,
"total_flos": 1.462030946643386e+19,
"trial_name": null,
"trial_params": null
}