wav2vec2-large-xlsr-coraa-exp-13 / trainer_state.json
alinerodrigues's picture
End of training
2af4b25
{
"best_metric": 0.556138277053833,
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-13/checkpoint-1736",
"epoch": 144.0,
"global_step": 2016,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 3e-05,
"loss": 38.268,
"step": 1
},
{
"epoch": 1.0,
"eval_cer": 0.9430027297543221,
"eval_loss": 32.05844497680664,
"eval_runtime": 53.1315,
"eval_samples_per_second": 10.201,
"eval_steps_per_second": 1.28,
"eval_wer": 1.0,
"step": 14
},
{
"epoch": 2.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 10.376302719116211,
"eval_runtime": 52.6044,
"eval_samples_per_second": 10.303,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 28
},
{
"epoch": 3.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 4.8976359367370605,
"eval_runtime": 52.7604,
"eval_samples_per_second": 10.273,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 42
},
{
"epoch": 4.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 4.040638446807861,
"eval_runtime": 53.2305,
"eval_samples_per_second": 10.182,
"eval_steps_per_second": 1.277,
"eval_wer": 1.0,
"step": 56
},
{
"epoch": 5.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.7469818592071533,
"eval_runtime": 52.5947,
"eval_samples_per_second": 10.305,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 70
},
{
"epoch": 6.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.5903122425079346,
"eval_runtime": 52.8025,
"eval_samples_per_second": 10.265,
"eval_steps_per_second": 1.288,
"eval_wer": 1.0,
"step": 84
},
{
"epoch": 7.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.474977493286133,
"eval_runtime": 52.6757,
"eval_samples_per_second": 10.289,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 98
},
{
"epoch": 7.14,
"learning_rate": 2.862857142857143e-05,
"loss": 10.1654,
"step": 100
},
{
"epoch": 8.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.3405568599700928,
"eval_runtime": 52.6172,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 112
},
{
"epoch": 9.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.226734161376953,
"eval_runtime": 52.664,
"eval_samples_per_second": 10.292,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 126
},
{
"epoch": 10.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.1887271404266357,
"eval_runtime": 52.6591,
"eval_samples_per_second": 10.293,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 140
},
{
"epoch": 11.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.130089521408081,
"eval_runtime": 53.0211,
"eval_samples_per_second": 10.222,
"eval_steps_per_second": 1.283,
"eval_wer": 1.0,
"step": 154
},
{
"epoch": 12.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.1045610904693604,
"eval_runtime": 52.5606,
"eval_samples_per_second": 10.312,
"eval_steps_per_second": 1.294,
"eval_wer": 1.0,
"step": 168
},
{
"epoch": 13.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.090874433517456,
"eval_runtime": 52.5759,
"eval_samples_per_second": 10.309,
"eval_steps_per_second": 1.293,
"eval_wer": 1.0,
"step": 182
},
{
"epoch": 14.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0602762699127197,
"eval_runtime": 52.7319,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 196
},
{
"epoch": 14.29,
"learning_rate": 2.72e-05,
"loss": 3.0823,
"step": 200
},
{
"epoch": 15.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0584146976470947,
"eval_runtime": 52.6179,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 210
},
{
"epoch": 16.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0485479831695557,
"eval_runtime": 52.7143,
"eval_samples_per_second": 10.282,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 224
},
{
"epoch": 17.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.046433925628662,
"eval_runtime": 52.6205,
"eval_samples_per_second": 10.3,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 238
},
{
"epoch": 18.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.024200916290283,
"eval_runtime": 52.7522,
"eval_samples_per_second": 10.274,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 252
},
{
"epoch": 19.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0237276554107666,
"eval_runtime": 52.648,
"eval_samples_per_second": 10.295,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 266
},
{
"epoch": 20.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0304243564605713,
"eval_runtime": 52.7771,
"eval_samples_per_second": 10.27,
"eval_steps_per_second": 1.288,
"eval_wer": 1.0,
"step": 280
},
{
"epoch": 21.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0118603706359863,
"eval_runtime": 52.6742,
"eval_samples_per_second": 10.29,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 294
},
{
"epoch": 21.43,
"learning_rate": 2.5771428571428574e-05,
"loss": 2.9562,
"step": 300
},
{
"epoch": 22.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.014829158782959,
"eval_runtime": 52.6427,
"eval_samples_per_second": 10.296,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 308
},
{
"epoch": 23.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0060625076293945,
"eval_runtime": 52.7555,
"eval_samples_per_second": 10.274,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 322
},
{
"epoch": 24.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0041589736938477,
"eval_runtime": 52.7518,
"eval_samples_per_second": 10.275,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 336
},
{
"epoch": 25.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.003258228302002,
"eval_runtime": 52.9828,
"eval_samples_per_second": 10.23,
"eval_steps_per_second": 1.283,
"eval_wer": 1.0,
"step": 350
},
{
"epoch": 26.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.0028507709503174,
"eval_runtime": 52.639,
"eval_samples_per_second": 10.297,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 364
},
{
"epoch": 27.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 3.008204460144043,
"eval_runtime": 52.7037,
"eval_samples_per_second": 10.284,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 378
},
{
"epoch": 28.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9955995082855225,
"eval_runtime": 52.6334,
"eval_samples_per_second": 10.298,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 392
},
{
"epoch": 28.57,
"learning_rate": 2.434285714285714e-05,
"loss": 2.9262,
"step": 400
},
{
"epoch": 29.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.994765043258667,
"eval_runtime": 52.6138,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 406
},
{
"epoch": 30.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.998243808746338,
"eval_runtime": 52.831,
"eval_samples_per_second": 10.259,
"eval_steps_per_second": 1.287,
"eval_wer": 1.0,
"step": 420
},
{
"epoch": 31.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.996180295944214,
"eval_runtime": 52.6837,
"eval_samples_per_second": 10.288,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 434
},
{
"epoch": 32.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9930543899536133,
"eval_runtime": 53.1611,
"eval_samples_per_second": 10.195,
"eval_steps_per_second": 1.279,
"eval_wer": 1.0,
"step": 448
},
{
"epoch": 33.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9809184074401855,
"eval_runtime": 52.778,
"eval_samples_per_second": 10.269,
"eval_steps_per_second": 1.288,
"eval_wer": 1.0,
"step": 462
},
{
"epoch": 34.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.980422019958496,
"eval_runtime": 52.6744,
"eval_samples_per_second": 10.29,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 476
},
{
"epoch": 35.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9742188453674316,
"eval_runtime": 52.6886,
"eval_samples_per_second": 10.287,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 490
},
{
"epoch": 35.71,
"learning_rate": 2.2914285714285714e-05,
"loss": 2.9125,
"step": 500
},
{
"epoch": 36.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.95219349861145,
"eval_runtime": 52.7664,
"eval_samples_per_second": 10.272,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 504
},
{
"epoch": 37.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.9014649391174316,
"eval_runtime": 52.6811,
"eval_samples_per_second": 10.288,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0,
"step": 518
},
{
"epoch": 38.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.852219581604004,
"eval_runtime": 52.7271,
"eval_samples_per_second": 10.279,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 532
},
{
"epoch": 39.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 2.828482151031494,
"eval_runtime": 52.6182,
"eval_samples_per_second": 10.301,
"eval_steps_per_second": 1.292,
"eval_wer": 1.0,
"step": 546
},
{
"epoch": 40.0,
"eval_cer": 0.9614558689717926,
"eval_loss": 2.729363441467285,
"eval_runtime": 52.6938,
"eval_samples_per_second": 10.286,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 560
},
{
"epoch": 41.0,
"eval_cer": 0.9605095541401274,
"eval_loss": 2.6491127014160156,
"eval_runtime": 53.1167,
"eval_samples_per_second": 10.204,
"eval_steps_per_second": 1.28,
"eval_wer": 1.0,
"step": 574
},
{
"epoch": 42.0,
"eval_cer": 0.8949590536851684,
"eval_loss": 2.4882705211639404,
"eval_runtime": 52.7981,
"eval_samples_per_second": 10.266,
"eval_steps_per_second": 1.288,
"eval_wer": 1.0,
"step": 588
},
{
"epoch": 42.86,
"learning_rate": 2.1485714285714284e-05,
"loss": 2.7205,
"step": 600
},
{
"epoch": 43.0,
"eval_cer": 0.836505914467698,
"eval_loss": 2.3630661964416504,
"eval_runtime": 52.7032,
"eval_samples_per_second": 10.284,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0,
"step": 602
},
{
"epoch": 44.0,
"eval_cer": 0.607424931756142,
"eval_loss": 2.054628610610962,
"eval_runtime": 52.7506,
"eval_samples_per_second": 10.275,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 616
},
{
"epoch": 45.0,
"eval_cer": 0.5147952684258417,
"eval_loss": 1.7867237329483032,
"eval_runtime": 53.2436,
"eval_samples_per_second": 10.18,
"eval_steps_per_second": 1.277,
"eval_wer": 1.0,
"step": 630
},
{
"epoch": 46.0,
"eval_cer": 0.4532120109190173,
"eval_loss": 1.5452687740325928,
"eval_runtime": 52.8784,
"eval_samples_per_second": 10.25,
"eval_steps_per_second": 1.286,
"eval_wer": 1.0,
"step": 644
},
{
"epoch": 47.0,
"eval_cer": 0.40640582347588716,
"eval_loss": 1.3553940057754517,
"eval_runtime": 52.7768,
"eval_samples_per_second": 10.27,
"eval_steps_per_second": 1.288,
"eval_wer": 0.9989841527834213,
"step": 658
},
{
"epoch": 48.0,
"eval_cer": 0.3669881710646042,
"eval_loss": 1.201612114906311,
"eval_runtime": 52.8752,
"eval_samples_per_second": 10.251,
"eval_steps_per_second": 1.286,
"eval_wer": 0.982933766761479,
"step": 672
},
{
"epoch": 49.0,
"eval_cer": 0.3167242948134668,
"eval_loss": 1.0777251720428467,
"eval_runtime": 52.8059,
"eval_samples_per_second": 10.264,
"eval_steps_per_second": 1.288,
"eval_wer": 0.8805363673303536,
"step": 686
},
{
"epoch": 50.0,
"learning_rate": 2.0057142857142858e-05,
"loss": 1.6469,
"step": 700
},
{
"epoch": 50.0,
"eval_cer": 0.2594358507734304,
"eval_loss": 0.978954017162323,
"eval_runtime": 52.919,
"eval_samples_per_second": 10.242,
"eval_steps_per_second": 1.285,
"eval_wer": 0.7029662738724096,
"step": 700
},
{
"epoch": 51.0,
"eval_cer": 0.22238398544131027,
"eval_loss": 0.8961830735206604,
"eval_runtime": 52.8398,
"eval_samples_per_second": 10.257,
"eval_steps_per_second": 1.287,
"eval_wer": 0.5270215359609914,
"step": 714
},
{
"epoch": 52.0,
"eval_cer": 0.21757961783439492,
"eval_loss": 0.8428747653961182,
"eval_runtime": 52.8781,
"eval_samples_per_second": 10.25,
"eval_steps_per_second": 1.286,
"eval_wer": 0.4973587972368956,
"step": 728
},
{
"epoch": 53.0,
"eval_cer": 0.2089171974522293,
"eval_loss": 0.8158747553825378,
"eval_runtime": 53.3812,
"eval_samples_per_second": 10.153,
"eval_steps_per_second": 1.274,
"eval_wer": 0.4658675335229581,
"step": 742
},
{
"epoch": 54.0,
"eval_cer": 0.20658780709736124,
"eval_loss": 0.7980368137359619,
"eval_runtime": 52.8695,
"eval_samples_per_second": 10.252,
"eval_steps_per_second": 1.286,
"eval_wer": 0.4512393336042259,
"step": 756
},
{
"epoch": 55.0,
"eval_cer": 0.20440400363967243,
"eval_loss": 0.7540920376777649,
"eval_runtime": 52.8272,
"eval_samples_per_second": 10.26,
"eval_steps_per_second": 1.287,
"eval_wer": 0.4441284030881755,
"step": 770
},
{
"epoch": 56.0,
"eval_cer": 0.20152866242038217,
"eval_loss": 0.7299144864082336,
"eval_runtime": 52.846,
"eval_samples_per_second": 10.256,
"eval_steps_per_second": 1.287,
"eval_wer": 0.42726533929297034,
"step": 784
},
{
"epoch": 57.0,
"eval_cer": 0.1964331210191083,
"eval_loss": 0.7077798843383789,
"eval_runtime": 52.7856,
"eval_samples_per_second": 10.268,
"eval_steps_per_second": 1.288,
"eval_wer": 0.40918325883787077,
"step": 798
},
{
"epoch": 57.14,
"learning_rate": 1.8628571428571428e-05,
"loss": 0.7997,
"step": 800
},
{
"epoch": 58.0,
"eval_cer": 0.1973430391264786,
"eval_loss": 0.7078654170036316,
"eval_runtime": 52.7848,
"eval_samples_per_second": 10.268,
"eval_steps_per_second": 1.288,
"eval_wer": 0.4110117838277123,
"step": 812
},
{
"epoch": 59.0,
"eval_cer": 0.19832575068243857,
"eval_loss": 0.6861252784729004,
"eval_runtime": 52.8203,
"eval_samples_per_second": 10.261,
"eval_steps_per_second": 1.287,
"eval_wer": 0.41365298659081673,
"step": 826
},
{
"epoch": 60.0,
"eval_cer": 0.1975250227479527,
"eval_loss": 0.7035004496574402,
"eval_runtime": 53.0259,
"eval_samples_per_second": 10.221,
"eval_steps_per_second": 1.282,
"eval_wer": 0.4010564811052418,
"step": 840
},
{
"epoch": 61.0,
"eval_cer": 0.19417652411282985,
"eval_loss": 0.6675873398780823,
"eval_runtime": 52.839,
"eval_samples_per_second": 10.258,
"eval_steps_per_second": 1.287,
"eval_wer": 0.4000406338886631,
"step": 854
},
{
"epoch": 62.0,
"eval_cer": 0.19366696997270247,
"eval_loss": 0.6562079787254333,
"eval_runtime": 52.8072,
"eval_samples_per_second": 10.264,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3980089394555059,
"step": 868
},
{
"epoch": 63.0,
"eval_cer": 0.1910828025477707,
"eval_loss": 0.6579793691635132,
"eval_runtime": 52.8351,
"eval_samples_per_second": 10.258,
"eval_steps_per_second": 1.287,
"eval_wer": 0.38500609508329947,
"step": 882
},
{
"epoch": 64.0,
"eval_cer": 0.19253867151956325,
"eval_loss": 0.6642553806304932,
"eval_runtime": 52.8162,
"eval_samples_per_second": 10.262,
"eval_steps_per_second": 1.287,
"eval_wer": 0.39110117838277125,
"step": 896
},
{
"epoch": 64.29,
"learning_rate": 1.72e-05,
"loss": 0.5379,
"step": 900
},
{
"epoch": 65.0,
"eval_cer": 0.19282984531392175,
"eval_loss": 0.6532391309738159,
"eval_runtime": 52.87,
"eval_samples_per_second": 10.252,
"eval_steps_per_second": 1.286,
"eval_wer": 0.39292970337261274,
"step": 910
},
{
"epoch": 66.0,
"eval_cer": 0.19064604185623293,
"eval_loss": 0.6483404040336609,
"eval_runtime": 52.7892,
"eval_samples_per_second": 10.267,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3866314506298253,
"step": 924
},
{
"epoch": 67.0,
"eval_cer": 0.18696997270245677,
"eval_loss": 0.6266820430755615,
"eval_runtime": 53.3837,
"eval_samples_per_second": 10.153,
"eval_steps_per_second": 1.274,
"eval_wer": 0.3756603006907761,
"step": 938
},
{
"epoch": 68.0,
"eval_cer": 0.18798908098271155,
"eval_loss": 0.6296297907829285,
"eval_runtime": 52.8207,
"eval_samples_per_second": 10.261,
"eval_steps_per_second": 1.287,
"eval_wer": 0.3793173506704592,
"step": 952
},
{
"epoch": 69.0,
"eval_cer": 0.19020928116469518,
"eval_loss": 0.6414676904678345,
"eval_runtime": 52.8153,
"eval_samples_per_second": 10.262,
"eval_steps_per_second": 1.288,
"eval_wer": 0.37850467289719625,
"step": 966
},
{
"epoch": 70.0,
"eval_cer": 0.18846223839854412,
"eval_loss": 0.6227236986160278,
"eval_runtime": 52.8625,
"eval_samples_per_second": 10.253,
"eval_steps_per_second": 1.286,
"eval_wer": 0.3746444534741975,
"step": 980
},
{
"epoch": 71.0,
"eval_cer": 0.1878434940855323,
"eval_loss": 0.6213016510009766,
"eval_runtime": 52.7591,
"eval_samples_per_second": 10.273,
"eval_steps_per_second": 1.289,
"eval_wer": 0.37383177570093457,
"step": 994
},
{
"epoch": 71.43,
"learning_rate": 1.577142857142857e-05,
"loss": 0.4372,
"step": 1000
},
{
"epoch": 72.0,
"eval_cer": 0.18718835304822565,
"eval_loss": 0.6110479831695557,
"eval_runtime": 52.7876,
"eval_samples_per_second": 10.268,
"eval_steps_per_second": 1.288,
"eval_wer": 0.37261275904104024,
"step": 1008
},
{
"epoch": 73.0,
"eval_cer": 0.1861692447679709,
"eval_loss": 0.6018897294998169,
"eval_runtime": 52.8613,
"eval_samples_per_second": 10.253,
"eval_steps_per_second": 1.286,
"eval_wer": 0.3695652173913043,
"step": 1022
},
{
"epoch": 74.0,
"eval_cer": 0.18671519563239308,
"eval_loss": 0.6036959290504456,
"eval_runtime": 53.2023,
"eval_samples_per_second": 10.188,
"eval_steps_per_second": 1.278,
"eval_wer": 0.3722064201544088,
"step": 1036
},
{
"epoch": 75.0,
"eval_cer": 0.188098271155596,
"eval_loss": 0.5993600487709045,
"eval_runtime": 52.8215,
"eval_samples_per_second": 10.261,
"eval_steps_per_second": 1.287,
"eval_wer": 0.3657049979683056,
"step": 1050
},
{
"epoch": 76.0,
"eval_cer": 0.18806187443130118,
"eval_loss": 0.6083250641822815,
"eval_runtime": 52.971,
"eval_samples_per_second": 10.232,
"eval_steps_per_second": 1.284,
"eval_wer": 0.37037789516456726,
"step": 1064
},
{
"epoch": 77.0,
"eval_cer": 0.1864968152866242,
"eval_loss": 0.5837586522102356,
"eval_runtime": 53.4695,
"eval_samples_per_second": 10.137,
"eval_steps_per_second": 1.272,
"eval_wer": 0.3695652173913043,
"step": 1078
},
{
"epoch": 78.0,
"eval_cer": 0.18547770700636942,
"eval_loss": 0.5794845819473267,
"eval_runtime": 52.8335,
"eval_samples_per_second": 10.259,
"eval_steps_per_second": 1.287,
"eval_wer": 0.3718000812677773,
"step": 1092
},
{
"epoch": 78.57,
"learning_rate": 1.4342857142857143e-05,
"loss": 0.3912,
"step": 1100
},
{
"epoch": 79.0,
"eval_cer": 0.18773430391264787,
"eval_loss": 0.6201197504997253,
"eval_runtime": 52.909,
"eval_samples_per_second": 10.244,
"eval_steps_per_second": 1.285,
"eval_wer": 0.37139374238114586,
"step": 1106
},
{
"epoch": 80.0,
"eval_cer": 0.1854413102820746,
"eval_loss": 0.5914958715438843,
"eval_runtime": 52.8551,
"eval_samples_per_second": 10.254,
"eval_steps_per_second": 1.287,
"eval_wer": 0.366111336854937,
"step": 1120
},
{
"epoch": 81.0,
"eval_cer": 0.18427661510464058,
"eval_loss": 0.5893952250480652,
"eval_runtime": 52.9037,
"eval_samples_per_second": 10.245,
"eval_steps_per_second": 1.285,
"eval_wer": 0.3650954896383584,
"step": 1134
},
{
"epoch": 82.0,
"eval_cer": 0.18591446769790718,
"eval_loss": 0.5993715524673462,
"eval_runtime": 52.7967,
"eval_samples_per_second": 10.266,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3681430312880943,
"step": 1148
},
{
"epoch": 83.0,
"eval_cer": 0.18642402183803458,
"eval_loss": 0.6001280546188354,
"eval_runtime": 52.869,
"eval_samples_per_second": 10.252,
"eval_steps_per_second": 1.286,
"eval_wer": 0.36550182852498986,
"step": 1162
},
{
"epoch": 84.0,
"eval_cer": 0.1864968152866242,
"eval_loss": 0.6007617115974426,
"eval_runtime": 52.8415,
"eval_samples_per_second": 10.257,
"eval_steps_per_second": 1.287,
"eval_wer": 0.36529865908167414,
"step": 1176
},
{
"epoch": 85.0,
"eval_cer": 0.18322111010009098,
"eval_loss": 0.5769873857498169,
"eval_runtime": 52.8264,
"eval_samples_per_second": 10.26,
"eval_steps_per_second": 1.287,
"eval_wer": 0.36021942299878096,
"step": 1190
},
{
"epoch": 85.71,
"learning_rate": 1.2914285714285713e-05,
"loss": 0.3485,
"step": 1200
},
{
"epoch": 86.0,
"eval_cer": 0.18358507734303914,
"eval_loss": 0.5905404686927795,
"eval_runtime": 52.731,
"eval_samples_per_second": 10.279,
"eval_steps_per_second": 1.29,
"eval_wer": 0.35656237301909793,
"step": 1204
},
{
"epoch": 87.0,
"eval_cer": 0.18278434940855323,
"eval_loss": 0.5810394287109375,
"eval_runtime": 52.802,
"eval_samples_per_second": 10.265,
"eval_steps_per_second": 1.288,
"eval_wer": 0.35798455912230803,
"step": 1218
},
{
"epoch": 88.0,
"eval_cer": 0.1829663330300273,
"eval_loss": 0.5765053033828735,
"eval_runtime": 53.0488,
"eval_samples_per_second": 10.217,
"eval_steps_per_second": 1.282,
"eval_wer": 0.3583908980089395,
"step": 1232
},
{
"epoch": 89.0,
"eval_cer": 0.18453139217470427,
"eval_loss": 0.5901545286178589,
"eval_runtime": 52.796,
"eval_samples_per_second": 10.266,
"eval_steps_per_second": 1.288,
"eval_wer": 0.36407964242177976,
"step": 1246
},
{
"epoch": 90.0,
"eval_cer": 0.18307552320291173,
"eval_loss": 0.581239640712738,
"eval_runtime": 52.8224,
"eval_samples_per_second": 10.261,
"eval_steps_per_second": 1.287,
"eval_wer": 0.36143843965867534,
"step": 1260
},
{
"epoch": 91.0,
"eval_cer": 0.18438580527752502,
"eval_loss": 0.5965577960014343,
"eval_runtime": 52.9107,
"eval_samples_per_second": 10.244,
"eval_steps_per_second": 1.285,
"eval_wer": 0.3585940674522552,
"step": 1274
},
{
"epoch": 92.0,
"eval_cer": 0.18223839854413104,
"eval_loss": 0.5686241388320923,
"eval_runtime": 53.3712,
"eval_samples_per_second": 10.155,
"eval_steps_per_second": 1.274,
"eval_wer": 0.35574969524583505,
"step": 1288
},
{
"epoch": 92.86,
"learning_rate": 1.1485714285714285e-05,
"loss": 0.3234,
"step": 1300
},
{
"epoch": 93.0,
"eval_cer": 0.18282074613284804,
"eval_loss": 0.5839269161224365,
"eval_runtime": 52.8855,
"eval_samples_per_second": 10.249,
"eval_steps_per_second": 1.286,
"eval_wer": 0.35534335635920355,
"step": 1302
},
{
"epoch": 94.0,
"eval_cer": 0.18198362147406733,
"eval_loss": 0.5765420198440552,
"eval_runtime": 52.892,
"eval_samples_per_second": 10.247,
"eval_steps_per_second": 1.286,
"eval_wer": 0.35534335635920355,
"step": 1316
},
{
"epoch": 95.0,
"eval_cer": 0.18202001819836214,
"eval_loss": 0.5779678225517273,
"eval_runtime": 52.8619,
"eval_samples_per_second": 10.253,
"eval_steps_per_second": 1.286,
"eval_wer": 0.35656237301909793,
"step": 1330
},
{
"epoch": 96.0,
"eval_cer": 0.18343949044585986,
"eval_loss": 0.5862200260162354,
"eval_runtime": 52.9527,
"eval_samples_per_second": 10.236,
"eval_steps_per_second": 1.284,
"eval_wer": 0.3596099146688338,
"step": 1344
},
{
"epoch": 97.0,
"eval_cer": 0.18209281164695176,
"eval_loss": 0.5701762437820435,
"eval_runtime": 52.8493,
"eval_samples_per_second": 10.256,
"eval_steps_per_second": 1.287,
"eval_wer": 0.3555465258025193,
"step": 1358
},
{
"epoch": 98.0,
"eval_cer": 0.18205641492265695,
"eval_loss": 0.5787171721458435,
"eval_runtime": 52.8738,
"eval_samples_per_second": 10.251,
"eval_steps_per_second": 1.286,
"eval_wer": 0.3547338480292564,
"step": 1372
},
{
"epoch": 99.0,
"eval_cer": 0.1823839854413103,
"eval_loss": 0.5766745209693909,
"eval_runtime": 52.9499,
"eval_samples_per_second": 10.236,
"eval_steps_per_second": 1.284,
"eval_wer": 0.3531084924827306,
"step": 1386
},
{
"epoch": 100.0,
"learning_rate": 1.0057142857142857e-05,
"loss": 0.2803,
"step": 1400
},
{
"epoch": 100.0,
"eval_cer": 0.18183803457688807,
"eval_loss": 0.5778467655181885,
"eval_runtime": 53.096,
"eval_samples_per_second": 10.208,
"eval_steps_per_second": 1.281,
"eval_wer": 0.3569687119057294,
"step": 1400
},
{
"epoch": 101.0,
"eval_cer": 0.18172884440400364,
"eval_loss": 0.5759402513504028,
"eval_runtime": 53.4646,
"eval_samples_per_second": 10.138,
"eval_steps_per_second": 1.272,
"eval_wer": 0.35432750914262495,
"step": 1414
},
{
"epoch": 102.0,
"eval_cer": 0.1823839854413103,
"eval_loss": 0.5838054418563843,
"eval_runtime": 53.0092,
"eval_samples_per_second": 10.225,
"eval_steps_per_second": 1.283,
"eval_wer": 0.3571718813490451,
"step": 1428
},
{
"epoch": 103.0,
"eval_cer": 0.18154686078252957,
"eval_loss": 0.569597065448761,
"eval_runtime": 53.1914,
"eval_samples_per_second": 10.19,
"eval_steps_per_second": 1.278,
"eval_wer": 0.35412433969930923,
"step": 1442
},
{
"epoch": 104.0,
"eval_cer": 0.18202001819836214,
"eval_loss": 0.5723647475242615,
"eval_runtime": 52.9421,
"eval_samples_per_second": 10.238,
"eval_steps_per_second": 1.284,
"eval_wer": 0.35412433969930923,
"step": 1456
},
{
"epoch": 105.0,
"eval_cer": 0.18202001819836214,
"eval_loss": 0.5698366165161133,
"eval_runtime": 53.0166,
"eval_samples_per_second": 10.223,
"eval_steps_per_second": 1.283,
"eval_wer": 0.35432750914262495,
"step": 1470
},
{
"epoch": 106.0,
"eval_cer": 0.1816196542311192,
"eval_loss": 0.5727118253707886,
"eval_runtime": 52.9397,
"eval_samples_per_second": 10.238,
"eval_steps_per_second": 1.284,
"eval_wer": 0.3522958147094677,
"step": 1484
},
{
"epoch": 107.0,
"eval_cer": 0.1808553230209281,
"eval_loss": 0.5609294176101685,
"eval_runtime": 53.3257,
"eval_samples_per_second": 10.164,
"eval_steps_per_second": 1.275,
"eval_wer": 0.35107679804957337,
"step": 1498
},
{
"epoch": 107.14,
"learning_rate": 8.628571428571429e-06,
"loss": 0.2718,
"step": 1500
},
{
"epoch": 108.0,
"eval_cer": 0.18070973612374885,
"eval_loss": 0.5654597282409668,
"eval_runtime": 52.8748,
"eval_samples_per_second": 10.251,
"eval_steps_per_second": 1.286,
"eval_wer": 0.34965461194636327,
"step": 1512
},
{
"epoch": 109.0,
"eval_cer": 0.18158325750682439,
"eval_loss": 0.5761396884918213,
"eval_runtime": 52.7804,
"eval_samples_per_second": 10.269,
"eval_steps_per_second": 1.288,
"eval_wer": 0.35351483136936207,
"step": 1526
},
{
"epoch": 110.0,
"eval_cer": 0.18147406733393995,
"eval_loss": 0.5753419995307922,
"eval_runtime": 52.7887,
"eval_samples_per_second": 10.267,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3522958147094677,
"step": 1540
},
{
"epoch": 111.0,
"eval_cer": 0.18049135577797998,
"eval_loss": 0.5703160762786865,
"eval_runtime": 52.7573,
"eval_samples_per_second": 10.273,
"eval_steps_per_second": 1.289,
"eval_wer": 0.35026412027631043,
"step": 1554
},
{
"epoch": 112.0,
"eval_cer": 0.18020018198362148,
"eval_loss": 0.5622747540473938,
"eval_runtime": 52.7621,
"eval_samples_per_second": 10.273,
"eval_steps_per_second": 1.289,
"eval_wer": 0.34701340918325885,
"step": 1568
},
{
"epoch": 113.0,
"eval_cer": 0.18129208371246588,
"eval_loss": 0.5722905993461609,
"eval_runtime": 52.84,
"eval_samples_per_second": 10.257,
"eval_steps_per_second": 1.287,
"eval_wer": 0.35107679804957337,
"step": 1582
},
{
"epoch": 114.0,
"eval_cer": 0.18030937215650591,
"eval_loss": 0.5607832670211792,
"eval_runtime": 52.8599,
"eval_samples_per_second": 10.254,
"eval_steps_per_second": 1.286,
"eval_wer": 0.34863876472978467,
"step": 1596
},
{
"epoch": 114.29,
"learning_rate": 7.2e-06,
"loss": 0.2614,
"step": 1600
},
{
"epoch": 115.0,
"eval_cer": 0.18089171974522292,
"eval_loss": 0.5612644553184509,
"eval_runtime": 52.8176,
"eval_samples_per_second": 10.262,
"eval_steps_per_second": 1.287,
"eval_wer": 0.35107679804957337,
"step": 1610
},
{
"epoch": 116.0,
"eval_cer": 0.18172884440400364,
"eval_loss": 0.5742478370666504,
"eval_runtime": 52.8139,
"eval_samples_per_second": 10.262,
"eval_steps_per_second": 1.288,
"eval_wer": 0.35331166192604635,
"step": 1624
},
{
"epoch": 117.0,
"eval_cer": 0.18172884440400364,
"eval_loss": 0.5715382695198059,
"eval_runtime": 52.8096,
"eval_samples_per_second": 10.263,
"eval_steps_per_second": 1.288,
"eval_wer": 0.3522958147094677,
"step": 1638
},
{
"epoch": 118.0,
"eval_cer": 0.18169244767970882,
"eval_loss": 0.5695165395736694,
"eval_runtime": 52.7498,
"eval_samples_per_second": 10.275,
"eval_steps_per_second": 1.289,
"eval_wer": 0.35331166192604635,
"step": 1652
},
{
"epoch": 119.0,
"eval_cer": 0.18245677888989992,
"eval_loss": 0.571264386177063,
"eval_runtime": 52.7339,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.289,
"eval_wer": 0.3531084924827306,
"step": 1666
},
{
"epoch": 120.0,
"eval_cer": 0.18205641492265695,
"eval_loss": 0.5664474368095398,
"eval_runtime": 52.8509,
"eval_samples_per_second": 10.255,
"eval_steps_per_second": 1.287,
"eval_wer": 0.35331166192604635,
"step": 1680
},
{
"epoch": 121.0,
"eval_cer": 0.1821656050955414,
"eval_loss": 0.5716355443000793,
"eval_runtime": 52.7551,
"eval_samples_per_second": 10.274,
"eval_steps_per_second": 1.289,
"eval_wer": 0.3531084924827306,
"step": 1694
},
{
"epoch": 121.43,
"learning_rate": 5.7714285714285715e-06,
"loss": 0.2463,
"step": 1700
},
{
"epoch": 122.0,
"eval_cer": 0.18100090991810738,
"eval_loss": 0.568006694316864,
"eval_runtime": 52.7861,
"eval_samples_per_second": 10.268,
"eval_steps_per_second": 1.288,
"eval_wer": 0.347622917513206,
"step": 1708
},
{
"epoch": 123.0,
"eval_cer": 0.18169244767970882,
"eval_loss": 0.5760354399681091,
"eval_runtime": 52.8132,
"eval_samples_per_second": 10.263,
"eval_steps_per_second": 1.288,
"eval_wer": 0.35270215359609913,
"step": 1722
},
{
"epoch": 124.0,
"eval_cer": 0.1802729754322111,
"eval_loss": 0.556138277053833,
"eval_runtime": 52.7767,
"eval_samples_per_second": 10.27,
"eval_steps_per_second": 1.288,
"eval_wer": 0.34559122308004875,
"step": 1736
},
{
"epoch": 125.0,
"eval_cer": 0.18118289353958145,
"eval_loss": 0.5698420405387878,
"eval_runtime": 52.7433,
"eval_samples_per_second": 10.276,
"eval_steps_per_second": 1.289,
"eval_wer": 0.34782608695652173,
"step": 1750
},
{
"epoch": 126.0,
"eval_cer": 0.18111010009099182,
"eval_loss": 0.5667452216148376,
"eval_runtime": 52.7698,
"eval_samples_per_second": 10.271,
"eval_steps_per_second": 1.289,
"eval_wer": 0.34823242584315317,
"step": 1764
},
{
"epoch": 127.0,
"eval_cer": 0.1813284804367607,
"eval_loss": 0.5677050948143005,
"eval_runtime": 52.7873,
"eval_samples_per_second": 10.268,
"eval_steps_per_second": 1.288,
"eval_wer": 0.34782608695652173,
"step": 1778
},
{
"epoch": 128.0,
"eval_cer": 0.18045495905368517,
"eval_loss": 0.5681147575378418,
"eval_runtime": 53.1709,
"eval_samples_per_second": 10.194,
"eval_steps_per_second": 1.279,
"eval_wer": 0.34457537586347015,
"step": 1792
},
{
"epoch": 128.57,
"learning_rate": 4.342857142857143e-06,
"loss": 0.2477,
"step": 1800
},
{
"epoch": 129.0,
"eval_cer": 0.18089171974522292,
"eval_loss": 0.5665947794914246,
"eval_runtime": 52.9379,
"eval_samples_per_second": 10.238,
"eval_steps_per_second": 1.285,
"eval_wer": 0.34701340918325885,
"step": 1806
},
{
"epoch": 130.0,
"eval_cer": 0.18041856232939035,
"eval_loss": 0.5696049928665161,
"eval_runtime": 52.7984,
"eval_samples_per_second": 10.265,
"eval_steps_per_second": 1.288,
"eval_wer": 0.34579439252336447,
"step": 1820
},
{
"epoch": 131.0,
"eval_cer": 0.1810373066424022,
"eval_loss": 0.5704218149185181,
"eval_runtime": 52.8548,
"eval_samples_per_second": 10.255,
"eval_steps_per_second": 1.287,
"eval_wer": 0.34782608695652173,
"step": 1834
},
{
"epoch": 132.0,
"eval_cer": 0.18078252957233848,
"eval_loss": 0.5655524134635925,
"eval_runtime": 52.9545,
"eval_samples_per_second": 10.235,
"eval_steps_per_second": 1.284,
"eval_wer": 0.34701340918325885,
"step": 1848
},
{
"epoch": 133.0,
"eval_cer": 0.18070973612374885,
"eval_loss": 0.5696657299995422,
"eval_runtime": 52.865,
"eval_samples_per_second": 10.253,
"eval_steps_per_second": 1.286,
"eval_wer": 0.34721657862657457,
"step": 1862
},
{
"epoch": 134.0,
"eval_cer": 0.18096451319381257,
"eval_loss": 0.5716409683227539,
"eval_runtime": 52.8035,
"eval_samples_per_second": 10.264,
"eval_steps_per_second": 1.288,
"eval_wer": 0.34721657862657457,
"step": 1876
},
{
"epoch": 135.0,
"eval_cer": 0.18096451319381257,
"eval_loss": 0.5742436647415161,
"eval_runtime": 52.961,
"eval_samples_per_second": 10.234,
"eval_steps_per_second": 1.284,
"eval_wer": 0.3484355952864689,
"step": 1890
},
{
"epoch": 135.71,
"learning_rate": 2.9142857142857142e-06,
"loss": 0.221,
"step": 1900
},
{
"epoch": 136.0,
"eval_cer": 0.18074613284804367,
"eval_loss": 0.567115306854248,
"eval_runtime": 52.8477,
"eval_samples_per_second": 10.256,
"eval_steps_per_second": 1.287,
"eval_wer": 0.34721657862657457,
"step": 1904
},
{
"epoch": 137.0,
"eval_cer": 0.18096451319381257,
"eval_loss": 0.5669675469398499,
"eval_runtime": 52.9196,
"eval_samples_per_second": 10.242,
"eval_steps_per_second": 1.285,
"eval_wer": 0.3462007314099959,
"step": 1918
},
{
"epoch": 138.0,
"eval_cer": 0.18100090991810738,
"eval_loss": 0.5674601793289185,
"eval_runtime": 53.2148,
"eval_samples_per_second": 10.185,
"eval_steps_per_second": 1.278,
"eval_wer": 0.3459975619666802,
"step": 1932
},
{
"epoch": 139.0,
"eval_cer": 0.18100090991810738,
"eval_loss": 0.5703522562980652,
"eval_runtime": 53.4902,
"eval_samples_per_second": 10.133,
"eval_steps_per_second": 1.271,
"eval_wer": 0.3462007314099959,
"step": 1946
},
{
"epoch": 140.0,
"eval_cer": 0.1808189262966333,
"eval_loss": 0.5675067901611328,
"eval_runtime": 53.2601,
"eval_samples_per_second": 10.176,
"eval_steps_per_second": 1.277,
"eval_wer": 0.34579439252336447,
"step": 1960
},
{
"epoch": 141.0,
"eval_cer": 0.1800181983621474,
"eval_loss": 0.5617998838424683,
"eval_runtime": 53.8381,
"eval_samples_per_second": 10.067,
"eval_steps_per_second": 1.263,
"eval_wer": 0.3443722064201544,
"step": 1974
},
{
"epoch": 142.0,
"eval_cer": 0.1799818016378526,
"eval_loss": 0.563258171081543,
"eval_runtime": 53.4467,
"eval_samples_per_second": 10.141,
"eval_steps_per_second": 1.272,
"eval_wer": 0.34538805363673303,
"step": 1988
},
{
"epoch": 142.86,
"learning_rate": 1.4857142857142858e-06,
"loss": 0.2217,
"step": 2000
},
{
"epoch": 143.0,
"eval_cer": 0.18067333939945404,
"eval_loss": 0.5663711428642273,
"eval_runtime": 53.0769,
"eval_samples_per_second": 10.212,
"eval_steps_per_second": 1.281,
"eval_wer": 0.34559122308004875,
"step": 2002
},
{
"epoch": 144.0,
"eval_cer": 0.18100090991810738,
"eval_loss": 0.5682144165039062,
"eval_runtime": 53.3453,
"eval_samples_per_second": 10.16,
"eval_steps_per_second": 1.275,
"eval_wer": 0.3462007314099959,
"step": 2016
},
{
"epoch": 144.0,
"step": 2016,
"total_flos": 1.799432351021922e+19,
"train_loss": 1.5532687327691488,
"train_runtime": 29581.7912,
"train_samples_per_second": 2.272,
"train_steps_per_second": 0.071
}
],
"max_steps": 2100,
"num_train_epochs": 150,
"total_flos": 1.799432351021922e+19,
"trial_name": null,
"trial_params": null
}