wav2vec2-large-xlsr-coraa-exp-11 / trainer_state.json
alinerodrigues's picture
End of training
52af36e
{
"best_metric": 8.99256706237793,
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-11/checkpoint-168",
"epoch": 32.0,
"global_step": 448,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.07,
"learning_rate": 3e-05,
"loss": 38.5161,
"step": 1
},
{
"epoch": 1.0,
"eval_cer": 0.9510100090991811,
"eval_loss": 34.24892807006836,
"eval_runtime": 52.8709,
"eval_samples_per_second": 10.251,
"eval_steps_per_second": 1.286,
"eval_wer": 1.0,
"step": 14
},
{
"epoch": 2.0,
"eval_cer": 0.9510464058234759,
"eval_loss": 23.386924743652344,
"eval_runtime": 52.734,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 28
},
{
"epoch": 3.0,
"eval_cer": 0.9510464058234759,
"eval_loss": 19.672130584716797,
"eval_runtime": 53.3907,
"eval_samples_per_second": 10.152,
"eval_steps_per_second": 1.274,
"eval_wer": 1.0,
"step": 42
},
{
"epoch": 4.0,
"eval_cer": 0.9510464058234759,
"eval_loss": 18.373493194580078,
"eval_runtime": 52.736,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 56
},
{
"epoch": 5.0,
"eval_cer": 0.9495905368516834,
"eval_loss": 17.55065155029297,
"eval_runtime": 52.7319,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0026412027631044,
"step": 70
},
{
"epoch": 6.0,
"eval_cer": 0.9688080072793449,
"eval_loss": 16.934043884277344,
"eval_runtime": 52.6762,
"eval_samples_per_second": 10.289,
"eval_steps_per_second": 1.291,
"eval_wer": 1.0737505079236083,
"step": 84
},
{
"epoch": 7.0,
"eval_cer": 0.9511191992720656,
"eval_loss": 17.322906494140625,
"eval_runtime": 52.7337,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0004063388866316,
"step": 98
},
{
"epoch": 7.14,
"learning_rate": 2.8614285714285714e-05,
"loss": 17.5323,
"step": 100
},
{
"epoch": 8.0,
"eval_cer": 0.9313921747042766,
"eval_loss": 16.459413528442383,
"eval_runtime": 52.7143,
"eval_samples_per_second": 10.282,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0156440471353108,
"step": 112
},
{
"epoch": 9.0,
"eval_cer": 0.935213830755232,
"eval_loss": 12.445086479187012,
"eval_runtime": 52.7004,
"eval_samples_per_second": 10.285,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0298659081674115,
"step": 126
},
{
"epoch": 10.0,
"eval_cer": 0.9618562329390354,
"eval_loss": 10.092220306396484,
"eval_runtime": 52.7354,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.289,
"eval_wer": 1.0,
"step": 140
},
{
"epoch": 11.0,
"eval_cer": 0.9617834394904459,
"eval_loss": 9.518609046936035,
"eval_runtime": 53.2311,
"eval_samples_per_second": 10.182,
"eval_steps_per_second": 1.277,
"eval_wer": 0.9997968305566842,
"step": 154
},
{
"epoch": 12.0,
"eval_cer": 0.932302092811647,
"eval_loss": 8.99256706237793,
"eval_runtime": 52.6632,
"eval_samples_per_second": 10.292,
"eval_steps_per_second": 1.291,
"eval_wer": 0.9865908167411621,
"step": 168
},
{
"epoch": 13.0,
"eval_cer": 0.9166515013648772,
"eval_loss": 9.018474578857422,
"eval_runtime": 52.7545,
"eval_samples_per_second": 10.274,
"eval_steps_per_second": 1.289,
"eval_wer": 0.9839496139780577,
"step": 182
},
{
"epoch": 14.0,
"eval_cer": 0.9216378525932666,
"eval_loss": 9.124226570129395,
"eval_runtime": 53.3159,
"eval_samples_per_second": 10.166,
"eval_steps_per_second": 1.275,
"eval_wer": 0.983746444534742,
"step": 196
},
{
"epoch": 14.29,
"learning_rate": 2.7185714285714287e-05,
"loss": 6.6506,
"step": 200
},
{
"epoch": 15.0,
"eval_cer": 0.8844404003639672,
"eval_loss": 9.050068855285645,
"eval_runtime": 52.6837,
"eval_samples_per_second": 10.288,
"eval_steps_per_second": 1.291,
"eval_wer": 0.9880130028443722,
"step": 210
},
{
"epoch": 16.0,
"eval_cer": 0.902238398544131,
"eval_loss": 9.189239501953125,
"eval_runtime": 52.7185,
"eval_samples_per_second": 10.281,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9776513612352702,
"step": 224
},
{
"epoch": 17.0,
"eval_cer": 0.8847315741583257,
"eval_loss": 9.173331260681152,
"eval_runtime": 52.733,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9798862251117432,
"step": 238
},
{
"epoch": 18.0,
"eval_cer": 0.8733393994540491,
"eval_loss": 9.303343772888184,
"eval_runtime": 52.7609,
"eval_samples_per_second": 10.273,
"eval_steps_per_second": 1.289,
"eval_wer": 0.9798862251117432,
"step": 252
},
{
"epoch": 19.0,
"eval_cer": 0.8989626933575978,
"eval_loss": 9.28529167175293,
"eval_runtime": 52.7177,
"eval_samples_per_second": 10.281,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9746038195855343,
"step": 266
},
{
"epoch": 20.0,
"eval_cer": 0.9086442220200182,
"eval_loss": 9.438006401062012,
"eval_runtime": 52.8014,
"eval_samples_per_second": 10.265,
"eval_steps_per_second": 1.288,
"eval_wer": 0.9748069890288501,
"step": 280
},
{
"epoch": 21.0,
"eval_cer": 0.8900090991810737,
"eval_loss": 9.513178825378418,
"eval_runtime": 52.7023,
"eval_samples_per_second": 10.284,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9750101584721658,
"step": 294
},
{
"epoch": 21.43,
"learning_rate": 2.5757142857142857e-05,
"loss": 3.6568,
"step": 300
},
{
"epoch": 22.0,
"eval_cer": 0.8811282984531392,
"eval_loss": 9.6267728805542,
"eval_runtime": 53.0646,
"eval_samples_per_second": 10.214,
"eval_steps_per_second": 1.281,
"eval_wer": 0.9817147501015847,
"step": 308
},
{
"epoch": 23.0,
"eval_cer": 0.8846587807097361,
"eval_loss": 9.698858261108398,
"eval_runtime": 52.7263,
"eval_samples_per_second": 10.28,
"eval_steps_per_second": 1.29,
"eval_wer": 1.0042665583096302,
"step": 322
},
{
"epoch": 24.0,
"eval_cer": 0.8963057324840764,
"eval_loss": 9.611275672912598,
"eval_runtime": 52.7167,
"eval_samples_per_second": 10.281,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9788703778951645,
"step": 336
},
{
"epoch": 25.0,
"eval_cer": 0.8923748862602365,
"eval_loss": 9.794692039489746,
"eval_runtime": 52.8702,
"eval_samples_per_second": 10.252,
"eval_steps_per_second": 1.286,
"eval_wer": 0.980698902885006,
"step": 350
},
{
"epoch": 26.0,
"eval_cer": 0.8979435850773431,
"eval_loss": 9.83806324005127,
"eval_runtime": 52.7321,
"eval_samples_per_second": 10.278,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9794798862251117,
"step": 364
},
{
"epoch": 27.0,
"eval_cer": 0.8951774340309372,
"eval_loss": 10.03061580657959,
"eval_runtime": 52.6816,
"eval_samples_per_second": 10.288,
"eval_steps_per_second": 1.291,
"eval_wer": 0.9788703778951645,
"step": 378
},
{
"epoch": 28.0,
"eval_cer": 0.8947042766151047,
"eval_loss": 9.994989395141602,
"eval_runtime": 53.3774,
"eval_samples_per_second": 10.154,
"eval_steps_per_second": 1.274,
"eval_wer": 0.9792767167817961,
"step": 392
},
{
"epoch": 28.57,
"learning_rate": 2.432857142857143e-05,
"loss": 3.316,
"step": 400
},
{
"epoch": 29.0,
"eval_cer": 0.8978707916287534,
"eval_loss": 10.14880084991455,
"eval_runtime": 52.6791,
"eval_samples_per_second": 10.289,
"eval_steps_per_second": 1.291,
"eval_wer": 0.9780577001219016,
"step": 406
},
{
"epoch": 30.0,
"eval_cer": 0.9092265696087353,
"eval_loss": 10.193445205688477,
"eval_runtime": 52.6484,
"eval_samples_per_second": 10.295,
"eval_steps_per_second": 1.292,
"eval_wer": 0.9809020723283218,
"step": 420
},
{
"epoch": 31.0,
"eval_cer": 0.9298999090081893,
"eval_loss": 10.21463680267334,
"eval_runtime": 52.7062,
"eval_samples_per_second": 10.283,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9880130028443722,
"step": 434
},
{
"epoch": 32.0,
"eval_cer": 0.9593084622383985,
"eval_loss": 10.298548698425293,
"eval_runtime": 52.7136,
"eval_samples_per_second": 10.282,
"eval_steps_per_second": 1.29,
"eval_wer": 0.9997968305566842,
"step": 448
},
{
"epoch": 32.0,
"step": 448,
"total_flos": 3.9986309695731635e+18,
"train_loss": 7.336955785751343,
"train_runtime": 6516.6943,
"train_samples_per_second": 10.312,
"train_steps_per_second": 0.322
}
],
"max_steps": 2100,
"num_train_epochs": 150,
"total_flos": 3.9986309695731635e+18,
"trial_name": null,
"trial_params": null
}