alinerodrigues's picture
End of training
6312117
{
"best_metric": 0.17724749445915222,
"best_model_checkpoint": "wav2vec2-xlsr-1b-mecita-portuguese-all-text-protecao_aos_pandas/checkpoint-225",
"epoch": 50.0,
"global_step": 375,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.13,
"learning_rate": 2.9957142857142858e-05,
"loss": 13.7229,
"step": 1
},
{
"epoch": 0.93,
"eval_cer": 0.9995906672124437,
"eval_loss": 4.859188556671143,
"eval_runtime": 1.8002,
"eval_samples_per_second": 16.109,
"eval_steps_per_second": 2.222,
"eval_wer": 1.0,
"step": 7
},
{
"epoch": 2.0,
"eval_cer": 1.0,
"eval_loss": 3.002265691757202,
"eval_runtime": 1.7603,
"eval_samples_per_second": 16.475,
"eval_steps_per_second": 2.272,
"eval_wer": 1.0,
"step": 15
},
{
"epoch": 2.93,
"eval_cer": 1.0,
"eval_loss": 2.929029941558838,
"eval_runtime": 1.7878,
"eval_samples_per_second": 16.221,
"eval_steps_per_second": 2.237,
"eval_wer": 1.0,
"step": 22
},
{
"epoch": 4.0,
"eval_cer": 1.0,
"eval_loss": 2.98417067527771,
"eval_runtime": 1.7731,
"eval_samples_per_second": 16.355,
"eval_steps_per_second": 2.256,
"eval_wer": 1.0,
"step": 30
},
{
"epoch": 4.93,
"eval_cer": 1.0,
"eval_loss": 2.845335006713867,
"eval_runtime": 1.7685,
"eval_samples_per_second": 16.398,
"eval_steps_per_second": 2.262,
"eval_wer": 1.0,
"step": 37
},
{
"epoch": 6.0,
"eval_cer": 1.0,
"eval_loss": 2.8119678497314453,
"eval_runtime": 1.8211,
"eval_samples_per_second": 15.924,
"eval_steps_per_second": 2.196,
"eval_wer": 1.0,
"step": 45
},
{
"epoch": 6.93,
"eval_cer": 1.0,
"eval_loss": 2.816225528717041,
"eval_runtime": 1.805,
"eval_samples_per_second": 16.067,
"eval_steps_per_second": 2.216,
"eval_wer": 1.0,
"step": 52
},
{
"epoch": 8.0,
"eval_cer": 1.0,
"eval_loss": 2.7843384742736816,
"eval_runtime": 1.7945,
"eval_samples_per_second": 16.161,
"eval_steps_per_second": 2.229,
"eval_wer": 1.0,
"step": 60
},
{
"epoch": 8.93,
"eval_cer": 1.0,
"eval_loss": 2.782341957092285,
"eval_runtime": 1.7839,
"eval_samples_per_second": 16.256,
"eval_steps_per_second": 2.242,
"eval_wer": 1.0,
"step": 67
},
{
"epoch": 10.0,
"eval_cer": 1.0,
"eval_loss": 2.743428945541382,
"eval_runtime": 1.77,
"eval_samples_per_second": 16.384,
"eval_steps_per_second": 2.26,
"eval_wer": 1.0,
"step": 75
},
{
"epoch": 10.93,
"eval_cer": 1.0,
"eval_loss": 2.636403799057007,
"eval_runtime": 1.7839,
"eval_samples_per_second": 16.256,
"eval_steps_per_second": 2.242,
"eval_wer": 1.0,
"step": 82
},
{
"epoch": 12.0,
"eval_cer": 0.9860826852230864,
"eval_loss": 2.3797059059143066,
"eval_runtime": 1.7797,
"eval_samples_per_second": 16.295,
"eval_steps_per_second": 2.248,
"eval_wer": 0.9876237623762376,
"step": 90
},
{
"epoch": 12.93,
"eval_cer": 0.9770773638968482,
"eval_loss": 1.9516112804412842,
"eval_runtime": 1.7769,
"eval_samples_per_second": 16.32,
"eval_steps_per_second": 2.251,
"eval_wer": 0.995049504950495,
"step": 97
},
{
"epoch": 13.33,
"learning_rate": 2.58e-05,
"loss": 3.3197,
"step": 100
},
{
"epoch": 14.0,
"eval_cer": 0.7474416700777732,
"eval_loss": 1.5396052598953247,
"eval_runtime": 1.8171,
"eval_samples_per_second": 15.96,
"eval_steps_per_second": 2.201,
"eval_wer": 1.0,
"step": 105
},
{
"epoch": 14.93,
"eval_cer": 0.4273434302087597,
"eval_loss": 1.103837251663208,
"eval_runtime": 1.7792,
"eval_samples_per_second": 16.3,
"eval_steps_per_second": 2.248,
"eval_wer": 0.995049504950495,
"step": 112
},
{
"epoch": 16.0,
"eval_cer": 0.16905444126074498,
"eval_loss": 0.6535802483558655,
"eval_runtime": 1.7778,
"eval_samples_per_second": 16.313,
"eval_steps_per_second": 2.25,
"eval_wer": 0.6732673267326733,
"step": 120
},
{
"epoch": 16.93,
"eval_cer": 0.07286123618501841,
"eval_loss": 0.40873047709465027,
"eval_runtime": 1.7934,
"eval_samples_per_second": 16.171,
"eval_steps_per_second": 2.23,
"eval_wer": 0.3217821782178218,
"step": 127
},
{
"epoch": 18.0,
"eval_cer": 0.056078591895210805,
"eval_loss": 0.31188902258872986,
"eval_runtime": 1.7728,
"eval_samples_per_second": 16.358,
"eval_steps_per_second": 2.256,
"eval_wer": 0.22524752475247525,
"step": 135
},
{
"epoch": 18.93,
"eval_cer": 0.04789193614408514,
"eval_loss": 0.2720329761505127,
"eval_runtime": 1.785,
"eval_samples_per_second": 16.247,
"eval_steps_per_second": 2.241,
"eval_wer": 0.17574257425742573,
"step": 142
},
{
"epoch": 20.0,
"eval_cer": 0.04134261154318461,
"eval_loss": 0.24048186838626862,
"eval_runtime": 1.7775,
"eval_samples_per_second": 16.315,
"eval_steps_per_second": 2.25,
"eval_wer": 0.15841584158415842,
"step": 150
},
{
"epoch": 20.93,
"eval_cer": 0.04093327875562833,
"eval_loss": 0.23653259873390198,
"eval_runtime": 1.8549,
"eval_samples_per_second": 15.634,
"eval_steps_per_second": 2.156,
"eval_wer": 0.15841584158415842,
"step": 157
},
{
"epoch": 22.0,
"eval_cer": 0.03970528039295947,
"eval_loss": 0.22812487185001373,
"eval_runtime": 1.7767,
"eval_samples_per_second": 16.323,
"eval_steps_per_second": 2.251,
"eval_wer": 0.15099009900990099,
"step": 165
},
{
"epoch": 22.93,
"eval_cer": 0.036021285304952924,
"eval_loss": 0.19893357157707214,
"eval_runtime": 1.7827,
"eval_samples_per_second": 16.267,
"eval_steps_per_second": 2.244,
"eval_wer": 0.13613861386138615,
"step": 172
},
{
"epoch": 24.0,
"eval_cer": 0.036021285304952924,
"eval_loss": 0.2050793319940567,
"eval_runtime": 1.7818,
"eval_samples_per_second": 16.275,
"eval_steps_per_second": 2.245,
"eval_wer": 0.12871287128712872,
"step": 180
},
{
"epoch": 24.93,
"eval_cer": 0.03561195251739664,
"eval_loss": 0.22654221951961517,
"eval_runtime": 1.7854,
"eval_samples_per_second": 16.243,
"eval_steps_per_second": 2.24,
"eval_wer": 0.12871287128712872,
"step": 187
},
{
"epoch": 26.0,
"eval_cer": 0.03765861645517806,
"eval_loss": 0.22025753557682037,
"eval_runtime": 1.7733,
"eval_samples_per_second": 16.354,
"eval_steps_per_second": 2.256,
"eval_wer": 0.12871287128712872,
"step": 195
},
{
"epoch": 26.67,
"learning_rate": 2.1514285714285717e-05,
"loss": 0.5589,
"step": 200
},
{
"epoch": 26.93,
"eval_cer": 0.03397462136717151,
"eval_loss": 0.2180820107460022,
"eval_runtime": 1.787,
"eval_samples_per_second": 16.228,
"eval_steps_per_second": 2.238,
"eval_wer": 0.12128712871287128,
"step": 202
},
{
"epoch": 28.0,
"eval_cer": 0.03356528857961523,
"eval_loss": 0.20063219964504242,
"eval_runtime": 1.7961,
"eval_samples_per_second": 16.146,
"eval_steps_per_second": 2.227,
"eval_wer": 0.12376237623762376,
"step": 210
},
{
"epoch": 28.93,
"eval_cer": 0.03315595579205895,
"eval_loss": 0.18598036468029022,
"eval_runtime": 1.7925,
"eval_samples_per_second": 16.178,
"eval_steps_per_second": 2.231,
"eval_wer": 0.12128712871287128,
"step": 217
},
{
"epoch": 30.0,
"eval_cer": 0.03029062627916496,
"eval_loss": 0.17724749445915222,
"eval_runtime": 1.7802,
"eval_samples_per_second": 16.29,
"eval_steps_per_second": 2.247,
"eval_wer": 0.11138613861386139,
"step": 225
},
{
"epoch": 30.93,
"eval_cer": 0.032337290216946375,
"eval_loss": 0.19143883883953094,
"eval_runtime": 1.7768,
"eval_samples_per_second": 16.322,
"eval_steps_per_second": 2.251,
"eval_wer": 0.12376237623762376,
"step": 232
},
{
"epoch": 32.0,
"eval_cer": 0.032337290216946375,
"eval_loss": 0.19965380430221558,
"eval_runtime": 1.8097,
"eval_samples_per_second": 16.025,
"eval_steps_per_second": 2.21,
"eval_wer": 0.12376237623762376,
"step": 240
},
{
"epoch": 32.93,
"eval_cer": 0.03397462136717151,
"eval_loss": 0.19473285973072052,
"eval_runtime": 1.8384,
"eval_samples_per_second": 15.775,
"eval_steps_per_second": 2.176,
"eval_wer": 0.12623762376237624,
"step": 247
},
{
"epoch": 34.0,
"eval_cer": 0.03274662300450266,
"eval_loss": 0.20558013021945953,
"eval_runtime": 1.7938,
"eval_samples_per_second": 16.167,
"eval_steps_per_second": 2.23,
"eval_wer": 0.12128712871287128,
"step": 255
},
{
"epoch": 34.93,
"eval_cer": 0.03315595579205895,
"eval_loss": 0.1984556019306183,
"eval_runtime": 1.7744,
"eval_samples_per_second": 16.343,
"eval_steps_per_second": 2.254,
"eval_wer": 0.12128712871287128,
"step": 262
},
{
"epoch": 36.0,
"eval_cer": 0.03274662300450266,
"eval_loss": 0.20163008570671082,
"eval_runtime": 1.8047,
"eval_samples_per_second": 16.069,
"eval_steps_per_second": 2.216,
"eval_wer": 0.12128712871287128,
"step": 270
},
{
"epoch": 36.93,
"eval_cer": 0.031109291854277528,
"eval_loss": 0.19409456849098206,
"eval_runtime": 1.7987,
"eval_samples_per_second": 16.123,
"eval_steps_per_second": 2.224,
"eval_wer": 0.11386138613861387,
"step": 277
},
{
"epoch": 38.0,
"eval_cer": 0.03192795742939009,
"eval_loss": 0.18242661654949188,
"eval_runtime": 1.806,
"eval_samples_per_second": 16.058,
"eval_steps_per_second": 2.215,
"eval_wer": 0.12376237623762376,
"step": 285
},
{
"epoch": 38.93,
"eval_cer": 0.029471960704052395,
"eval_loss": 0.18223299086093903,
"eval_runtime": 1.8045,
"eval_samples_per_second": 16.071,
"eval_steps_per_second": 2.217,
"eval_wer": 0.10891089108910891,
"step": 292
},
{
"epoch": 40.0,
"learning_rate": 1.7271428571428574e-05,
"loss": 0.1503,
"step": 300
},
{
"epoch": 40.0,
"eval_cer": 0.031109291854277528,
"eval_loss": 0.19688135385513306,
"eval_runtime": 1.8319,
"eval_samples_per_second": 15.83,
"eval_steps_per_second": 2.184,
"eval_wer": 0.11633663366336634,
"step": 300
},
{
"epoch": 40.93,
"eval_cer": 0.029471960704052395,
"eval_loss": 0.19957467913627625,
"eval_runtime": 1.8232,
"eval_samples_per_second": 15.906,
"eval_steps_per_second": 2.194,
"eval_wer": 0.11633663366336634,
"step": 307
},
{
"epoch": 42.0,
"eval_cer": 0.029471960704052395,
"eval_loss": 0.18802578747272491,
"eval_runtime": 1.7999,
"eval_samples_per_second": 16.112,
"eval_steps_per_second": 2.222,
"eval_wer": 0.10891089108910891,
"step": 315
},
{
"epoch": 42.93,
"eval_cer": 0.034383954154727794,
"eval_loss": 0.20173507928848267,
"eval_runtime": 1.7941,
"eval_samples_per_second": 16.164,
"eval_steps_per_second": 2.23,
"eval_wer": 0.1311881188118812,
"step": 322
},
{
"epoch": 44.0,
"eval_cer": 0.03274662300450266,
"eval_loss": 0.19139862060546875,
"eval_runtime": 1.8064,
"eval_samples_per_second": 16.054,
"eval_steps_per_second": 2.214,
"eval_wer": 0.11633663366336634,
"step": 330
},
{
"epoch": 44.93,
"eval_cer": 0.03315595579205895,
"eval_loss": 0.19346125423908234,
"eval_runtime": 1.8407,
"eval_samples_per_second": 15.755,
"eval_steps_per_second": 2.173,
"eval_wer": 0.11633663366336634,
"step": 337
},
{
"epoch": 46.0,
"eval_cer": 0.03192795742939009,
"eval_loss": 0.19668900966644287,
"eval_runtime": 1.8343,
"eval_samples_per_second": 15.81,
"eval_steps_per_second": 2.181,
"eval_wer": 0.11386138613861387,
"step": 345
},
{
"epoch": 46.93,
"eval_cer": 0.029881293491608677,
"eval_loss": 0.19127391278743744,
"eval_runtime": 1.7943,
"eval_samples_per_second": 16.162,
"eval_steps_per_second": 2.229,
"eval_wer": 0.10643564356435643,
"step": 352
},
{
"epoch": 48.0,
"eval_cer": 0.03029062627916496,
"eval_loss": 0.1993999034166336,
"eval_runtime": 1.8021,
"eval_samples_per_second": 16.092,
"eval_steps_per_second": 2.22,
"eval_wer": 0.11138613861386139,
"step": 360
},
{
"epoch": 48.93,
"eval_cer": 0.029062627916496112,
"eval_loss": 0.18826055526733398,
"eval_runtime": 1.81,
"eval_samples_per_second": 16.022,
"eval_steps_per_second": 2.21,
"eval_wer": 0.10891089108910891,
"step": 367
},
{
"epoch": 50.0,
"eval_cer": 0.03029062627916496,
"eval_loss": 0.18807141482830048,
"eval_runtime": 1.8146,
"eval_samples_per_second": 15.982,
"eval_steps_per_second": 2.204,
"eval_wer": 0.11386138613861387,
"step": 375
},
{
"epoch": 50.0,
"step": 375,
"total_flos": 9.822732861444276e+18,
"train_loss": 1.1235487569173177,
"train_runtime": 3285.5807,
"train_samples_per_second": 6.879,
"train_steps_per_second": 0.213
}
],
"max_steps": 700,
"num_train_epochs": 100,
"total_flos": 9.822732861444276e+18,
"trial_name": null,
"trial_params": null
}