|
{ |
|
"best_metric": 0.17724749445915222, |
|
"best_model_checkpoint": "wav2vec2-xlsr-1b-mecita-portuguese-all-text-protecao_aos_pandas/checkpoint-225", |
|
"epoch": 50.0, |
|
"global_step": 375, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 2.9957142857142858e-05, |
|
"loss": 13.7229, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_cer": 0.9995906672124437, |
|
"eval_loss": 4.859188556671143, |
|
"eval_runtime": 1.8002, |
|
"eval_samples_per_second": 16.109, |
|
"eval_steps_per_second": 2.222, |
|
"eval_wer": 1.0, |
|
"step": 7 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 3.002265691757202, |
|
"eval_runtime": 1.7603, |
|
"eval_samples_per_second": 16.475, |
|
"eval_steps_per_second": 2.272, |
|
"eval_wer": 1.0, |
|
"step": 15 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.929029941558838, |
|
"eval_runtime": 1.7878, |
|
"eval_samples_per_second": 16.221, |
|
"eval_steps_per_second": 2.237, |
|
"eval_wer": 1.0, |
|
"step": 22 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.98417067527771, |
|
"eval_runtime": 1.7731, |
|
"eval_samples_per_second": 16.355, |
|
"eval_steps_per_second": 2.256, |
|
"eval_wer": 1.0, |
|
"step": 30 |
|
}, |
|
{ |
|
"epoch": 4.93, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.845335006713867, |
|
"eval_runtime": 1.7685, |
|
"eval_samples_per_second": 16.398, |
|
"eval_steps_per_second": 2.262, |
|
"eval_wer": 1.0, |
|
"step": 37 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.8119678497314453, |
|
"eval_runtime": 1.8211, |
|
"eval_samples_per_second": 15.924, |
|
"eval_steps_per_second": 2.196, |
|
"eval_wer": 1.0, |
|
"step": 45 |
|
}, |
|
{ |
|
"epoch": 6.93, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.816225528717041, |
|
"eval_runtime": 1.805, |
|
"eval_samples_per_second": 16.067, |
|
"eval_steps_per_second": 2.216, |
|
"eval_wer": 1.0, |
|
"step": 52 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.7843384742736816, |
|
"eval_runtime": 1.7945, |
|
"eval_samples_per_second": 16.161, |
|
"eval_steps_per_second": 2.229, |
|
"eval_wer": 1.0, |
|
"step": 60 |
|
}, |
|
{ |
|
"epoch": 8.93, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.782341957092285, |
|
"eval_runtime": 1.7839, |
|
"eval_samples_per_second": 16.256, |
|
"eval_steps_per_second": 2.242, |
|
"eval_wer": 1.0, |
|
"step": 67 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.743428945541382, |
|
"eval_runtime": 1.77, |
|
"eval_samples_per_second": 16.384, |
|
"eval_steps_per_second": 2.26, |
|
"eval_wer": 1.0, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 10.93, |
|
"eval_cer": 1.0, |
|
"eval_loss": 2.636403799057007, |
|
"eval_runtime": 1.7839, |
|
"eval_samples_per_second": 16.256, |
|
"eval_steps_per_second": 2.242, |
|
"eval_wer": 1.0, |
|
"step": 82 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.9860826852230864, |
|
"eval_loss": 2.3797059059143066, |
|
"eval_runtime": 1.7797, |
|
"eval_samples_per_second": 16.295, |
|
"eval_steps_per_second": 2.248, |
|
"eval_wer": 0.9876237623762376, |
|
"step": 90 |
|
}, |
|
{ |
|
"epoch": 12.93, |
|
"eval_cer": 0.9770773638968482, |
|
"eval_loss": 1.9516112804412842, |
|
"eval_runtime": 1.7769, |
|
"eval_samples_per_second": 16.32, |
|
"eval_steps_per_second": 2.251, |
|
"eval_wer": 0.995049504950495, |
|
"step": 97 |
|
}, |
|
{ |
|
"epoch": 13.33, |
|
"learning_rate": 2.58e-05, |
|
"loss": 3.3197, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.7474416700777732, |
|
"eval_loss": 1.5396052598953247, |
|
"eval_runtime": 1.8171, |
|
"eval_samples_per_second": 15.96, |
|
"eval_steps_per_second": 2.201, |
|
"eval_wer": 1.0, |
|
"step": 105 |
|
}, |
|
{ |
|
"epoch": 14.93, |
|
"eval_cer": 0.4273434302087597, |
|
"eval_loss": 1.103837251663208, |
|
"eval_runtime": 1.7792, |
|
"eval_samples_per_second": 16.3, |
|
"eval_steps_per_second": 2.248, |
|
"eval_wer": 0.995049504950495, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.16905444126074498, |
|
"eval_loss": 0.6535802483558655, |
|
"eval_runtime": 1.7778, |
|
"eval_samples_per_second": 16.313, |
|
"eval_steps_per_second": 2.25, |
|
"eval_wer": 0.6732673267326733, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 16.93, |
|
"eval_cer": 0.07286123618501841, |
|
"eval_loss": 0.40873047709465027, |
|
"eval_runtime": 1.7934, |
|
"eval_samples_per_second": 16.171, |
|
"eval_steps_per_second": 2.23, |
|
"eval_wer": 0.3217821782178218, |
|
"step": 127 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.056078591895210805, |
|
"eval_loss": 0.31188902258872986, |
|
"eval_runtime": 1.7728, |
|
"eval_samples_per_second": 16.358, |
|
"eval_steps_per_second": 2.256, |
|
"eval_wer": 0.22524752475247525, |
|
"step": 135 |
|
}, |
|
{ |
|
"epoch": 18.93, |
|
"eval_cer": 0.04789193614408514, |
|
"eval_loss": 0.2720329761505127, |
|
"eval_runtime": 1.785, |
|
"eval_samples_per_second": 16.247, |
|
"eval_steps_per_second": 2.241, |
|
"eval_wer": 0.17574257425742573, |
|
"step": 142 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.04134261154318461, |
|
"eval_loss": 0.24048186838626862, |
|
"eval_runtime": 1.7775, |
|
"eval_samples_per_second": 16.315, |
|
"eval_steps_per_second": 2.25, |
|
"eval_wer": 0.15841584158415842, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 20.93, |
|
"eval_cer": 0.04093327875562833, |
|
"eval_loss": 0.23653259873390198, |
|
"eval_runtime": 1.8549, |
|
"eval_samples_per_second": 15.634, |
|
"eval_steps_per_second": 2.156, |
|
"eval_wer": 0.15841584158415842, |
|
"step": 157 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_cer": 0.03970528039295947, |
|
"eval_loss": 0.22812487185001373, |
|
"eval_runtime": 1.7767, |
|
"eval_samples_per_second": 16.323, |
|
"eval_steps_per_second": 2.251, |
|
"eval_wer": 0.15099009900990099, |
|
"step": 165 |
|
}, |
|
{ |
|
"epoch": 22.93, |
|
"eval_cer": 0.036021285304952924, |
|
"eval_loss": 0.19893357157707214, |
|
"eval_runtime": 1.7827, |
|
"eval_samples_per_second": 16.267, |
|
"eval_steps_per_second": 2.244, |
|
"eval_wer": 0.13613861386138615, |
|
"step": 172 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_cer": 0.036021285304952924, |
|
"eval_loss": 0.2050793319940567, |
|
"eval_runtime": 1.7818, |
|
"eval_samples_per_second": 16.275, |
|
"eval_steps_per_second": 2.245, |
|
"eval_wer": 0.12871287128712872, |
|
"step": 180 |
|
}, |
|
{ |
|
"epoch": 24.93, |
|
"eval_cer": 0.03561195251739664, |
|
"eval_loss": 0.22654221951961517, |
|
"eval_runtime": 1.7854, |
|
"eval_samples_per_second": 16.243, |
|
"eval_steps_per_second": 2.24, |
|
"eval_wer": 0.12871287128712872, |
|
"step": 187 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_cer": 0.03765861645517806, |
|
"eval_loss": 0.22025753557682037, |
|
"eval_runtime": 1.7733, |
|
"eval_samples_per_second": 16.354, |
|
"eval_steps_per_second": 2.256, |
|
"eval_wer": 0.12871287128712872, |
|
"step": 195 |
|
}, |
|
{ |
|
"epoch": 26.67, |
|
"learning_rate": 2.1514285714285717e-05, |
|
"loss": 0.5589, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 26.93, |
|
"eval_cer": 0.03397462136717151, |
|
"eval_loss": 0.2180820107460022, |
|
"eval_runtime": 1.787, |
|
"eval_samples_per_second": 16.228, |
|
"eval_steps_per_second": 2.238, |
|
"eval_wer": 0.12128712871287128, |
|
"step": 202 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_cer": 0.03356528857961523, |
|
"eval_loss": 0.20063219964504242, |
|
"eval_runtime": 1.7961, |
|
"eval_samples_per_second": 16.146, |
|
"eval_steps_per_second": 2.227, |
|
"eval_wer": 0.12376237623762376, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 28.93, |
|
"eval_cer": 0.03315595579205895, |
|
"eval_loss": 0.18598036468029022, |
|
"eval_runtime": 1.7925, |
|
"eval_samples_per_second": 16.178, |
|
"eval_steps_per_second": 2.231, |
|
"eval_wer": 0.12128712871287128, |
|
"step": 217 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.03029062627916496, |
|
"eval_loss": 0.17724749445915222, |
|
"eval_runtime": 1.7802, |
|
"eval_samples_per_second": 16.29, |
|
"eval_steps_per_second": 2.247, |
|
"eval_wer": 0.11138613861386139, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 30.93, |
|
"eval_cer": 0.032337290216946375, |
|
"eval_loss": 0.19143883883953094, |
|
"eval_runtime": 1.7768, |
|
"eval_samples_per_second": 16.322, |
|
"eval_steps_per_second": 2.251, |
|
"eval_wer": 0.12376237623762376, |
|
"step": 232 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_cer": 0.032337290216946375, |
|
"eval_loss": 0.19965380430221558, |
|
"eval_runtime": 1.8097, |
|
"eval_samples_per_second": 16.025, |
|
"eval_steps_per_second": 2.21, |
|
"eval_wer": 0.12376237623762376, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 32.93, |
|
"eval_cer": 0.03397462136717151, |
|
"eval_loss": 0.19473285973072052, |
|
"eval_runtime": 1.8384, |
|
"eval_samples_per_second": 15.775, |
|
"eval_steps_per_second": 2.176, |
|
"eval_wer": 0.12623762376237624, |
|
"step": 247 |
|
}, |
|
{ |
|
"epoch": 34.0, |
|
"eval_cer": 0.03274662300450266, |
|
"eval_loss": 0.20558013021945953, |
|
"eval_runtime": 1.7938, |
|
"eval_samples_per_second": 16.167, |
|
"eval_steps_per_second": 2.23, |
|
"eval_wer": 0.12128712871287128, |
|
"step": 255 |
|
}, |
|
{ |
|
"epoch": 34.93, |
|
"eval_cer": 0.03315595579205895, |
|
"eval_loss": 0.1984556019306183, |
|
"eval_runtime": 1.7744, |
|
"eval_samples_per_second": 16.343, |
|
"eval_steps_per_second": 2.254, |
|
"eval_wer": 0.12128712871287128, |
|
"step": 262 |
|
}, |
|
{ |
|
"epoch": 36.0, |
|
"eval_cer": 0.03274662300450266, |
|
"eval_loss": 0.20163008570671082, |
|
"eval_runtime": 1.8047, |
|
"eval_samples_per_second": 16.069, |
|
"eval_steps_per_second": 2.216, |
|
"eval_wer": 0.12128712871287128, |
|
"step": 270 |
|
}, |
|
{ |
|
"epoch": 36.93, |
|
"eval_cer": 0.031109291854277528, |
|
"eval_loss": 0.19409456849098206, |
|
"eval_runtime": 1.7987, |
|
"eval_samples_per_second": 16.123, |
|
"eval_steps_per_second": 2.224, |
|
"eval_wer": 0.11386138613861387, |
|
"step": 277 |
|
}, |
|
{ |
|
"epoch": 38.0, |
|
"eval_cer": 0.03192795742939009, |
|
"eval_loss": 0.18242661654949188, |
|
"eval_runtime": 1.806, |
|
"eval_samples_per_second": 16.058, |
|
"eval_steps_per_second": 2.215, |
|
"eval_wer": 0.12376237623762376, |
|
"step": 285 |
|
}, |
|
{ |
|
"epoch": 38.93, |
|
"eval_cer": 0.029471960704052395, |
|
"eval_loss": 0.18223299086093903, |
|
"eval_runtime": 1.8045, |
|
"eval_samples_per_second": 16.071, |
|
"eval_steps_per_second": 2.217, |
|
"eval_wer": 0.10891089108910891, |
|
"step": 292 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"learning_rate": 1.7271428571428574e-05, |
|
"loss": 0.1503, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 40.0, |
|
"eval_cer": 0.031109291854277528, |
|
"eval_loss": 0.19688135385513306, |
|
"eval_runtime": 1.8319, |
|
"eval_samples_per_second": 15.83, |
|
"eval_steps_per_second": 2.184, |
|
"eval_wer": 0.11633663366336634, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 40.93, |
|
"eval_cer": 0.029471960704052395, |
|
"eval_loss": 0.19957467913627625, |
|
"eval_runtime": 1.8232, |
|
"eval_samples_per_second": 15.906, |
|
"eval_steps_per_second": 2.194, |
|
"eval_wer": 0.11633663366336634, |
|
"step": 307 |
|
}, |
|
{ |
|
"epoch": 42.0, |
|
"eval_cer": 0.029471960704052395, |
|
"eval_loss": 0.18802578747272491, |
|
"eval_runtime": 1.7999, |
|
"eval_samples_per_second": 16.112, |
|
"eval_steps_per_second": 2.222, |
|
"eval_wer": 0.10891089108910891, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 42.93, |
|
"eval_cer": 0.034383954154727794, |
|
"eval_loss": 0.20173507928848267, |
|
"eval_runtime": 1.7941, |
|
"eval_samples_per_second": 16.164, |
|
"eval_steps_per_second": 2.23, |
|
"eval_wer": 0.1311881188118812, |
|
"step": 322 |
|
}, |
|
{ |
|
"epoch": 44.0, |
|
"eval_cer": 0.03274662300450266, |
|
"eval_loss": 0.19139862060546875, |
|
"eval_runtime": 1.8064, |
|
"eval_samples_per_second": 16.054, |
|
"eval_steps_per_second": 2.214, |
|
"eval_wer": 0.11633663366336634, |
|
"step": 330 |
|
}, |
|
{ |
|
"epoch": 44.93, |
|
"eval_cer": 0.03315595579205895, |
|
"eval_loss": 0.19346125423908234, |
|
"eval_runtime": 1.8407, |
|
"eval_samples_per_second": 15.755, |
|
"eval_steps_per_second": 2.173, |
|
"eval_wer": 0.11633663366336634, |
|
"step": 337 |
|
}, |
|
{ |
|
"epoch": 46.0, |
|
"eval_cer": 0.03192795742939009, |
|
"eval_loss": 0.19668900966644287, |
|
"eval_runtime": 1.8343, |
|
"eval_samples_per_second": 15.81, |
|
"eval_steps_per_second": 2.181, |
|
"eval_wer": 0.11386138613861387, |
|
"step": 345 |
|
}, |
|
{ |
|
"epoch": 46.93, |
|
"eval_cer": 0.029881293491608677, |
|
"eval_loss": 0.19127391278743744, |
|
"eval_runtime": 1.7943, |
|
"eval_samples_per_second": 16.162, |
|
"eval_steps_per_second": 2.229, |
|
"eval_wer": 0.10643564356435643, |
|
"step": 352 |
|
}, |
|
{ |
|
"epoch": 48.0, |
|
"eval_cer": 0.03029062627916496, |
|
"eval_loss": 0.1993999034166336, |
|
"eval_runtime": 1.8021, |
|
"eval_samples_per_second": 16.092, |
|
"eval_steps_per_second": 2.22, |
|
"eval_wer": 0.11138613861386139, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 48.93, |
|
"eval_cer": 0.029062627916496112, |
|
"eval_loss": 0.18826055526733398, |
|
"eval_runtime": 1.81, |
|
"eval_samples_per_second": 16.022, |
|
"eval_steps_per_second": 2.21, |
|
"eval_wer": 0.10891089108910891, |
|
"step": 367 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_cer": 0.03029062627916496, |
|
"eval_loss": 0.18807141482830048, |
|
"eval_runtime": 1.8146, |
|
"eval_samples_per_second": 15.982, |
|
"eval_steps_per_second": 2.204, |
|
"eval_wer": 0.11386138613861387, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"step": 375, |
|
"total_flos": 9.822732861444276e+18, |
|
"train_loss": 1.1235487569173177, |
|
"train_runtime": 3285.5807, |
|
"train_samples_per_second": 6.879, |
|
"train_steps_per_second": 0.213 |
|
} |
|
], |
|
"max_steps": 700, |
|
"num_train_epochs": 100, |
|
"total_flos": 9.822732861444276e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|