|
{ |
|
"best_metric": 8.99256706237793, |
|
"best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-11/checkpoint-168", |
|
"epoch": 32.0, |
|
"global_step": 448, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 3e-05, |
|
"loss": 38.5161, |
|
"step": 1 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_cer": 0.9510100090991811, |
|
"eval_loss": 34.24892807006836, |
|
"eval_runtime": 52.8709, |
|
"eval_samples_per_second": 10.251, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 1.0, |
|
"step": 14 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_cer": 0.9510464058234759, |
|
"eval_loss": 23.386924743652344, |
|
"eval_runtime": 52.734, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 28 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_cer": 0.9510464058234759, |
|
"eval_loss": 19.672130584716797, |
|
"eval_runtime": 53.3907, |
|
"eval_samples_per_second": 10.152, |
|
"eval_steps_per_second": 1.274, |
|
"eval_wer": 1.0, |
|
"step": 42 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_cer": 0.9510464058234759, |
|
"eval_loss": 18.373493194580078, |
|
"eval_runtime": 52.736, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 56 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_cer": 0.9495905368516834, |
|
"eval_loss": 17.55065155029297, |
|
"eval_runtime": 52.7319, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0026412027631044, |
|
"step": 70 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_cer": 0.9688080072793449, |
|
"eval_loss": 16.934043884277344, |
|
"eval_runtime": 52.6762, |
|
"eval_samples_per_second": 10.289, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 1.0737505079236083, |
|
"step": 84 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_cer": 0.9511191992720656, |
|
"eval_loss": 17.322906494140625, |
|
"eval_runtime": 52.7337, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0004063388866316, |
|
"step": 98 |
|
}, |
|
{ |
|
"epoch": 7.14, |
|
"learning_rate": 2.8614285714285714e-05, |
|
"loss": 17.5323, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_cer": 0.9313921747042766, |
|
"eval_loss": 16.459413528442383, |
|
"eval_runtime": 52.7143, |
|
"eval_samples_per_second": 10.282, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0156440471353108, |
|
"step": 112 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_cer": 0.935213830755232, |
|
"eval_loss": 12.445086479187012, |
|
"eval_runtime": 52.7004, |
|
"eval_samples_per_second": 10.285, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0298659081674115, |
|
"step": 126 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_cer": 0.9618562329390354, |
|
"eval_loss": 10.092220306396484, |
|
"eval_runtime": 52.7354, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 1.0, |
|
"step": 140 |
|
}, |
|
{ |
|
"epoch": 11.0, |
|
"eval_cer": 0.9617834394904459, |
|
"eval_loss": 9.518609046936035, |
|
"eval_runtime": 53.2311, |
|
"eval_samples_per_second": 10.182, |
|
"eval_steps_per_second": 1.277, |
|
"eval_wer": 0.9997968305566842, |
|
"step": 154 |
|
}, |
|
{ |
|
"epoch": 12.0, |
|
"eval_cer": 0.932302092811647, |
|
"eval_loss": 8.99256706237793, |
|
"eval_runtime": 52.6632, |
|
"eval_samples_per_second": 10.292, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.9865908167411621, |
|
"step": 168 |
|
}, |
|
{ |
|
"epoch": 13.0, |
|
"eval_cer": 0.9166515013648772, |
|
"eval_loss": 9.018474578857422, |
|
"eval_runtime": 52.7545, |
|
"eval_samples_per_second": 10.274, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.9839496139780577, |
|
"step": 182 |
|
}, |
|
{ |
|
"epoch": 14.0, |
|
"eval_cer": 0.9216378525932666, |
|
"eval_loss": 9.124226570129395, |
|
"eval_runtime": 53.3159, |
|
"eval_samples_per_second": 10.166, |
|
"eval_steps_per_second": 1.275, |
|
"eval_wer": 0.983746444534742, |
|
"step": 196 |
|
}, |
|
{ |
|
"epoch": 14.29, |
|
"learning_rate": 2.7185714285714287e-05, |
|
"loss": 6.6506, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 15.0, |
|
"eval_cer": 0.8844404003639672, |
|
"eval_loss": 9.050068855285645, |
|
"eval_runtime": 52.6837, |
|
"eval_samples_per_second": 10.288, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.9880130028443722, |
|
"step": 210 |
|
}, |
|
{ |
|
"epoch": 16.0, |
|
"eval_cer": 0.902238398544131, |
|
"eval_loss": 9.189239501953125, |
|
"eval_runtime": 52.7185, |
|
"eval_samples_per_second": 10.281, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9776513612352702, |
|
"step": 224 |
|
}, |
|
{ |
|
"epoch": 17.0, |
|
"eval_cer": 0.8847315741583257, |
|
"eval_loss": 9.173331260681152, |
|
"eval_runtime": 52.733, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9798862251117432, |
|
"step": 238 |
|
}, |
|
{ |
|
"epoch": 18.0, |
|
"eval_cer": 0.8733393994540491, |
|
"eval_loss": 9.303343772888184, |
|
"eval_runtime": 52.7609, |
|
"eval_samples_per_second": 10.273, |
|
"eval_steps_per_second": 1.289, |
|
"eval_wer": 0.9798862251117432, |
|
"step": 252 |
|
}, |
|
{ |
|
"epoch": 19.0, |
|
"eval_cer": 0.8989626933575978, |
|
"eval_loss": 9.28529167175293, |
|
"eval_runtime": 52.7177, |
|
"eval_samples_per_second": 10.281, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9746038195855343, |
|
"step": 266 |
|
}, |
|
{ |
|
"epoch": 20.0, |
|
"eval_cer": 0.9086442220200182, |
|
"eval_loss": 9.438006401062012, |
|
"eval_runtime": 52.8014, |
|
"eval_samples_per_second": 10.265, |
|
"eval_steps_per_second": 1.288, |
|
"eval_wer": 0.9748069890288501, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 21.0, |
|
"eval_cer": 0.8900090991810737, |
|
"eval_loss": 9.513178825378418, |
|
"eval_runtime": 52.7023, |
|
"eval_samples_per_second": 10.284, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9750101584721658, |
|
"step": 294 |
|
}, |
|
{ |
|
"epoch": 21.43, |
|
"learning_rate": 2.5757142857142857e-05, |
|
"loss": 3.6568, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 22.0, |
|
"eval_cer": 0.8811282984531392, |
|
"eval_loss": 9.6267728805542, |
|
"eval_runtime": 53.0646, |
|
"eval_samples_per_second": 10.214, |
|
"eval_steps_per_second": 1.281, |
|
"eval_wer": 0.9817147501015847, |
|
"step": 308 |
|
}, |
|
{ |
|
"epoch": 23.0, |
|
"eval_cer": 0.8846587807097361, |
|
"eval_loss": 9.698858261108398, |
|
"eval_runtime": 52.7263, |
|
"eval_samples_per_second": 10.28, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 1.0042665583096302, |
|
"step": 322 |
|
}, |
|
{ |
|
"epoch": 24.0, |
|
"eval_cer": 0.8963057324840764, |
|
"eval_loss": 9.611275672912598, |
|
"eval_runtime": 52.7167, |
|
"eval_samples_per_second": 10.281, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9788703778951645, |
|
"step": 336 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_cer": 0.8923748862602365, |
|
"eval_loss": 9.794692039489746, |
|
"eval_runtime": 52.8702, |
|
"eval_samples_per_second": 10.252, |
|
"eval_steps_per_second": 1.286, |
|
"eval_wer": 0.980698902885006, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 26.0, |
|
"eval_cer": 0.8979435850773431, |
|
"eval_loss": 9.83806324005127, |
|
"eval_runtime": 52.7321, |
|
"eval_samples_per_second": 10.278, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9794798862251117, |
|
"step": 364 |
|
}, |
|
{ |
|
"epoch": 27.0, |
|
"eval_cer": 0.8951774340309372, |
|
"eval_loss": 10.03061580657959, |
|
"eval_runtime": 52.6816, |
|
"eval_samples_per_second": 10.288, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.9788703778951645, |
|
"step": 378 |
|
}, |
|
{ |
|
"epoch": 28.0, |
|
"eval_cer": 0.8947042766151047, |
|
"eval_loss": 9.994989395141602, |
|
"eval_runtime": 53.3774, |
|
"eval_samples_per_second": 10.154, |
|
"eval_steps_per_second": 1.274, |
|
"eval_wer": 0.9792767167817961, |
|
"step": 392 |
|
}, |
|
{ |
|
"epoch": 28.57, |
|
"learning_rate": 2.432857142857143e-05, |
|
"loss": 3.316, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 29.0, |
|
"eval_cer": 0.8978707916287534, |
|
"eval_loss": 10.14880084991455, |
|
"eval_runtime": 52.6791, |
|
"eval_samples_per_second": 10.289, |
|
"eval_steps_per_second": 1.291, |
|
"eval_wer": 0.9780577001219016, |
|
"step": 406 |
|
}, |
|
{ |
|
"epoch": 30.0, |
|
"eval_cer": 0.9092265696087353, |
|
"eval_loss": 10.193445205688477, |
|
"eval_runtime": 52.6484, |
|
"eval_samples_per_second": 10.295, |
|
"eval_steps_per_second": 1.292, |
|
"eval_wer": 0.9809020723283218, |
|
"step": 420 |
|
}, |
|
{ |
|
"epoch": 31.0, |
|
"eval_cer": 0.9298999090081893, |
|
"eval_loss": 10.21463680267334, |
|
"eval_runtime": 52.7062, |
|
"eval_samples_per_second": 10.283, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9880130028443722, |
|
"step": 434 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"eval_cer": 0.9593084622383985, |
|
"eval_loss": 10.298548698425293, |
|
"eval_runtime": 52.7136, |
|
"eval_samples_per_second": 10.282, |
|
"eval_steps_per_second": 1.29, |
|
"eval_wer": 0.9997968305566842, |
|
"step": 448 |
|
}, |
|
{ |
|
"epoch": 32.0, |
|
"step": 448, |
|
"total_flos": 3.9986309695731635e+18, |
|
"train_loss": 7.336955785751343, |
|
"train_runtime": 6516.6943, |
|
"train_samples_per_second": 10.312, |
|
"train_steps_per_second": 0.322 |
|
} |
|
], |
|
"max_steps": 2100, |
|
"num_train_epochs": 150, |
|
"total_flos": 3.9986309695731635e+18, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|