{ "best_metric": 0.5470190644264221, "best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-10/checkpoint-1764", "epoch": 146.0, "global_step": 2044, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.07, "learning_rate": 3e-05, "loss": 37.9224, "step": 1 }, { "epoch": 1.0, "eval_cer": 0.9618198362147407, "eval_loss": 24.657764434814453, "eval_runtime": 53.8844, "eval_samples_per_second": 10.059, "eval_steps_per_second": 1.262, "eval_wer": 1.0, "step": 14 }, { "epoch": 2.0, "eval_cer": 0.9618562329390354, "eval_loss": 7.14532470703125, "eval_runtime": 53.624, "eval_samples_per_second": 10.107, "eval_steps_per_second": 1.268, "eval_wer": 1.0, "step": 28 }, { "epoch": 3.0, "eval_cer": 0.9618562329390354, "eval_loss": 4.43905782699585, "eval_runtime": 53.4498, "eval_samples_per_second": 10.14, "eval_steps_per_second": 1.272, "eval_wer": 1.0, "step": 42 }, { "epoch": 4.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.90922474861145, "eval_runtime": 53.742, "eval_samples_per_second": 10.085, "eval_steps_per_second": 1.265, "eval_wer": 1.0, "step": 56 }, { "epoch": 5.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.6834604740142822, "eval_runtime": 53.6572, "eval_samples_per_second": 10.101, "eval_steps_per_second": 1.267, "eval_wer": 1.0, "step": 70 }, { "epoch": 6.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.522313117980957, "eval_runtime": 53.7448, "eval_samples_per_second": 10.085, "eval_steps_per_second": 1.265, "eval_wer": 1.0, "step": 84 }, { "epoch": 7.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.3716423511505127, "eval_runtime": 53.5358, "eval_samples_per_second": 10.124, "eval_steps_per_second": 1.27, "eval_wer": 1.0, "step": 98 }, { "epoch": 7.14, "learning_rate": 2.8614285714285714e-05, "loss": 9.0651, "step": 100 }, { "epoch": 8.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.2723329067230225, "eval_runtime": 53.6095, "eval_samples_per_second": 10.11, "eval_steps_per_second": 1.268, "eval_wer": 1.0, "step": 112 }, { "epoch": 9.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.1859705448150635, "eval_runtime": 53.5878, "eval_samples_per_second": 10.114, "eval_steps_per_second": 1.269, "eval_wer": 1.0, "step": 126 }, { "epoch": 10.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.146104574203491, "eval_runtime": 53.491, "eval_samples_per_second": 10.133, "eval_steps_per_second": 1.271, "eval_wer": 1.0, "step": 140 }, { "epoch": 11.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.1367859840393066, "eval_runtime": 53.9341, "eval_samples_per_second": 10.049, "eval_steps_per_second": 1.261, "eval_wer": 1.0, "step": 154 }, { "epoch": 12.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0960755348205566, "eval_runtime": 53.5674, "eval_samples_per_second": 10.118, "eval_steps_per_second": 1.269, "eval_wer": 1.0, "step": 168 }, { "epoch": 13.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0767099857330322, "eval_runtime": 53.6269, "eval_samples_per_second": 10.107, "eval_steps_per_second": 1.268, "eval_wer": 1.0, "step": 182 }, { "epoch": 14.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0509135723114014, "eval_runtime": 53.9364, "eval_samples_per_second": 10.049, "eval_steps_per_second": 1.261, "eval_wer": 1.0, "step": 196 }, { "epoch": 14.29, "learning_rate": 2.7185714285714287e-05, "loss": 3.0601, "step": 200 }, { "epoch": 15.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.087069511413574, "eval_runtime": 53.3522, "eval_samples_per_second": 10.159, "eval_steps_per_second": 1.275, "eval_wer": 1.0, "step": 210 }, { "epoch": 16.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.041494131088257, "eval_runtime": 53.2391, "eval_samples_per_second": 10.18, "eval_steps_per_second": 1.277, "eval_wer": 1.0, "step": 224 }, { "epoch": 17.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0329771041870117, "eval_runtime": 53.3109, "eval_samples_per_second": 10.167, "eval_steps_per_second": 1.276, "eval_wer": 1.0, "step": 238 }, { "epoch": 18.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.019200086593628, "eval_runtime": 53.38, "eval_samples_per_second": 10.154, "eval_steps_per_second": 1.274, "eval_wer": 1.0, "step": 252 }, { "epoch": 19.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.026556968688965, "eval_runtime": 53.4357, "eval_samples_per_second": 10.143, "eval_steps_per_second": 1.273, "eval_wer": 1.0, "step": 266 }, { "epoch": 20.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.024301528930664, "eval_runtime": 53.5352, "eval_samples_per_second": 10.124, "eval_steps_per_second": 1.27, "eval_wer": 1.0, "step": 280 }, { "epoch": 21.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0105724334716797, "eval_runtime": 53.4874, "eval_samples_per_second": 10.133, "eval_steps_per_second": 1.271, "eval_wer": 1.0, "step": 294 }, { "epoch": 21.43, "learning_rate": 2.5757142857142857e-05, "loss": 2.9552, "step": 300 }, { "epoch": 22.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0053164958953857, "eval_runtime": 53.5107, "eval_samples_per_second": 10.129, "eval_steps_per_second": 1.271, "eval_wer": 1.0, "step": 308 }, { "epoch": 23.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9986302852630615, "eval_runtime": 53.679, "eval_samples_per_second": 10.097, "eval_steps_per_second": 1.267, "eval_wer": 1.0, "step": 322 }, { "epoch": 24.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0029869079589844, "eval_runtime": 54.0064, "eval_samples_per_second": 10.036, "eval_steps_per_second": 1.259, "eval_wer": 1.0, "step": 336 }, { "epoch": 25.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.99497389793396, "eval_runtime": 53.5494, "eval_samples_per_second": 10.122, "eval_steps_per_second": 1.27, "eval_wer": 1.0, "step": 350 }, { "epoch": 26.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0058376789093018, "eval_runtime": 53.3418, "eval_samples_per_second": 10.161, "eval_steps_per_second": 1.275, "eval_wer": 1.0, "step": 364 }, { "epoch": 27.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9943442344665527, "eval_runtime": 53.5262, "eval_samples_per_second": 10.126, "eval_steps_per_second": 1.27, "eval_wer": 1.0, "step": 378 }, { "epoch": 28.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9845216274261475, "eval_runtime": 53.6167, "eval_samples_per_second": 10.109, "eval_steps_per_second": 1.268, "eval_wer": 1.0, "step": 392 }, { "epoch": 28.57, "learning_rate": 2.432857142857143e-05, "loss": 2.9213, "step": 400 }, { "epoch": 29.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.971311330795288, "eval_runtime": 53.7132, "eval_samples_per_second": 10.091, "eval_steps_per_second": 1.266, "eval_wer": 1.0, "step": 406 }, { "epoch": 30.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9484527111053467, "eval_runtime": 53.7813, "eval_samples_per_second": 10.078, "eval_steps_per_second": 1.264, "eval_wer": 1.0, "step": 420 }, { "epoch": 31.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.941479206085205, "eval_runtime": 53.6932, "eval_samples_per_second": 10.094, "eval_steps_per_second": 1.266, "eval_wer": 1.0, "step": 434 }, { "epoch": 32.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.8912880420684814, "eval_runtime": 53.8504, "eval_samples_per_second": 10.065, "eval_steps_per_second": 1.263, "eval_wer": 1.0, "step": 448 }, { "epoch": 33.0, "eval_cer": 0.9612010919017289, "eval_loss": 2.8057382106781006, "eval_runtime": 54.0302, "eval_samples_per_second": 10.031, "eval_steps_per_second": 1.259, "eval_wer": 1.0, "step": 462 }, { "epoch": 34.0, "eval_cer": 0.9598908098271156, "eval_loss": 2.698427438735962, "eval_runtime": 53.7576, "eval_samples_per_second": 10.082, "eval_steps_per_second": 1.265, "eval_wer": 1.0, "step": 476 }, { "epoch": 35.0, "eval_cer": 0.9066787989080982, "eval_loss": 2.57851243019104, "eval_runtime": 53.7653, "eval_samples_per_second": 10.081, "eval_steps_per_second": 1.265, "eval_wer": 1.0, "step": 490 }, { "epoch": 35.71, "learning_rate": 2.29e-05, "loss": 2.7804, "step": 500 }, { "epoch": 36.0, "eval_cer": 0.7928662420382165, "eval_loss": 2.3545000553131104, "eval_runtime": 53.7523, "eval_samples_per_second": 10.083, "eval_steps_per_second": 1.265, "eval_wer": 1.0, "step": 504 }, { "epoch": 37.0, "eval_cer": 0.5933030027297543, "eval_loss": 2.0432868003845215, "eval_runtime": 53.6932, "eval_samples_per_second": 10.094, "eval_steps_per_second": 1.266, "eval_wer": 1.0, "step": 518 }, { "epoch": 38.0, "eval_cer": 0.4701000909918107, "eval_loss": 1.7438023090362549, "eval_runtime": 53.7889, "eval_samples_per_second": 10.076, "eval_steps_per_second": 1.264, "eval_wer": 1.0, "step": 532 }, { "epoch": 39.0, "eval_cer": 0.4139399454049136, "eval_loss": 1.4659055471420288, "eval_runtime": 53.7237, "eval_samples_per_second": 10.089, "eval_steps_per_second": 1.266, "eval_wer": 1.0, "step": 546 }, { "epoch": 40.0, "eval_cer": 0.3840218380345769, "eval_loss": 1.2873483896255493, "eval_runtime": 53.8213, "eval_samples_per_second": 10.07, "eval_steps_per_second": 1.263, "eval_wer": 0.9928890694839496, "step": 560 }, { "epoch": 41.0, "eval_cer": 0.3386715195632393, "eval_loss": 1.1587954759597778, "eval_runtime": 53.6935, "eval_samples_per_second": 10.094, "eval_steps_per_second": 1.266, "eval_wer": 0.9315318976026006, "step": 574 }, { "epoch": 42.0, "eval_cer": 0.2705732484076433, "eval_loss": 1.016275405883789, "eval_runtime": 53.8774, "eval_samples_per_second": 10.06, "eval_steps_per_second": 1.262, "eval_wer": 0.7395367736692402, "step": 588 }, { "epoch": 42.86, "learning_rate": 2.1471428571428574e-05, "loss": 1.6517, "step": 600 }, { "epoch": 43.0, "eval_cer": 0.22584167424931756, "eval_loss": 0.9398883581161499, "eval_runtime": 53.8756, "eval_samples_per_second": 10.06, "eval_steps_per_second": 1.262, "eval_wer": 0.5331166192604633, "step": 602 }, { "epoch": 44.0, "eval_cer": 0.21670609645131939, "eval_loss": 0.91312175989151, "eval_runtime": 53.9097, "eval_samples_per_second": 10.054, "eval_steps_per_second": 1.261, "eval_wer": 0.4928890694839496, "step": 616 }, { "epoch": 45.0, "eval_cer": 0.2113557779799818, "eval_loss": 0.8351526856422424, "eval_runtime": 54.2652, "eval_samples_per_second": 9.988, "eval_steps_per_second": 1.253, "eval_wer": 0.477041852905323, "step": 630 }, { "epoch": 46.0, "eval_cer": 0.2083712465878071, "eval_loss": 0.8114636540412903, "eval_runtime": 53.8109, "eval_samples_per_second": 10.072, "eval_steps_per_second": 1.264, "eval_wer": 0.45550589191385615, "step": 644 }, { "epoch": 47.0, "eval_cer": 0.2037852593266606, "eval_loss": 0.78495192527771, "eval_runtime": 53.8458, "eval_samples_per_second": 10.066, "eval_steps_per_second": 1.263, "eval_wer": 0.4402681836651768, "step": 658 }, { "epoch": 48.0, "eval_cer": 0.2018926296633303, "eval_loss": 0.757414698600769, "eval_runtime": 53.866, "eval_samples_per_second": 10.062, "eval_steps_per_second": 1.262, "eval_wer": 0.4355952864689151, "step": 672 }, { "epoch": 49.0, "eval_cer": 0.1989080982711556, "eval_loss": 0.723770022392273, "eval_runtime": 54.4837, "eval_samples_per_second": 9.948, "eval_steps_per_second": 1.248, "eval_wer": 0.42482730597318163, "step": 686 }, { "epoch": 50.0, "learning_rate": 2.004285714285714e-05, "loss": 0.7966, "step": 700 }, { "epoch": 50.0, "eval_cer": 0.19603275705186532, "eval_loss": 0.7132200002670288, "eval_runtime": 53.8591, "eval_samples_per_second": 10.063, "eval_steps_per_second": 1.263, "eval_wer": 0.41304347826086957, "step": 700 }, { "epoch": 51.0, "eval_cer": 0.19628753412192904, "eval_loss": 0.7053857445716858, "eval_runtime": 53.8356, "eval_samples_per_second": 10.068, "eval_steps_per_second": 1.263, "eval_wer": 0.41284030881755385, "step": 714 }, { "epoch": 52.0, "eval_cer": 0.19898089171974523, "eval_loss": 0.7119351029396057, "eval_runtime": 53.6949, "eval_samples_per_second": 10.094, "eval_steps_per_second": 1.266, "eval_wer": 0.413449817147501, "step": 728 }, { "epoch": 53.0, "eval_cer": 0.19450409463148316, "eval_loss": 0.6792961955070496, "eval_runtime": 53.7823, "eval_samples_per_second": 10.078, "eval_steps_per_second": 1.264, "eval_wer": 0.3990247866720845, "step": 742 }, { "epoch": 54.0, "eval_cer": 0.19319381255686988, "eval_loss": 0.6717870235443115, "eval_runtime": 53.6919, "eval_samples_per_second": 10.095, "eval_steps_per_second": 1.266, "eval_wer": 0.39435188947582284, "step": 756 }, { "epoch": 55.0, "eval_cer": 0.19494085532302094, "eval_loss": 0.6717579960823059, "eval_runtime": 53.8881, "eval_samples_per_second": 10.058, "eval_steps_per_second": 1.262, "eval_wer": 0.4012596505485575, "step": 770 }, { "epoch": 56.0, "eval_cer": 0.19654231119199272, "eval_loss": 0.6830848455429077, "eval_runtime": 54.2951, "eval_samples_per_second": 9.982, "eval_steps_per_second": 1.252, "eval_wer": 0.3976026005688744, "step": 784 }, { "epoch": 57.0, "eval_cer": 0.1916287534121929, "eval_loss": 0.6400262117385864, "eval_runtime": 53.8725, "eval_samples_per_second": 10.061, "eval_steps_per_second": 1.262, "eval_wer": 0.38703778951645673, "step": 798 }, { "epoch": 57.14, "learning_rate": 1.8614285714285715e-05, "loss": 0.5799, "step": 800 }, { "epoch": 58.0, "eval_cer": 0.19060964513193812, "eval_loss": 0.642275869846344, "eval_runtime": 53.5527, "eval_samples_per_second": 10.121, "eval_steps_per_second": 1.27, "eval_wer": 0.3843965867533523, "step": 812 }, { "epoch": 59.0, "eval_cer": 0.19075523202911737, "eval_loss": 0.6394357681274414, "eval_runtime": 54.0972, "eval_samples_per_second": 10.019, "eval_steps_per_second": 1.257, "eval_wer": 0.38338073953677365, "step": 826 }, { "epoch": 60.0, "eval_cer": 0.1924294813466788, "eval_loss": 0.6573936939239502, "eval_runtime": 53.9836, "eval_samples_per_second": 10.04, "eval_steps_per_second": 1.26, "eval_wer": 0.37850467289719625, "step": 840 }, { "epoch": 61.0, "eval_cer": 0.19181073703366697, "eval_loss": 0.6321007013320923, "eval_runtime": 53.881, "eval_samples_per_second": 10.059, "eval_steps_per_second": 1.262, "eval_wer": 0.38155221454693217, "step": 854 }, { "epoch": 62.0, "eval_cer": 0.19126478616924478, "eval_loss": 0.63057541847229, "eval_runtime": 53.9032, "eval_samples_per_second": 10.055, "eval_steps_per_second": 1.262, "eval_wer": 0.38013002844372207, "step": 868 }, { "epoch": 63.0, "eval_cer": 0.1915923566878981, "eval_loss": 0.6432803869247437, "eval_runtime": 53.9619, "eval_samples_per_second": 10.044, "eval_steps_per_second": 1.26, "eval_wer": 0.37992685900040635, "step": 882 }, { "epoch": 64.0, "eval_cer": 0.18955414012738853, "eval_loss": 0.6342417001724243, "eval_runtime": 53.7595, "eval_samples_per_second": 10.082, "eval_steps_per_second": 1.265, "eval_wer": 0.38114587566030067, "step": 896 }, { "epoch": 64.29, "learning_rate": 1.7185714285714285e-05, "loss": 0.445, "step": 900 }, { "epoch": 65.0, "eval_cer": 0.19042766151046406, "eval_loss": 0.6211907267570496, "eval_runtime": 53.9351, "eval_samples_per_second": 10.049, "eval_steps_per_second": 1.261, "eval_wer": 0.38114587566030067, "step": 910 }, { "epoch": 66.0, "eval_cer": 0.1894813466787989, "eval_loss": 0.6164088249206543, "eval_runtime": 53.6257, "eval_samples_per_second": 10.107, "eval_steps_per_second": 1.268, "eval_wer": 0.3789110117838277, "step": 924 }, { "epoch": 67.0, "eval_cer": 0.18715195632393083, "eval_loss": 0.6005796194076538, "eval_runtime": 53.6712, "eval_samples_per_second": 10.099, "eval_steps_per_second": 1.267, "eval_wer": 0.3732222673709874, "step": 938 }, { "epoch": 68.0, "eval_cer": 0.18911737943585077, "eval_loss": 0.6054388880729675, "eval_runtime": 53.6435, "eval_samples_per_second": 10.104, "eval_steps_per_second": 1.268, "eval_wer": 0.3746444534741975, "step": 952 }, { "epoch": 69.0, "eval_cer": 0.18940855323020928, "eval_loss": 0.6244754791259766, "eval_runtime": 53.8541, "eval_samples_per_second": 10.064, "eval_steps_per_second": 1.263, "eval_wer": 0.3722064201544088, "step": 966 }, { "epoch": 70.0, "eval_cer": 0.1878070973612375, "eval_loss": 0.6090296506881714, "eval_runtime": 53.9168, "eval_samples_per_second": 10.053, "eval_steps_per_second": 1.261, "eval_wer": 0.36875253961804144, "step": 980 }, { "epoch": 71.0, "eval_cer": 0.18758871701546861, "eval_loss": 0.6072561144828796, "eval_runtime": 53.6209, "eval_samples_per_second": 10.108, "eval_steps_per_second": 1.268, "eval_wer": 0.3669240146281999, "step": 994 }, { "epoch": 71.43, "learning_rate": 1.5757142857142858e-05, "loss": 0.3746, "step": 1000 }, { "epoch": 72.0, "eval_cer": 0.18886260236578709, "eval_loss": 0.5989311337471008, "eval_runtime": 53.765, "eval_samples_per_second": 10.081, "eval_steps_per_second": 1.265, "eval_wer": 0.3707842340511987, "step": 1008 }, { "epoch": 73.0, "eval_cer": 0.18744313011828936, "eval_loss": 0.5967620611190796, "eval_runtime": 53.6159, "eval_samples_per_second": 10.109, "eval_steps_per_second": 1.268, "eval_wer": 0.3681430312880943, "step": 1022 }, { "epoch": 74.0, "eval_cer": 0.1870427661510464, "eval_loss": 0.5945658683776855, "eval_runtime": 53.8501, "eval_samples_per_second": 10.065, "eval_steps_per_second": 1.263, "eval_wer": 0.3659081674116213, "step": 1036 }, { "epoch": 75.0, "eval_cer": 0.18638762511373977, "eval_loss": 0.5873651504516602, "eval_runtime": 53.5608, "eval_samples_per_second": 10.119, "eval_steps_per_second": 1.27, "eval_wer": 0.3622511174319382, "step": 1050 }, { "epoch": 76.0, "eval_cer": 0.1870427661510464, "eval_loss": 0.5927525758743286, "eval_runtime": 53.7753, "eval_samples_per_second": 10.079, "eval_steps_per_second": 1.265, "eval_wer": 0.36387647297846404, "step": 1064 }, { "epoch": 77.0, "eval_cer": 0.18824385805277524, "eval_loss": 0.5889000296592712, "eval_runtime": 53.8481, "eval_samples_per_second": 10.065, "eval_steps_per_second": 1.263, "eval_wer": 0.3681430312880943, "step": 1078 }, { "epoch": 78.0, "eval_cer": 0.18635122838944496, "eval_loss": 0.5722672343254089, "eval_runtime": 53.9948, "eval_samples_per_second": 10.038, "eval_steps_per_second": 1.259, "eval_wer": 0.36834620073141, "step": 1092 }, { "epoch": 78.57, "learning_rate": 1.4328571428571428e-05, "loss": 0.3543, "step": 1100 }, { "epoch": 79.0, "eval_cer": 0.18627843494085533, "eval_loss": 0.5927807688713074, "eval_runtime": 53.7175, "eval_samples_per_second": 10.09, "eval_steps_per_second": 1.266, "eval_wer": 0.3657049979683056, "step": 1106 }, { "epoch": 80.0, "eval_cer": 0.18547770700636942, "eval_loss": 0.583193838596344, "eval_runtime": 53.7886, "eval_samples_per_second": 10.076, "eval_steps_per_second": 1.264, "eval_wer": 0.36489232019504264, "step": 1120 }, { "epoch": 81.0, "eval_cer": 0.18493175614194723, "eval_loss": 0.5785495638847351, "eval_runtime": 53.8447, "eval_samples_per_second": 10.066, "eval_steps_per_second": 1.263, "eval_wer": 0.3644859813084112, "step": 1134 }, { "epoch": 82.0, "eval_cer": 0.18424021838034577, "eval_loss": 0.5877463817596436, "eval_runtime": 53.7471, "eval_samples_per_second": 10.084, "eval_steps_per_second": 1.265, "eval_wer": 0.35798455912230803, "step": 1148 }, { "epoch": 83.0, "eval_cer": 0.18525932666060055, "eval_loss": 0.5869647860527039, "eval_runtime": 53.8204, "eval_samples_per_second": 10.071, "eval_steps_per_second": 1.263, "eval_wer": 0.36265745631856966, "step": 1162 }, { "epoch": 84.0, "eval_cer": 0.18456778889899908, "eval_loss": 0.5738150477409363, "eval_runtime": 53.9516, "eval_samples_per_second": 10.046, "eval_steps_per_second": 1.26, "eval_wer": 0.3618447785453068, "step": 1176 }, { "epoch": 85.0, "eval_cer": 0.18158325750682439, "eval_loss": 0.5640825033187866, "eval_runtime": 53.9077, "eval_samples_per_second": 10.054, "eval_steps_per_second": 1.261, "eval_wer": 0.35757822023567654, "step": 1190 }, { "epoch": 85.71, "learning_rate": 1.29e-05, "loss": 0.3207, "step": 1200 }, { "epoch": 86.0, "eval_cer": 0.18209281164695176, "eval_loss": 0.5727854371070862, "eval_runtime": 54.0413, "eval_samples_per_second": 10.029, "eval_steps_per_second": 1.258, "eval_wer": 0.35656237301909793, "step": 1204 }, { "epoch": 87.0, "eval_cer": 0.18169244767970882, "eval_loss": 0.5706486105918884, "eval_runtime": 54.0703, "eval_samples_per_second": 10.024, "eval_steps_per_second": 1.258, "eval_wer": 0.35595286468915077, "step": 1218 }, { "epoch": 88.0, "eval_cer": 0.1813284804367607, "eval_loss": 0.5607408881187439, "eval_runtime": 54.3555, "eval_samples_per_second": 9.971, "eval_steps_per_second": 1.251, "eval_wer": 0.3569687119057294, "step": 1232 }, { "epoch": 89.0, "eval_cer": 0.181656050955414, "eval_loss": 0.56435227394104, "eval_runtime": 53.7806, "eval_samples_per_second": 10.078, "eval_steps_per_second": 1.264, "eval_wer": 0.35574969524583505, "step": 1246 }, { "epoch": 90.0, "eval_cer": 0.1824203821656051, "eval_loss": 0.5659990310668945, "eval_runtime": 54.3449, "eval_samples_per_second": 9.973, "eval_steps_per_second": 1.251, "eval_wer": 0.35818772856562375, "step": 1260 }, { "epoch": 91.0, "eval_cer": 0.18285714285714286, "eval_loss": 0.5688397884368896, "eval_runtime": 53.7699, "eval_samples_per_second": 10.08, "eval_steps_per_second": 1.265, "eval_wer": 0.35656237301909793, "step": 1274 }, { "epoch": 92.0, "eval_cer": 0.18074613284804367, "eval_loss": 0.563470184803009, "eval_runtime": 54.0176, "eval_samples_per_second": 10.034, "eval_steps_per_second": 1.259, "eval_wer": 0.35412433969930923, "step": 1288 }, { "epoch": 92.86, "learning_rate": 1.1471428571428572e-05, "loss": 0.2984, "step": 1300 }, { "epoch": 93.0, "eval_cer": 0.1813648771610555, "eval_loss": 0.5662950277328491, "eval_runtime": 54.0264, "eval_samples_per_second": 10.032, "eval_steps_per_second": 1.259, "eval_wer": 0.35026412027631043, "step": 1302 }, { "epoch": 94.0, "eval_cer": 0.18074613284804367, "eval_loss": 0.5514569282531738, "eval_runtime": 53.9373, "eval_samples_per_second": 10.049, "eval_steps_per_second": 1.261, "eval_wer": 0.35432750914262495, "step": 1316 }, { "epoch": 95.0, "eval_cer": 0.1802729754322111, "eval_loss": 0.5563488602638245, "eval_runtime": 54.0134, "eval_samples_per_second": 10.035, "eval_steps_per_second": 1.259, "eval_wer": 0.35168630637952053, "step": 1330 }, { "epoch": 96.0, "eval_cer": 0.18089171974522292, "eval_loss": 0.5617594122886658, "eval_runtime": 54.0211, "eval_samples_per_second": 10.033, "eval_steps_per_second": 1.259, "eval_wer": 0.3508736286062576, "step": 1344 }, { "epoch": 97.0, "eval_cer": 0.18074613284804367, "eval_loss": 0.5554497838020325, "eval_runtime": 54.2071, "eval_samples_per_second": 9.999, "eval_steps_per_second": 1.254, "eval_wer": 0.35168630637952053, "step": 1358 }, { "epoch": 98.0, "eval_cer": 0.18092811646951773, "eval_loss": 0.5605758428573608, "eval_runtime": 53.9801, "eval_samples_per_second": 10.041, "eval_steps_per_second": 1.26, "eval_wer": 0.35290532303941485, "step": 1372 }, { "epoch": 99.0, "eval_cer": 0.1813284804367607, "eval_loss": 0.5596539974212646, "eval_runtime": 53.7711, "eval_samples_per_second": 10.08, "eval_steps_per_second": 1.265, "eval_wer": 0.35107679804957337, "step": 1386 }, { "epoch": 100.0, "learning_rate": 1.0042857142857144e-05, "loss": 0.2622, "step": 1400 }, { "epoch": 100.0, "eval_cer": 0.18121929026387626, "eval_loss": 0.5628100037574768, "eval_runtime": 53.9102, "eval_samples_per_second": 10.054, "eval_steps_per_second": 1.261, "eval_wer": 0.35046728971962615, "step": 1400 }, { "epoch": 101.0, "eval_cer": 0.17990900818926298, "eval_loss": 0.5564116835594177, "eval_runtime": 54.03, "eval_samples_per_second": 10.031, "eval_steps_per_second": 1.259, "eval_wer": 0.34945144250304755, "step": 1414 }, { "epoch": 102.0, "eval_cer": 0.18114649681528663, "eval_loss": 0.5625892877578735, "eval_runtime": 53.8963, "eval_samples_per_second": 10.056, "eval_steps_per_second": 1.262, "eval_wer": 0.3484355952864689, "step": 1428 }, { "epoch": 103.0, "eval_cer": 0.1799818016378526, "eval_loss": 0.5555956959724426, "eval_runtime": 54.0019, "eval_samples_per_second": 10.037, "eval_steps_per_second": 1.259, "eval_wer": 0.34701340918325885, "step": 1442 }, { "epoch": 104.0, "eval_cer": 0.1799454049135578, "eval_loss": 0.5602657198905945, "eval_runtime": 53.864, "eval_samples_per_second": 10.062, "eval_steps_per_second": 1.262, "eval_wer": 0.3464039008533117, "step": 1456 }, { "epoch": 105.0, "eval_cer": 0.17987261146496816, "eval_loss": 0.5570572018623352, "eval_runtime": 53.8761, "eval_samples_per_second": 10.06, "eval_steps_per_second": 1.262, "eval_wer": 0.34538805363673303, "step": 1470 }, { "epoch": 106.0, "eval_cer": 0.17990900818926298, "eval_loss": 0.5618259310722351, "eval_runtime": 53.8537, "eval_samples_per_second": 10.064, "eval_steps_per_second": 1.263, "eval_wer": 0.3466070702966274, "step": 1484 }, { "epoch": 107.0, "eval_cer": 0.17867151956323932, "eval_loss": 0.5518925786018372, "eval_runtime": 54.2003, "eval_samples_per_second": 10.0, "eval_steps_per_second": 1.255, "eval_wer": 0.343965867533523, "step": 1498 }, { "epoch": 107.14, "learning_rate": 8.614285714285714e-06, "loss": 0.2519, "step": 1500 }, { "epoch": 108.0, "eval_cer": 0.17903548680618744, "eval_loss": 0.5540814399719238, "eval_runtime": 53.903, "eval_samples_per_second": 10.055, "eval_steps_per_second": 1.262, "eval_wer": 0.343965867533523, "step": 1512 }, { "epoch": 109.0, "eval_cer": 0.17939945404913557, "eval_loss": 0.557438850402832, "eval_runtime": 54.7258, "eval_samples_per_second": 9.904, "eval_steps_per_second": 1.243, "eval_wer": 0.3464039008533117, "step": 1526 }, { "epoch": 110.0, "eval_cer": 0.18009099181073704, "eval_loss": 0.5590262413024902, "eval_runtime": 54.0902, "eval_samples_per_second": 10.02, "eval_steps_per_second": 1.257, "eval_wer": 0.34538805363673303, "step": 1540 }, { "epoch": 111.0, "eval_cer": 0.17958143767060963, "eval_loss": 0.5529592633247375, "eval_runtime": 53.9289, "eval_samples_per_second": 10.05, "eval_steps_per_second": 1.261, "eval_wer": 0.34477854530678587, "step": 1554 }, { "epoch": 112.0, "eval_cer": 0.1791810737033667, "eval_loss": 0.5500696301460266, "eval_runtime": 53.992, "eval_samples_per_second": 10.039, "eval_steps_per_second": 1.259, "eval_wer": 0.3437626980902072, "step": 1568 }, { "epoch": 113.0, "eval_cer": 0.17990900818926298, "eval_loss": 0.5595071911811829, "eval_runtime": 54.515, "eval_samples_per_second": 9.942, "eval_steps_per_second": 1.247, "eval_wer": 0.34477854530678587, "step": 1582 }, { "epoch": 114.0, "eval_cer": 0.18005459508644223, "eval_loss": 0.5535922646522522, "eval_runtime": 53.9067, "eval_samples_per_second": 10.054, "eval_steps_per_second": 1.261, "eval_wer": 0.34457537586347015, "step": 1596 }, { "epoch": 114.29, "learning_rate": 7.185714285714286e-06, "loss": 0.245, "step": 1600 }, { "epoch": 115.0, "eval_cer": 0.1788898999090082, "eval_loss": 0.5480047464370728, "eval_runtime": 53.9861, "eval_samples_per_second": 10.04, "eval_steps_per_second": 1.26, "eval_wer": 0.34315318976026005, "step": 1610 }, { "epoch": 116.0, "eval_cer": 0.17979981801637854, "eval_loss": 0.562286913394928, "eval_runtime": 53.656, "eval_samples_per_second": 10.101, "eval_steps_per_second": 1.267, "eval_wer": 0.34863876472978467, "step": 1624 }, { "epoch": 117.0, "eval_cer": 0.17903548680618744, "eval_loss": 0.549622118473053, "eval_runtime": 53.5772, "eval_samples_per_second": 10.116, "eval_steps_per_second": 1.269, "eval_wer": 0.3427468508736286, "step": 1638 }, { "epoch": 118.0, "eval_cer": 0.17885350318471338, "eval_loss": 0.5551720857620239, "eval_runtime": 53.9431, "eval_samples_per_second": 10.048, "eval_steps_per_second": 1.261, "eval_wer": 0.34213734254368144, "step": 1652 }, { "epoch": 119.0, "eval_cer": 0.17867151956323932, "eval_loss": 0.5557767152786255, "eval_runtime": 54.2974, "eval_samples_per_second": 9.982, "eval_steps_per_second": 1.252, "eval_wer": 0.3437626980902072, "step": 1666 }, { "epoch": 120.0, "eval_cer": 0.17834394904458598, "eval_loss": 0.552444338798523, "eval_runtime": 53.9105, "eval_samples_per_second": 10.054, "eval_steps_per_second": 1.261, "eval_wer": 0.3425436814303129, "step": 1680 }, { "epoch": 121.0, "eval_cer": 0.1785987261146497, "eval_loss": 0.5581905841827393, "eval_runtime": 53.9834, "eval_samples_per_second": 10.04, "eval_steps_per_second": 1.26, "eval_wer": 0.34213734254368144, "step": 1694 }, { "epoch": 121.43, "learning_rate": 5.7571428571428574e-06, "loss": 0.2322, "step": 1700 }, { "epoch": 122.0, "eval_cer": 0.17856232939035488, "eval_loss": 0.5533866286277771, "eval_runtime": 54.0755, "eval_samples_per_second": 10.023, "eval_steps_per_second": 1.258, "eval_wer": 0.3425436814303129, "step": 1708 }, { "epoch": 123.0, "eval_cer": 0.18012738853503185, "eval_loss": 0.5595676302909851, "eval_runtime": 53.7843, "eval_samples_per_second": 10.077, "eval_steps_per_second": 1.264, "eval_wer": 0.3464039008533117, "step": 1722 }, { "epoch": 124.0, "eval_cer": 0.17899909008189263, "eval_loss": 0.5486122369766235, "eval_runtime": 53.9909, "eval_samples_per_second": 10.039, "eval_steps_per_second": 1.259, "eval_wer": 0.34315318976026005, "step": 1736 }, { "epoch": 125.0, "eval_cer": 0.1792174704276615, "eval_loss": 0.5580961108207703, "eval_runtime": 53.9973, "eval_samples_per_second": 10.038, "eval_steps_per_second": 1.259, "eval_wer": 0.3425436814303129, "step": 1750 }, { "epoch": 126.0, "eval_cer": 0.17852593266606007, "eval_loss": 0.5470190644264221, "eval_runtime": 53.6657, "eval_samples_per_second": 10.1, "eval_steps_per_second": 1.267, "eval_wer": 0.34173100365705, "step": 1764 }, { "epoch": 127.0, "eval_cer": 0.17805277525022747, "eval_loss": 0.5543853640556335, "eval_runtime": 53.9507, "eval_samples_per_second": 10.046, "eval_steps_per_second": 1.26, "eval_wer": 0.3413246647704185, "step": 1778 }, { "epoch": 128.0, "eval_cer": 0.1780891719745223, "eval_loss": 0.5500943660736084, "eval_runtime": 53.7085, "eval_samples_per_second": 10.092, "eval_steps_per_second": 1.266, "eval_wer": 0.3435595286468915, "step": 1792 }, { "epoch": 128.57, "learning_rate": 4.328571428571429e-06, "loss": 0.2324, "step": 1800 }, { "epoch": 129.0, "eval_cer": 0.1781619654231119, "eval_loss": 0.5517907738685608, "eval_runtime": 54.1553, "eval_samples_per_second": 10.008, "eval_steps_per_second": 1.256, "eval_wer": 0.343965867533523, "step": 1806 }, { "epoch": 130.0, "eval_cer": 0.1775432211101001, "eval_loss": 0.551121711730957, "eval_runtime": 54.0869, "eval_samples_per_second": 10.021, "eval_steps_per_second": 1.257, "eval_wer": 0.3388866314506298, "step": 1820 }, { "epoch": 131.0, "eval_cer": 0.17823475887170154, "eval_loss": 0.5584121942520142, "eval_runtime": 54.0126, "eval_samples_per_second": 10.035, "eval_steps_per_second": 1.259, "eval_wer": 0.34173100365705, "step": 1834 }, { "epoch": 132.0, "eval_cer": 0.17747042766151047, "eval_loss": 0.549301028251648, "eval_runtime": 54.1977, "eval_samples_per_second": 10.0, "eval_steps_per_second": 1.255, "eval_wer": 0.33726127590410404, "step": 1848 }, { "epoch": 133.0, "eval_cer": 0.17768880800727935, "eval_loss": 0.5506242513656616, "eval_runtime": 54.3838, "eval_samples_per_second": 9.966, "eval_steps_per_second": 1.25, "eval_wer": 0.339496139780577, "step": 1862 }, { "epoch": 134.0, "eval_cer": 0.1781619654231119, "eval_loss": 0.5543136596679688, "eval_runtime": 53.8876, "eval_samples_per_second": 10.058, "eval_steps_per_second": 1.262, "eval_wer": 0.34091832588378707, "step": 1876 }, { "epoch": 135.0, "eval_cer": 0.17805277525022747, "eval_loss": 0.5588898062705994, "eval_runtime": 53.8452, "eval_samples_per_second": 10.066, "eval_steps_per_second": 1.263, "eval_wer": 0.33990247866720846, "step": 1890 }, { "epoch": 135.71, "learning_rate": 2.9e-06, "loss": 0.2077, "step": 1900 }, { "epoch": 136.0, "eval_cer": 0.17776160145586897, "eval_loss": 0.5555850267410278, "eval_runtime": 54.3429, "eval_samples_per_second": 9.974, "eval_steps_per_second": 1.251, "eval_wer": 0.3390898008939455, "step": 1904 }, { "epoch": 137.0, "eval_cer": 0.17779799818016379, "eval_loss": 0.5555258393287659, "eval_runtime": 53.6523, "eval_samples_per_second": 10.102, "eval_steps_per_second": 1.267, "eval_wer": 0.34071515644047135, "step": 1918 }, { "epoch": 138.0, "eval_cer": 0.17739763421292085, "eval_loss": 0.5501488447189331, "eval_runtime": 53.6556, "eval_samples_per_second": 10.101, "eval_steps_per_second": 1.267, "eval_wer": 0.3390898008939455, "step": 1932 }, { "epoch": 139.0, "eval_cer": 0.17721565059144678, "eval_loss": 0.5544245839118958, "eval_runtime": 54.0174, "eval_samples_per_second": 10.034, "eval_steps_per_second": 1.259, "eval_wer": 0.33746444534741976, "step": 1946 }, { "epoch": 140.0, "eval_cer": 0.17732484076433122, "eval_loss": 0.5553618669509888, "eval_runtime": 54.2475, "eval_samples_per_second": 9.991, "eval_steps_per_second": 1.254, "eval_wer": 0.3386834620073141, "step": 1960 }, { "epoch": 141.0, "eval_cer": 0.17721565059144678, "eval_loss": 0.5504088401794434, "eval_runtime": 54.07, "eval_samples_per_second": 10.024, "eval_steps_per_second": 1.258, "eval_wer": 0.3380739536773669, "step": 1974 }, { "epoch": 142.0, "eval_cer": 0.17699727024567788, "eval_loss": 0.5484427809715271, "eval_runtime": 54.0621, "eval_samples_per_second": 10.026, "eval_steps_per_second": 1.258, "eval_wer": 0.33827712312068264, "step": 1988 }, { "epoch": 142.86, "learning_rate": 1.4714285714285716e-06, "loss": 0.2089, "step": 2000 }, { "epoch": 143.0, "eval_cer": 0.17721565059144678, "eval_loss": 0.5519289374351501, "eval_runtime": 54.2165, "eval_samples_per_second": 9.997, "eval_steps_per_second": 1.254, "eval_wer": 0.33848029256399836, "step": 2002 }, { "epoch": 144.0, "eval_cer": 0.17721565059144678, "eval_loss": 0.5531746745109558, "eval_runtime": 54.0827, "eval_samples_per_second": 10.022, "eval_steps_per_second": 1.257, "eval_wer": 0.3390898008939455, "step": 2016 }, { "epoch": 145.0, "eval_cer": 0.17747042766151047, "eval_loss": 0.5529664158821106, "eval_runtime": 54.0306, "eval_samples_per_second": 10.031, "eval_steps_per_second": 1.259, "eval_wer": 0.33969930922389274, "step": 2030 }, { "epoch": 146.0, "eval_cer": 0.1775432211101001, "eval_loss": 0.5551361441612244, "eval_runtime": 54.0882, "eval_samples_per_second": 10.021, "eval_steps_per_second": 1.257, "eval_wer": 0.33969930922389274, "step": 2044 }, { "epoch": 146.0, "step": 2044, "total_flos": 1.8244410804942518e+19, "train_loss": 1.3513914437676595, "train_runtime": 31402.8433, "train_samples_per_second": 2.14, "train_steps_per_second": 0.067 } ], "max_steps": 2100, "num_train_epochs": 150, "total_flos": 1.8244410804942518e+19, "trial_name": null, "trial_params": null }