{ "best_metric": 0.564974844455719, "best_model_checkpoint": "wav2vec2-large-xlsr-coraa-exp-12/checkpoint-1498", "epoch": 127.0, "global_step": 1778, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.07, "learning_rate": 3e-05, "loss": 37.6216, "step": 1 }, { "epoch": 1.0, "eval_cer": 0.9618562329390354, "eval_loss": 23.20707130432129, "eval_runtime": 53.2412, "eval_samples_per_second": 10.18, "eval_steps_per_second": 1.277, "eval_wer": 1.0, "step": 14 }, { "epoch": 2.0, "eval_cer": 0.9618562329390354, "eval_loss": 6.9366374015808105, "eval_runtime": 52.8966, "eval_samples_per_second": 10.246, "eval_steps_per_second": 1.286, "eval_wer": 1.0, "step": 28 }, { "epoch": 3.0, "eval_cer": 0.9618562329390354, "eval_loss": 4.42495059967041, "eval_runtime": 53.0892, "eval_samples_per_second": 10.209, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 42 }, { "epoch": 4.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.915421962738037, "eval_runtime": 52.9638, "eval_samples_per_second": 10.233, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 56 }, { "epoch": 5.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.684857130050659, "eval_runtime": 53.3885, "eval_samples_per_second": 10.152, "eval_steps_per_second": 1.274, "eval_wer": 1.0, "step": 70 }, { "epoch": 6.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.52828049659729, "eval_runtime": 52.9774, "eval_samples_per_second": 10.231, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 84 }, { "epoch": 7.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.371574640274048, "eval_runtime": 53.0413, "eval_samples_per_second": 10.218, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 98 }, { "epoch": 7.14, "learning_rate": 2.862857142857143e-05, "loss": 8.823, "step": 100 }, { "epoch": 8.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.265662670135498, "eval_runtime": 52.9677, "eval_samples_per_second": 10.233, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 112 }, { "epoch": 9.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.1796252727508545, "eval_runtime": 53.0173, "eval_samples_per_second": 10.223, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 126 }, { "epoch": 10.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.156822919845581, "eval_runtime": 52.9813, "eval_samples_per_second": 10.23, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 140 }, { "epoch": 11.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.1071083545684814, "eval_runtime": 52.9255, "eval_samples_per_second": 10.241, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 154 }, { "epoch": 12.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0891101360321045, "eval_runtime": 53.0174, "eval_samples_per_second": 10.223, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 168 }, { "epoch": 13.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.058786153793335, "eval_runtime": 53.0158, "eval_samples_per_second": 10.223, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 182 }, { "epoch": 14.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.042229175567627, "eval_runtime": 53.05, "eval_samples_per_second": 10.217, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 196 }, { "epoch": 14.29, "learning_rate": 2.72e-05, "loss": 3.0574, "step": 200 }, { "epoch": 15.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.038764238357544, "eval_runtime": 52.9184, "eval_samples_per_second": 10.242, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 210 }, { "epoch": 16.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0324084758758545, "eval_runtime": 53.3043, "eval_samples_per_second": 10.168, "eval_steps_per_second": 1.276, "eval_wer": 1.0, "step": 224 }, { "epoch": 17.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.025251865386963, "eval_runtime": 52.9716, "eval_samples_per_second": 10.232, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 238 }, { "epoch": 18.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.010026454925537, "eval_runtime": 52.9941, "eval_samples_per_second": 10.228, "eval_steps_per_second": 1.283, "eval_wer": 1.0, "step": 252 }, { "epoch": 19.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0079331398010254, "eval_runtime": 52.9545, "eval_samples_per_second": 10.235, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 266 }, { "epoch": 20.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0150105953216553, "eval_runtime": 52.9312, "eval_samples_per_second": 10.24, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 280 }, { "epoch": 21.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0032567977905273, "eval_runtime": 52.9575, "eval_samples_per_second": 10.235, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 294 }, { "epoch": 21.43, "learning_rate": 2.5771428571428574e-05, "loss": 2.95, "step": 300 }, { "epoch": 22.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.999887466430664, "eval_runtime": 52.9429, "eval_samples_per_second": 10.237, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 308 }, { "epoch": 23.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9940125942230225, "eval_runtime": 52.9557, "eval_samples_per_second": 10.235, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 322 }, { "epoch": 24.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9982004165649414, "eval_runtime": 53.3517, "eval_samples_per_second": 10.159, "eval_steps_per_second": 1.275, "eval_wer": 1.0, "step": 336 }, { "epoch": 25.0, "eval_cer": 0.9618562329390354, "eval_loss": 3.0212087631225586, "eval_runtime": 52.917, "eval_samples_per_second": 10.242, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 350 }, { "epoch": 26.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.995063543319702, "eval_runtime": 52.9179, "eval_samples_per_second": 10.242, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 364 }, { "epoch": 27.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.989276885986328, "eval_runtime": 52.9648, "eval_samples_per_second": 10.233, "eval_steps_per_second": 1.284, "eval_wer": 1.0, "step": 378 }, { "epoch": 28.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.990724802017212, "eval_runtime": 52.9049, "eval_samples_per_second": 10.245, "eval_steps_per_second": 1.285, "eval_wer": 1.0, "step": 392 }, { "epoch": 28.57, "learning_rate": 2.434285714285714e-05, "loss": 2.9233, "step": 400 }, { "epoch": 29.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9889469146728516, "eval_runtime": 53.0796, "eval_samples_per_second": 10.211, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 406 }, { "epoch": 30.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9812769889831543, "eval_runtime": 53.0284, "eval_samples_per_second": 10.221, "eval_steps_per_second": 1.282, "eval_wer": 1.0, "step": 420 }, { "epoch": 31.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9795358180999756, "eval_runtime": 53.6697, "eval_samples_per_second": 10.099, "eval_steps_per_second": 1.267, "eval_wer": 1.0, "step": 434 }, { "epoch": 32.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9633467197418213, "eval_runtime": 53.1489, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 1.0, "step": 448 }, { "epoch": 33.0, "eval_cer": 0.9585441310282075, "eval_loss": 2.9652762413024902, "eval_runtime": 53.0687, "eval_samples_per_second": 10.213, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 462 }, { "epoch": 34.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.9050323963165283, "eval_runtime": 53.1009, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 476 }, { "epoch": 35.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.8805932998657227, "eval_runtime": 53.2017, "eval_samples_per_second": 10.188, "eval_steps_per_second": 1.278, "eval_wer": 1.0, "step": 490 }, { "epoch": 35.71, "learning_rate": 2.2914285714285714e-05, "loss": 2.8852, "step": 500 }, { "epoch": 36.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.822971820831299, "eval_runtime": 53.1752, "eval_samples_per_second": 10.193, "eval_steps_per_second": 1.279, "eval_wer": 1.0, "step": 504 }, { "epoch": 37.0, "eval_cer": 0.9618562329390354, "eval_loss": 2.780466318130493, "eval_runtime": 53.2177, "eval_samples_per_second": 10.185, "eval_steps_per_second": 1.278, "eval_wer": 1.0, "step": 518 }, { "epoch": 38.0, "eval_cer": 0.9571974522292994, "eval_loss": 2.70436954498291, "eval_runtime": 53.1033, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 1.0, "step": 532 }, { "epoch": 39.0, "eval_cer": 0.9558507734303913, "eval_loss": 2.6560797691345215, "eval_runtime": 53.1469, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 1.0, "step": 546 }, { "epoch": 40.0, "eval_cer": 0.9254231119199272, "eval_loss": 2.547485828399658, "eval_runtime": 53.1445, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 1.0, "step": 560 }, { "epoch": 41.0, "eval_cer": 0.7458416742493176, "eval_loss": 2.333609104156494, "eval_runtime": 53.2579, "eval_samples_per_second": 10.177, "eval_steps_per_second": 1.277, "eval_wer": 1.0, "step": 574 }, { "epoch": 42.0, "eval_cer": 0.5467879890809827, "eval_loss": 2.069585084915161, "eval_runtime": 53.2259, "eval_samples_per_second": 10.183, "eval_steps_per_second": 1.278, "eval_wer": 1.0, "step": 588 }, { "epoch": 42.86, "learning_rate": 2.1485714285714284e-05, "loss": 2.5339, "step": 600 }, { "epoch": 43.0, "eval_cer": 0.49714285714285716, "eval_loss": 1.7759531736373901, "eval_runtime": 53.69, "eval_samples_per_second": 10.095, "eval_steps_per_second": 1.267, "eval_wer": 1.0, "step": 602 }, { "epoch": 44.0, "eval_cer": 0.4545950864422202, "eval_loss": 1.5432746410369873, "eval_runtime": 53.2888, "eval_samples_per_second": 10.171, "eval_steps_per_second": 1.276, "eval_wer": 1.0, "step": 616 }, { "epoch": 45.0, "eval_cer": 0.4066606005459509, "eval_loss": 1.352888584136963, "eval_runtime": 53.6434, "eval_samples_per_second": 10.104, "eval_steps_per_second": 1.268, "eval_wer": 1.0, "step": 630 }, { "epoch": 46.0, "eval_cer": 0.38340309372156506, "eval_loss": 1.214944839477539, "eval_runtime": 53.2877, "eval_samples_per_second": 10.171, "eval_steps_per_second": 1.276, "eval_wer": 0.9997968305566842, "step": 644 }, { "epoch": 47.0, "eval_cer": 0.35781619654231117, "eval_loss": 1.0925143957138062, "eval_runtime": 53.2174, "eval_samples_per_second": 10.185, "eval_steps_per_second": 1.278, "eval_wer": 0.9943112555871597, "step": 658 }, { "epoch": 48.0, "eval_cer": 0.3129390354868062, "eval_loss": 1.023630976676941, "eval_runtime": 53.2114, "eval_samples_per_second": 10.186, "eval_steps_per_second": 1.278, "eval_wer": 0.8953677366924014, "step": 672 }, { "epoch": 49.0, "eval_cer": 0.26227479526842584, "eval_loss": 0.9525313377380371, "eval_runtime": 53.2409, "eval_samples_per_second": 10.18, "eval_steps_per_second": 1.277, "eval_wer": 0.7062169849654611, "step": 686 }, { "epoch": 50.0, "learning_rate": 2.0057142857142858e-05, "loss": 1.3395, "step": 700 }, { "epoch": 50.0, "eval_cer": 0.22009099181073705, "eval_loss": 0.8921615481376648, "eval_runtime": 53.2916, "eval_samples_per_second": 10.17, "eval_steps_per_second": 1.276, "eval_wer": 0.5062982527427875, "step": 700 }, { "epoch": 51.0, "eval_cer": 0.21150136487716106, "eval_loss": 0.8068466782569885, "eval_runtime": 53.2081, "eval_samples_per_second": 10.186, "eval_steps_per_second": 1.278, "eval_wer": 0.47744819179195447, "step": 714 }, { "epoch": 52.0, "eval_cer": 0.20764331210191084, "eval_loss": 0.7931560277938843, "eval_runtime": 53.422, "eval_samples_per_second": 10.146, "eval_steps_per_second": 1.273, "eval_wer": 0.45530272247054043, "step": 728 }, { "epoch": 53.0, "eval_cer": 0.20658780709736124, "eval_loss": 0.7725641131401062, "eval_runtime": 53.3035, "eval_samples_per_second": 10.168, "eval_steps_per_second": 1.276, "eval_wer": 0.4453474197480699, "step": 742 }, { "epoch": 54.0, "eval_cer": 0.2026569608735214, "eval_loss": 0.755141019821167, "eval_runtime": 53.6653, "eval_samples_per_second": 10.1, "eval_steps_per_second": 1.267, "eval_wer": 0.4339699309223893, "step": 756 }, { "epoch": 55.0, "eval_cer": 0.20385805277525024, "eval_loss": 0.7420439720153809, "eval_runtime": 53.1999, "eval_samples_per_second": 10.188, "eval_steps_per_second": 1.278, "eval_wer": 0.4305160503860219, "step": 770 }, { "epoch": 56.0, "eval_cer": 0.2008371246587807, "eval_loss": 0.7146174311637878, "eval_runtime": 53.5808, "eval_samples_per_second": 10.116, "eval_steps_per_second": 1.269, "eval_wer": 0.42117025599349855, "step": 784 }, { "epoch": 57.0, "eval_cer": 0.195705186533212, "eval_loss": 0.6767785549163818, "eval_runtime": 53.1793, "eval_samples_per_second": 10.192, "eval_steps_per_second": 1.279, "eval_wer": 0.4095895977245022, "step": 798 }, { "epoch": 57.14, "learning_rate": 1.8628571428571428e-05, "loss": 0.7419, "step": 800 }, { "epoch": 58.0, "eval_cer": 0.1961783439490446, "eval_loss": 0.6767465472221375, "eval_runtime": 53.2804, "eval_samples_per_second": 10.173, "eval_steps_per_second": 1.276, "eval_wer": 0.40796424217797644, "step": 812 }, { "epoch": 59.0, "eval_cer": 0.19712465878070973, "eval_loss": 0.6708809733390808, "eval_runtime": 53.3292, "eval_samples_per_second": 10.163, "eval_steps_per_second": 1.275, "eval_wer": 0.4069483949613978, "step": 826 }, { "epoch": 60.0, "eval_cer": 0.19665150136487716, "eval_loss": 0.6790570020675659, "eval_runtime": 53.2448, "eval_samples_per_second": 10.179, "eval_steps_per_second": 1.277, "eval_wer": 0.4024786672084518, "step": 840 }, { "epoch": 61.0, "eval_cer": 0.19381255686988172, "eval_loss": 0.6560342311859131, "eval_runtime": 53.279, "eval_samples_per_second": 10.173, "eval_steps_per_second": 1.276, "eval_wer": 0.4028850060950833, "step": 854 }, { "epoch": 62.0, "eval_cer": 0.19392174704276616, "eval_loss": 0.6473817229270935, "eval_runtime": 53.2557, "eval_samples_per_second": 10.177, "eval_steps_per_second": 1.277, "eval_wer": 0.3976026005688744, "step": 868 }, { "epoch": 63.0, "eval_cer": 0.19414012738853503, "eval_loss": 0.6583911180496216, "eval_runtime": 53.2562, "eval_samples_per_second": 10.177, "eval_steps_per_second": 1.277, "eval_wer": 0.39821210889882164, "step": 882 }, { "epoch": 64.0, "eval_cer": 0.19381255686988172, "eval_loss": 0.6618856191635132, "eval_runtime": 53.4299, "eval_samples_per_second": 10.144, "eval_steps_per_second": 1.273, "eval_wer": 0.39597724502234866, "step": 896 }, { "epoch": 64.29, "learning_rate": 1.72e-05, "loss": 0.5254, "step": 900 }, { "epoch": 65.0, "eval_cer": 0.19363057324840766, "eval_loss": 0.6513723134994507, "eval_runtime": 53.2194, "eval_samples_per_second": 10.184, "eval_steps_per_second": 1.278, "eval_wer": 0.3923201950426656, "step": 910 }, { "epoch": 66.0, "eval_cer": 0.19148316651501365, "eval_loss": 0.6362853050231934, "eval_runtime": 53.25, "eval_samples_per_second": 10.178, "eval_steps_per_second": 1.277, "eval_wer": 0.3874441284030882, "step": 924 }, { "epoch": 67.0, "eval_cer": 0.19002729754322112, "eval_loss": 0.6173312067985535, "eval_runtime": 53.2465, "eval_samples_per_second": 10.179, "eval_steps_per_second": 1.277, "eval_wer": 0.3797236895570906, "step": 938 }, { "epoch": 68.0, "eval_cer": 0.19177434030937215, "eval_loss": 0.6283513307571411, "eval_runtime": 53.1947, "eval_samples_per_second": 10.189, "eval_steps_per_second": 1.278, "eval_wer": 0.38866314506298255, "step": 952 }, { "epoch": 69.0, "eval_cer": 0.18966333030027296, "eval_loss": 0.6152955293655396, "eval_runtime": 53.1902, "eval_samples_per_second": 10.19, "eval_steps_per_second": 1.278, "eval_wer": 0.3766761479073547, "step": 966 }, { "epoch": 70.0, "eval_cer": 0.18787989080982712, "eval_loss": 0.6083645820617676, "eval_runtime": 53.1965, "eval_samples_per_second": 10.189, "eval_steps_per_second": 1.278, "eval_wer": 0.37362860625761884, "step": 980 }, { "epoch": 71.0, "eval_cer": 0.1899909008189263, "eval_loss": 0.6196299195289612, "eval_runtime": 53.1375, "eval_samples_per_second": 10.2, "eval_steps_per_second": 1.28, "eval_wer": 0.3772856562373019, "step": 994 }, { "epoch": 71.43, "learning_rate": 1.577142857142857e-05, "loss": 0.4219, "step": 1000 }, { "epoch": 72.0, "eval_cer": 0.18988171064604187, "eval_loss": 0.6074672341346741, "eval_runtime": 53.2378, "eval_samples_per_second": 10.181, "eval_steps_per_second": 1.277, "eval_wer": 0.3730190979276717, "step": 1008 }, { "epoch": 73.0, "eval_cer": 0.1883894449499545, "eval_loss": 0.6016885042190552, "eval_runtime": 53.2097, "eval_samples_per_second": 10.186, "eval_steps_per_second": 1.278, "eval_wer": 0.37119057293783014, "step": 1022 }, { "epoch": 74.0, "eval_cer": 0.18722474977252046, "eval_loss": 0.5947157740592957, "eval_runtime": 53.1687, "eval_samples_per_second": 10.194, "eval_steps_per_second": 1.279, "eval_wer": 0.3693620479479886, "step": 1036 }, { "epoch": 75.0, "eval_cer": 0.1889353958143767, "eval_loss": 0.5974624752998352, "eval_runtime": 53.2006, "eval_samples_per_second": 10.188, "eval_steps_per_second": 1.278, "eval_wer": 0.3695652173913043, "step": 1050 }, { "epoch": 76.0, "eval_cer": 0.18868061874431302, "eval_loss": 0.6020309925079346, "eval_runtime": 53.2351, "eval_samples_per_second": 10.181, "eval_steps_per_second": 1.277, "eval_wer": 0.37281592848435596, "step": 1064 }, { "epoch": 77.0, "eval_cer": 0.1891537761601456, "eval_loss": 0.5994043946266174, "eval_runtime": 53.1703, "eval_samples_per_second": 10.194, "eval_steps_per_second": 1.279, "eval_wer": 0.37037789516456726, "step": 1078 }, { "epoch": 78.0, "eval_cer": 0.18773430391264787, "eval_loss": 0.5821866393089294, "eval_runtime": 53.6598, "eval_samples_per_second": 10.101, "eval_steps_per_second": 1.267, "eval_wer": 0.3715969118244616, "step": 1092 }, { "epoch": 78.57, "learning_rate": 1.4342857142857143e-05, "loss": 0.385, "step": 1100 }, { "epoch": 79.0, "eval_cer": 0.18929936305732484, "eval_loss": 0.6073063015937805, "eval_runtime": 53.2561, "eval_samples_per_second": 10.177, "eval_steps_per_second": 1.277, "eval_wer": 0.374238114587566, "step": 1106 }, { "epoch": 80.0, "eval_cer": 0.18740673339399455, "eval_loss": 0.6028934121131897, "eval_runtime": 53.1886, "eval_samples_per_second": 10.19, "eval_steps_per_second": 1.278, "eval_wer": 0.37281592848435596, "step": 1120 }, { "epoch": 81.0, "eval_cer": 0.18682438580527752, "eval_loss": 0.5961212515830994, "eval_runtime": 53.2244, "eval_samples_per_second": 10.183, "eval_steps_per_second": 1.278, "eval_wer": 0.3699715562779358, "step": 1134 }, { "epoch": 82.0, "eval_cer": 0.1870427661510464, "eval_loss": 0.6032407283782959, "eval_runtime": 53.2843, "eval_samples_per_second": 10.172, "eval_steps_per_second": 1.276, "eval_wer": 0.37017472572125154, "step": 1148 }, { "epoch": 83.0, "eval_cer": 0.1889353958143767, "eval_loss": 0.611492395401001, "eval_runtime": 53.1834, "eval_samples_per_second": 10.191, "eval_steps_per_second": 1.279, "eval_wer": 0.3722064201544088, "step": 1162 }, { "epoch": 84.0, "eval_cer": 0.18831665150136487, "eval_loss": 0.6018120646476746, "eval_runtime": 53.2232, "eval_samples_per_second": 10.184, "eval_steps_per_second": 1.278, "eval_wer": 0.36895570906135716, "step": 1176 }, { "epoch": 85.0, "eval_cer": 0.18547770700636942, "eval_loss": 0.5824325084686279, "eval_runtime": 53.2981, "eval_samples_per_second": 10.169, "eval_steps_per_second": 1.276, "eval_wer": 0.36651767574156846, "step": 1190 }, { "epoch": 85.71, "learning_rate": 1.2914285714285713e-05, "loss": 0.3463, "step": 1200 }, { "epoch": 86.0, "eval_cer": 0.18660600545950864, "eval_loss": 0.5985358953475952, "eval_runtime": 53.1709, "eval_samples_per_second": 10.194, "eval_steps_per_second": 1.279, "eval_wer": 0.3669240146281999, "step": 1204 }, { "epoch": 87.0, "eval_cer": 0.18609645131938127, "eval_loss": 0.5833200812339783, "eval_runtime": 53.1104, "eval_samples_per_second": 10.205, "eval_steps_per_second": 1.28, "eval_wer": 0.3669240146281999, "step": 1218 }, { "epoch": 88.0, "eval_cer": 0.1861692447679709, "eval_loss": 0.5775151252746582, "eval_runtime": 53.1027, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.3636733035351483, "step": 1232 }, { "epoch": 89.0, "eval_cer": 0.18496815286624205, "eval_loss": 0.5746987462043762, "eval_runtime": 53.0756, "eval_samples_per_second": 10.212, "eval_steps_per_second": 1.281, "eval_wer": 0.36062576188541245, "step": 1246 }, { "epoch": 90.0, "eval_cer": 0.18507734303912649, "eval_loss": 0.5784278512001038, "eval_runtime": 53.0821, "eval_samples_per_second": 10.211, "eval_steps_per_second": 1.281, "eval_wer": 0.36387647297846404, "step": 1260 }, { "epoch": 91.0, "eval_cer": 0.18580527752502274, "eval_loss": 0.5841168165206909, "eval_runtime": 53.1168, "eval_samples_per_second": 10.204, "eval_steps_per_second": 1.28, "eval_wer": 0.36042259244209673, "step": 1274 }, { "epoch": 92.0, "eval_cer": 0.18496815286624205, "eval_loss": 0.5761845707893372, "eval_runtime": 53.1679, "eval_samples_per_second": 10.194, "eval_steps_per_second": 1.279, "eval_wer": 0.36550182852498986, "step": 1288 }, { "epoch": 92.86, "learning_rate": 1.1485714285714285e-05, "loss": 0.3237, "step": 1300 }, { "epoch": 93.0, "eval_cer": 0.1854049135577798, "eval_loss": 0.5835999846458435, "eval_runtime": 53.1013, "eval_samples_per_second": 10.207, "eval_steps_per_second": 1.281, "eval_wer": 0.3598130841121495, "step": 1302 }, { "epoch": 94.0, "eval_cer": 0.18409463148316652, "eval_loss": 0.576073408126831, "eval_runtime": 53.509, "eval_samples_per_second": 10.129, "eval_steps_per_second": 1.271, "eval_wer": 0.3587972368955709, "step": 1316 }, { "epoch": 95.0, "eval_cer": 0.1848225659690628, "eval_loss": 0.5822096467018127, "eval_runtime": 53.2494, "eval_samples_per_second": 10.179, "eval_steps_per_second": 1.277, "eval_wer": 0.3596099146688338, "step": 1330 }, { "epoch": 96.0, "eval_cer": 0.18496815286624205, "eval_loss": 0.5886383652687073, "eval_runtime": 53.1468, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 0.35920357578220236, "step": 1344 }, { "epoch": 97.0, "eval_cer": 0.1830027297543221, "eval_loss": 0.5695921182632446, "eval_runtime": 53.2532, "eval_samples_per_second": 10.178, "eval_steps_per_second": 1.277, "eval_wer": 0.3573750507923608, "step": 1358 }, { "epoch": 98.0, "eval_cer": 0.18358507734303914, "eval_loss": 0.5794330835342407, "eval_runtime": 53.1395, "eval_samples_per_second": 10.2, "eval_steps_per_second": 1.28, "eval_wer": 0.3587972368955709, "step": 1372 }, { "epoch": 99.0, "eval_cer": 0.18365787079162876, "eval_loss": 0.5768290758132935, "eval_runtime": 53.1965, "eval_samples_per_second": 10.189, "eval_steps_per_second": 1.278, "eval_wer": 0.3569687119057294, "step": 1386 }, { "epoch": 100.0, "learning_rate": 1.0057142857142857e-05, "loss": 0.2799, "step": 1400 }, { "epoch": 100.0, "eval_cer": 0.18442220200181983, "eval_loss": 0.5836793184280396, "eval_runtime": 53.2358, "eval_samples_per_second": 10.181, "eval_steps_per_second": 1.277, "eval_wer": 0.35778138967899226, "step": 1400 }, { "epoch": 101.0, "eval_cer": 0.18263876251137398, "eval_loss": 0.5696985721588135, "eval_runtime": 53.2164, "eval_samples_per_second": 10.185, "eval_steps_per_second": 1.278, "eval_wer": 0.3524989841527834, "step": 1414 }, { "epoch": 102.0, "eval_cer": 0.18336669699727023, "eval_loss": 0.5795508027076721, "eval_runtime": 53.1474, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 0.35656237301909793, "step": 1428 }, { "epoch": 103.0, "eval_cer": 0.18249317561419473, "eval_loss": 0.571198046207428, "eval_runtime": 53.193, "eval_samples_per_second": 10.189, "eval_steps_per_second": 1.278, "eval_wer": 0.3549370174725721, "step": 1442 }, { "epoch": 104.0, "eval_cer": 0.18289353958143767, "eval_loss": 0.5795718431472778, "eval_runtime": 53.0944, "eval_samples_per_second": 10.208, "eval_steps_per_second": 1.281, "eval_wer": 0.3555465258025193, "step": 1456 }, { "epoch": 105.0, "eval_cer": 0.1835122838944495, "eval_loss": 0.5758859515190125, "eval_runtime": 53.062, "eval_samples_per_second": 10.214, "eval_steps_per_second": 1.282, "eval_wer": 0.35534335635920355, "step": 1470 }, { "epoch": 106.0, "eval_cer": 0.18307552320291173, "eval_loss": 0.5749973058700562, "eval_runtime": 53.2134, "eval_samples_per_second": 10.185, "eval_steps_per_second": 1.278, "eval_wer": 0.3561560341324665, "step": 1484 }, { "epoch": 107.0, "eval_cer": 0.18231119199272067, "eval_loss": 0.564974844455719, "eval_runtime": 53.1418, "eval_samples_per_second": 10.199, "eval_steps_per_second": 1.28, "eval_wer": 0.35270215359609913, "step": 1498 }, { "epoch": 107.14, "learning_rate": 8.628571428571429e-06, "loss": 0.2674, "step": 1500 }, { "epoch": 108.0, "eval_cer": 0.18231119199272067, "eval_loss": 0.5676841139793396, "eval_runtime": 53.12, "eval_samples_per_second": 10.203, "eval_steps_per_second": 1.28, "eval_wer": 0.349857781389679, "step": 1512 }, { "epoch": 109.0, "eval_cer": 0.18263876251137398, "eval_loss": 0.5698859691619873, "eval_runtime": 53.173, "eval_samples_per_second": 10.193, "eval_steps_per_second": 1.279, "eval_wer": 0.35412433969930923, "step": 1526 }, { "epoch": 110.0, "eval_cer": 0.1837306642402184, "eval_loss": 0.5779122710227966, "eval_runtime": 53.1485, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 0.3555465258025193, "step": 1540 }, { "epoch": 111.0, "eval_cer": 0.18336669699727023, "eval_loss": 0.5792039036750793, "eval_runtime": 53.5286, "eval_samples_per_second": 10.125, "eval_steps_per_second": 1.27, "eval_wer": 0.35514018691588783, "step": 1554 }, { "epoch": 112.0, "eval_cer": 0.18289353958143767, "eval_loss": 0.5696908831596375, "eval_runtime": 53.1508, "eval_samples_per_second": 10.197, "eval_steps_per_second": 1.279, "eval_wer": 0.3573750507923608, "step": 1568 }, { "epoch": 113.0, "eval_cer": 0.18394904458598726, "eval_loss": 0.5852411389350891, "eval_runtime": 53.0856, "eval_samples_per_second": 10.21, "eval_steps_per_second": 1.281, "eval_wer": 0.35900040633888664, "step": 1582 }, { "epoch": 114.0, "eval_cer": 0.18289353958143767, "eval_loss": 0.5735089778900146, "eval_runtime": 53.149, "eval_samples_per_second": 10.198, "eval_steps_per_second": 1.279, "eval_wer": 0.3537180008126778, "step": 1596 }, { "epoch": 114.29, "learning_rate": 7.2e-06, "loss": 0.2611, "step": 1600 }, { "epoch": 115.0, "eval_cer": 0.18318471337579617, "eval_loss": 0.577383279800415, "eval_runtime": 53.1629, "eval_samples_per_second": 10.195, "eval_steps_per_second": 1.279, "eval_wer": 0.3545306785859407, "step": 1610 }, { "epoch": 116.0, "eval_cer": 0.1840582347588717, "eval_loss": 0.5835606455802917, "eval_runtime": 53.1573, "eval_samples_per_second": 10.196, "eval_steps_per_second": 1.279, "eval_wer": 0.3555465258025193, "step": 1624 }, { "epoch": 117.0, "eval_cer": 0.18322111010009098, "eval_loss": 0.5749671459197998, "eval_runtime": 53.1768, "eval_samples_per_second": 10.192, "eval_steps_per_second": 1.279, "eval_wer": 0.35168630637952053, "step": 1638 }, { "epoch": 118.0, "eval_cer": 0.18245677888989992, "eval_loss": 0.5771631598472595, "eval_runtime": 53.195, "eval_samples_per_second": 10.189, "eval_steps_per_second": 1.278, "eval_wer": 0.35209264526615197, "step": 1652 }, { "epoch": 119.0, "eval_cer": 0.18307552320291173, "eval_loss": 0.5793441534042358, "eval_runtime": 53.2698, "eval_samples_per_second": 10.175, "eval_steps_per_second": 1.277, "eval_wer": 0.35209264526615197, "step": 1666 }, { "epoch": 120.0, "eval_cer": 0.18282074613284804, "eval_loss": 0.575577974319458, "eval_runtime": 53.2251, "eval_samples_per_second": 10.183, "eval_steps_per_second": 1.278, "eval_wer": 0.35168630637952053, "step": 1680 }, { "epoch": 121.0, "eval_cer": 0.1830027297543221, "eval_loss": 0.5794119834899902, "eval_runtime": 53.1856, "eval_samples_per_second": 10.191, "eval_steps_per_second": 1.279, "eval_wer": 0.35168630637952053, "step": 1694 }, { "epoch": 121.43, "learning_rate": 5.7714285714285715e-06, "loss": 0.2476, "step": 1700 }, { "epoch": 122.0, "eval_cer": 0.18274795268425842, "eval_loss": 0.5718653202056885, "eval_runtime": 53.2426, "eval_samples_per_second": 10.18, "eval_steps_per_second": 1.277, "eval_wer": 0.35209264526615197, "step": 1708 }, { "epoch": 123.0, "eval_cer": 0.1830027297543221, "eval_loss": 0.5803536772727966, "eval_runtime": 53.2083, "eval_samples_per_second": 10.186, "eval_steps_per_second": 1.278, "eval_wer": 0.35432750914262495, "step": 1722 }, { "epoch": 124.0, "eval_cer": 0.18249317561419473, "eval_loss": 0.5728517174720764, "eval_runtime": 53.1988, "eval_samples_per_second": 10.188, "eval_steps_per_second": 1.278, "eval_wer": 0.3539211702559935, "step": 1736 }, { "epoch": 125.0, "eval_cer": 0.18318471337579617, "eval_loss": 0.5873575806617737, "eval_runtime": 53.0805, "eval_samples_per_second": 10.211, "eval_steps_per_second": 1.281, "eval_wer": 0.35188947582283625, "step": 1750 }, { "epoch": 126.0, "eval_cer": 0.18260236578707917, "eval_loss": 0.5776769518852234, "eval_runtime": 53.1869, "eval_samples_per_second": 10.19, "eval_steps_per_second": 1.279, "eval_wer": 0.35331166192604635, "step": 1764 }, { "epoch": 127.0, "eval_cer": 0.18223839854413104, "eval_loss": 0.5761721730232239, "eval_runtime": 53.4852, "eval_samples_per_second": 10.134, "eval_steps_per_second": 1.271, "eval_wer": 0.3531084924827306, "step": 1778 }, { "epoch": 127.0, "step": 1778, "total_flos": 1.5870191391607497e+19, "train_loss": 1.6193932103091606, "train_runtime": 26266.2725, "train_samples_per_second": 2.558, "train_steps_per_second": 0.08 } ], "max_steps": 2100, "num_train_epochs": 150, "total_flos": 1.5870191391607497e+19, "trial_name": null, "trial_params": null }