|
[ |
|
{ |
|
"language_name": "English", |
|
"bcp_47": "en", |
|
"speakers": 1636485840, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.4351349353198866, |
|
"chrf": 54.9504915580248 |
|
} |
|
], |
|
"bleu": 0.4351349353198866, |
|
"chrf": 54.9504915580248, |
|
"commonvoice_hours": 2649.0, |
|
"commonvoice_locale": "en", |
|
"population": { |
|
"AC": 931, |
|
"AE": 4996040, |
|
"AG": 84434, |
|
"AI": 17186, |
|
"AQ": 300, |
|
"AR": 3183537, |
|
"AS": 47954, |
|
"AT": 6467398, |
|
"AU": 24447840, |
|
"AW": 2986, |
|
"BA": 1726016, |
|
"BB": 294560, |
|
"BD": 29277180, |
|
"BE": 6915213, |
|
"BG": 1741725, |
|
"BI": 6289, |
|
"BM": 66010, |
|
"BN": 7896, |
|
"BR": 16937280, |
|
"BS": 337721, |
|
"BT": 86055, |
|
"BV": 1, |
|
"BW": 1876956, |
|
"BZ": 399598, |
|
"CA": 32416926, |
|
"CC": 101, |
|
"CH": 5126434, |
|
"CK": 8574, |
|
"CL": 1727746, |
|
"CM": 10543100, |
|
"CN": 62731, |
|
"CP": 1, |
|
"CQ": 482, |
|
"CX": 1389, |
|
"CY": 924676, |
|
"CZ": 2889675, |
|
"DE": 51302208, |
|
"DG": 495, |
|
"DK": 5047693, |
|
"DM": 69788, |
|
"DO": 7980, |
|
"DZ": 3008103, |
|
"EE": 614310, |
|
"EG": 36443400, |
|
"ER": 3587908, |
|
"ES": 12003792, |
|
"ET": 46488590, |
|
"FI": 3900169, |
|
"FJ": 879816, |
|
"FK": 2814, |
|
"FM": 58389, |
|
"FR": 26460798, |
|
"GB": 64445878, |
|
"GD": 108570, |
|
"GG": 67052, |
|
"GH": 6161442, |
|
"GI": 23665, |
|
"GM": 869600, |
|
"GR": 5409621, |
|
"GS": 20, |
|
"GU": 153321, |
|
"GY": 750204, |
|
"HK": 3697454, |
|
"HM": 1, |
|
"HN": 40635, |
|
"HR": 2071598, |
|
"HU": 1954366, |
|
"IE": 5073039, |
|
"IL": 7374158, |
|
"IM": 90499, |
|
"IN": 251957100, |
|
"IO": 3500, |
|
"IQ": 13605445, |
|
"IT": 21216918, |
|
"JE": 96019, |
|
"JM": 2752399, |
|
"JO": 4869270, |
|
"KE": 10170301, |
|
"KI": 111796, |
|
"KN": 52745, |
|
"KY": 60705, |
|
"KZ": 2863785, |
|
"LB": 2187844, |
|
"LC": 149838, |
|
"LK": 2288920, |
|
"LR": 4210839, |
|
"LS": 531719, |
|
"LT": 1037955, |
|
"LU": 351893, |
|
"LV": 865366, |
|
"MA": 4978638, |
|
"MG": 4852026, |
|
"MH": 72463, |
|
"MO": 14133, |
|
"MP": 49890, |
|
"MS": 3492, |
|
"MT": 402395, |
|
"MU": 993146, |
|
"MV": 293928, |
|
"MW": 13353858, |
|
"MX": 16724500, |
|
"MY": 6856941, |
|
"NA": 184105, |
|
"NF": 1678, |
|
"NG": 113434840, |
|
"NL": 15552360, |
|
"NP": 909837, |
|
"NR": 9350, |
|
"NU": 1120, |
|
"NZ": 4826970, |
|
"PA": 545171, |
|
"PG": 3629730, |
|
"PH": 69875840, |
|
"PK": 116750500, |
|
"PL": 12633159, |
|
"PM": 187, |
|
"PN": 46, |
|
"PR": 1562644, |
|
"PT": 2781729, |
|
"PW": 1887, |
|
"RO": 6603899, |
|
"RW": 1906860, |
|
"SB": 685097, |
|
"SC": 36473, |
|
"SD": 27792576, |
|
"SE": 8774150, |
|
"SG": 5774984, |
|
"SH": 5425, |
|
"SI": 1240581, |
|
"SK": 1414556, |
|
"SL": 2318726, |
|
"SS": 2851524, |
|
"SX": 29816, |
|
"SZ": 883584, |
|
"TA": 272, |
|
"TC": 54807, |
|
"TH": 18623898, |
|
"TK": 1285, |
|
"TO": 29707, |
|
"TR": 13942975, |
|
"TT": 1063735, |
|
"TV": 1066, |
|
"TZ": 40401432, |
|
"UG": 1686867, |
|
"UM": 316, |
|
"US": 319333440, |
|
"VC": 97334, |
|
"VG": 36633, |
|
"VI": 79676, |
|
"VU": 247616, |
|
"WS": 4279, |
|
"YE": 2689596, |
|
"ZA": 17503716, |
|
"ZM": 2788256, |
|
"ZW": 6109446 |
|
} |
|
}, |
|
{ |
|
"language_name": "Chinese", |
|
"bcp_47": "zh", |
|
"speakers": 1304678914, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3977775857451761, |
|
"chrf": 57.672913792439125 |
|
} |
|
], |
|
"bleu": 0.3977775857451761, |
|
"chrf": 57.672913792439125, |
|
"commonvoice_hours": 422.0, |
|
"commonvoice_locale": "zh-TW", |
|
"population": { |
|
"AU": 534796, |
|
"BN": 51093, |
|
"CA": 678494, |
|
"CN": 1254618000, |
|
"GB": 197283, |
|
"GF": 4988, |
|
"HK": 7249910, |
|
"ID": 2456639, |
|
"MN": 44352, |
|
"MO": 632892, |
|
"MY": 5550857, |
|
"PA": 5841, |
|
"PF": 23019, |
|
"PH": 797021, |
|
"SG": 4781438, |
|
"SR": 6705, |
|
"TH": 1241593, |
|
"TW": 22422850, |
|
"US": 2295209, |
|
"VN": 1085934 |
|
} |
|
}, |
|
{ |
|
"language_name": "Hindi", |
|
"bcp_47": "hi", |
|
"speakers": 546882144, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.333521621016373, |
|
"chrf": 50.48364584189306 |
|
} |
|
], |
|
"bleu": 0.333521621016373, |
|
"chrf": 50.48364584189306, |
|
"commonvoice_hours": 16.0, |
|
"commonvoice_locale": "hi-IN", |
|
"population": { |
|
"CA": 188470, |
|
"FJ": 411829, |
|
"IN": 545022990, |
|
"NP": 127377, |
|
"UG": 2206, |
|
"ZA": 1129272 |
|
} |
|
}, |
|
{ |
|
"language_name": "Spanish", |
|
"bcp_47": "es", |
|
"speakers": 493528077, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.29160032861883095, |
|
"chrf": 47.668399832701844 |
|
} |
|
], |
|
"bleu": 0.29160032861883095, |
|
"chrf": 47.668399832701844, |
|
"commonvoice_hours": 446.0, |
|
"commonvoice_locale": "es", |
|
"population": { |
|
"AD": 33110, |
|
"AR": 45479100, |
|
"BO": 7100339, |
|
"BR": 76218, |
|
"BZ": 111887, |
|
"CA": 603106, |
|
"CL": 17823064, |
|
"CO": 45648864, |
|
"CR": 4843090, |
|
"CU": 11059100, |
|
"CW": 5751, |
|
"DE": 4809582, |
|
"DO": 8189766, |
|
"EA": 147000, |
|
"EC": 16228704, |
|
"ES": 49515642, |
|
"FR": 8820266, |
|
"GB": 5260888, |
|
"GI": 14790, |
|
"GQ": 727475, |
|
"GT": 15952569, |
|
"HN": 7203565, |
|
"IC": 2056618, |
|
"MA": 23115, |
|
"MX": 106779500, |
|
"NI": 4838683, |
|
"PA": 2686915, |
|
"PE": 23297950, |
|
"PH": 33846110, |
|
"PR": 2774491, |
|
"PT": 1030270, |
|
"PY": 230134, |
|
"RO": 2130290, |
|
"SV": 5768179, |
|
"SX": 4823, |
|
"TT": 4110, |
|
"US": 31933344, |
|
"UY": 2981097, |
|
"VE": 23488572 |
|
} |
|
}, |
|
{ |
|
"language_name": "Arabic", |
|
"bcp_47": "ar", |
|
"speakers": 351664197, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.277257629790728, |
|
"chrf": 46.62779335380641 |
|
} |
|
], |
|
"bleu": 0.277257629790728, |
|
"chrf": 46.62779335380641, |
|
"commonvoice_hours": 91.0, |
|
"commonvoice_locale": "ar", |
|
"population": { |
|
"AE": 7793822, |
|
"BH": 1309350, |
|
"CA": 565412, |
|
"CM": 108206, |
|
"CY": 1267, |
|
"DJ": 67292, |
|
"DZ": 31799946, |
|
"EG": 97876560, |
|
"EH": 652271, |
|
"ER": 297979, |
|
"GB": 197283, |
|
"IL": 1735096, |
|
"IQ": 26433436, |
|
"IR": 1698466, |
|
"JO": 10820600, |
|
"KE": 24623, |
|
"KM": 558545, |
|
"KW": 2993710, |
|
"LB": 4703865, |
|
"LY": 5099000, |
|
"MA": 22048254, |
|
"ML": 175981, |
|
"MR": 3404658, |
|
"NE": 47822, |
|
"NG": 151960, |
|
"OM": 3778520, |
|
"PS": 4818260, |
|
"QA": 2175311, |
|
"SA": 34173500, |
|
"SD": 27792576, |
|
"SO": 3997414, |
|
"SS": 2851524, |
|
"SY": 15518720, |
|
"TD": 2869158, |
|
"TJ": 976, |
|
"TN": 10549080, |
|
"TR": 459298, |
|
"YE": 22114456 |
|
} |
|
}, |
|
{ |
|
"language_name": "Urdu", |
|
"bcp_47": "ur", |
|
"speakers": 290790290, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2659144372728079, |
|
"chrf": 44.14831240898717 |
|
} |
|
], |
|
"bleu": 0.2659144372728079, |
|
"chrf": 44.14831240898717, |
|
"commonvoice_hours": 76.0, |
|
"commonvoice_locale": "ur", |
|
"population": { |
|
"CA": 286475, |
|
"GB": 2301638, |
|
"IN": 66304500, |
|
"MU": 71727, |
|
"PK": 221825950 |
|
} |
|
}, |
|
{ |
|
"language_name": "French", |
|
"bcp_47": "fr", |
|
"speakers": 278611507, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.315663773358301, |
|
"chrf": 49.253978669350964 |
|
} |
|
], |
|
"bleu": 0.315663773358301, |
|
"chrf": 49.253978669350964, |
|
"commonvoice_hours": 1052.0, |
|
"commonvoice_locale": "fr", |
|
"population": { |
|
"AD": 5775, |
|
"AT": 974540, |
|
"BE": 4453866, |
|
"BF": 4583788, |
|
"BI": 7000822, |
|
"BJ": 4502610, |
|
"BL": 6837, |
|
"CA": 11308230, |
|
"CD": 3867640, |
|
"CF": 2935521, |
|
"CG": 4446179, |
|
"CH": 1764838, |
|
"CI": 13465739, |
|
"CM": 18866600, |
|
"CY": 88668, |
|
"DE": 14428746, |
|
"DJ": 19358, |
|
"DZ": 8594580, |
|
"FR": 67169718, |
|
"GA": 1405473, |
|
"GB": 15125053, |
|
"GF": 153622, |
|
"GN": 3632946, |
|
"GP": 407498, |
|
"GQ": 73584, |
|
"GR": 954639, |
|
"HT": 520187, |
|
"HU": 293155, |
|
"IE": 880017, |
|
"IT": 3931370, |
|
"KM": 473917, |
|
"LB": 20238, |
|
"LU": 546691, |
|
"MA": 7112340, |
|
"MC": 38610, |
|
"MF": 32556, |
|
"MG": 18599433, |
|
"ML": 8994564, |
|
"MQ": 427408, |
|
"MR": 680932, |
|
"MT": 50299, |
|
"MU": 41381, |
|
"NC": 278409, |
|
"NE": 6603996, |
|
"NL": 5011316, |
|
"PF": 180024, |
|
"PM": 5133, |
|
"PT": 1545405, |
|
"RE": 700950, |
|
"RO": 3621493, |
|
"RW": 2288, |
|
"SC": 57589, |
|
"SN": 6137196, |
|
"SY": 1144506, |
|
"TD": 4388124, |
|
"TF": 140, |
|
"TG": 5251148, |
|
"TN": 8673688, |
|
"US": 1862778, |
|
"VU": 149166, |
|
"WF": 7610, |
|
"YT": 110580 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bangla", |
|
"bcp_47": "bn", |
|
"speakers": 267193288, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21265887286151353, |
|
"chrf": 41.501657722373686 |
|
} |
|
], |
|
"bleu": 0.21265887286151353, |
|
"chrf": 41.501657722373686, |
|
"commonvoice_hours": 49.0, |
|
"commonvoice_locale": "bn", |
|
"population": { |
|
"BD": 159397980, |
|
"CA": 90466, |
|
"GB": 263044, |
|
"IN": 107413290, |
|
"NP": 28508 |
|
} |
|
}, |
|
{ |
|
"language_name": "Portuguese", |
|
"bcp_47": "pt", |
|
"speakers": 237496885, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.27514792195783394, |
|
"chrf": 45.901248962808694 |
|
} |
|
], |
|
"bleu": 0.27514792195783394, |
|
"chrf": 45.901248962808694, |
|
"commonvoice_hours": 176.0, |
|
"commonvoice_locale": "pt", |
|
"population": { |
|
"AG": 1571, |
|
"AO": 21789941, |
|
"BR": 192661560, |
|
"CA": 229934, |
|
"CH": 285736, |
|
"CV": 443274, |
|
"FR": 882027, |
|
"GB": 131522, |
|
"GQ": 1, |
|
"GW": 1927100, |
|
"LU": 100541, |
|
"MO": 30723, |
|
"MZ": 8126514, |
|
"PT": 9890592, |
|
"ST": 179454, |
|
"TL": 816395 |
|
} |
|
}, |
|
{ |
|
"language_name": "Punjabi", |
|
"bcp_47": "pa", |
|
"speakers": 203571210, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.32250608979374484, |
|
"chrf": 48.43043110055342 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3048037308116852, |
|
"chrf": 48.4304965568793 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.2314793285308931, |
|
"chrf": 37.53667069805556 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.37468960333154994, |
|
"chrf": 53.381398796420086 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.359056244961623, |
|
"chrf": 52.278269268214366 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.27331521881795146, |
|
"chrf": 45.15087304059057 |
|
} |
|
], |
|
"bleu": 0.31097503604124127, |
|
"chrf": 47.53468991011888, |
|
"commonvoice_hours": 2.3, |
|
"commonvoice_locale": "pa-IN", |
|
"population": { |
|
"CA": 603106, |
|
"GB": 2367400, |
|
"IN": 37130520, |
|
"KE": 10170, |
|
"PK": 163450700, |
|
"SG": 9314 |
|
} |
|
}, |
|
{ |
|
"language_name": "Russian", |
|
"bcp_47": "ru", |
|
"speakers": 195841151, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.26108507692625094, |
|
"chrf": 45.063308940468154 |
|
} |
|
], |
|
"bleu": 0.26108507692625094, |
|
"chrf": 45.063308940468154, |
|
"commonvoice_hours": 241.0, |
|
"commonvoice_locale": "ru", |
|
"population": { |
|
"BG": 1602387, |
|
"BY": 1137350, |
|
"CA": 211087, |
|
"CN": 13940, |
|
"DE": 4809582, |
|
"EE": 688027, |
|
"FI": 45131, |
|
"GE": 359730, |
|
"IL": 954303, |
|
"KG": 2147364, |
|
"KZ": 13746168, |
|
"LT": 2185168, |
|
"LV": 714867, |
|
"MD": 100935, |
|
"MN": 4118, |
|
"PL": 6890814, |
|
"RU": 133218680, |
|
"SJ": 1200, |
|
"TJ": 1064840, |
|
"TM": 663436, |
|
"UA": 20204534, |
|
"US": 798334, |
|
"UZ": 4279156 |
|
} |
|
}, |
|
{ |
|
"language_name": "Swahili", |
|
"bcp_47": "sw", |
|
"speakers": 171610296, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2709203338132304, |
|
"chrf": 44.36399636969686 |
|
} |
|
], |
|
"bleu": 0.2709203338132304, |
|
"chrf": 44.36399636969686, |
|
"commonvoice_hours": 411.0, |
|
"commonvoice_locale": "sw", |
|
"population": { |
|
"BI": 6408, |
|
"CD": 50890000, |
|
"KE": 35328414, |
|
"MZ": 9330, |
|
"SO": 235142, |
|
"TZ": 52697520, |
|
"UG": 32439750, |
|
"YT": 2716, |
|
"ZA": 1016 |
|
} |
|
}, |
|
{ |
|
"language_name": "Indonesian", |
|
"bcp_47": "id", |
|
"speakers": 171207687, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.27441353638286026, |
|
"chrf": 46.025445629112156 |
|
} |
|
], |
|
"bleu": 0.27441353638286026, |
|
"chrf": 46.025445629112156, |
|
"commonvoice_hours": 33.0, |
|
"commonvoice_locale": "id", |
|
"population": { |
|
"ID": 170896640, |
|
"NL": 311047 |
|
} |
|
}, |
|
{ |
|
"language_name": "German", |
|
"bcp_47": "de", |
|
"speakers": 136350226, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3338682761061998, |
|
"chrf": 50.216731068308064 |
|
} |
|
], |
|
"bleu": 0.3338682761061998, |
|
"chrf": 50.216731068308064, |
|
"commonvoice_hours": 1357.0, |
|
"commonvoice_locale": "de", |
|
"population": { |
|
"AT": 8593666, |
|
"BE": 2578554, |
|
"BG": 557352, |
|
"BR": 1778414, |
|
"CA": 294014, |
|
"CH": 6134913, |
|
"CZ": 1605375, |
|
"DE": 72945327, |
|
"DK": 2758623, |
|
"FI": 1002901, |
|
"FR": 3392410, |
|
"GB": 5918499, |
|
"GR": 530355, |
|
"HU": 1758929, |
|
"IT": 998443, |
|
"KZ": 1221882, |
|
"LI": 39137, |
|
"LT": 382404, |
|
"LU": 395880, |
|
"NA": 23671, |
|
"NL": 12269084, |
|
"PL": 7273637, |
|
"PY": 208559, |
|
"RO": 44736, |
|
"SI": 883126, |
|
"SK": 1196932, |
|
"US": 1563403 |
|
} |
|
}, |
|
{ |
|
"language_name": "Japanese", |
|
"bcp_47": "ja", |
|
"speakers": 119729026, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2940100667664714, |
|
"chrf": 46.403097021492236 |
|
} |
|
], |
|
"bleu": 0.2940100667664714, |
|
"chrf": 46.403097021492236, |
|
"commonvoice_hours": 222.0, |
|
"commonvoice_locale": "ja", |
|
"population": { |
|
"BR": 444604, |
|
"CA": 52772, |
|
"JP": 119231650 |
|
} |
|
}, |
|
{ |
|
"language_name": "Telugu", |
|
"bcp_47": "te", |
|
"speakers": 95478480, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.28964452051612244, |
|
"chrf": 45.75290973782886 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2750887189010237, |
|
"chrf": 46.31463752811596 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.1314237858560668, |
|
"chrf": 27.750433857144273 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.35187073123584545, |
|
"chrf": 52.04190885735586 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.2808664068178743, |
|
"chrf": 48.221979700718 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.16468103557770178, |
|
"chrf": 36.43981433605732 |
|
} |
|
], |
|
"bleu": 0.24892919981743908, |
|
"chrf": 42.75361400287005, |
|
"commonvoice_hours": 0.3, |
|
"commonvoice_locale": "te", |
|
"population": { |
|
"IN": 95478480 |
|
} |
|
}, |
|
{ |
|
"language_name": "Marathi", |
|
"bcp_47": "mr", |
|
"speakers": 92826300, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.235200323237626, |
|
"chrf": 39.43789667749676 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2584800238292114, |
|
"chrf": 44.69889855306244 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.1158656438579424, |
|
"chrf": 27.118712681006436 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3039098126596327, |
|
"chrf": 48.26657289026638 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.23702154369195902, |
|
"chrf": 43.039588362590955 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.14770612974379574, |
|
"chrf": 35.63558588907277 |
|
} |
|
], |
|
"bleu": 0.21636391283669454, |
|
"chrf": 39.69954250891596, |
|
"commonvoice_hours": 20.0, |
|
"commonvoice_locale": "mr", |
|
"population": { |
|
"IN": 92826300 |
|
} |
|
}, |
|
{ |
|
"language_name": "Javanese", |
|
"bcp_47": "jv", |
|
"speakers": 91180665, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23082586428104943, |
|
"chrf": 41.42591471734489 |
|
} |
|
], |
|
"bleu": 0.23082586428104943, |
|
"chrf": 41.42591471734489, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "jv", |
|
"population": { |
|
"ID": 90788840, |
|
"MY": 391825 |
|
} |
|
}, |
|
{ |
|
"language_name": "Vietnamese", |
|
"bcp_47": "vi", |
|
"speakers": 86222962, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.2790022403255029, |
|
"chrf": 44.76577365559692 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.252552287345529, |
|
"chrf": 43.351007120897606 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.17142561681893811, |
|
"chrf": 34.23876708175754 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.32076560886563743, |
|
"chrf": 49.46269756420099 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.269842412561934, |
|
"chrf": 44.17252674642975 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.19118351096728373, |
|
"chrf": 37.642090247027234 |
|
} |
|
], |
|
"bleu": 0.24746194614747083, |
|
"chrf": 42.272143735985004, |
|
"commonvoice_hours": 5.9, |
|
"commonvoice_locale": "vi", |
|
"population": { |
|
"CA": 184701, |
|
"CN": 6970, |
|
"US": 1130973, |
|
"VN": 84900318 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tamil", |
|
"bcp_47": "ta", |
|
"speakers": 85616159, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.2159676106476219, |
|
"chrf": 38.592451568525966 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.24147470924504938, |
|
"chrf": 41.98664320436057 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.11055269618146167, |
|
"chrf": 26.929660798631293 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.2993653070835946, |
|
"chrf": 46.760725728832945 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.22772498517043588, |
|
"chrf": 40.963440857462984 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.14949134449145374, |
|
"chrf": 33.188135588116566 |
|
} |
|
], |
|
"bleu": 0.2074294421366029, |
|
"chrf": 38.07017629098839, |
|
"commonvoice_hours": 234.0, |
|
"commonvoice_locale": "ta", |
|
"population": { |
|
"CA": 184701, |
|
"GB": 2104355, |
|
"IN": 78239310, |
|
"LK": 3433380, |
|
"MU": 34484, |
|
"MY": 1371388, |
|
"RE": 118138, |
|
"SG": 130403 |
|
} |
|
}, |
|
{ |
|
"language_name": "Persian", |
|
"bcp_47": "fa", |
|
"speakers": 84710459, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2543274430452483, |
|
"chrf": 44.798186786819564 |
|
} |
|
], |
|
"bleu": 0.2543274430452483, |
|
"chrf": 44.798186786819564, |
|
"commonvoice_hours": 370.0, |
|
"commonvoice_locale": "fa", |
|
"population": { |
|
"AE": 189850, |
|
"AF": 18321900, |
|
"CA": 245012, |
|
"IQ": 338192, |
|
"IR": 63692475, |
|
"OM": 43849, |
|
"PK": 1541107, |
|
"QA": 268859, |
|
"TJ": 69215 |
|
} |
|
}, |
|
{ |
|
"language_name": "Turkish", |
|
"bcp_47": "tr", |
|
"speakers": 80360704, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2848412390293461, |
|
"chrf": 45.023438128876236 |
|
} |
|
], |
|
"bleu": 0.2848412390293461, |
|
"chrf": 45.023438128876236, |
|
"commonvoice_hours": 127.0, |
|
"commonvoice_locale": "tr", |
|
"population": { |
|
"BG": 766359, |
|
"CA": 37694, |
|
"CY": 291336, |
|
"DE": 2003992, |
|
"GB": 131522, |
|
"GR": 127285, |
|
"MK": 74409, |
|
"NL": 207365, |
|
"RO": 27694, |
|
"TR": 76276275, |
|
"UA": 184476, |
|
"UZ": 232297 |
|
} |
|
}, |
|
{ |
|
"language_name": "Cantonese", |
|
"bcp_47": "yue", |
|
"speakers": 79654759, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2745324223697869, |
|
"chrf": 46.18505717482203 |
|
} |
|
], |
|
"bleu": 0.2745324223697869, |
|
"chrf": 46.18505717482203, |
|
"commonvoice_hours": 203.0, |
|
"commonvoice_locale": "yue", |
|
"population": { |
|
"CA": 640800, |
|
"CN": 72489040, |
|
"HK": 6524919 |
|
} |
|
}, |
|
{ |
|
"language_name": "Korean", |
|
"bcp_47": "ko", |
|
"speakers": 78357046, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21423807187509414, |
|
"chrf": 42.31955622695572 |
|
} |
|
], |
|
"bleu": 0.21423807187509414, |
|
"chrf": 42.31955622695572, |
|
"commonvoice_hours": 1.7, |
|
"commonvoice_locale": "ko", |
|
"population": { |
|
"BR": 44460, |
|
"CA": 169623, |
|
"CN": 2091030, |
|
"JP": 652636, |
|
"KP": 22566280, |
|
"KR": 51835100, |
|
"US": 997917 |
|
} |
|
}, |
|
{ |
|
"language_name": "Italian", |
|
"bcp_47": "it", |
|
"speakers": 70247060, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.29744196180619636, |
|
"chrf": 46.58884190721562 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2947459489130278, |
|
"chrf": 48.23578446556176 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.26709213193768344, |
|
"chrf": 43.42719841351614 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.34518602347709243, |
|
"chrf": 51.45922256128821 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.3136120219290237, |
|
"chrf": 49.456527591725454 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.26629405288011837, |
|
"chrf": 44.95821657057411 |
|
} |
|
], |
|
"bleu": 0.29739535682385704, |
|
"chrf": 47.35429858498022, |
|
"commonvoice_hours": 362.0, |
|
"commonvoice_locale": "it", |
|
"population": { |
|
"AT": 797350, |
|
"AU": 483864, |
|
"BR": 592805, |
|
"CA": 343016, |
|
"CH": 361372, |
|
"DE": 5611179, |
|
"FR": 1153419, |
|
"GB": 131522, |
|
"HR": 67644, |
|
"IT": 59282565, |
|
"MT": 256070, |
|
"SI": 3995, |
|
"SM": 30466, |
|
"US": 1130973, |
|
"VA": 820 |
|
} |
|
}, |
|
{ |
|
"language_name": "Filipino", |
|
"bcp_47": "fil", |
|
"speakers": 67471096, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3020075248846111, |
|
"chrf": 45.148692233744825 |
|
} |
|
], |
|
"bleu": 0.3020075248846111, |
|
"chrf": 45.148692233744825, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "tl", |
|
"population": { |
|
"CA": 565412, |
|
"PH": 65508600, |
|
"US": 1397084 |
|
} |
|
}, |
|
{ |
|
"language_name": "Egyptian Arabic", |
|
"bcp_47": "arz", |
|
"speakers": 66639360, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.18353324091064518, |
|
"chrf": 37.67362087042454 |
|
} |
|
], |
|
"bleu": 0.18353324091064518, |
|
"chrf": 37.67362087042454, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"EG": 66639360 |
|
} |
|
}, |
|
{ |
|
"language_name": "Gujarati", |
|
"bcp_47": "gu", |
|
"speakers": 61721799, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.27618486571036477, |
|
"chrf": 45.30697533607047 |
|
} |
|
], |
|
"bleu": 0.27618486571036477, |
|
"chrf": 45.30697533607047, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "gu-IN", |
|
"population": { |
|
"CA": 135699, |
|
"GB": 1907072, |
|
"IN": 59674050, |
|
"KE": 4978 |
|
} |
|
}, |
|
{ |
|
"language_name": "Thai", |
|
"bcp_47": "th", |
|
"speakers": 55181920, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2461561900137243, |
|
"chrf": 43.886996888191135 |
|
} |
|
], |
|
"bleu": 0.2461561900137243, |
|
"chrf": 43.886996888191135, |
|
"commonvoice_hours": 172.0, |
|
"commonvoice_locale": "th", |
|
"population": { |
|
"TH": 55181920 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kannada", |
|
"bcp_47": "kn", |
|
"speakers": 49065330, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.25650866519447973, |
|
"chrf": 43.53706086839864 |
|
} |
|
], |
|
"bleu": 0.25650866519447973, |
|
"chrf": 43.53706086839864, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "kn", |
|
"population": { |
|
"IN": 49065330 |
|
} |
|
}, |
|
{ |
|
"language_name": "Malayalam", |
|
"bcp_47": "ml", |
|
"speakers": 43257484, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.23073727076678055, |
|
"chrf": 41.53402359471923 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21782657144614825, |
|
"chrf": 41.630569782738704 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.1695641998407403, |
|
"chrf": 33.20242503336964 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3195014249623395, |
|
"chrf": 50.399254960139395 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.2633223158501049, |
|
"chrf": 45.473592535604965 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.19162873119255258, |
|
"chrf": 38.21485785002488 |
|
} |
|
], |
|
"bleu": 0.23209675234311103, |
|
"chrf": 41.7424539594328, |
|
"commonvoice_hours": 2.8, |
|
"commonvoice_locale": "ml", |
|
"population": { |
|
"AE": 699446, |
|
"BH": 49665, |
|
"IL": 7981, |
|
"IN": 42434880, |
|
"MY": 48978, |
|
"QA": 6599, |
|
"SG": 9935 |
|
} |
|
}, |
|
{ |
|
"language_name": "Odia", |
|
"bcp_47": "or", |
|
"speakers": 42434880, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2616054244059909, |
|
"chrf": 44.81898318236423 |
|
} |
|
], |
|
"bleu": 0.2616054244059909, |
|
"chrf": 44.81898318236423, |
|
"commonvoice_hours": 2.8, |
|
"commonvoice_locale": "or", |
|
"population": { |
|
"IN": 42434880 |
|
} |
|
}, |
|
{ |
|
"language_name": "Polish", |
|
"bcp_47": "pl", |
|
"speakers": 41077399, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.24382878885531348, |
|
"chrf": 43.88802125000008 |
|
} |
|
], |
|
"bleu": 0.24382878885531348, |
|
"chrf": 43.88802125000008, |
|
"commonvoice_hours": 174.0, |
|
"commonvoice_locale": "pl", |
|
"population": { |
|
"CA": 173393, |
|
"CZ": 52442, |
|
"DE": 232463, |
|
"GB": 2630444, |
|
"IL": 130132, |
|
"PL": 36751008, |
|
"RO": 2769, |
|
"SK": 50598, |
|
"UA": 1054150 |
|
} |
|
}, |
|
{ |
|
"language_name": "Hausa", |
|
"bcp_47": "ha", |
|
"speakers": 40411882, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1493358875548207, |
|
"chrf": 31.734228520521885 |
|
} |
|
], |
|
"bleu": 0.1493358875548207, |
|
"chrf": 31.734228520521885, |
|
"commonvoice_hours": 4.1, |
|
"commonvoice_locale": "ha", |
|
"population": { |
|
"CM": 38843, |
|
"GH": 252326, |
|
"NE": 9336684, |
|
"NG": 29963920, |
|
"SD": 820109 |
|
} |
|
}, |
|
{ |
|
"language_name": "Sindhi", |
|
"bcp_47": "sd", |
|
"speakers": 40329510, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.22524971121549384, |
|
"chrf": 41.35718488130492 |
|
} |
|
], |
|
"bleu": 0.22524971121549384, |
|
"chrf": 41.35718488130492, |
|
"commonvoice_hours": 0.4, |
|
"commonvoice_locale": "sd", |
|
"population": { |
|
"IN": 5304360, |
|
"PK": 35025150 |
|
} |
|
}, |
|
{ |
|
"language_name": "Malay", |
|
"bcp_47": "ms", |
|
"speakers": 38097307, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.27545115634664297, |
|
"chrf": 46.5366529956061 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2445459295400275, |
|
"chrf": 43.683725288188164 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.23380594556884363, |
|
"chrf": 38.09288562825641 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3521510571182875, |
|
"chrf": 51.6107732437805 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.2984537737499322, |
|
"chrf": 47.07139912930323 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.20974647653543713, |
|
"chrf": 40.94603982712764 |
|
} |
|
], |
|
"bleu": 0.2690257231431951, |
|
"chrf": 44.656912685377016, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ms", |
|
"population": { |
|
"BN": 455189, |
|
"CC": 495, |
|
"ID": 12283196, |
|
"MY": 24489075, |
|
"SG": 869352 |
|
} |
|
}, |
|
{ |
|
"language_name": "Burmese", |
|
"bcp_47": "my", |
|
"speakers": 36559231, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.17529594258449108, |
|
"chrf": 38.09396067803311 |
|
} |
|
], |
|
"bleu": 0.17529594258449108, |
|
"chrf": 38.09396067803311, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "my", |
|
"population": { |
|
"BD": 341567, |
|
"MM": 36217664 |
|
} |
|
}, |
|
{ |
|
"language_name": "Amharic", |
|
"bcp_47": "am", |
|
"speakers": 35728475, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.16453710162389373, |
|
"chrf": 34.89886094698235 |
|
} |
|
], |
|
"bleu": 0.16453710162389373, |
|
"chrf": 34.89886094698235, |
|
"commonvoice_hours": 1.8, |
|
"commonvoice_locale": "am", |
|
"population": { |
|
"ET": 35677290, |
|
"IL": 51185 |
|
} |
|
}, |
|
{ |
|
"language_name": "Oromo", |
|
"bcp_47": "om", |
|
"speakers": 34897121, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.0691897827221633, |
|
"chrf": 22.166735299684706 |
|
} |
|
], |
|
"bleu": 0.0691897827221633, |
|
"chrf": 22.166735299684706, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "om", |
|
"population": { |
|
"ET": 34596160, |
|
"KE": 251581, |
|
"SO": 49380 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bhojpuri", |
|
"bcp_47": "bho", |
|
"speakers": 32934797, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23176648838308359, |
|
"chrf": 42.06617216025931 |
|
} |
|
], |
|
"bleu": 0.23176648838308359, |
|
"chrf": 42.06617216025931, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 30500070, |
|
"MU": 372430, |
|
"NP": 2062297 |
|
} |
|
}, |
|
{ |
|
"language_name": "Uzbek", |
|
"bcp_47": "uz", |
|
"speakers": 32792780, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2038544554531401, |
|
"chrf": 39.8364082393657 |
|
} |
|
], |
|
"bleu": 0.2038544554531401, |
|
"chrf": 39.8364082393657, |
|
"commonvoice_hours": 100.0, |
|
"commonvoice_locale": "uz", |
|
"population": { |
|
"AF": 1722259, |
|
"CN": 5576, |
|
"TM": 497577, |
|
"TR": 1968, |
|
"UZ": 30565400 |
|
} |
|
}, |
|
{ |
|
"language_name": "Azerbaijani", |
|
"bcp_47": "az", |
|
"speakers": 32446682, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1911853993562902, |
|
"chrf": 38.284553121320506 |
|
} |
|
], |
|
"bleu": 0.1911853993562902, |
|
"chrf": 38.284553121320506, |
|
"commonvoice_hours": 0.5, |
|
"commonvoice_locale": "az", |
|
"population": { |
|
"AM": 0, |
|
"AZ": 10093536, |
|
"IQ": 699709, |
|
"IR": 20381592, |
|
"RU": 131801, |
|
"TR": 1140044 |
|
} |
|
}, |
|
{ |
|
"language_name": "Sundanese", |
|
"bcp_47": "su", |
|
"speakers": 32043120, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.18638464691782505, |
|
"chrf": 36.390067106438586 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.22413489641063433, |
|
"chrf": 39.08607675576149 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.12396443500389862, |
|
"chrf": 27.44605100630464 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.31100961611618916, |
|
"chrf": 48.684591434160616 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.23467068441612768, |
|
"chrf": 40.54860164135514 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.1315217916431994, |
|
"chrf": 32.71394871178255 |
|
} |
|
], |
|
"bleu": 0.20194767841797903, |
|
"chrf": 37.47822277596717, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"ID": 32043120 |
|
} |
|
}, |
|
{ |
|
"language_name": "Dutch", |
|
"bcp_47": "nl", |
|
"speakers": 31765645, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2592795402705898, |
|
"chrf": 44.356739380497835 |
|
} |
|
], |
|
"bleu": 0.2592795402705898, |
|
"chrf": 44.356739380497835, |
|
"commonvoice_hours": 114.0, |
|
"commonvoice_locale": "nl", |
|
"population": { |
|
"AW": 115845, |
|
"BE": 6446385, |
|
"BQ": 1600, |
|
"CA": 56541, |
|
"CW": 12108, |
|
"DE": 7214373, |
|
"FR": 88203, |
|
"NL": 17280400, |
|
"SR": 548612, |
|
"SX": 1578 |
|
} |
|
}, |
|
{ |
|
"language_name": "Moroccan Arabic", |
|
"bcp_47": "ary", |
|
"speakers": 30938679, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1795140543637709, |
|
"chrf": 37.426822543484725 |
|
} |
|
], |
|
"bleu": 0.1795140543637709, |
|
"chrf": 37.426822543484725, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"MA": 30938679 |
|
} |
|
}, |
|
{ |
|
"language_name": "Ukrainian", |
|
"bcp_47": "uk", |
|
"speakers": 29348975, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.2564463888571809, |
|
"chrf": 41.5181715644979 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2922812040972885, |
|
"chrf": 46.82127627710616 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.24225796102393954, |
|
"chrf": 39.42058485499366 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3452563778145038, |
|
"chrf": 50.96771482708702 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.3292127494173498, |
|
"chrf": 48.580427643849056 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.2452825737163755, |
|
"chrf": 42.05493360532406 |
|
} |
|
], |
|
"bleu": 0.28512287582110635, |
|
"chrf": 44.893851462142976, |
|
"commonvoice_hours": 98.0, |
|
"commonvoice_locale": "uk", |
|
"population": { |
|
"CA": 75388, |
|
"MD": 471030, |
|
"PL": 149301, |
|
"RS": 0, |
|
"SK": 103371, |
|
"UA": 28549885 |
|
} |
|
}, |
|
{ |
|
"language_name": "Yoruba", |
|
"bcp_47": "yo", |
|
"speakers": 28685568, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.09852676389614487, |
|
"chrf": 25.656950226425916 |
|
} |
|
], |
|
"bleu": 0.09852676389614487, |
|
"chrf": 25.656950226425916, |
|
"commonvoice_hours": 5.9, |
|
"commonvoice_locale": "yo", |
|
"population": { |
|
"BJ": 861928, |
|
"NG": 27823640 |
|
} |
|
}, |
|
{ |
|
"language_name": "Igbo", |
|
"bcp_47": "ig", |
|
"speakers": 27823640, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1549827013842116, |
|
"chrf": 35.431035675871804 |
|
} |
|
], |
|
"bleu": 0.1549827013842116, |
|
"chrf": 35.431035675871804, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ig", |
|
"population": { |
|
"NG": 27823640 |
|
} |
|
}, |
|
{ |
|
"language_name": "Cebuano", |
|
"bcp_47": "ceb", |
|
"speakers": 26203440, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.27783470672988303, |
|
"chrf": 43.53549785827671 |
|
} |
|
], |
|
"bleu": 0.27783470672988303, |
|
"chrf": 43.53549785827671, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"PH": 26203440 |
|
} |
|
}, |
|
{ |
|
"language_name": "Awadhi", |
|
"bcp_47": "awa", |
|
"speakers": 25862924, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2554810263222905, |
|
"chrf": 42.35795046006446 |
|
} |
|
], |
|
"bleu": 0.2554810263222905, |
|
"chrf": 42.35795046006446, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 25195710, |
|
"NP": 667214 |
|
} |
|
}, |
|
{ |
|
"language_name": "Malagasy", |
|
"bcp_47": "mg", |
|
"speakers": 24260130, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.15163299980391426, |
|
"chrf": 32.41299083831688 |
|
} |
|
], |
|
"bleu": 0.15163299980391426, |
|
"chrf": 32.41299083831688, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "mg", |
|
"population": { |
|
"MG": 24260130 |
|
} |
|
}, |
|
{ |
|
"language_name": "Romanian", |
|
"bcp_47": "ro", |
|
"speakers": 22187408, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.33899025568959984, |
|
"chrf": 49.419389839471826 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.26666997541189236, |
|
"chrf": 44.76525386460237 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.24172488724041316, |
|
"chrf": 37.98045602918644 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.37365302832845815, |
|
"chrf": 52.777299654432 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.332600965807992, |
|
"chrf": 49.14582652136321 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.2510789925018768, |
|
"chrf": 42.27877315264307 |
|
} |
|
], |
|
"bleu": 0.30078635083003874, |
|
"chrf": 46.06116651028316, |
|
"commonvoice_hours": 21.0, |
|
"commonvoice_locale": "ro", |
|
"population": { |
|
"CA": 101774, |
|
"HU": 96741, |
|
"IL": 320993, |
|
"MD": 2119635, |
|
"RO": 19172610, |
|
"RS": 147256, |
|
"UA": 228399 |
|
} |
|
}, |
|
{ |
|
"language_name": "Nepali", |
|
"bcp_47": "ne", |
|
"speakers": 20903374, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.26199282928489126, |
|
"chrf": 44.7560662712792 |
|
} |
|
], |
|
"bleu": 0.26199282928489126, |
|
"chrf": 44.7560662712792, |
|
"commonvoice_hours": 1.3, |
|
"commonvoice_locale": "ne-NP", |
|
"population": { |
|
"BT": 132994, |
|
"IN": 7426104, |
|
"NP": 13344276 |
|
} |
|
}, |
|
{ |
|
"language_name": "Maithili", |
|
"bcp_47": "mai", |
|
"speakers": 19249149, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23975507119180453, |
|
"chrf": 41.8894484718934 |
|
} |
|
], |
|
"bleu": 0.23975507119180453, |
|
"chrf": 41.8894484718934, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "mai", |
|
"population": { |
|
"IN": 15913080, |
|
"NP": 3336069 |
|
} |
|
}, |
|
{ |
|
"language_name": "Assamese", |
|
"bcp_47": "as", |
|
"speakers": 17239170, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.19363225565136952, |
|
"chrf": 38.96237165376663 |
|
} |
|
], |
|
"bleu": 0.19363225565136952, |
|
"chrf": 38.96237165376663, |
|
"commonvoice_hours": 2.8, |
|
"commonvoice_locale": "as", |
|
"population": { |
|
"IN": 17239170 |
|
} |
|
}, |
|
{ |
|
"language_name": "Nyanja", |
|
"bcp_47": "ny", |
|
"speakers": 17026781, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.09504458945778768, |
|
"chrf": 27.576030002164906 |
|
} |
|
], |
|
"bleu": 0.09504458945778768, |
|
"chrf": 27.576030002164906, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ny", |
|
"population": { |
|
"MW": 13353858, |
|
"MZ": 782553, |
|
"ZM": 2613990, |
|
"ZW": 276380 |
|
} |
|
}, |
|
{ |
|
"language_name": "Somali", |
|
"bcp_47": "so", |
|
"speakers": 16911645, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.2024994684991584, |
|
"chrf": 37.37281822856629 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1532133716194419, |
|
"chrf": 32.05620028647162 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.043408496427191995, |
|
"chrf": 15.267715935014895 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3048371831537258, |
|
"chrf": 46.24092673305936 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.21360545410615966, |
|
"chrf": 38.32357547187653 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.06484340154849859, |
|
"chrf": 22.781181465233722 |
|
} |
|
], |
|
"bleu": 0.16373456255902938, |
|
"chrf": 32.00706968670374, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "so", |
|
"population": { |
|
"CA": 49002, |
|
"DJ": 377940, |
|
"ET": 6486780, |
|
"GB": 131522, |
|
"KE": 695863, |
|
"SO": 9170538 |
|
} |
|
}, |
|
{ |
|
"language_name": "Magahi", |
|
"bcp_47": "mag", |
|
"speakers": 15913080, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.29925558767802407, |
|
"chrf": 47.539870710677974 |
|
} |
|
], |
|
"bleu": 0.29925558767802407, |
|
"chrf": 47.539870710677974, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 15913080 |
|
} |
|
}, |
|
{ |
|
"language_name": "Serbian", |
|
"bcp_47": "sr", |
|
"speakers": 15602410, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.26029402164210574, |
|
"chrf": 44.75391848259974 |
|
} |
|
], |
|
"bleu": 0.26029402164210574, |
|
"chrf": 44.75391848259974, |
|
"commonvoice_hours": 7.4, |
|
"commonvoice_locale": "sr", |
|
"population": { |
|
"BA": 767118, |
|
"CA": 64080, |
|
"ME": 640352, |
|
"RO": 25563, |
|
"RS": 13884096, |
|
"RU": 4960, |
|
"TR": 22965, |
|
"XK": 193276 |
|
} |
|
}, |
|
{ |
|
"language_name": "Sinhala", |
|
"bcp_47": "si", |
|
"speakers": 15564656, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.20259734060180434, |
|
"chrf": 39.00188422851495 |
|
} |
|
], |
|
"bleu": 0.20259734060180434, |
|
"chrf": 39.00188422851495, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "si", |
|
"population": { |
|
"LK": 15564656 |
|
} |
|
}, |
|
{ |
|
"language_name": "Khmer", |
|
"bcp_47": "km", |
|
"speakers": 15065030, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.21699232146684352, |
|
"chrf": 41.99979148031644 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21417349432612984, |
|
"chrf": 41.35771196976409 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.03287369352293625, |
|
"chrf": 14.140423341647319 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.34264229339556035, |
|
"chrf": 51.55826045210756 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.24630515818736093, |
|
"chrf": 44.60963216433486 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.11830648687368288, |
|
"chrf": 31.534012306448343 |
|
} |
|
], |
|
"bleu": 0.1952155746287523, |
|
"chrf": 37.53330528576977, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "km", |
|
"population": { |
|
"KH": 15065030 |
|
} |
|
}, |
|
{ |
|
"language_name": "Chhattisgarhi", |
|
"bcp_47": "hne", |
|
"speakers": 14586990, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2212498883000727, |
|
"chrf": 39.102114067893005 |
|
} |
|
], |
|
"bleu": 0.2212498883000727, |
|
"chrf": 39.102114067893005, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 14586990 |
|
} |
|
}, |
|
{ |
|
"language_name": "Nigerian Fulfulde", |
|
"bcp_47": "fuv", |
|
"speakers": 14339876, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.08190470208193343, |
|
"chrf": 23.041107899884107 |
|
} |
|
], |
|
"bleu": 0.08190470208193343, |
|
"chrf": 23.041107899884107, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"NG": 14339876 |
|
} |
|
}, |
|
{ |
|
"language_name": "Zulu", |
|
"bcp_47": "zu", |
|
"speakers": 13973830, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.15449146502209737, |
|
"chrf": 33.087212745906356 |
|
} |
|
], |
|
"bleu": 0.15449146502209737, |
|
"chrf": 33.087212745906356, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "zu", |
|
"population": { |
|
"LS": 275706, |
|
"MW": 69949, |
|
"MZ": 1806, |
|
"SZ": 75105, |
|
"ZA": 13551264 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kazakh", |
|
"bcp_47": "kk", |
|
"speakers": 13637392, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2392246097188628, |
|
"chrf": 42.67763456362536 |
|
} |
|
], |
|
"bleu": 0.2392246097188628, |
|
"chrf": 42.67763456362536, |
|
"commonvoice_hours": 2.1, |
|
"commonvoice_locale": "kk", |
|
"population": { |
|
"AF": 2015, |
|
"CN": 1184917, |
|
"IR": 2972, |
|
"KZ": 12218816, |
|
"MN": 228098, |
|
"TR": 574 |
|
} |
|
}, |
|
{ |
|
"language_name": "Czech", |
|
"bcp_47": "cs", |
|
"speakers": 13045532, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2844520855192069, |
|
"chrf": 47.327010269160255 |
|
} |
|
], |
|
"bleu": 0.2844520855192069, |
|
"chrf": 47.327010269160255, |
|
"commonvoice_hours": 74.0, |
|
"commonvoice_locale": "cs", |
|
"population": { |
|
"CZ": 10488450, |
|
"SK": 2557082 |
|
} |
|
}, |
|
{ |
|
"language_name": "Swedish", |
|
"bcp_47": "sv", |
|
"speakers": 12932871, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.31838456223051165, |
|
"chrf": 48.08041424667649 |
|
} |
|
], |
|
"bleu": 0.31838456223051165, |
|
"chrf": 48.08041424667649, |
|
"commonvoice_hours": 47.0, |
|
"commonvoice_locale": "sv-SE", |
|
"population": { |
|
"AX": 25938, |
|
"DK": 763023, |
|
"FI": 2451535, |
|
"SE": 9692375 |
|
} |
|
}, |
|
{ |
|
"language_name": "Hungarian", |
|
"bcp_47": "hu", |
|
"speakers": 12443430, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2517614908428288, |
|
"chrf": 42.77520440394925 |
|
} |
|
], |
|
"bleu": 0.2517614908428288, |
|
"chrf": 42.77520440394925, |
|
"commonvoice_hours": 92.0, |
|
"commonvoice_locale": "hu", |
|
"population": { |
|
"AT": 23035, |
|
"CA": 49002, |
|
"HU": 9771830, |
|
"IL": 86755, |
|
"RO": 1405991, |
|
"RS": 336584, |
|
"SI": 9252, |
|
"SK": 598466, |
|
"UA": 162515 |
|
} |
|
}, |
|
{ |
|
"language_name": "Greek", |
|
"bcp_47": "el", |
|
"speakers": 12292242, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.24888370153898132, |
|
"chrf": 42.743109839531535 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.27269196827838943, |
|
"chrf": 45.53483489961114 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.21351544070708506, |
|
"chrf": 39.64425368969459 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3500489758234636, |
|
"chrf": 51.1729677922222 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.32858632704534785, |
|
"chrf": 49.70348294319061 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.1903000734693107, |
|
"chrf": 39.41911092527115 |
|
} |
|
], |
|
"bleu": 0.2673377478104297, |
|
"chrf": 44.7029600149202, |
|
"commonvoice_hours": 20.0, |
|
"commonvoice_locale": "el", |
|
"population": { |
|
"AL": 58417, |
|
"CA": 124391, |
|
"CY": 1203346, |
|
"DE": 304607, |
|
"EG": 63516, |
|
"GR": 10501029, |
|
"IT": 21841, |
|
"RO": 4048, |
|
"TR": 4019, |
|
"UA": 7028 |
|
} |
|
}, |
|
{ |
|
"language_name": "Shona", |
|
"bcp_47": "sn", |
|
"speakers": 11782503, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.10438047654339373, |
|
"chrf": 28.358507205354343 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1054140213254438, |
|
"chrf": 28.275522446025796 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.049580893458705456, |
|
"chrf": 18.458313551880636 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.20979752102494492, |
|
"chrf": 38.7737276002067 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.14066476436038525, |
|
"chrf": 32.050887533047465 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.060530921002659346, |
|
"chrf": 22.35054590384825 |
|
} |
|
], |
|
"bleu": 0.11172809961925541, |
|
"chrf": 28.04458404006053, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"ZW": 11782503 |
|
} |
|
}, |
|
{ |
|
"language_name": "Central Kurdish", |
|
"bcp_47": "ckb", |
|
"speakers": 11086549, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.20654412682006296, |
|
"chrf": 38.66802600490074 |
|
} |
|
], |
|
"bleu": 0.20654412682006296, |
|
"chrf": 38.66802600490074, |
|
"commonvoice_hours": 135.0, |
|
"commonvoice_locale": "ckb", |
|
"population": { |
|
"IQ": 7774540, |
|
"IR": 3312009 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kinyarwanda", |
|
"bcp_47": "rw", |
|
"speakers": 11083625, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.14006909985587948, |
|
"chrf": 31.739340000779823 |
|
} |
|
], |
|
"bleu": 0.14006909985587948, |
|
"chrf": 31.739340000779823, |
|
"commonvoice_hours": 2002.0, |
|
"commonvoice_locale": "rw", |
|
"population": { |
|
"CD": 386764, |
|
"RW": 9788548, |
|
"UG": 908313 |
|
} |
|
}, |
|
{ |
|
"language_name": "Wolof", |
|
"bcp_47": "wo", |
|
"speakers": 11025494, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.08408628490585719, |
|
"chrf": 23.767561072306325 |
|
} |
|
], |
|
"bleu": 0.08408628490585719, |
|
"chrf": 23.767561072306325, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "wo", |
|
"population": { |
|
"MR": 10014, |
|
"SN": 11015480 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tunisian Arabic", |
|
"bcp_47": "aeb", |
|
"speakers": 10549080, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23738824104522893, |
|
"chrf": 42.85642541970995 |
|
} |
|
], |
|
"bleu": 0.23738824104522893, |
|
"chrf": 42.85642541970995, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"TN": 10549080 |
|
} |
|
}, |
|
{ |
|
"language_name": "Iloko", |
|
"bcp_47": "ilo", |
|
"speakers": 10481376, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.20685666710862224, |
|
"chrf": 37.066073786659494 |
|
} |
|
], |
|
"bleu": 0.20685666710862224, |
|
"chrf": 37.066073786659494, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"PH": 10481376 |
|
} |
|
}, |
|
{ |
|
"language_name": "Xhosa", |
|
"bcp_47": "xh", |
|
"speakers": 10182944, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1143143326923908, |
|
"chrf": 28.93119601652647 |
|
} |
|
], |
|
"bleu": 0.1143143326923908, |
|
"chrf": 28.93119601652647, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "xh", |
|
"population": { |
|
"LS": 19496, |
|
"ZA": 10163448 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tigrinya", |
|
"bcp_47": "ti", |
|
"speakers": 10145911, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.08532345270447181, |
|
"chrf": 25.148121650983146 |
|
} |
|
], |
|
"bleu": 0.08532345270447181, |
|
"chrf": 25.148121650983146, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ti", |
|
"population": { |
|
"ER": 3648720, |
|
"ET": 6486780, |
|
"IL": 10411 |
|
} |
|
}, |
|
{ |
|
"language_name": "Belarusian", |
|
"bcp_47": "be", |
|
"speakers": 10064517, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.18341973561481445, |
|
"chrf": 39.828398360117035 |
|
} |
|
], |
|
"bleu": 0.18341973561481445, |
|
"chrf": 39.828398360117035, |
|
"commonvoice_hours": 1804.0, |
|
"commonvoice_locale": "be", |
|
"population": { |
|
"BY": 9477920, |
|
"PL": 222037, |
|
"UA": 364560 |
|
} |
|
}, |
|
{ |
|
"language_name": "Luba-Lulua", |
|
"bcp_47": "lua", |
|
"speakers": 9770880, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.11581604983636683, |
|
"chrf": 28.08252510561598 |
|
} |
|
], |
|
"bleu": 0.11581604983636683, |
|
"chrf": 28.08252510561598, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"CD": 9770880 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tajik", |
|
"bcp_47": "tg", |
|
"speakers": 9644223, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1846236171638531, |
|
"chrf": 39.50004300248175 |
|
} |
|
], |
|
"bleu": 0.1846236171638531, |
|
"chrf": 39.50004300248175, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "tg", |
|
"population": { |
|
"PK": 770553, |
|
"TJ": 8873670 |
|
} |
|
}, |
|
{ |
|
"language_name": "Umbundu", |
|
"bcp_47": "umb", |
|
"speakers": 9431467, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.05520341910203098, |
|
"chrf": 20.443280736080066 |
|
} |
|
], |
|
"bleu": 0.05520341910203098, |
|
"chrf": 20.443280736080066, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"AO": 9431467 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bambara", |
|
"bcp_47": "bm", |
|
"speakers": 9385632, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.07227674667013836, |
|
"chrf": 22.136582910055218 |
|
} |
|
], |
|
"bleu": 0.07227674667013836, |
|
"chrf": 22.136582910055218, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "bm", |
|
"population": { |
|
"ML": 9385632 |
|
} |
|
}, |
|
{ |
|
"language_name": "Afrikaans", |
|
"bcp_47": "af", |
|
"speakers": 9318845, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.3277177864074156, |
|
"chrf": 48.61873150516328 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.31538459755111, |
|
"chrf": 47.75260784921264 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.26710030799119333, |
|
"chrf": 38.869810330084285 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.4361740814378139, |
|
"chrf": 56.524736028951835 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.37149647257024515, |
|
"chrf": 53.20003536968165 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.2883662842075808, |
|
"chrf": 45.203083386764426 |
|
} |
|
], |
|
"bleu": 0.3343732550275598, |
|
"chrf": 48.361500744976354, |
|
"commonvoice_hours": 0.5, |
|
"commonvoice_locale": "af", |
|
"population": { |
|
"BW": 6025, |
|
"NA": 1972552, |
|
"ZA": 7340268 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kikuyu", |
|
"bcp_47": "ki", |
|
"speakers": 9099743, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.0883556207236924, |
|
"chrf": 24.868277910094278 |
|
} |
|
], |
|
"bleu": 0.0883556207236924, |
|
"chrf": 24.868277910094278, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ki", |
|
"population": { |
|
"KE": 9099743 |
|
} |
|
}, |
|
{ |
|
"language_name": "Haitian Creole", |
|
"bcp_47": "ht", |
|
"speakers": 8964918, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1872609836464467, |
|
"chrf": 37.00166091804026 |
|
} |
|
], |
|
"bleu": 0.1872609836464467, |
|
"chrf": 37.00166091804026, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ht", |
|
"population": { |
|
"HT": 8964918 |
|
} |
|
}, |
|
{ |
|
"language_name": "Catalan", |
|
"bcp_47": "ca", |
|
"speakers": 8679139, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.29445274007068095, |
|
"chrf": 47.46074814103581 |
|
} |
|
], |
|
"bleu": 0.29445274007068095, |
|
"chrf": 47.46074814103581, |
|
"commonvoice_hours": 2842.0, |
|
"commonvoice_locale": "ca", |
|
"population": { |
|
"AD": 39270, |
|
"ES": 8502686, |
|
"FR": 115342, |
|
"IT": 21841 |
|
} |
|
}, |
|
{ |
|
"language_name": "Hebrew", |
|
"bcp_47": "he", |
|
"speakers": 8675480, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2824719214447976, |
|
"chrf": 46.279771845770604 |
|
} |
|
], |
|
"bleu": 0.2824719214447976, |
|
"chrf": 46.279771845770604, |
|
"commonvoice_hours": 1.1, |
|
"commonvoice_locale": "he", |
|
"population": { |
|
"IL": 8675480 |
|
} |
|
}, |
|
{ |
|
"language_name": "Mossi", |
|
"bcp_47": "mos", |
|
"speakers": 8334160, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.08102496244147746, |
|
"chrf": 22.184797797745208 |
|
} |
|
], |
|
"bleu": 0.08102496244147746, |
|
"chrf": 22.184797797745208, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "mos", |
|
"population": { |
|
"BF": 8334160 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kimbundu", |
|
"bcp_47": "kmb", |
|
"speakers": 8130575, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.07329500673809967, |
|
"chrf": 22.838222030254723 |
|
} |
|
], |
|
"bleu": 0.07329500673809967, |
|
"chrf": 22.838222030254723, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"AO": 8130575 |
|
} |
|
}, |
|
{ |
|
"language_name": "Uyghur", |
|
"bcp_47": "ug", |
|
"speakers": 8052967, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.18397910035998616, |
|
"chrf": 35.50154017198535 |
|
} |
|
], |
|
"bleu": 0.18397910035998616, |
|
"chrf": 35.50154017198535, |
|
"commonvoice_hours": 361.0, |
|
"commonvoice_locale": "ug", |
|
"population": { |
|
"AF": 3005, |
|
"CN": 7667110, |
|
"KZ": 381838, |
|
"MN": 1014 |
|
} |
|
}, |
|
{ |
|
"language_name": "Minangkabau", |
|
"bcp_47": "min", |
|
"speakers": 8010780, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.22401269807719826, |
|
"chrf": 40.34678123737912 |
|
} |
|
], |
|
"bleu": 0.22401269807719826, |
|
"chrf": 40.34678123737912, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"ID": 8010780 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bulgarian", |
|
"bcp_47": "bg", |
|
"speakers": 7878315, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.24723779163445408, |
|
"chrf": 45.55403997487483 |
|
} |
|
], |
|
"bleu": 0.24723779163445408, |
|
"chrf": 45.55403997487483, |
|
"commonvoice_hours": 16.0, |
|
"commonvoice_locale": "bg", |
|
"population": { |
|
"BG": 6966900, |
|
"GR": 28639, |
|
"MD": 316263, |
|
"RO": 6817, |
|
"TR": 344474, |
|
"UA": 215222 |
|
} |
|
}, |
|
{ |
|
"language_name": "Standard Moroccan Tamazight", |
|
"bcp_47": "zgh", |
|
"speakers": 7823574, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.0366272802298245, |
|
"chrf": 15.463910171449278 |
|
} |
|
], |
|
"bleu": 0.0366272802298245, |
|
"chrf": 15.463910171449278, |
|
"commonvoice_hours": 1.3, |
|
"commonvoice_locale": "zgh", |
|
"population": { |
|
"MA": 7823574 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bosnian", |
|
"bcp_47": "bs", |
|
"speakers": 7594468, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3051247921441283, |
|
"chrf": 48.3731481201238 |
|
} |
|
], |
|
"bleu": 0.3051247921441283, |
|
"chrf": 48.3731481201238, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "bs", |
|
"population": { |
|
"BA": 7594468 |
|
} |
|
}, |
|
{ |
|
"language_name": "Rundi", |
|
"bcp_47": "rn", |
|
"speakers": 7475454, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.0957054530624, |
|
"chrf": 28.269164219007447 |
|
} |
|
], |
|
"bleu": 0.0957054530624, |
|
"chrf": 28.269164219007447, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"BI": 7475454 |
|
} |
|
}, |
|
{ |
|
"language_name": "Santali", |
|
"bcp_47": "sat", |
|
"speakers": 7293495, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.11554870024021023, |
|
"chrf": 29.549934477174254 |
|
} |
|
], |
|
"bleu": 0.11554870024021023, |
|
"chrf": 29.549934477174254, |
|
"commonvoice_hours": 0.5, |
|
"commonvoice_locale": "sat", |
|
"population": { |
|
"IN": 7293495 |
|
} |
|
}, |
|
{ |
|
"language_name": "Danish", |
|
"bcp_47": "da", |
|
"speakers": 7072056, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3512857581168584, |
|
"chrf": 51.12453594191334 |
|
} |
|
], |
|
"bleu": 0.3512857581168584, |
|
"chrf": 51.12453594191334, |
|
"commonvoice_hours": 13.0, |
|
"commonvoice_locale": "da", |
|
"population": { |
|
"DE": 1603194, |
|
"DK": 5458551, |
|
"GL": 8066, |
|
"IS": 2245 |
|
} |
|
}, |
|
{ |
|
"language_name": "Turkmen", |
|
"bcp_47": "tk", |
|
"speakers": 6870838, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.15410064596625964, |
|
"chrf": 36.3602620147462 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.14820890318014426, |
|
"chrf": 34.78567738931005 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.07938993687949465, |
|
"chrf": 24.385063397578556 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.2761834512123037, |
|
"chrf": 47.41646574422384 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.1718597543270264, |
|
"chrf": 38.84762953076257 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.10118596975980092, |
|
"chrf": 28.31840639855478 |
|
} |
|
], |
|
"bleu": 0.15515477688750492, |
|
"chrf": 35.018917412529326, |
|
"commonvoice_hours": 2.8, |
|
"commonvoice_locale": "tk", |
|
"population": { |
|
"AF": 622945, |
|
"IR": 2377852, |
|
"TM": 3870041 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kurdish", |
|
"bcp_47": "ku", |
|
"speakers": 6866757, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.14440915289810186, |
|
"chrf": 31.3622869278075 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.15987085387022903, |
|
"chrf": 35.18523232721762 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.10987778830152085, |
|
"chrf": 25.91454653951599 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.28985769410441137, |
|
"chrf": 46.64309582634758 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.1865343501300658, |
|
"chrf": 37.28483871763787 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.10000019378200214, |
|
"chrf": 26.406217887319293 |
|
} |
|
], |
|
"bleu": 0.16509167218105517, |
|
"chrf": 33.79936970430764, |
|
"commonvoice_hours": 69.0, |
|
"commonvoice_locale": "kmr", |
|
"population": { |
|
"AM": 99704, |
|
"AZ": 24494, |
|
"DE": 529054, |
|
"GE": 35573, |
|
"LB": 92983, |
|
"SY": 1551872, |
|
"TM": 22115, |
|
"TR": 4510962 |
|
} |
|
}, |
|
{ |
|
"language_name": "Croatian", |
|
"bcp_47": "hr", |
|
"speakers": 6813164, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2290484937313612, |
|
"chrf": 41.79307139114272 |
|
} |
|
], |
|
"bleu": 0.2290484937313612, |
|
"chrf": 41.79307139114272, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "hr", |
|
"population": { |
|
"AT": 106313, |
|
"BA": 460271, |
|
"CA": 45233, |
|
"DE": 633262, |
|
"HR": 4185472, |
|
"HU": 31270, |
|
"IT": 3495, |
|
"RS": 65213, |
|
"SI": 1282635 |
|
} |
|
}, |
|
{ |
|
"language_name": "Albanian", |
|
"bcp_47": "sq", |
|
"speakers": 6791906, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.26490711574268994, |
|
"chrf": 44.54318851690701 |
|
} |
|
], |
|
"bleu": 0.26490711574268994, |
|
"chrf": 44.54318851690701, |
|
"commonvoice_hours": 8.8, |
|
"commonvoice_locale": "sq", |
|
"population": { |
|
"AL": 3074580, |
|
"GR": 9971, |
|
"ME": 48179, |
|
"MK": 531492, |
|
"RS": 1332312, |
|
"TR": 17224, |
|
"XK": 1778148 |
|
} |
|
}, |
|
{ |
|
"language_name": "Slovak", |
|
"bcp_47": "sk", |
|
"speakers": 6680269, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2826836020834733, |
|
"chrf": 45.73110764547564 |
|
} |
|
], |
|
"bleu": 0.2826836020834733, |
|
"chrf": 45.73110764547564, |
|
"commonvoice_hours": 40.0, |
|
"commonvoice_locale": "sk", |
|
"population": { |
|
"CZ": 1712400, |
|
"HU": 11726, |
|
"RS": 59603, |
|
"SK": 4896540 |
|
} |
|
}, |
|
{ |
|
"language_name": "Dyula", |
|
"bcp_47": "dyu", |
|
"speakers": 6667328, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.0633017924291756, |
|
"chrf": 21.71247042480193 |
|
} |
|
], |
|
"bleu": 0.0633017924291756, |
|
"chrf": 21.71247042480193, |
|
"commonvoice_hours": 0.3, |
|
"commonvoice_locale": "dyu", |
|
"population": { |
|
"BF": 6667328 |
|
} |
|
}, |
|
{ |
|
"language_name": "Mongolian", |
|
"bcp_47": "mn", |
|
"speakers": 6572846, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1950781841033538, |
|
"chrf": 41.09779803278993 |
|
} |
|
], |
|
"bleu": 0.1950781841033538, |
|
"chrf": 41.09779803278993, |
|
"commonvoice_hours": 46.0, |
|
"commonvoice_locale": "mn", |
|
"population": { |
|
"CN": 3624452, |
|
"MN": 2946268, |
|
"RU": 2126 |
|
} |
|
}, |
|
{ |
|
"language_name": "Southern Sotho", |
|
"bcp_47": "st", |
|
"speakers": 6390567, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.12381413258013083, |
|
"chrf": 28.651371806370722 |
|
} |
|
], |
|
"bleu": 0.12381413258013083, |
|
"chrf": 28.651371806370722, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "st", |
|
"population": { |
|
"LS": 1929943, |
|
"ZA": 4460624 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tswana", |
|
"bcp_47": "tn", |
|
"speakers": 6113428, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.09139131060492443, |
|
"chrf": 25.97258334431281 |
|
} |
|
], |
|
"bleu": 0.09139131060492443, |
|
"chrf": 25.97258334431281, |
|
"commonvoice_hours": 4.2, |
|
"commonvoice_locale": "tn", |
|
"population": { |
|
"BW": 1436683, |
|
"NA": 14728, |
|
"ZA": 4630015, |
|
"ZW": 32002 |
|
} |
|
}, |
|
{ |
|
"language_name": "Guarani", |
|
"bcp_47": "gn", |
|
"speakers": 5827107, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.12296923497272805, |
|
"chrf": 29.040238903610113 |
|
} |
|
], |
|
"bleu": 0.12296923497272805, |
|
"chrf": 29.040238903610113, |
|
"commonvoice_hours": 3.7, |
|
"commonvoice_locale": "gn", |
|
"population": { |
|
"AR": 21375, |
|
"BO": 52380, |
|
"PY": 5753352 |
|
} |
|
}, |
|
{ |
|
"language_name": "Finnish", |
|
"bcp_47": "fi", |
|
"speakers": 5736842, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2306868672081301, |
|
"chrf": 42.094559446408105 |
|
} |
|
], |
|
"bleu": 0.2306868672081301, |
|
"chrf": 42.094559446408105, |
|
"commonvoice_hours": 15.0, |
|
"commonvoice_locale": "fi", |
|
"population": { |
|
"EE": 258010, |
|
"FI": 5237370, |
|
"RU": 17007, |
|
"SE": 224455 |
|
} |
|
}, |
|
{ |
|
"language_name": "Ganda", |
|
"bcp_47": "lg", |
|
"speakers": 5622890, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.09865217050437662, |
|
"chrf": 25.926064361947446 |
|
} |
|
], |
|
"bleu": 0.09865217050437662, |
|
"chrf": 25.926064361947446, |
|
"commonvoice_hours": 437.0, |
|
"commonvoice_locale": "lg", |
|
"population": { |
|
"UG": 5622890 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kashmiri", |
|
"bcp_47": "ks", |
|
"speakers": 5598085, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1344939664526747, |
|
"chrf": 32.68903932403509 |
|
} |
|
], |
|
"bleu": 0.1344939664526747, |
|
"chrf": 32.68903932403509, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 5436969, |
|
"PK": 161116 |
|
} |
|
}, |
|
{ |
|
"language_name": "Norwegian Bokmål", |
|
"bcp_47": "nb", |
|
"speakers": 5468932, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3568538739752233, |
|
"chrf": 50.18863565152686 |
|
} |
|
], |
|
"bleu": 0.3568538739752233, |
|
"chrf": 50.18863565152686, |
|
"commonvoice_hours": 0.1, |
|
"commonvoice_locale": "nb-NO", |
|
"population": { |
|
"NO": 5467440, |
|
"SJ": 1492 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bemba", |
|
"bcp_47": "bem", |
|
"speakers": 5402246, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.07496563614353445, |
|
"chrf": 23.431580504923282 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.10425825663987873, |
|
"chrf": 26.156513526794825 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.048552315311727906, |
|
"chrf": 17.052116746764433 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.20820762589055672, |
|
"chrf": 37.899164894105404 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.13037194233770932, |
|
"chrf": 29.069219847377738 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.07919429950933718, |
|
"chrf": 22.45526755754465 |
|
} |
|
], |
|
"bleu": 0.10759167930545738, |
|
"chrf": 26.01064384625172, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"ZM": 5402246 |
|
} |
|
}, |
|
{ |
|
"language_name": "Armenian", |
|
"bcp_47": "hy", |
|
"speakers": 5317273, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2525113198548088, |
|
"chrf": 44.115149170486895 |
|
} |
|
], |
|
"bleu": 0.2525113198548088, |
|
"chrf": 44.115149170486895, |
|
"commonvoice_hours": 31.0, |
|
"commonvoice_locale": "hy-AM", |
|
"population": { |
|
"AM": 2960894, |
|
"CY": 2787, |
|
"GE": 279790, |
|
"IR": 203816, |
|
"LB": 284420, |
|
"RU": 1190465, |
|
"SY": 349171, |
|
"TR": 45930 |
|
} |
|
}, |
|
{ |
|
"language_name": "Northern Sotho", |
|
"bcp_47": "nso", |
|
"speakers": 5307578, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.1287306186367617, |
|
"chrf": 28.538499437787404 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.11431860079235977, |
|
"chrf": 29.789689541768464 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.048032427671766596, |
|
"chrf": 16.511000736562355 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.277532484522071, |
|
"chrf": 43.725160462861595 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.1559013863573944, |
|
"chrf": 31.344526297642712 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.08683694629684643, |
|
"chrf": 24.176752802670837 |
|
} |
|
], |
|
"bleu": 0.13522541071286664, |
|
"chrf": 29.014271546548898, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "nso", |
|
"population": { |
|
"ZA": 5307578 |
|
} |
|
}, |
|
{ |
|
"language_name": "Luo (Kenya and Tanzania)", |
|
"bcp_47": "luo", |
|
"speakers": 5245734, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.07123028733548639, |
|
"chrf": 21.84956735049654 |
|
} |
|
], |
|
"bleu": 0.07123028733548639, |
|
"chrf": 21.84956735049654, |
|
"commonvoice_hours": 30.0, |
|
"commonvoice_locale": "luo", |
|
"population": { |
|
"KE": 5245734 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tok Pisin", |
|
"bcp_47": "tpi", |
|
"speakers": 5154217, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.17665711931817996, |
|
"chrf": 35.46692292627831 |
|
} |
|
], |
|
"bleu": 0.17665711931817996, |
|
"chrf": 35.46692292627831, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"PG": 5154217 |
|
} |
|
}, |
|
{ |
|
"language_name": "Lao", |
|
"bcp_47": "lo", |
|
"speakers": 5138706, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.17291556794348653, |
|
"chrf": 35.37210957380201 |
|
} |
|
], |
|
"bleu": 0.17291556794348653, |
|
"chrf": 35.37210957380201, |
|
"commonvoice_hours": 0.2, |
|
"commonvoice_locale": "lo", |
|
"population": { |
|
"LA": 5138706 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tsonga", |
|
"bcp_47": "ts", |
|
"speakers": 4880932, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.1264498146181144, |
|
"chrf": 26.535888048377064 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.09614725376527729, |
|
"chrf": 26.35974604226704 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.043920591728788254, |
|
"chrf": 15.171343812958735 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.2843690426617385, |
|
"chrf": 43.51952547276378 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.10072669531344912, |
|
"chrf": 24.778318092682298 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.0708900783780892, |
|
"chrf": 24.114324582460767 |
|
} |
|
], |
|
"bleu": 0.12041724607757613, |
|
"chrf": 26.746524341918285, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ts", |
|
"population": { |
|
"MZ": 2377758, |
|
"SZ": 18776, |
|
"ZA": 2484398 |
|
} |
|
}, |
|
{ |
|
"language_name": "Balinese", |
|
"bcp_47": "ban", |
|
"speakers": 4806468, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.20937766416587725, |
|
"chrf": 37.802202729584685 |
|
} |
|
], |
|
"bleu": 0.20937766416587725, |
|
"chrf": 37.802202729584685, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"ID": 4806468 |
|
} |
|
}, |
|
{ |
|
"language_name": "Ewe", |
|
"bcp_47": "ee", |
|
"speakers": 4690857, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.06328122760447334, |
|
"chrf": 21.930232101484705 |
|
} |
|
], |
|
"bleu": 0.06328122760447334, |
|
"chrf": 21.930232101484705, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ee", |
|
"population": { |
|
"GH": 3227422, |
|
"TG": 1463435 |
|
} |
|
}, |
|
{ |
|
"language_name": "Buginese", |
|
"bcp_47": "bug", |
|
"speakers": 4298211, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.11888625287150432, |
|
"chrf": 26.566035803697112 |
|
} |
|
], |
|
"bleu": 0.11888625287150432, |
|
"chrf": 26.566035803697112, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"ID": 4272416, |
|
"MY": 25795 |
|
} |
|
}, |
|
{ |
|
"language_name": "Goan Konkani", |
|
"bcp_47": "gom", |
|
"speakers": 4243488, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.17517997036818814, |
|
"chrf": 35.662782661637515 |
|
} |
|
], |
|
"bleu": 0.17517997036818814, |
|
"chrf": 35.662782661637515, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "gom", |
|
"population": { |
|
"IN": 4243488 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kamba", |
|
"bcp_47": "kam", |
|
"speakers": 4068120, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.09766297423802607, |
|
"chrf": 24.328994687372596 |
|
} |
|
], |
|
"bleu": 0.09766297423802607, |
|
"chrf": 24.328994687372596, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"KE": 4068120 |
|
} |
|
}, |
|
{ |
|
"language_name": "Banjar", |
|
"bcp_47": "bjn", |
|
"speakers": 4010288, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21429523594040997, |
|
"chrf": 37.997802850700054 |
|
} |
|
], |
|
"bleu": 0.21429523594040997, |
|
"chrf": 37.997802850700054, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"ID": 4005390, |
|
"MY": 4898 |
|
} |
|
}, |
|
{ |
|
"language_name": "Lombard", |
|
"bcp_47": "lmo", |
|
"speakers": 3901518, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.19986098660959015, |
|
"chrf": 38.27348032712485 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21159778572935684, |
|
"chrf": 40.44461475492081 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.1588300738463149, |
|
"chrf": 31.614789846388156 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.30563834118855027, |
|
"chrf": 47.111364119506355 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.22666325208418955, |
|
"chrf": 42.07703156302399 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.18882590620933629, |
|
"chrf": 37.12550972377164 |
|
} |
|
], |
|
"bleu": 0.215236057611223, |
|
"chrf": 39.44113172245597, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"CH": 344564, |
|
"IT": 3556954 |
|
} |
|
}, |
|
{ |
|
"language_name": "Achinese", |
|
"bcp_47": "ace", |
|
"speakers": 3738364, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.16911632683538352, |
|
"chrf": 35.055560798896856 |
|
} |
|
], |
|
"bleu": 0.16911632683538352, |
|
"chrf": 35.055560798896856, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ace", |
|
"population": { |
|
"ID": 3738364 |
|
} |
|
}, |
|
{ |
|
"language_name": "Shan", |
|
"bcp_47": "shn", |
|
"speakers": 3687984, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.03567194702202585, |
|
"chrf": 15.061253284595894 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.14589621017705648, |
|
"chrf": 32.36640913542123 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.011114664716630177, |
|
"chrf": 9.54345606166579 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.24688742301342204, |
|
"chrf": 43.47153430068834 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.11534595629433392, |
|
"chrf": 32.685789872044445 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.06564720827517354, |
|
"chrf": 21.409820368208937 |
|
} |
|
], |
|
"bleu": 0.10342723491644035, |
|
"chrf": 25.756377170437435, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "shn", |
|
"population": { |
|
"MM": 3621766, |
|
"TH": 66218 |
|
} |
|
}, |
|
{ |
|
"language_name": "Georgian", |
|
"bcp_47": "ka", |
|
"speakers": 3543646, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.22489436376782782, |
|
"chrf": 42.05355918136569 |
|
} |
|
], |
|
"bleu": 0.22489436376782782, |
|
"chrf": 42.05355918136569, |
|
"commonvoice_hours": 158.0, |
|
"commonvoice_locale": "ka", |
|
"population": { |
|
"GE": 3437420, |
|
"IR": 60296, |
|
"TR": 45930 |
|
} |
|
}, |
|
{ |
|
"language_name": "Galician", |
|
"bcp_47": "gl", |
|
"speakers": 3515530, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2463790593991139, |
|
"chrf": 43.16984633200989 |
|
} |
|
], |
|
"bleu": 0.2463790593991139, |
|
"chrf": 43.16984633200989, |
|
"commonvoice_hours": 109.0, |
|
"commonvoice_locale": "gl", |
|
"population": { |
|
"ES": 3501106, |
|
"PT": 14424 |
|
} |
|
}, |
|
{ |
|
"language_name": "Lingala", |
|
"bcp_47": "ln", |
|
"speakers": 3514491, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.10115588577551943, |
|
"chrf": 26.041173534129616 |
|
} |
|
], |
|
"bleu": 0.10115588577551943, |
|
"chrf": 26.041173534129616, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ln", |
|
"population": { |
|
"AO": 217899, |
|
"CD": 3155180, |
|
"CF": 14378, |
|
"CG": 127034 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kabyle", |
|
"bcp_47": "kab", |
|
"speakers": 3351886, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.03368838568519845, |
|
"chrf": 17.84430440143716 |
|
} |
|
], |
|
"bleu": 0.03368838568519845, |
|
"chrf": 17.84430440143716, |
|
"commonvoice_hours": 571.0, |
|
"commonvoice_locale": "kab", |
|
"population": { |
|
"DZ": 3351886 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kyrgyz", |
|
"bcp_47": "ky", |
|
"speakers": 3338267, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21002212869070494, |
|
"chrf": 39.3726736717899 |
|
} |
|
], |
|
"bleu": 0.21002212869070494, |
|
"chrf": 39.3726736717899, |
|
"commonvoice_hours": 39.0, |
|
"commonvoice_locale": "ky", |
|
"population": { |
|
"CN": 473967, |
|
"KG": 2863152, |
|
"TR": 1148 |
|
} |
|
}, |
|
{ |
|
"language_name": "Fon", |
|
"bcp_47": "fon", |
|
"speakers": 3216150, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.0832678269022026, |
|
"chrf": 21.627442109362057 |
|
} |
|
], |
|
"bleu": 0.0832678269022026, |
|
"chrf": 21.627442109362057, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"BJ": 3216150 |
|
} |
|
}, |
|
{ |
|
"language_name": "Waray", |
|
"bcp_47": "war", |
|
"speakers": 3166927, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2156899984074879, |
|
"chrf": 38.73293471051519 |
|
} |
|
], |
|
"bleu": 0.2156899984074879, |
|
"chrf": 38.73293471051519, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"CA": 678, |
|
"PH": 3166249 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tibetan", |
|
"bcp_47": "bo", |
|
"speakers": 3006697, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.11883469874802492, |
|
"chrf": 29.188000714511094 |
|
} |
|
], |
|
"bleu": 0.11883469874802492, |
|
"chrf": 29.188000714511094, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "bo", |
|
"population": { |
|
"CN": 2788040, |
|
"IN": 145870, |
|
"NP": 72787 |
|
} |
|
}, |
|
{ |
|
"language_name": "Sango", |
|
"bcp_47": "sg", |
|
"speakers": 2935521, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.052708457503892185, |
|
"chrf": 21.077342933150366 |
|
} |
|
], |
|
"bleu": 0.052708457503892185, |
|
"chrf": 21.077342933150366, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"CF": 2935521 |
|
} |
|
}, |
|
{ |
|
"language_name": "Aymara", |
|
"bcp_47": "ay", |
|
"speakers": 2838620, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.07563412710891973, |
|
"chrf": 23.042901816075858 |
|
} |
|
], |
|
"bleu": 0.07563412710891973, |
|
"chrf": 23.042901816075858, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"BO": 2327980, |
|
"PE": 510640 |
|
} |
|
}, |
|
{ |
|
"language_name": "Dogri", |
|
"bcp_47": "doi", |
|
"speakers": 2652180, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.18698274115592, |
|
"chrf": 36.17811444987121 |
|
} |
|
], |
|
"bleu": 0.18698274115592, |
|
"chrf": 36.17811444987121, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 2652180 |
|
} |
|
}, |
|
{ |
|
"language_name": "Lithuanian", |
|
"bcp_47": "lt", |
|
"speakers": 2488617, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23629191535308328, |
|
"chrf": 41.457632804056466 |
|
} |
|
], |
|
"bleu": 0.23629191535308328, |
|
"chrf": 41.457632804056466, |
|
"commonvoice_hours": 25.0, |
|
"commonvoice_locale": "lt", |
|
"population": { |
|
"GB": 131522, |
|
"LT": 2349056, |
|
"PL": 8039 |
|
} |
|
}, |
|
{ |
|
"language_name": "Swati", |
|
"bcp_47": "ss", |
|
"speakers": 2212379, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.10571792263190831, |
|
"chrf": 26.72182646364123 |
|
} |
|
], |
|
"bleu": 0.10571792263190831, |
|
"chrf": 26.72182646364123, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "ss", |
|
"population": { |
|
"LS": 47264, |
|
"SZ": 640598, |
|
"ZA": 1524517 |
|
} |
|
}, |
|
{ |
|
"language_name": "Occitan", |
|
"bcp_47": "oc", |
|
"speakers": 2040398, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3116700967049491, |
|
"chrf": 49.33859359679982 |
|
} |
|
], |
|
"bleu": 0.3116700967049491, |
|
"chrf": 49.33859359679982, |
|
"commonvoice_hours": 1.8, |
|
"commonvoice_locale": "oc", |
|
"population": { |
|
"ES": 4952, |
|
"FR": 2035446 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tatar", |
|
"bcp_47": "tt", |
|
"speakers": 1984108, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.20199966692246552, |
|
"chrf": 38.969447814905855 |
|
} |
|
], |
|
"bleu": 0.20199966692246552, |
|
"chrf": 38.969447814905855, |
|
"commonvoice_hours": 32.0, |
|
"commonvoice_locale": "tt", |
|
"population": { |
|
"RU": 1984108 |
|
} |
|
}, |
|
{ |
|
"language_name": "Slovenian", |
|
"bcp_47": "sl", |
|
"speakers": 1973181, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.25710751649810404, |
|
"chrf": 43.97419502631293 |
|
} |
|
], |
|
"bleu": 0.25710751649810404, |
|
"chrf": 43.97419502631293, |
|
"commonvoice_hours": 17.0, |
|
"commonvoice_locale": "sl", |
|
"population": { |
|
"AT": 32780, |
|
"HU": 4984, |
|
"IT": 106085, |
|
"SI": 1829332 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bodo", |
|
"bcp_47": "brx", |
|
"speakers": 1856526, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.07193315161893905, |
|
"chrf": 21.198050861825372 |
|
} |
|
], |
|
"bleu": 0.07193315161893905, |
|
"chrf": 21.198050861825372, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 1856526 |
|
} |
|
}, |
|
{ |
|
"language_name": "Chuvash", |
|
"bcp_47": "cv", |
|
"speakers": 1842386, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.16319209573807847, |
|
"chrf": 35.5605244185656 |
|
} |
|
], |
|
"bleu": 0.16319209573807847, |
|
"chrf": 35.5605244185656, |
|
"commonvoice_hours": 27.0, |
|
"commonvoice_locale": "cv", |
|
"population": { |
|
"RU": 1842386 |
|
} |
|
}, |
|
{ |
|
"language_name": "Bashkir", |
|
"bcp_47": "ba", |
|
"speakers": 1842386, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23494956875272427, |
|
"chrf": 43.58361096793536 |
|
} |
|
], |
|
"bleu": 0.23494956875272427, |
|
"chrf": 43.58361096793536, |
|
"commonvoice_hours": 259.0, |
|
"commonvoice_locale": "ba", |
|
"population": { |
|
"RU": 1842386 |
|
} |
|
}, |
|
{ |
|
"language_name": "Tumbuka", |
|
"bcp_47": "tum", |
|
"speakers": 1780514, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.09211959148198216, |
|
"chrf": 25.078974624106454 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.08953119623294435, |
|
"chrf": 26.60406076382521 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.036353192983993324, |
|
"chrf": 15.247949668242475 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.21852974820220555, |
|
"chrf": 40.790711915222424 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.13308678184347988, |
|
"chrf": 31.89595169117875 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.06252197708878435, |
|
"chrf": 23.417269345311365 |
|
} |
|
], |
|
"bleu": 0.10535708130556494, |
|
"chrf": 27.172486334647783, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"MW": 1780514 |
|
} |
|
}, |
|
{ |
|
"language_name": "Macedonian", |
|
"bcp_47": "mk", |
|
"speakers": 1608565, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2635416107541368, |
|
"chrf": 46.15461303306508 |
|
} |
|
], |
|
"bleu": 0.2635416107541368, |
|
"chrf": 46.15461303306508, |
|
"commonvoice_hours": 18.0, |
|
"commonvoice_locale": "mk", |
|
"population": { |
|
"AL": 14451, |
|
"GR": 169714, |
|
"MK": 1424400 |
|
} |
|
}, |
|
{ |
|
"language_name": "Pangasinan", |
|
"bcp_47": "pag", |
|
"speakers": 1528534, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.14637588345836686, |
|
"chrf": 33.27328635596556 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.17061619096272593, |
|
"chrf": 35.63408741214199 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.11313843155080379, |
|
"chrf": 26.507505375137484 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.27369890360254523, |
|
"chrf": 44.34141738332121 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.19116528491340065, |
|
"chrf": 36.672507303893106 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.11054650956119119, |
|
"chrf": 30.67803234997905 |
|
} |
|
], |
|
"bleu": 0.16759020067483896, |
|
"chrf": 34.51780603007307, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"PH": 1528534 |
|
} |
|
}, |
|
{ |
|
"language_name": "Manipuri", |
|
"bcp_47": "mni", |
|
"speakers": 1476591, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.061702153982680315, |
|
"chrf": 20.627265799751633 |
|
} |
|
], |
|
"bleu": 0.061702153982680315, |
|
"chrf": 20.627265799751633, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "mni", |
|
"population": { |
|
"BD": 17892, |
|
"IN": 1458699 |
|
} |
|
}, |
|
{ |
|
"language_name": "Venetian", |
|
"bcp_47": "vec", |
|
"speakers": 1380829, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.24764447442173138, |
|
"chrf": 41.97335861313842 |
|
} |
|
], |
|
"bleu": 0.24764447442173138, |
|
"chrf": 41.97335861313842, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "vec", |
|
"population": { |
|
"BR": 508118, |
|
"HR": 29594, |
|
"IT": 811235, |
|
"MX": 2444, |
|
"SI": 29438 |
|
} |
|
}, |
|
{ |
|
"language_name": "Norwegian Nynorsk", |
|
"bcp_47": "nn", |
|
"speakers": 1366860, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.31661912673403325, |
|
"chrf": 48.792392911852595 |
|
} |
|
], |
|
"bleu": 0.31661912673403325, |
|
"chrf": 48.792392911852595, |
|
"commonvoice_hours": 1.5, |
|
"commonvoice_locale": "nn-NO", |
|
"population": { |
|
"NO": 1366860 |
|
} |
|
}, |
|
{ |
|
"language_name": "Irish", |
|
"bcp_47": "ga", |
|
"speakers": 1237487, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2768559181644857, |
|
"chrf": 46.47151564403362 |
|
} |
|
], |
|
"bleu": 0.2768559181644857, |
|
"chrf": 46.47151564403362, |
|
"commonvoice_hours": 5.8, |
|
"commonvoice_locale": "ga-IE", |
|
"population": { |
|
"GB": 98642, |
|
"IE": 1138845 |
|
} |
|
}, |
|
{ |
|
"language_name": "Latvian", |
|
"bcp_47": "lv", |
|
"speakers": 1147550, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23200427142275887, |
|
"chrf": 44.00679383253316 |
|
} |
|
], |
|
"bleu": 0.23200427142275887, |
|
"chrf": 44.00679383253316, |
|
"commonvoice_hours": 260.0, |
|
"commonvoice_locale": "lv", |
|
"population": { |
|
"LV": 1147550 |
|
} |
|
}, |
|
{ |
|
"language_name": "Basque", |
|
"bcp_47": "eu", |
|
"speakers": 1088519, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1907277513380933, |
|
"chrf": 40.633564870804214 |
|
} |
|
], |
|
"bleu": 0.1907277513380933, |
|
"chrf": 40.633564870804214, |
|
"commonvoice_hours": 335.0, |
|
"commonvoice_locale": "eu", |
|
"population": { |
|
"ES": 1000316, |
|
"FR": 88203 |
|
} |
|
}, |
|
{ |
|
"language_name": "Sardinian", |
|
"bcp_47": "sc", |
|
"speakers": 1060846, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2003666163856343, |
|
"chrf": 39.97859549386356 |
|
} |
|
], |
|
"bleu": 0.2003666163856343, |
|
"chrf": 39.97859549386356, |
|
"commonvoice_hours": 2.9, |
|
"commonvoice_locale": "sc", |
|
"population": { |
|
"IT": 1060846 |
|
} |
|
}, |
|
{ |
|
"language_name": "Najdi Arabic", |
|
"bcp_47": "ars", |
|
"speakers": 1025205, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.26325866988203733, |
|
"chrf": 45.79452460253912 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.25411630061861235, |
|
"chrf": 45.68081123321704 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.19634428413472024, |
|
"chrf": 37.402576382999925 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3267312117229826, |
|
"chrf": 50.07524798517934 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.27947088689796734, |
|
"chrf": 47.70370329275568 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.23043700347741075, |
|
"chrf": 40.64509062227617 |
|
} |
|
], |
|
"bleu": 0.2583930594556218, |
|
"chrf": 44.550325686494546, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"SA": 1025205 |
|
} |
|
}, |
|
{ |
|
"language_name": "Yiddish", |
|
"bcp_47": "yi", |
|
"speakers": 997214, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2748989006328114, |
|
"chrf": 44.151717001541904 |
|
} |
|
], |
|
"bleu": 0.2748989006328114, |
|
"chrf": 44.151717001541904, |
|
"commonvoice_hours": 0.5, |
|
"commonvoice_locale": "yi", |
|
"population": { |
|
"IL": 260264, |
|
"SE": 2959, |
|
"UA": 570998, |
|
"US": 162993 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kachin", |
|
"bcp_47": "kac", |
|
"speakers": 962032, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.06343642810657522, |
|
"chrf": 21.96116119019238 |
|
} |
|
], |
|
"bleu": 0.06343642810657522, |
|
"chrf": 21.96116119019238, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"MM": 962032 |
|
} |
|
}, |
|
{ |
|
"language_name": "Limburgish", |
|
"bcp_47": "li", |
|
"speakers": 950422, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.28017358847160223, |
|
"chrf": 45.82764538788154 |
|
} |
|
], |
|
"bleu": 0.28017358847160223, |
|
"chrf": 45.82764538788154, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"NL": 950422 |
|
} |
|
}, |
|
{ |
|
"language_name": "Welsh", |
|
"bcp_47": "cy", |
|
"speakers": 884910, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.31667961925197524, |
|
"chrf": 48.49344578612579 |
|
} |
|
], |
|
"bleu": 0.31667961925197524, |
|
"chrf": 48.49344578612579, |
|
"commonvoice_hours": 124.0, |
|
"commonvoice_locale": "cy", |
|
"population": { |
|
"AR": 30016, |
|
"GB": 854894 |
|
} |
|
}, |
|
{ |
|
"language_name": "Estonian", |
|
"bcp_47": "et", |
|
"speakers": 878449, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.23762161272302187, |
|
"chrf": 42.90409268311042 |
|
} |
|
], |
|
"bleu": 0.23762161272302187, |
|
"chrf": 42.90409268311042, |
|
"commonvoice_hours": 58.0, |
|
"commonvoice_locale": "et", |
|
"population": { |
|
"EE": 872320, |
|
"FI": 6129 |
|
} |
|
}, |
|
{ |
|
"language_name": "Asturian", |
|
"bcp_47": "ast", |
|
"speakers": 650205, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.3066166431048003, |
|
"chrf": 47.792858053998366 |
|
} |
|
], |
|
"bleu": 0.3066166431048003, |
|
"chrf": 47.792858053998366, |
|
"commonvoice_hours": 0.7, |
|
"commonvoice_locale": "ast", |
|
"population": { |
|
"ES": 650205 |
|
} |
|
}, |
|
{ |
|
"language_name": "N’Ko", |
|
"bcp_47": "nqo", |
|
"speakers": 626370, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.0026829540009563496, |
|
"chrf": 8.366238228343608 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.0028810767141941676, |
|
"chrf": 11.711522538883516 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.002244809403558117, |
|
"chrf": 6.87154254960649 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.1373860974763018, |
|
"chrf": 29.63649387292498 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.005449384832055512, |
|
"chrf": 13.63303465097306 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.001220306675003964, |
|
"chrf": 11.614232149229839 |
|
} |
|
], |
|
"bleu": 0.02531077151701165, |
|
"chrf": 13.638843998326914, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "nqo", |
|
"population": { |
|
"GN": 626370 |
|
} |
|
}, |
|
{ |
|
"language_name": "Nuer", |
|
"bcp_47": "nus", |
|
"speakers": 591427, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.04422064781985695, |
|
"chrf": 18.101658717442856 |
|
} |
|
], |
|
"bleu": 0.04422064781985695, |
|
"chrf": 18.101658717442856, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"SS": 591427 |
|
} |
|
}, |
|
{ |
|
"language_name": "Ligurian", |
|
"bcp_47": "lij", |
|
"speakers": 536663, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.2433180508520944, |
|
"chrf": 42.16628456571689 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2730358021257564, |
|
"chrf": 43.59770121161605 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.1659569541464764, |
|
"chrf": 32.04882604989477 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.3868854055493315, |
|
"chrf": 52.982923067584665 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.30131335750773747, |
|
"chrf": 47.80059076162273 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.22953082347299453, |
|
"chrf": 39.89195612874355 |
|
} |
|
], |
|
"bleu": 0.26667339894239844, |
|
"chrf": 43.08138029752978, |
|
"commonvoice_hours": 5.1, |
|
"commonvoice_locale": "lij", |
|
"population": { |
|
"IT": 536663 |
|
} |
|
}, |
|
{ |
|
"language_name": "Kabuverdianu", |
|
"bcp_47": "kea", |
|
"speakers": 530762, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2049568393036302, |
|
"chrf": 39.12735936405683 |
|
} |
|
], |
|
"bleu": 0.2049568393036302, |
|
"chrf": 39.12735936405683, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"CV": 530762 |
|
} |
|
}, |
|
{ |
|
"language_name": "Mari", |
|
"bcp_47": "chm", |
|
"speakers": 524371, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.1477332953533076, |
|
"chrf": 33.28969144955911 |
|
} |
|
], |
|
"bleu": 0.1477332953533076, |
|
"chrf": 33.28969144955911, |
|
"commonvoice_hours": 282.0, |
|
"commonvoice_locale": "mhr", |
|
"population": { |
|
"RU": 524371 |
|
} |
|
}, |
|
{ |
|
"language_name": "Sicilian", |
|
"bcp_47": "scn", |
|
"speakers": 511702, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.26991391704955275, |
|
"chrf": 44.10988575231252 |
|
} |
|
], |
|
"bleu": 0.26991391704955275, |
|
"chrf": 44.10988575231252, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "scn", |
|
"population": { |
|
"IT": 511702 |
|
} |
|
}, |
|
{ |
|
"language_name": "Silesian", |
|
"bcp_47": "szl", |
|
"speakers": 497670, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2478859256009672, |
|
"chrf": 42.936549641246145 |
|
} |
|
], |
|
"bleu": 0.2478859256009672, |
|
"chrf": 42.936549641246145, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"PL": 497670 |
|
} |
|
}, |
|
{ |
|
"language_name": "Maltese", |
|
"bcp_47": "mt", |
|
"speakers": 457267, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.27335683193570975, |
|
"chrf": 45.920903610737895 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.28654849898846085, |
|
"chrf": 46.936205424540766 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.15248109554681186, |
|
"chrf": 30.516627088468166 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.38954095833662916, |
|
"chrf": 54.945196672005885 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.3175303995061197, |
|
"chrf": 51.04064318379729 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.11179045198515461, |
|
"chrf": 30.191257026189298 |
|
} |
|
], |
|
"bleu": 0.2552080393831477, |
|
"chrf": 43.25847216762322, |
|
"commonvoice_hours": 8.7, |
|
"commonvoice_locale": "mt", |
|
"population": { |
|
"MT": 457267 |
|
} |
|
}, |
|
{ |
|
"language_name": "Luxembourgish", |
|
"bcp_47": "lb", |
|
"speakers": 421015, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2835765541228824, |
|
"chrf": 44.80618475111259 |
|
} |
|
], |
|
"bleu": 0.2835765541228824, |
|
"chrf": 44.80618475111259, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "lb", |
|
"population": { |
|
"LU": 421015 |
|
} |
|
}, |
|
{ |
|
"language_name": "Dzongkha", |
|
"bcp_47": "dz", |
|
"speakers": 370341, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.05723633975042216, |
|
"chrf": 23.461346449303786 |
|
} |
|
], |
|
"bleu": 0.05723633975042216, |
|
"chrf": 23.461346449303786, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"BT": 367689, |
|
"IN": 2652 |
|
} |
|
}, |
|
{ |
|
"language_name": "Fijian", |
|
"bcp_47": "fj", |
|
"speakers": 365030, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.10451524271139898, |
|
"chrf": 24.713018515709646 |
|
} |
|
], |
|
"bleu": 0.10451524271139898, |
|
"chrf": 24.713018515709646, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"FJ": 365030 |
|
} |
|
}, |
|
{ |
|
"language_name": "Icelandic", |
|
"bcp_47": "is", |
|
"speakers": 350734, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2142644347281729, |
|
"chrf": 40.04812999157868 |
|
} |
|
], |
|
"bleu": 0.2142644347281729, |
|
"chrf": 40.04812999157868, |
|
"commonvoice_hours": 0.1, |
|
"commonvoice_locale": "is", |
|
"population": { |
|
"IS": 350734 |
|
} |
|
}, |
|
{ |
|
"language_name": "Samoan", |
|
"bcp_47": "sm", |
|
"speakers": 252717, |
|
"scores": [ |
|
{ |
|
"model": "openai/gpt-4o-mini", |
|
"bleu": 0.13327372905795537, |
|
"chrf": 28.9583532166856 |
|
}, |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.11602460228698847, |
|
"chrf": 29.156949243212015 |
|
}, |
|
{ |
|
"model": "mistralai/mistral-small-24b-instruct-2501", |
|
"bleu": 0.05771585788755527, |
|
"chrf": 16.752178728973906 |
|
}, |
|
{ |
|
"model": "google/gemini-2.0-flash-001", |
|
"bleu": 0.2585259997356889, |
|
"chrf": 45.18784342425295 |
|
}, |
|
{ |
|
"model": "deepseek/deepseek-chat", |
|
"bleu": 0.22221137013078898, |
|
"chrf": 39.7496231353589 |
|
}, |
|
{ |
|
"model": "microsoft/phi-4", |
|
"bleu": 0.04756300118196289, |
|
"chrf": 21.060764155029197 |
|
} |
|
], |
|
"bleu": 0.13921909338015664, |
|
"chrf": 30.144285317252095, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"AS": 48943, |
|
"WS": 203774 |
|
} |
|
}, |
|
{ |
|
"language_name": "Crimean Tatar", |
|
"bcp_47": "crh", |
|
"speakers": 245968, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.22725256040555009, |
|
"chrf": 42.07005703444819 |
|
} |
|
], |
|
"bleu": 0.22725256040555009, |
|
"chrf": 42.07005703444819, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "crh", |
|
"population": { |
|
"UA": 245968 |
|
} |
|
}, |
|
{ |
|
"language_name": "Papiamento", |
|
"bcp_47": "pap", |
|
"speakers": 211640, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21648792499796674, |
|
"chrf": 41.57061175824069 |
|
} |
|
], |
|
"bleu": 0.21648792499796674, |
|
"chrf": 41.57061175824069, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "pap-AW", |
|
"population": { |
|
"AW": 72851, |
|
"BQ": 16200, |
|
"CW": 122589 |
|
} |
|
}, |
|
{ |
|
"language_name": "Latgalian", |
|
"bcp_47": "ltg", |
|
"speakers": 167429, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.13475273241606922, |
|
"chrf": 32.044009672423776 |
|
} |
|
], |
|
"bleu": 0.13475273241606922, |
|
"chrf": 32.044009672423776, |
|
"commonvoice_hours": 28.0, |
|
"commonvoice_locale": "ltg", |
|
"population": { |
|
"LV": 167429 |
|
} |
|
}, |
|
{ |
|
"language_name": "Māori", |
|
"bcp_47": "mi", |
|
"speakers": 137913, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.17610729049259877, |
|
"chrf": 35.01961886760811 |
|
} |
|
], |
|
"bleu": 0.17610729049259877, |
|
"chrf": 35.01961886760811, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"NZ": 137913 |
|
} |
|
}, |
|
{ |
|
"language_name": "Scottish Gaelic", |
|
"bcp_47": "gd", |
|
"speakers": 72337, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2154279041570466, |
|
"chrf": 37.40630914857015 |
|
} |
|
], |
|
"bleu": 0.2154279041570466, |
|
"chrf": 37.40630914857015, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"GB": 72337 |
|
} |
|
}, |
|
{ |
|
"language_name": "Faroese", |
|
"bcp_47": "fo", |
|
"speakers": 71351, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.21180629663838063, |
|
"chrf": 39.28673819745006 |
|
} |
|
], |
|
"bleu": 0.21180629663838063, |
|
"chrf": 39.28673819745006, |
|
"commonvoice_hours": 0.0, |
|
"commonvoice_locale": "fo", |
|
"population": { |
|
"DK": 22304, |
|
"FO": 49047 |
|
} |
|
}, |
|
{ |
|
"language_name": "Friulian", |
|
"bcp_47": "fur", |
|
"speakers": 37442, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.2255876860328074, |
|
"chrf": 40.6191779521821 |
|
} |
|
], |
|
"bleu": 0.2255876860328074, |
|
"chrf": 40.6191779521821, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IT": 37442 |
|
} |
|
}, |
|
{ |
|
"language_name": "Sanskrit", |
|
"bcp_47": "sa", |
|
"speakers": 15913, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.14313294345831834, |
|
"chrf": 32.44676491537583 |
|
} |
|
], |
|
"bleu": 0.14313294345831834, |
|
"chrf": 32.44676491537583, |
|
"commonvoice_hours": null, |
|
"commonvoice_locale": null, |
|
"population": { |
|
"IN": 15913 |
|
} |
|
}, |
|
{ |
|
"language_name": "Esperanto", |
|
"bcp_47": "eo", |
|
"speakers": 301, |
|
"scores": [ |
|
{ |
|
"model": "meta-llama/llama-3.3-70b-instruct", |
|
"bleu": 0.27440987441620224, |
|
"chrf": 44.40715599582661 |
|
} |
|
], |
|
"bleu": 0.27440987441620224, |
|
"chrf": 44.40715599582661, |
|
"commonvoice_hours": 1436.0, |
|
"commonvoice_locale": "eo", |
|
"population": { |
|
"SM": 301 |
|
} |
|
} |
|
] |