diff --git "a/results.json" "b/results.json" new file mode 100644--- /dev/null +++ "b/results.json" @@ -0,0 +1,13710 @@ +{ + "tasks": [ + { + "task": "classification", + "metric": "accuracy", + "score": 0.5671296296296297, + "bcp_47": 42, + "model": 4 + }, + { + "task": "language_modeling", + "metric": "chrf", + "score": 0.9370067182020132, + "bcp_47": 42, + "model": 4 + }, + { + "task": "translation", + "metric": "bleu", + "score": 0.27639322299355507, + "bcp_47": 42, + "model": 4 + }, + { + "task": "translation", + "metric": "chrf", + "score": 0.44833214505324764, + "bcp_47": 42, + "model": 4 + } + ], + "models": [ + { + "model": "google/gemini-2.0-flash-001", + "task": "classification", + "metric": "accuracy", + "score": 0.8700000000000001, + "bcp_47": 10 + }, + { + "model": "google/gemini-2.0-flash-001", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9555263008516499, + "bcp_47": 10 + }, + { + "model": "google/gemini-2.0-flash-001", + "task": "translation", + "metric": "bleu", + "score": 0.36418986768393896, + "bcp_47": 10 + }, + { + "model": "google/gemini-2.0-flash-001", + "task": "translation", + "metric": "chrf", + "score": 0.5257896349203012, + "bcp_47": 10 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "task": "classification", + "metric": "accuracy", + "score": 0.5087301587301587, + "bcp_47": 42 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9382523459554147, + "bcp_47": 42 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "task": "translation", + "metric": "bleu", + "score": 0.2511829155327205, + "bcp_47": 42 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "task": "translation", + "metric": "chrf", + "score": 0.4313353245284424, + "bcp_47": 42 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "bcp_47": 10 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9046559534191477, + "bcp_47": 10 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "task": "translation", + "metric": "bleu", + "score": 0.2612972853503233, + "bcp_47": 10 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "task": "translation", + "metric": "chrf", + "score": 0.41659663566434596, + "bcp_47": 10 + }, + { + "model": "openai/gpt-4o-mini", + "task": "classification", + "metric": "accuracy", + "score": 0.51, + "bcp_47": 10 + }, + { + "model": "openai/gpt-4o-mini", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9456062637709552, + "bcp_47": 10 + }, + { + "model": "openai/gpt-4o-mini", + "task": "translation", + "metric": "bleu", + "score": 0.30957580728190814, + "bcp_47": 10 + }, + { + "model": "openai/gpt-4o-mini", + "task": "translation", + "metric": "chrf", + "score": 0.4739968107792783, + "bcp_47": 10 + } + ], + "languages": [ + { + "bcp_47": "aa", + "speakers": 2119663, + "language_name": "Afar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "aa", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ab", + "speakers": 91953, + "language_name": "Abkhazian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 67.0, + "commonvoice_locale": "ab", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "abr", + "speakers": 1467010, + "language_name": "Abron", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ace", + "speakers": 3738364, + "language_name": "Achinese", + "flores_path": "ace_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ace", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ach", + "speakers": 1600361, + "language_name": "Acoli", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ada", + "speakers": 880206, + "language_name": "Adangme", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ady", + "speakers": 444583, + "language_name": "Adyghe", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 12.0, + "commonvoice_locale": "ady", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "aeb", + "speakers": 10549080, + "language_name": "Tunisian Arabic", + "flores_path": "aeb_Arab", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "af", + "speakers": 9318845, + "language_name": "Afrikaans", + "flores_path": "afr_Latn", + "fleurs_tag": "af_za", + "commonvoice_hours": 0.5, + "commonvoice_locale": "af", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "agq", + "speakers": 38843, + "language_name": "Aghem", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ak", + "speakers": 11442678, + "language_name": "Akan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.1, + "commonvoice_locale": "tw", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "aln", + "speakers": 1430250, + "language_name": "Gheg Albanian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "aln", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "alt", + "speakers": 19841, + "language_name": "Southern Altai", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "am", + "speakers": 35728475, + "language_name": "Amharic", + "flores_path": "amh_Ethi", + "fleurs_tag": "am_et", + "commonvoice_hours": 1.8, + "commonvoice_locale": "am", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.36666666666666664, + "model": 1.0 + }, + { + "bcp_47": "am", + "speakers": 35728475, + "language_name": "Amharic", + "flores_path": "amh_Ethi", + "fleurs_tag": "am_et", + "commonvoice_hours": 1.8, + "commonvoice_locale": "am", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9031129205404201, + "model": 1.0 + }, + { + "bcp_47": "am", + "speakers": 35728475, + "language_name": "Amharic", + "flores_path": "amh_Ethi", + "fleurs_tag": "am_et", + "commonvoice_hours": 1.8, + "commonvoice_locale": "am", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.15002522598066087, + "model": 1.0 + }, + { + "bcp_47": "am", + "speakers": 35728475, + "language_name": "Amharic", + "flores_path": "amh_Ethi", + "fleurs_tag": "am_et", + "commonvoice_hours": 1.8, + "commonvoice_locale": "am", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.3344555209113584, + "model": 1.0 + }, + { + "bcp_47": "amo", + "speakers": 18620, + "language_name": "Amo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "an", + "speakers": 26008, + "language_name": "Aragonese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 13.0, + "commonvoice_locale": "an", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ann", + "speakers": 0, + "language_name": "Obolo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "aoz", + "speakers": 720970, + "language_name": "Uab Meto", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "apc", + "speakers": 39031474, + "language_name": "North Levantine Arabic", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ar", + "speakers": 351664197, + "language_name": "Arabic", + "flores_path": "arb_Arab", + "fleurs_tag": "ar_eg", + "commonvoice_hours": 92.0, + "commonvoice_locale": "ar", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6666666666666666, + "model": 4.0 + }, + { + "bcp_47": "ar", + "speakers": 351664197, + "language_name": "Arabic", + "flores_path": "arb_Arab", + "fleurs_tag": "ar_eg", + "commonvoice_hours": 92.0, + "commonvoice_locale": "ar", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9505580315120445, + "model": 4.0 + }, + { + "bcp_47": "ar", + "speakers": 351664197, + "language_name": "Arabic", + "flores_path": "arb_Arab", + "fleurs_tag": "ar_eg", + "commonvoice_hours": 92.0, + "commonvoice_locale": "ar", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.272695032954275, + "model": 4.0 + }, + { + "bcp_47": "ar", + "speakers": 351664197, + "language_name": "Arabic", + "flores_path": "arb_Arab", + "fleurs_tag": "ar_eg", + "commonvoice_hours": 92.0, + "commonvoice_locale": "ar", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.45513349114063173, + "model": 4.0 + }, + { + "bcp_47": "arn", + "speakers": 272802, + "language_name": "Mapuche", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "arn", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "aro", + "speakers": 105, + "language_name": "Araona", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "arq", + "speakers": 35667507, + "language_name": "Algerian Arabic", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ars", + "speakers": 1025205, + "language_name": "Najdi Arabic", + "flores_path": "ars_Arab", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ary", + "speakers": 30938679, + "language_name": "Moroccan Arabic", + "flores_path": "ary_Arab", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "arz", + "speakers": 66639360, + "language_name": "Egyptian Arabic", + "flores_path": "arz_Arab", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "model": 1.0 + }, + { + "bcp_47": "arz", + "speakers": 66639360, + "language_name": "Egyptian Arabic", + "flores_path": "arz_Arab", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9319821809429131, + "model": 1.0 + }, + { + "bcp_47": "arz", + "speakers": 66639360, + "language_name": "Egyptian Arabic", + "flores_path": "arz_Arab", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.20127691717583826, + "model": 1.0 + }, + { + "bcp_47": "arz", + "speakers": 66639360, + "language_name": "Egyptian Arabic", + "flores_path": "arz_Arab", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.38780198426317497, + "model": 1.0 + }, + { + "bcp_47": "as", + "speakers": 17239170, + "language_name": "Assamese", + "flores_path": "asm_Beng", + "fleurs_tag": "as_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "as", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "asa", + "speakers": 702634, + "language_name": "Asu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ast", + "speakers": 650205, + "language_name": "Asturian", + "flores_path": "ast_Latn", + "fleurs_tag": "ast_es", + "commonvoice_hours": 0.8, + "commonvoice_locale": "ast", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "atj", + "speakers": 6408, + "language_name": "Atikamekw", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "av", + "speakers": 552716, + "language_name": "Avaric", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "awa", + "speakers": 25862924, + "language_name": "Awadhi", + "flores_path": "awa_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ay", + "speakers": 2838620, + "language_name": "Aymara", + "flores_path": "ayr_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "az", + "speakers": 32446682, + "language_name": "Azerbaijani", + "flores_path": "azj_Latn", + "fleurs_tag": "az_az", + "commonvoice_hours": 0.5, + "commonvoice_locale": "az", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "model": 1.0 + }, + { + "bcp_47": "az", + "speakers": 32446682, + "language_name": "Azerbaijani", + "flores_path": "azj_Latn", + "fleurs_tag": "az_az", + "commonvoice_hours": 0.5, + "commonvoice_locale": "az", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9439975775415789, + "model": 1.0 + }, + { + "bcp_47": "az", + "speakers": 32446682, + "language_name": "Azerbaijani", + "flores_path": "azj_Latn", + "fleurs_tag": "az_az", + "commonvoice_hours": 0.5, + "commonvoice_locale": "az", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.18364881639775618, + "model": 1.0 + }, + { + "bcp_47": "az", + "speakers": 32446682, + "language_name": "Azerbaijani", + "flores_path": "azj_Latn", + "fleurs_tag": "az_az", + "commonvoice_hours": 0.5, + "commonvoice_locale": "az", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.3791669348856303, + "model": 1.0 + }, + { + "bcp_47": "ba", + "speakers": 1842386, + "language_name": "Bashkir", + "flores_path": "bak_Cyrl", + "fleurs_tag": null, + "commonvoice_hours": 259.0, + "commonvoice_locale": "ba", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bal", + "speakers": 8227887, + "language_name": "Baluchi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "bal", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ban", + "speakers": 4806468, + "language_name": "Balinese", + "flores_path": "ban_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bap", + "speakers": 454918, + "language_name": "Bantawa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bar", + "speakers": 22043627, + "language_name": "Bavarian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bas", + "speakers": 332940, + "language_name": "Basaa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 12.0, + "commonvoice_locale": "bas", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bax", + "speakers": 332940, + "language_name": "Bamun", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 11.0, + "commonvoice_locale": "bax", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bbc", + "speakers": 2456639, + "language_name": "Batak Toba", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bbj", + "speakers": 388430, + "language_name": "Ghomala", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 13.0, + "commonvoice_locale": "bbj", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bci", + "speakers": 3022921, + "language_name": "Baoulé", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 2.0, + "commonvoice_locale": "bci", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "be", + "speakers": 10064517, + "language_name": "Belarusian", + "flores_path": "bel_Cyrl", + "fleurs_tag": "be_by", + "commonvoice_hours": 1805.0, + "commonvoice_locale": "be", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bej", + "speakers": 2460326, + "language_name": "Beja", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bem", + "speakers": 5402246, + "language_name": "Bemba", + "flores_path": "bem_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bew", + "speakers": 5607546, + "language_name": "Betawi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "bew", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bez", + "speakers": 995398, + "language_name": "Bena", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bfd", + "speakers": 158146, + "language_name": "Bafut", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 11.0, + "commonvoice_locale": "bfd", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bfq", + "speakers": 305001, + "language_name": "Badaga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bft", + "speakers": 502520, + "language_name": "Balti", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 18.0, + "commonvoice_locale": "bft", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bfy", + "speakers": 654424, + "language_name": "Bagheli", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bg", + "speakers": 7878315, + "language_name": "Bulgarian", + "flores_path": "bul_Cyrl", + "fleurs_tag": "bg_bg", + "commonvoice_hours": 16.0, + "commonvoice_locale": "bg", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bgc", + "speakers": 15913080, + "language_name": "Haryanvi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bgn", + "speakers": 2037382, + "language_name": "Western Balochi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bgx", + "speakers": 377280, + "language_name": "Balkan Gagauz Turkish", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bhb", + "speakers": 1591308, + "language_name": "Bhili", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bhi", + "speakers": 1220003, + "language_name": "Bhilali", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bho", + "speakers": 32934797, + "language_name": "Bhojpuri", + "flores_path": "bho_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.3333333333333333, + "model": 1.0 + }, + { + "bcp_47": "bho", + "speakers": 32934797, + "language_name": "Bhojpuri", + "flores_path": "bho_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9334228689163548, + "model": 1.0 + }, + { + "bcp_47": "bho", + "speakers": 32934797, + "language_name": "Bhojpuri", + "flores_path": "bho_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.24092898437545654, + "model": 1.0 + }, + { + "bcp_47": "bho", + "speakers": 32934797, + "language_name": "Bhojpuri", + "flores_path": "bho_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.41894143077328727, + "model": 1.0 + }, + { + "bcp_47": "bi", + "speakers": 268500, + "language_name": "Bislama", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bik", + "speakers": 3275430, + "language_name": "Bikol", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bin", + "speakers": 1519599, + "language_name": "Bini", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bjj", + "speakers": 7426104, + "language_name": "Kanauji", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bjn", + "speakers": 4010288, + "language_name": "Banjar", + "flores_path": "bjn_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bjt", + "speakers": 95992, + "language_name": "Balanta-Ganja", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bkm", + "speakers": 360685, + "language_name": "Kom", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 13.0, + "commonvoice_locale": "bkm", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bku", + "speakers": 7970, + "language_name": "Buhid", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bla", + "speakers": 4900, + "language_name": "Siksiká", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "blo", + "speakers": 51507, + "language_name": "Anii", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "blt", + "speakers": 681177, + "language_name": "Tai Dam", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bm", + "speakers": 9385632, + "language_name": "Bambara", + "flores_path": "bam_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "bm", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bmq", + "speakers": 168159, + "language_name": "Bomu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bn", + "speakers": 267193288, + "language_name": "Bangla", + "flores_path": "ben_Beng", + "fleurs_tag": "bn_in", + "commonvoice_hours": 49.0, + "commonvoice_locale": "bn", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5, + "model": 4.0 + }, + { + "bcp_47": "bn", + "speakers": 267193288, + "language_name": "Bangla", + "flores_path": "ben_Beng", + "fleurs_tag": "bn_in", + "commonvoice_hours": 49.0, + "commonvoice_locale": "bn", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.8930948406963347, + "model": 4.0 + }, + { + "bcp_47": "bn", + "speakers": 267193288, + "language_name": "Bangla", + "flores_path": "ben_Beng", + "fleurs_tag": "bn_in", + "commonvoice_hours": 49.0, + "commonvoice_locale": "bn", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.22867663633876684, + "model": 4.0 + }, + { + "bcp_47": "bn", + "speakers": 267193288, + "language_name": "Bangla", + "flores_path": "ben_Beng", + "fleurs_tag": "bn_in", + "commonvoice_hours": 49.0, + "commonvoice_locale": "bn", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.40541764389945456, + "model": 4.0 + }, + { + "bcp_47": "bo", + "speakers": 3006697, + "language_name": "Tibetan", + "flores_path": "bod_Tibt", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "bo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bpy", + "speakers": 90174, + "language_name": "Bishnupriya", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bqi", + "speakers": 1188926, + "language_name": "Bakhtiari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bqv", + "speakers": 46718, + "language_name": "Koro Wachi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "br", + "speakers": 563140, + "language_name": "Breton", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 27.0, + "commonvoice_locale": "br", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bra", + "speakers": 54370, + "language_name": "Braj", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "brh", + "speakers": 3035513, + "language_name": "Brahui", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "brx", + "speakers": 1856526, + "language_name": "Bodo", + "flores_path": "brx_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bs", + "speakers": 7594468, + "language_name": "Bosnian", + "flores_path": "bos_Latn", + "fleurs_tag": "bs_ba", + "commonvoice_hours": 0.0, + "commonvoice_locale": "bs", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bsc", + "speakers": 15264, + "language_name": "Bassari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bss", + "speakers": 149823, + "language_name": "Akoose", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bto", + "speakers": 305707, + "language_name": "Rinconada Bikol", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "btv", + "speakers": 78843, + "language_name": "Bateri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bua", + "speakers": 311788, + "language_name": "Buriat", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "bxr", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "buc", + "speakers": 44620, + "language_name": "Bushi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bug", + "speakers": 4298211, + "language_name": "Buginese", + "flores_path": "bug_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bum", + "speakers": 1276270, + "language_name": "Bulu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 9.5, + "commonvoice_locale": "bum", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bvb", + "speakers": 66058, + "language_name": "Bube", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "byn", + "speakers": 79056, + "language_name": "Blin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "byv", + "speakers": 305195, + "language_name": "Medumba", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 14.0, + "commonvoice_locale": "byv", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "bze", + "speakers": 166204, + "language_name": "Jenaama Bozo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ca", + "speakers": 8679139, + "language_name": "Catalan", + "flores_path": "cat_Latn", + "fleurs_tag": "ca_es", + "commonvoice_hours": 2842.0, + "commonvoice_locale": "ca", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cad", + "speakers": 0, + "language_name": "Caddo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cch", + "speakers": 44946, + "language_name": "Atsam", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ccp", + "speakers": 729137, + "language_name": "Chakma", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ce", + "speakers": 935365, + "language_name": "Chechen", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ceb", + "speakers": 26203440, + "language_name": "Cebuano", + "flores_path": "ceb_Latn", + "fleurs_tag": "ceb_ph", + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cgg", + "speakers": 2335662, + "language_name": "Chiga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ch", + "speakers": 46325, + "language_name": "Chamorro", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "chk", + "speakers": 30731, + "language_name": "Chuukese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "chm", + "speakers": 524371, + "language_name": "Mari", + "flores_path": "mhr_Cyrl", + "fleurs_tag": null, + "commonvoice_hours": 282.0, + "commonvoice_locale": "mhr", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cho", + "speakers": 10977, + "language_name": "Choctaw", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "chp", + "speakers": 12816, + "language_name": "Chipewyan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "chr", + "speakers": 25613, + "language_name": "Cherokee", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cic", + "speakers": 0, + "language_name": "Chickasaw", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cja", + "speakers": 270832, + "language_name": "Western Cham", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cjm", + "speakers": 87862, + "language_name": "Eastern Cham", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ckb", + "speakers": 11086549, + "language_name": "Central Kurdish", + "flores_path": "ckb_Arab", + "fleurs_tag": "ckb_iq", + "commonvoice_hours": 135.0, + "commonvoice_locale": "ckb", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "clc", + "speakers": 867, + "language_name": "Chilcotin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "co", + "speakers": 162836, + "language_name": "Corsican", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "co", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cps", + "speakers": 720595, + "language_name": "Capiznon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cr", + "speakers": 9047, + "language_name": "Cree", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "crg", + "speakers": 678, + "language_name": "Michif", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "crh", + "speakers": 245968, + "language_name": "Crimean Tatar", + "flores_path": "crh_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "crh", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "crk", + "speakers": 4146, + "language_name": "Plains Cree", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "crl", + "speakers": 377, + "language_name": "Northern East Cree", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "crs", + "speakers": 94061, + "language_name": "Seselwa Creole French", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cs", + "speakers": 13045532, + "language_name": "Czech", + "flores_path": "ces_Latn", + "fleurs_tag": "cs_cz", + "commonvoice_hours": 74.0, + "commonvoice_locale": "cs", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "csb", + "speakers": 49767, + "language_name": "Kashubian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "csw", + "speakers": 1809, + "language_name": "Swampy Cree", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cu", + "speakers": 0, + "language_name": "Church Slavic", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cv", + "speakers": 1842386, + "language_name": "Chuvash", + "flores_path": "chv_Cyrl", + "fleurs_tag": null, + "commonvoice_hours": 27.0, + "commonvoice_locale": "cv", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "cy", + "speakers": 884910, + "language_name": "Welsh", + "flores_path": "cym_Latn", + "fleurs_tag": "cy_gb", + "commonvoice_hours": 124.0, + "commonvoice_locale": "cy", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "da", + "speakers": 7072056, + "language_name": "Danish", + "flores_path": "dan_Latn", + "fleurs_tag": "da_dk", + "commonvoice_hours": 13.0, + "commonvoice_locale": "da", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dak", + "speakers": 20832, + "language_name": "Dakota", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dar", + "speakers": 368477, + "language_name": "Dargwa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "dar", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dav", + "speakers": 438929, + "language_name": "Taita", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 9.3, + "commonvoice_locale": "dav", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dcc", + "speakers": 13128291, + "language_name": "Deccan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "de", + "speakers": 136350226, + "language_name": "German", + "flores_path": "deu_Latn", + "fleurs_tag": "de_de", + "commonvoice_hours": 1359.0, + "commonvoice_locale": "de", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6666666666666666, + "model": 1.0 + }, + { + "bcp_47": "de", + "speakers": 136350226, + "language_name": "German", + "flores_path": "deu_Latn", + "fleurs_tag": "de_de", + "commonvoice_hours": 1359.0, + "commonvoice_locale": "de", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9788487181545229, + "model": 1.0 + }, + { + "bcp_47": "de", + "speakers": 136350226, + "language_name": "German", + "flores_path": "deu_Latn", + "fleurs_tag": "de_de", + "commonvoice_hours": 1359.0, + "commonvoice_locale": "de", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.31823711841849855, + "model": 1.0 + }, + { + "bcp_47": "de", + "speakers": 136350226, + "language_name": "German", + "flores_path": "deu_Latn", + "fleurs_tag": "de_de", + "commonvoice_hours": 1359.0, + "commonvoice_locale": "de", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.49174647549269207, + "model": 1.0 + }, + { + "bcp_47": "den", + "speakers": 2299, + "language_name": "Slave", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dgr", + "speakers": 2111, + "language_name": "Dogrib", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dje", + "speakers": 3871308, + "language_name": "Zarma", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dnj", + "speakers": 1099244, + "language_name": "Dan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "doi", + "speakers": 2652180, + "language_name": "Dogri", + "flores_path": "dgo_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dsb", + "speakers": 6974, + "language_name": "Lower Sorbian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "dsb", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dtm", + "speakers": 215087, + "language_name": "Tomo Kan Dogon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dtp", + "speakers": 182852, + "language_name": "Central Dusun", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dty", + "speakers": 758198, + "language_name": "Dotyali", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dua", + "speakers": 133176, + "language_name": "Duala", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 14.0, + "commonvoice_locale": "dua", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dv", + "speakers": 388044, + "language_name": "Divehi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 39.0, + "commonvoice_locale": "dv", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dyo", + "speakers": 409146, + "language_name": "Jola-Fonyi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dyu", + "speakers": 6667328, + "language_name": "Dyula", + "flores_path": "dyu_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.4, + "commonvoice_locale": "dyu", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "dz", + "speakers": 370341, + "language_name": "Dzongkha", + "flores_path": "dzo_Tibt", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ebu", + "speakers": 802918, + "language_name": "Embu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ee", + "speakers": 4690857, + "language_name": "Ewe", + "flores_path": "ewe_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ee", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "efi", + "speakers": 2996392, + "language_name": "Efik", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "egl", + "speakers": 31201, + "language_name": "Emilian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "el", + "speakers": 12292242, + "language_name": "Greek", + "flores_path": "ell_Grek", + "fleurs_tag": "el_gr", + "commonvoice_hours": 20.0, + "commonvoice_locale": "el", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "en", + "speakers": 1636485840, + "language_name": "English", + "flores_path": "eng_Latn", + "fleurs_tag": "en_us", + "commonvoice_hours": 2651.0, + "commonvoice_locale": "en", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5916666666666667, + "model": 4.0 + }, + { + "bcp_47": "en", + "speakers": 1636485840, + "language_name": "English", + "flores_path": "eng_Latn", + "fleurs_tag": "en_us", + "commonvoice_hours": 2651.0, + "commonvoice_locale": "en", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9225354470067261, + "model": 4.0 + }, + { + "bcp_47": "en", + "speakers": 1636485840, + "language_name": "English", + "flores_path": "eng_Latn", + "fleurs_tag": "en_us", + "commonvoice_hours": 2651.0, + "commonvoice_locale": "en", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.4289895608958245, + "model": 4.0 + }, + { + "bcp_47": "en", + "speakers": 1636485840, + "language_name": "English", + "flores_path": "eng_Latn", + "fleurs_tag": "en_us", + "commonvoice_hours": 2651.0, + "commonvoice_locale": "en", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.5437014634491315, + "model": 4.0 + }, + { + "bcp_47": "eo", + "speakers": 301, + "language_name": "Esperanto", + "flores_path": "epo_Latn", + "fleurs_tag": null, + "commonvoice_hours": 1436.0, + "commonvoice_locale": "eo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "es", + "speakers": 493528077, + "language_name": "Spanish", + "flores_path": "spa_Latn", + "fleurs_tag": "es_419", + "commonvoice_hours": 446.0, + "commonvoice_locale": "es", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6583333333333333, + "model": 4.0 + }, + { + "bcp_47": "es", + "speakers": 493528077, + "language_name": "Spanish", + "flores_path": "spa_Latn", + "fleurs_tag": "es_419", + "commonvoice_hours": 446.0, + "commonvoice_locale": "es", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9561525839092082, + "model": 4.0 + }, + { + "bcp_47": "es", + "speakers": 493528077, + "language_name": "Spanish", + "flores_path": "spa_Latn", + "fleurs_tag": "es_419", + "commonvoice_hours": 446.0, + "commonvoice_locale": "es", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.2984596316936459, + "model": 4.0 + }, + { + "bcp_47": "es", + "speakers": 493528077, + "language_name": "Spanish", + "flores_path": "spa_Latn", + "fleurs_tag": "es_419", + "commonvoice_hours": 446.0, + "commonvoice_locale": "es", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.46243613105820586, + "model": 4.0 + }, + { + "bcp_47": "esu", + "speakers": 20956, + "language_name": "Central Yupik", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "esu", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "et", + "speakers": 878449, + "language_name": "Estonian", + "flores_path": "ekk_Latn", + "fleurs_tag": "et_ee", + "commonvoice_hours": 58.0, + "commonvoice_locale": "et", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "eu", + "speakers": 1088519, + "language_name": "Basque", + "flores_path": "eus_Latn", + "fleurs_tag": null, + "commonvoice_hours": 335.0, + "commonvoice_locale": "eu", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ewo", + "speakers": 860095, + "language_name": "Ewondo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 19.0, + "commonvoice_locale": "ewo", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ext", + "speakers": 245077, + "language_name": "Extremaduran", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fa", + "speakers": 84710459, + "language_name": "Persian", + "flores_path": "pes_Arab", + "fleurs_tag": "fa_ir", + "commonvoice_hours": 370.0, + "commonvoice_locale": "fa", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "model": 1.0 + }, + { + "bcp_47": "fa", + "speakers": 84710459, + "language_name": "Persian", + "flores_path": "pes_Arab", + "fleurs_tag": "fa_ir", + "commonvoice_hours": 370.0, + "commonvoice_locale": "fa", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9396649061437635, + "model": 1.0 + }, + { + "bcp_47": "fa", + "speakers": 84710459, + "language_name": "Persian", + "flores_path": "pes_Arab", + "fleurs_tag": "fa_ir", + "commonvoice_hours": 370.0, + "commonvoice_locale": "fa", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.2516753344674677, + "model": 1.0 + }, + { + "bcp_47": "fa", + "speakers": 84710459, + "language_name": "Persian", + "flores_path": "pes_Arab", + "fleurs_tag": "fa_ir", + "commonvoice_hours": 370.0, + "commonvoice_locale": "fa", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4448545956789697, + "model": 1.0 + }, + { + "bcp_47": "fan", + "speakers": 426451, + "language_name": "Fang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 9.3, + "commonvoice_locale": "fan", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fbl", + "speakers": 2511163, + "language_name": "West Albay Bikol", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ff", + "speakers": 7788904, + "language_name": "Fula", + "flores_path": null, + "fleurs_tag": "ff_sn", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ff", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ffm", + "speakers": 1505612, + "language_name": "Maasina Fulfulde", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fi", + "speakers": 5736842, + "language_name": "Finnish", + "flores_path": "fin_Latn", + "fleurs_tag": "fi_fi", + "commonvoice_hours": 15.0, + "commonvoice_locale": "fi", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fia", + "speakers": 378161, + "language_name": "Nobiin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fil", + "speakers": 67471096, + "language_name": "Filipino", + "flores_path": "fil_Latn", + "fleurs_tag": "fil_ph", + "commonvoice_hours": 0.0, + "commonvoice_locale": "tl", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "model": 1.0 + }, + { + "bcp_47": "fil", + "speakers": 67471096, + "language_name": "Filipino", + "flores_path": "fil_Latn", + "fleurs_tag": "fil_ph", + "commonvoice_hours": 0.0, + "commonvoice_locale": "tl", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9553160038255677, + "model": 1.0 + }, + { + "bcp_47": "fil", + "speakers": 67471096, + "language_name": "Filipino", + "flores_path": "fil_Latn", + "fleurs_tag": "fil_ph", + "commonvoice_hours": 0.0, + "commonvoice_locale": "tl", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.3248927726984041, + "model": 1.0 + }, + { + "bcp_47": "fil", + "speakers": 67471096, + "language_name": "Filipino", + "flores_path": "fil_Latn", + "fleurs_tag": "fil_ph", + "commonvoice_hours": 0.0, + "commonvoice_locale": "tl", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4689020729383555, + "model": 1.0 + }, + { + "bcp_47": "fit", + "speakers": 56114, + "language_name": "Tornedalen Finnish", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fj", + "speakers": 365030, + "language_name": "Fijian", + "flores_path": "fij_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fo", + "speakers": 71351, + "language_name": "Faroese", + "flores_path": "fao_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "fo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fon", + "speakers": 3216150, + "language_name": "Fon", + "flores_path": "fon_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fr", + "speakers": 278611507, + "language_name": "French", + "flores_path": "fra_Latn", + "fleurs_tag": "fr_fr", + "commonvoice_hours": 1052.0, + "commonvoice_locale": "fr", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.7166666666666667, + "model": 4.0 + }, + { + "bcp_47": "fr", + "speakers": 278611507, + "language_name": "French", + "flores_path": "fra_Latn", + "fleurs_tag": "fr_fr", + "commonvoice_hours": 1052.0, + "commonvoice_locale": "fr", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9718447009224642, + "model": 4.0 + }, + { + "bcp_47": "fr", + "speakers": 278611507, + "language_name": "French", + "flores_path": "fra_Latn", + "fleurs_tag": "fr_fr", + "commonvoice_hours": 1052.0, + "commonvoice_locale": "fr", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.3187714613657571, + "model": 4.0 + }, + { + "bcp_47": "fr", + "speakers": 278611507, + "language_name": "French", + "flores_path": "fra_Latn", + "fleurs_tag": "fr_fr", + "commonvoice_hours": 1052.0, + "commonvoice_locale": "fr", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4845347359298269, + "model": 4.0 + }, + { + "bcp_47": "frc", + "speakers": 27942, + "language_name": "Cajun French", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "frp", + "speakers": 63777, + "language_name": "Arpitan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "frr", + "speakers": 9619, + "language_name": "Northern Frisian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "frs", + "speakers": 2004, + "language_name": "Eastern Frisian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fud", + "speakers": 4756, + "language_name": "East Futuna", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fuq", + "speakers": 1594068, + "language_name": "Central-Eastern Niger Fulfulde", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fur", + "speakers": 37442, + "language_name": "Friulian", + "flores_path": "fur_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fuv", + "speakers": 14339876, + "language_name": "Nigerian Fulfulde", + "flores_path": "fuv_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fvr", + "speakers": 1230163, + "language_name": "Fur", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "fy", + "speakers": 743057, + "language_name": "Western Frisian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 66.0, + "commonvoice_locale": "fy-NL", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ga", + "speakers": 1237487, + "language_name": "Irish", + "flores_path": "gle_Latn", + "fleurs_tag": "ga_ie", + "commonvoice_hours": 5.9, + "commonvoice_locale": "ga-IE", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gaa", + "speakers": 821526, + "language_name": "Ga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gag", + "speakers": 111028, + "language_name": "Gagauz", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gan", + "speakers": 23698340, + "language_name": "Gan Chinese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gay", + "speakers": 320431, + "language_name": "Gayo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gbm", + "speakers": 3580443, + "language_name": "Garhwali", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gbz", + "speakers": 7983, + "language_name": "Zoroastrian Dari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gcr", + "speakers": 51872, + "language_name": "Guianese Creole French", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gd", + "speakers": 72337, + "language_name": "Scottish Gaelic", + "flores_path": "gla_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gez", + "speakers": 0, + "language_name": "Geez", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gil", + "speakers": 67078, + "language_name": "Gilbertese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gjk", + "speakers": 256851, + "language_name": "Kachi Koli", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gju", + "speakers": 467002, + "language_name": "Gujari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 11.0, + "commonvoice_locale": "gju", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gl", + "speakers": 3515530, + "language_name": "Galician", + "flores_path": "glg_Latn", + "fleurs_tag": "gl_es", + "commonvoice_hours": 111.0, + "commonvoice_locale": "gl", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "glk", + "speakers": 3906472, + "language_name": "Gilaki", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gn", + "speakers": 5827107, + "language_name": "Guarani", + "flores_path": "gug_Latn", + "fleurs_tag": null, + "commonvoice_hours": 3.7, + "commonvoice_locale": "gn", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gom", + "speakers": 4243488, + "language_name": "Goan Konkani", + "flores_path": "gom_Deva", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "gom", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gon", + "speakers": 3182616, + "language_name": "Gondi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gor", + "speakers": 1094807, + "language_name": "Gorontalo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gos", + "speakers": 622094, + "language_name": "Gronings", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "gos", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "grt", + "speakers": 821563, + "language_name": "Garo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gsw", + "speakers": 7956952, + "language_name": "Swiss German", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "gsw", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gu", + "speakers": 61721799, + "language_name": "Gujarati", + "flores_path": "guj_Gujr", + "fleurs_tag": "gu_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "gu-IN", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "model": 1.0 + }, + { + "bcp_47": "gu", + "speakers": 61721799, + "language_name": "Gujarati", + "flores_path": "guj_Gujr", + "fleurs_tag": "gu_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "gu-IN", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9421488818900206, + "model": 1.0 + }, + { + "bcp_47": "gu", + "speakers": 61721799, + "language_name": "Gujarati", + "flores_path": "guj_Gujr", + "fleurs_tag": "gu_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "gu-IN", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.24812610549809738, + "model": 1.0 + }, + { + "bcp_47": "gu", + "speakers": 61721799, + "language_name": "Gujarati", + "flores_path": "guj_Gujr", + "fleurs_tag": "gu_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "gu-IN", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4318359636701651, + "model": 1.0 + }, + { + "bcp_47": "gub", + "speakers": 17784, + "language_name": "Guajajára", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "guc", + "speakers": 132529, + "language_name": "Wayuu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "guc", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gur", + "speakers": 1026907, + "language_name": "Frafra", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "guz", + "speakers": 2622867, + "language_name": "Gusii", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gv", + "speakers": 1719, + "language_name": "Manx", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 8.6, + "commonvoice_locale": "gv", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gvr", + "speakers": 87951, + "language_name": "Gurung", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "gwi", + "speakers": 302, + "language_name": "Gwichʼin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ha", + "speakers": 40411882, + "language_name": "Hausa", + "flores_path": "hau_Latn", + "fleurs_tag": "ha_ng", + "commonvoice_hours": 4.1, + "commonvoice_locale": "ha", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "model": 1.0 + }, + { + "bcp_47": "ha", + "speakers": 40411882, + "language_name": "Hausa", + "flores_path": "hau_Latn", + "fleurs_tag": "ha_ng", + "commonvoice_hours": 4.1, + "commonvoice_locale": "ha", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.945704338611724, + "model": 1.0 + }, + { + "bcp_47": "ha", + "speakers": 40411882, + "language_name": "Hausa", + "flores_path": "hau_Latn", + "fleurs_tag": "ha_ng", + "commonvoice_hours": 4.1, + "commonvoice_locale": "ha", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.14767816277169443, + "model": 1.0 + }, + { + "bcp_47": "ha", + "speakers": 40411882, + "language_name": "Hausa", + "flores_path": "hau_Latn", + "fleurs_tag": "ha_ng", + "commonvoice_hours": 4.1, + "commonvoice_locale": "ha", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.34353973347368816, + "model": 1.0 + }, + { + "bcp_47": "hak", + "speakers": 32062460, + "language_name": "Hakka Chinese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "haw", + "speakers": 29605, + "language_name": "Hawaiian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "haz", + "speakers": 2161984, + "language_name": "Hazaragi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "he", + "speakers": 8675480, + "language_name": "Hebrew", + "flores_path": "heb_Hebr", + "fleurs_tag": "he_il", + "commonvoice_hours": 1.1, + "commonvoice_locale": "he", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hi", + "speakers": 546882144, + "language_name": "Hindi", + "flores_path": "hin_Deva", + "fleurs_tag": "hi_in", + "commonvoice_hours": 16.0, + "commonvoice_locale": "hi-IN", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6083333333333334, + "model": 4.0 + }, + { + "bcp_47": "hi", + "speakers": 546882144, + "language_name": "Hindi", + "flores_path": "hin_Deva", + "fleurs_tag": "hi_in", + "commonvoice_hours": 16.0, + "commonvoice_locale": "hi-IN", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.935107298962707, + "model": 4.0 + }, + { + "bcp_47": "hi", + "speakers": 546882144, + "language_name": "Hindi", + "flores_path": "hin_Deva", + "fleurs_tag": "hi_in", + "commonvoice_hours": 16.0, + "commonvoice_locale": "hi-IN", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.29263068330216335, + "model": 4.0 + }, + { + "bcp_47": "hi", + "speakers": 546882144, + "language_name": "Hindi", + "flores_path": "hin_Deva", + "fleurs_tag": "hi_in", + "commonvoice_hours": 16.0, + "commonvoice_locale": "hi-IN", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.45579369454961405, + "model": 4.0 + }, + { + "bcp_47": "hif", + "speakers": 383749, + "language_name": "Fiji Hindi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hil", + "speakers": 9171204, + "language_name": "Hiligaynon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "hil", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hnd", + "speakers": 957354, + "language_name": "Southern Hindko", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hne", + "speakers": 14586990, + "language_name": "Chhattisgarhi", + "flores_path": "hne_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hnj", + "speakers": 781687, + "language_name": "Hmong Njua", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hnn", + "speakers": 17469, + "language_name": "Hanunoo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hno", + "speakers": 3969517, + "language_name": "Northern Hindko", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 11.0, + "commonvoice_locale": "hno", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ho", + "speakers": 152449, + "language_name": "Hiri Motu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hoc", + "speakers": 1312829, + "language_name": "Ho", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hoj", + "speakers": 1087394, + "language_name": "Hadothi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hr", + "speakers": 6813164, + "language_name": "Croatian", + "flores_path": "hrv_Latn", + "fleurs_tag": "hr_hr", + "commonvoice_hours": 0.0, + "commonvoice_locale": "hr", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hsb", + "speakers": 12826, + "language_name": "Upper Sorbian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 2.9, + "commonvoice_locale": "hsb", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hsn", + "speakers": 40426580, + "language_name": "Xiang Chinese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ht", + "speakers": 8964918, + "language_name": "Haitian Creole", + "flores_path": "hat_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ht", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hu", + "speakers": 12443430, + "language_name": "Hungarian", + "flores_path": "hun_Latn", + "fleurs_tag": "hu_hu", + "commonvoice_hours": 92.0, + "commonvoice_locale": "hu", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hur", + "speakers": 716, + "language_name": "Halkomelem", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hy", + "speakers": 5317273, + "language_name": "Armenian", + "flores_path": "hye_Armn", + "fleurs_tag": "hy_am", + "commonvoice_hours": 31.0, + "commonvoice_locale": "hy-AM", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "hz", + "speakers": 239336, + "language_name": "Herero", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ia", + "speakers": 136, + "language_name": "Interlingua", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 14.0, + "commonvoice_locale": "ia", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "iba", + "speakers": 816302, + "language_name": "Iban", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ibb", + "speakers": 2996392, + "language_name": "Ibibio", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 2.6, + "commonvoice_locale": "ibb", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "id", + "speakers": 171207687, + "language_name": "Indonesian", + "flores_path": "ind_Latn", + "fleurs_tag": "id_id", + "commonvoice_hours": 33.0, + "commonvoice_locale": "id", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "model": 1.0 + }, + { + "bcp_47": "id", + "speakers": 171207687, + "language_name": "Indonesian", + "flores_path": "ind_Latn", + "fleurs_tag": "id_id", + "commonvoice_hours": 33.0, + "commonvoice_locale": "id", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9441891794331471, + "model": 1.0 + }, + { + "bcp_47": "id", + "speakers": 171207687, + "language_name": "Indonesian", + "flores_path": "ind_Latn", + "fleurs_tag": "id_id", + "commonvoice_hours": 33.0, + "commonvoice_locale": "id", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.28485630651027877, + "model": 1.0 + }, + { + "bcp_47": "id", + "speakers": 171207687, + "language_name": "Indonesian", + "flores_path": "ind_Latn", + "fleurs_tag": "id_id", + "commonvoice_hours": 33.0, + "commonvoice_locale": "id", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4561447909933971, + "model": 1.0 + }, + { + "bcp_47": "ie", + "speakers": 1, + "language_name": "Interlingue", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ie", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ife", + "speakers": 111910, + "language_name": "Ifè", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ig", + "speakers": 27823640, + "language_name": "Igbo", + "flores_path": "ibo_Latn", + "fleurs_tag": "ig_ng", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ig", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ii", + "speakers": 8364120, + "language_name": "Sichuan Yi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ik", + "speakers": 7983, + "language_name": "Inupiaq", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 3.2, + "commonvoice_locale": "ipk", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ilo", + "speakers": 10481376, + "language_name": "Iloko", + "flores_path": "ilo_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "inh", + "speakers": 226755, + "language_name": "Ingush", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "io", + "speakers": 0, + "language_name": "Ido", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "is", + "speakers": 350734, + "language_name": "Icelandic", + "flores_path": "isl_Latn", + "fleurs_tag": "is_is", + "commonvoice_hours": 0.1, + "commonvoice_locale": "is", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "it", + "speakers": 70247060, + "language_name": "Italian", + "flores_path": "ita_Latn", + "fleurs_tag": "it_it", + "commonvoice_hours": 362.0, + "commonvoice_locale": "it", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "model": 1.0 + }, + { + "bcp_47": "it", + "speakers": 70247060, + "language_name": "Italian", + "flores_path": "ita_Latn", + "fleurs_tag": "it_it", + "commonvoice_hours": 362.0, + "commonvoice_locale": "it", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.96965822717479, + "model": 1.0 + }, + { + "bcp_47": "it", + "speakers": 70247060, + "language_name": "Italian", + "flores_path": "ita_Latn", + "fleurs_tag": "it_it", + "commonvoice_hours": 362.0, + "commonvoice_locale": "it", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.27748101044407486, + "model": 1.0 + }, + { + "bcp_47": "it", + "speakers": 70247060, + "language_name": "Italian", + "flores_path": "ita_Latn", + "fleurs_tag": "it_it", + "commonvoice_hours": 362.0, + "commonvoice_locale": "it", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.46396483435604213, + "model": 1.0 + }, + { + "bcp_47": "iu", + "speakers": 90466, + "language_name": "Inuktitut", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "izh", + "speakers": 142, + "language_name": "Ingrian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "izh", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ja", + "speakers": 119729026, + "language_name": "Japanese", + "flores_path": "jpn_Jpan", + "fleurs_tag": "ja_jp", + "commonvoice_hours": 222.0, + "commonvoice_locale": "ja", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "model": 1.0 + }, + { + "bcp_47": "ja", + "speakers": 119729026, + "language_name": "Japanese", + "flores_path": "jpn_Jpan", + "fleurs_tag": "ja_jp", + "commonvoice_hours": 222.0, + "commonvoice_locale": "ja", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9339719005290334, + "model": 1.0 + }, + { + "bcp_47": "ja", + "speakers": 119729026, + "language_name": "Japanese", + "flores_path": "jpn_Jpan", + "fleurs_tag": "ja_jp", + "commonvoice_hours": 222.0, + "commonvoice_locale": "ja", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.26835607046224613, + "model": 1.0 + }, + { + "bcp_47": "ja", + "speakers": 119729026, + "language_name": "Japanese", + "flores_path": "jpn_Jpan", + "fleurs_tag": "ja_jp", + "commonvoice_hours": 222.0, + "commonvoice_locale": "ja", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4411714629040183, + "model": 1.0 + }, + { + "bcp_47": "jam", + "speakers": 2668142, + "language_name": "Jamaican Creole English", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "jbo", + "speakers": 0, + "language_name": "Lojban", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "jbo", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "jgo", + "speakers": 94333, + "language_name": "Ngomba", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "jmc", + "speakers": 433291, + "language_name": "Machame", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "jml", + "speakers": 970493, + "language_name": "Jumli", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "jut", + "speakers": 0, + "language_name": "Jutish", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "jv", + "speakers": 91180665, + "language_name": "Javanese", + "flores_path": "jav_Latn", + "fleurs_tag": "jv_id", + "commonvoice_hours": 0.0, + "commonvoice_locale": "jv", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "model": 1.0 + }, + { + "bcp_47": "jv", + "speakers": 91180665, + "language_name": "Javanese", + "flores_path": "jav_Latn", + "fleurs_tag": "jv_id", + "commonvoice_hours": 0.0, + "commonvoice_locale": "jv", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9274301130074318, + "model": 1.0 + }, + { + "bcp_47": "jv", + "speakers": 91180665, + "language_name": "Javanese", + "flores_path": "jav_Latn", + "fleurs_tag": "jv_id", + "commonvoice_hours": 0.0, + "commonvoice_locale": "jv", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.25461973194021953, + "model": 1.0 + }, + { + "bcp_47": "jv", + "speakers": 91180665, + "language_name": "Javanese", + "flores_path": "jav_Latn", + "fleurs_tag": "jv_id", + "commonvoice_hours": 0.0, + "commonvoice_locale": "jv", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4296209828775689, + "model": 1.0 + }, + { + "bcp_47": "ka", + "speakers": 3543646, + "language_name": "Georgian", + "flores_path": "kat_Geor", + "fleurs_tag": "ka_ge", + "commonvoice_hours": 158.0, + "commonvoice_locale": "ka", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kaa", + "speakers": 489046, + "language_name": "Kara-Kalpak", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "kaa", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kab", + "speakers": 3351886, + "language_name": "Kabyle", + "flores_path": "kab_Latn", + "fleurs_tag": null, + "commonvoice_hours": 571.0, + "commonvoice_locale": "kab", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kac", + "speakers": 962032, + "language_name": "Kachin", + "flores_path": "kac_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kaj", + "speakers": 449459, + "language_name": "Jju", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kam", + "speakers": 4068120, + "language_name": "Kamba", + "flores_path": "kam_Latn", + "fleurs_tag": "kam_ke", + "commonvoice_hours": 0.0, + "commonvoice_locale": "kam", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kao", + "speakers": 195534, + "language_name": "Xaasongaxango", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kbd", + "speakers": 1070873, + "language_name": "Kabardian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 16.0, + "commonvoice_locale": "kbd", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kcg", + "speakers": 199046, + "language_name": "Tyap", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kck", + "speakers": 770954, + "language_name": "Kalanga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kde", + "speakers": 1463820, + "language_name": "Makonde", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kdt", + "speakers": 421207, + "language_name": "Kuy", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kea", + "speakers": 530762, + "language_name": "Kabuverdianu", + "flores_path": "kea_Latn", + "fleurs_tag": "kea_cv", + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ken", + "speakers": 69362, + "language_name": "Kenyang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kfo", + "speakers": 63207, + "language_name": "Koro", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kfr", + "speakers": 994568, + "language_name": "Kachhi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kfy", + "speakers": 2917398, + "language_name": "Kumaoni", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kg", + "speakers": 1526700, + "language_name": "Kongo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kge", + "speakers": 854483, + "language_name": "Komering", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kgp", + "speakers": 50812, + "language_name": "Kaingang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kha", + "speakers": 1060872, + "language_name": "Khasi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "khb", + "speakers": 264864, + "language_name": "Lü", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "khn", + "speakers": 1989135, + "language_name": "Khandesi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "khq", + "speakers": 332408, + "language_name": "Koyra Chiini", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kht", + "speakers": 13527, + "language_name": "Khamti", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "khw", + "speakers": 350252, + "language_name": "Khowar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 18.0, + "commonvoice_locale": "khw", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ki", + "speakers": 9099743, + "language_name": "Kikuyu", + "flores_path": "kik_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ki", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kiu", + "speakers": 155833, + "language_name": "Kirmanjki", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kj", + "speakers": 920524, + "language_name": "Kuanyama", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kjg", + "speakers": 431949, + "language_name": "Khmu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kk", + "speakers": 13637392, + "language_name": "Kazakh", + "flores_path": "kaz_Cyrl", + "fleurs_tag": "kk_kz", + "commonvoice_hours": 2.1, + "commonvoice_locale": "kk", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kkj", + "speakers": 149823, + "language_name": "Kako", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kl", + "speakers": 55440, + "language_name": "Kalaallisut", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kln", + "speakers": 4068120, + "language_name": "Kalenjin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 43.0, + "commonvoice_locale": "kln", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "km", + "speakers": 15065030, + "language_name": "Khmer", + "flores_path": "khm_Khmr", + "fleurs_tag": "km_kh", + "commonvoice_hours": 0.0, + "commonvoice_locale": "km", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kmb", + "speakers": 8130575, + "language_name": "Kimbundu", + "flores_path": "kmb_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kn", + "speakers": 49065330, + "language_name": "Kannada", + "flores_path": "kan_Knda", + "fleurs_tag": "kn_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "kn", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4, + "model": 1.0 + }, + { + "bcp_47": "kn", + "speakers": 49065330, + "language_name": "Kannada", + "flores_path": "kan_Knda", + "fleurs_tag": "kn_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "kn", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9422502494463877, + "model": 1.0 + }, + { + "bcp_47": "kn", + "speakers": 49065330, + "language_name": "Kannada", + "flores_path": "kan_Knda", + "fleurs_tag": "kn_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "kn", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.2550718176103704, + "model": 1.0 + }, + { + "bcp_47": "kn", + "speakers": 49065330, + "language_name": "Kannada", + "flores_path": "kan_Knda", + "fleurs_tag": "kn_in", + "commonvoice_hours": 0.0, + "commonvoice_locale": "kn", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.44555883949922764, + "model": 1.0 + }, + { + "bcp_47": "knf", + "speakers": 83151, + "language_name": "Mankanya", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ko", + "speakers": 78357046, + "language_name": "Korean", + "flores_path": "kor_Hang", + "fleurs_tag": "ko_kr", + "commonvoice_hours": 1.7, + "commonvoice_locale": "ko", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "model": 1.0 + }, + { + "bcp_47": "ko", + "speakers": 78357046, + "language_name": "Korean", + "flores_path": "kor_Hang", + "fleurs_tag": "ko_kr", + "commonvoice_hours": 1.7, + "commonvoice_locale": "ko", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9384158016197498, + "model": 1.0 + }, + { + "bcp_47": "ko", + "speakers": 78357046, + "language_name": "Korean", + "flores_path": "kor_Hang", + "fleurs_tag": "ko_kr", + "commonvoice_hours": 1.7, + "commonvoice_locale": "ko", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.21969579072372616, + "model": 1.0 + }, + { + "bcp_47": "ko", + "speakers": 78357046, + "language_name": "Korean", + "flores_path": "kor_Hang", + "fleurs_tag": "ko_kr", + "commonvoice_hours": 1.7, + "commonvoice_locale": "ko", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4134343535369622, + "model": 1.0 + }, + { + "bcp_47": "koi", + "speakers": 63775, + "language_name": "Komi-Permyak", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kok", + "speakers": 4906533, + "language_name": "Konkani", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "knn", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kos", + "speakers": 7990, + "language_name": "Kosraean", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kpe", + "speakers": 1186303, + "language_name": "Kpelle", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "krc", + "speakers": 240927, + "language_name": "Karachay-Balkar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "krc", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kri", + "speakers": 6293684, + "language_name": "Krio", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "krj", + "speakers": 425806, + "language_name": "Kinaray-a", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "krl", + "speakers": 116212, + "language_name": "Karelian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kru", + "speakers": 2519571, + "language_name": "Kurukh", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ks", + "speakers": 5598085, + "language_name": "Kashmiri", + "flores_path": "kas_Arab", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ks", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ksb", + "speakers": 995398, + "language_name": "Shambala", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ksf", + "speakers": 88784, + "language_name": "Bafia", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 20.0, + "commonvoice_locale": "ksf", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ksh", + "speakers": 240479, + "language_name": "Colognian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ku", + "speakers": 6866757, + "language_name": "Kurdish", + "flores_path": "kmr_Latn", + "fleurs_tag": null, + "commonvoice_hours": 69.0, + "commonvoice_locale": "kmr", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kum", + "speakers": 283444, + "language_name": "Kumyk", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kv", + "speakers": 255100, + "language_name": "Komi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "kpv", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kvr", + "speakers": 373836, + "language_name": "Kerinci", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kvx", + "speakers": 373602, + "language_name": "Parkari Koli", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kw", + "speakers": 1973, + "language_name": "Cornish", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 2.9, + "commonvoice_locale": "kw", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kwk", + "speakers": 377, + "language_name": "Kwakʼwala", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kxm", + "speakers": 1172616, + "language_name": "Northern Khmer", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kxp", + "speakers": 256851, + "language_name": "Wadiyara Koli", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "kxv", + "speakers": 38457, + "language_name": "Kuvi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ky", + "speakers": 3338267, + "language_name": "Kyrgyz", + "flores_path": "kir_Cyrl", + "fleurs_tag": "ky_kg", + "commonvoice_hours": 39.0, + "commonvoice_locale": "ky", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "la", + "speakers": 820, + "language_name": "Latin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lad", + "speakers": 112781, + "language_name": "Ladino", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lag", + "speakers": 509409, + "language_name": "Langi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lah", + "speakers": 93433552, + "language_name": "Western Panjabi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "laj", + "speakers": 1643614, + "language_name": "Lango (Uganda)", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lb", + "speakers": 421015, + "language_name": "Luxembourgish", + "flores_path": "ltz_Latn", + "fleurs_tag": "lb_lu", + "commonvoice_hours": 0.0, + "commonvoice_locale": "lb", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lbe", + "speakers": 110543, + "language_name": "Lak", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lbw", + "speakers": 347134, + "language_name": "Tolaki", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lcp", + "speakers": 87751, + "language_name": "Western Lawa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lep", + "speakers": 79743, + "language_name": "Lepcha", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lez", + "speakers": 255100, + "language_name": "Lezghian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lg", + "speakers": 5622890, + "language_name": "Ganda", + "flores_path": "lug_Latn", + "fleurs_tag": "lg_ug", + "commonvoice_hours": 437.0, + "commonvoice_locale": "lg", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "li", + "speakers": 950422, + "language_name": "Limburgish", + "flores_path": "lim_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lif", + "speakers": 368085, + "language_name": "Limbu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lij", + "speakers": 536663, + "language_name": "Ligurian", + "flores_path": "lij_Latn", + "fleurs_tag": null, + "commonvoice_hours": 5.1, + "commonvoice_locale": "lij", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lil", + "speakers": 528, + "language_name": "Lillooet", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lis", + "speakers": 627309, + "language_name": "Lisu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ljp", + "speakers": 1842479, + "language_name": "Lampung Api", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lki", + "speakers": 645417, + "language_name": "Laki", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lkt", + "speakers": 8316, + "language_name": "Lakota", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lmn", + "speakers": 3580443, + "language_name": "Lambadi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lmo", + "speakers": 3901518, + "language_name": "Lombard", + "flores_path": "lmo_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ln", + "speakers": 3514491, + "language_name": "Lingala", + "flores_path": "lin_Latn", + "fleurs_tag": "ln_cd", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ln", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lo", + "speakers": 5138706, + "language_name": "Lao", + "flores_path": "lao_Laoo", + "fleurs_tag": "lo_la", + "commonvoice_hours": 0.2, + "commonvoice_locale": "lo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lol", + "speakers": 620858, + "language_name": "Mongo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "loz", + "speakers": 1045596, + "language_name": "Lozi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lrc", + "speakers": 2020512, + "language_name": "Northern Luri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lt", + "speakers": 2488617, + "language_name": "Lithuanian", + "flores_path": "lit_Latn", + "fleurs_tag": "lt_lt", + "commonvoice_hours": 25.0, + "commonvoice_locale": "lt", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ltg", + "speakers": 167429, + "language_name": "Latgalian", + "flores_path": "ltg_Latn", + "fleurs_tag": null, + "commonvoice_hours": 28.0, + "commonvoice_locale": "ltg", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lu", + "speakers": 2340940, + "language_name": "Luba-Katanga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lua", + "speakers": 9770880, + "language_name": "Luba-Lulua", + "flores_path": "lua_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "luo", + "speakers": 5245734, + "language_name": "Luo (Kenya and Tanzania)", + "flores_path": "luo_Latn", + "fleurs_tag": "luo_ke", + "commonvoice_hours": 30.0, + "commonvoice_locale": "luo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "luy", + "speakers": 5888069, + "language_name": "Luyia", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "luz", + "speakers": 1019080, + "language_name": "Southern Luri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lv", + "speakers": 1147550, + "language_name": "Latvian", + "flores_path": "lvs_Latn", + "fleurs_tag": "lv_lv", + "commonvoice_hours": 260.0, + "commonvoice_locale": "lv", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lwl", + "speakers": 6898, + "language_name": "Eastern Lawa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lzh", + "speakers": 0, + "language_name": "Literary Chinese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "lzz", + "speakers": 22965, + "language_name": "Laz", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "lzz", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mad", + "speakers": 16822638, + "language_name": "Madurese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "maf", + "speakers": 205313, + "language_name": "Mafa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mag", + "speakers": 15913080, + "language_name": "Magahi", + "flores_path": "mag_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mai", + "speakers": 19249149, + "language_name": "Maithili", + "flores_path": "mai_Deva", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "mai", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mak", + "speakers": 1949290, + "language_name": "Makasar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "man", + "speakers": 3511762, + "language_name": "Mandingo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mas", + "speakers": 1734738, + "language_name": "Masai", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "maz", + "speakers": 437410, + "language_name": "Central Mazahua", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mdf", + "speakers": 297616, + "language_name": "Moksha", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.5, + "commonvoice_locale": "mdf", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mdh", + "speakers": 1310172, + "language_name": "Maguindanaon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mdr", + "speakers": 245664, + "language_name": "Mandar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "men", + "speakers": 1813083, + "language_name": "Mende", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mer", + "speakers": 2141116, + "language_name": "Meru", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mey", + "speakers": 7239, + "language_name": "Hassaniyya", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mfa", + "speakers": 3448870, + "language_name": "Pattani Malay", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mfe", + "speakers": 1241433, + "language_name": "Morisyen", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mfv", + "speakers": 121170, + "language_name": "Mandjak", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mg", + "speakers": 24260130, + "language_name": "Malagasy", + "flores_path": "plt_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "mg", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mgh", + "speakers": 1354419, + "language_name": "Makhuwa-Meetto", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mgo", + "speakers": 130401, + "language_name": "Metaʼ", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mgp", + "speakers": 333607, + "language_name": "Eastern Magar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mgy", + "speakers": 819739, + "language_name": "Mbunga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mh", + "speakers": 56879, + "language_name": "Marshallese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mi", + "speakers": 137913, + "language_name": "Māori", + "flores_path": "mri_Latn", + "fleurs_tag": "mi_nz", + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mic", + "speakers": 7916, + "language_name": "Mi'kmaw", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "min", + "speakers": 8010780, + "language_name": "Minangkabau", + "flores_path": "min_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mk", + "speakers": 1608565, + "language_name": "Macedonian", + "flores_path": "mkd_Cyrl", + "fleurs_tag": "mk_mk", + "commonvoice_hours": 18.0, + "commonvoice_locale": "mk", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ml", + "speakers": 43257484, + "language_name": "Malayalam", + "flores_path": "mal_Mlym", + "fleurs_tag": "ml_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "ml", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.43333333333333335, + "model": 1.0 + }, + { + "bcp_47": "ml", + "speakers": 43257484, + "language_name": "Malayalam", + "flores_path": "mal_Mlym", + "fleurs_tag": "ml_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "ml", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9372865200487422, + "model": 1.0 + }, + { + "bcp_47": "ml", + "speakers": 43257484, + "language_name": "Malayalam", + "flores_path": "mal_Mlym", + "fleurs_tag": "ml_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "ml", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.20114751241051923, + "model": 1.0 + }, + { + "bcp_47": "ml", + "speakers": 43257484, + "language_name": "Malayalam", + "flores_path": "mal_Mlym", + "fleurs_tag": "ml_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "ml", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.39404171184956394, + "model": 1.0 + }, + { + "bcp_47": "mls", + "speakers": 451060, + "language_name": "Masalit", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mn", + "speakers": 6572846, + "language_name": "Mongolian", + "flores_path": "khk_Cyrl", + "fleurs_tag": "mn_mn", + "commonvoice_hours": 46.0, + "commonvoice_locale": "mn", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mni", + "speakers": 1476591, + "language_name": "Manipuri", + "flores_path": "mni_Beng", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "mni", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mnw", + "speakers": 966114, + "language_name": "Mon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "moe", + "speakers": 12062, + "language_name": "Innu-aimun", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "moh", + "speakers": 1772, + "language_name": "Mohawk", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mos", + "speakers": 8334160, + "language_name": "Mossi", + "flores_path": "mos_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "mos", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mr", + "speakers": 92826300, + "language_name": "Marathi", + "flores_path": "mar_Deva", + "fleurs_tag": "mr_in", + "commonvoice_hours": 20.0, + "commonvoice_locale": "mr", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "model": 1.0 + }, + { + "bcp_47": "mr", + "speakers": 92826300, + "language_name": "Marathi", + "flores_path": "mar_Deva", + "fleurs_tag": "mr_in", + "commonvoice_hours": 20.0, + "commonvoice_locale": "mr", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9493846554320581, + "model": 1.0 + }, + { + "bcp_47": "mr", + "speakers": 92826300, + "language_name": "Marathi", + "flores_path": "mar_Deva", + "fleurs_tag": "mr_in", + "commonvoice_hours": 20.0, + "commonvoice_locale": "mr", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.22832077978859452, + "model": 1.0 + }, + { + "bcp_47": "mr", + "speakers": 92826300, + "language_name": "Marathi", + "flores_path": "mar_Deva", + "fleurs_tag": "mr_in", + "commonvoice_hours": 20.0, + "commonvoice_locale": "mr", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4245203296342906, + "model": 1.0 + }, + { + "bcp_47": "mrd", + "speakers": 251722, + "language_name": "Western Magar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mrj", + "speakers": 29762, + "language_name": "Western Mari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 34.0, + "commonvoice_locale": "mrj", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mro", + "speakers": 29277, + "language_name": "Mru", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ms", + "speakers": 38097307, + "language_name": "Malay", + "flores_path": "zsm_Latn", + "fleurs_tag": "ms_my", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ms", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "model": 1.0 + }, + { + "bcp_47": "ms", + "speakers": 38097307, + "language_name": "Malay", + "flores_path": "zsm_Latn", + "fleurs_tag": "ms_my", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ms", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9449541544914151, + "model": 1.0 + }, + { + "bcp_47": "ms", + "speakers": 38097307, + "language_name": "Malay", + "flores_path": "zsm_Latn", + "fleurs_tag": "ms_my", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ms", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.26403874316694886, + "model": 1.0 + }, + { + "bcp_47": "ms", + "speakers": 38097307, + "language_name": "Malay", + "flores_path": "zsm_Latn", + "fleurs_tag": "ms_my", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ms", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.45903065670305854, + "model": 1.0 + }, + { + "bcp_47": "mt", + "speakers": 457267, + "language_name": "Maltese", + "flores_path": "mlt_Latn", + "fleurs_tag": "mt_mt", + "commonvoice_hours": 8.7, + "commonvoice_locale": "mt", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mtr", + "speakers": 1286307, + "language_name": "Mewari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mua", + "speakers": 277450, + "language_name": "Mundang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mus", + "speakers": 3992, + "language_name": "Muscogee", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mvy", + "speakers": 326901, + "language_name": "Indus Kohistani", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 23.0, + "commonvoice_locale": "mvy", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mwk", + "speakers": 977670, + "language_name": "Kita Maninkakan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mwr", + "speakers": 15913080, + "language_name": "Marwari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mwv", + "speakers": 64086, + "language_name": "Mentawai", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mxc", + "speakers": 945510, + "language_name": "Manyika", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "my", + "speakers": 36559231, + "language_name": "Burmese", + "flores_path": "mya_Mymr", + "fleurs_tag": "my_mm", + "commonvoice_hours": 0.0, + "commonvoice_locale": "my", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4, + "model": 1.0 + }, + { + "bcp_47": "my", + "speakers": 36559231, + "language_name": "Burmese", + "flores_path": "mya_Mymr", + "fleurs_tag": "my_mm", + "commonvoice_hours": 0.0, + "commonvoice_locale": "my", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.918432369873729, + "model": 1.0 + }, + { + "bcp_47": "my", + "speakers": 36559231, + "language_name": "Burmese", + "flores_path": "mya_Mymr", + "fleurs_tag": "my_mm", + "commonvoice_hours": 0.0, + "commonvoice_locale": "my", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.18617334539824332, + "model": 1.0 + }, + { + "bcp_47": "my", + "speakers": 36559231, + "language_name": "Burmese", + "flores_path": "mya_Mymr", + "fleurs_tag": "my_mm", + "commonvoice_hours": 0.0, + "commonvoice_locale": "my", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.3705060280208132, + "model": 1.0 + }, + { + "bcp_47": "myv", + "speakers": 439338, + "language_name": "Erzya", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 3.8, + "commonvoice_locale": "myv", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "myx", + "speakers": 1254337, + "language_name": "Masaaba", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "mzn", + "speakers": 4246165, + "language_name": "Mazanderani", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "na", + "speakers": 6930, + "language_name": "Nauru", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nan", + "speakers": 26486380, + "language_name": "Min Nan Chinese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nap", + "speakers": 605306, + "language_name": "Neapolitan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "naq", + "speakers": 289308, + "language_name": "Nama", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nb", + "speakers": 5468932, + "language_name": "Norwegian Bokmål", + "flores_path": "nob_Latn", + "fleurs_tag": "nb_no", + "commonvoice_hours": 0.1, + "commonvoice_locale": "nb-NO", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nch", + "speakers": 244435, + "language_name": "Central Huasteca Nahuatl", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nd", + "speakers": 1745556, + "language_name": "North Ndebele", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "nd", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ndc", + "speakers": 3867046, + "language_name": "Ndau", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nds", + "speakers": 11520008, + "language_name": "Low German", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ne", + "speakers": 20903374, + "language_name": "Nepali", + "flores_path": "npi_Deva", + "fleurs_tag": "ne_np", + "commonvoice_hours": 1.3, + "commonvoice_locale": "ne-NP", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "new", + "speakers": 1000821, + "language_name": "Newari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "new", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ng", + "speakers": 552315, + "language_name": "Ndonga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ngl", + "speakers": 2046678, + "language_name": "Lomwe", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nhe", + "speakers": 501735, + "language_name": "Eastern Huasteca Nahuatl", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "nhe", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nhw", + "speakers": 501735, + "language_name": "Western Huasteca Nahuatl", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nij", + "speakers": 987996, + "language_name": "Ngaju", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "niu", + "speakers": 1120, + "language_name": "Niuean", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "njo", + "speakers": 305001, + "language_name": "Ao Naga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nl", + "speakers": 31765645, + "language_name": "Dutch", + "flores_path": "nld_Latn", + "fleurs_tag": "nl_nl", + "commonvoice_hours": 114.0, + "commonvoice_locale": "nl", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nmg", + "speakers": 8878, + "language_name": "Kwasio", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nn", + "speakers": 1366860, + "language_name": "Norwegian Nynorsk", + "flores_path": "nno_Latn", + "fleurs_tag": null, + "commonvoice_hours": 1.5, + "commonvoice_locale": "nn-NO", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nnh", + "speakers": 388430, + "language_name": "Ngiemboon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 23.0, + "commonvoice_locale": "nnh", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "no", + "speakers": 5467440, + "language_name": "Norwegian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nod", + "speakers": 6621830, + "language_name": "Northern Thai", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "noe", + "speakers": 1723917, + "language_name": "Nimadi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nqo", + "speakers": 626370, + "language_name": "N’Ko", + "flores_path": "nqo_Nkoo", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "nqo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nr", + "speakers": 903418, + "language_name": "South Ndebele", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "nr", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nsk", + "speakers": 1395, + "language_name": "Naskapi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nso", + "speakers": 5307578, + "language_name": "Northern Sotho", + "flores_path": "nso_Latn", + "fleurs_tag": "nso_za", + "commonvoice_hours": 0.0, + "commonvoice_locale": "nso", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nus", + "speakers": 591427, + "language_name": "Nuer", + "flores_path": "nus_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nv", + "speakers": 166320, + "language_name": "Navajo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nxq", + "speakers": 334565, + "language_name": "Naxi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ny", + "speakers": 17026781, + "language_name": "Nyanja", + "flores_path": "nya_Latn", + "fleurs_tag": "ny_mw", + "commonvoice_hours": 0.0, + "commonvoice_locale": "ny", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nym", + "speakers": 1932242, + "language_name": "Nyamwezi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nyn", + "speakers": 2724939, + "language_name": "Nyankole", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "nyn", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "nzi", + "speakers": 293402, + "language_name": "Nzima", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "oc", + "speakers": 2040398, + "language_name": "Occitan", + "flores_path": "oci_Latn", + "fleurs_tag": "oc_fr", + "commonvoice_hours": 1.8, + "commonvoice_locale": "oc", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "oj", + "speakers": 23747, + "language_name": "Ojibwa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ojs", + "speakers": 15078, + "language_name": "Oji-Cree", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "oka", + "speakers": 490, + "language_name": "Okanagan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "om", + "speakers": 34897121, + "language_name": "Oromo", + "flores_path": "gaz_Latn", + "fleurs_tag": "om_et", + "commonvoice_hours": 0.0, + "commonvoice_locale": "om", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "model": 1.0 + }, + { + "bcp_47": "om", + "speakers": 34897121, + "language_name": "Oromo", + "flores_path": "gaz_Latn", + "fleurs_tag": "om_et", + "commonvoice_hours": 0.0, + "commonvoice_locale": "om", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9359301483225031, + "model": 1.0 + }, + { + "bcp_47": "om", + "speakers": 34897121, + "language_name": "Oromo", + "flores_path": "gaz_Latn", + "fleurs_tag": "om_et", + "commonvoice_hours": 0.0, + "commonvoice_locale": "om", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.06509147151730071, + "model": 1.0 + }, + { + "bcp_47": "om", + "speakers": 34897121, + "language_name": "Oromo", + "flores_path": "gaz_Latn", + "fleurs_tag": "om_et", + "commonvoice_hours": 0.0, + "commonvoice_locale": "om", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.22674886804446037, + "model": 1.0 + }, + { + "bcp_47": "or", + "speakers": 42434880, + "language_name": "Odia", + "flores_path": "ory_Orya", + "fleurs_tag": "or_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "or", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "model": 1.0 + }, + { + "bcp_47": "or", + "speakers": 42434880, + "language_name": "Odia", + "flores_path": "ory_Orya", + "fleurs_tag": "or_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "or", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9211968327986088, + "model": 1.0 + }, + { + "bcp_47": "or", + "speakers": 42434880, + "language_name": "Odia", + "flores_path": "ory_Orya", + "fleurs_tag": "or_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "or", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.2521285657827072, + "model": 1.0 + }, + { + "bcp_47": "or", + "speakers": 42434880, + "language_name": "Odia", + "flores_path": "ory_Orya", + "fleurs_tag": "or_in", + "commonvoice_hours": 2.8, + "commonvoice_locale": "or", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4422326291663304, + "model": 1.0 + }, + { + "bcp_47": "os", + "speakers": 541444, + "language_name": "Ossetic", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.7, + "commonvoice_locale": "os", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "osa", + "speakers": 0, + "language_name": "Osage", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pa", + "speakers": 203571210, + "language_name": "Punjabi", + "flores_path": "pan_Guru", + "fleurs_tag": "pa_in", + "commonvoice_hours": 2.3, + "commonvoice_locale": "pa-IN", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "model": 4.0 + }, + { + "bcp_47": "pa", + "speakers": 203571210, + "language_name": "Punjabi", + "flores_path": "pan_Guru", + "fleurs_tag": "pa_in", + "commonvoice_hours": 2.3, + "commonvoice_locale": "pa-IN", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9013087100801337, + "model": 4.0 + }, + { + "bcp_47": "pa", + "speakers": 203571210, + "language_name": "Punjabi", + "flores_path": "pan_Guru", + "fleurs_tag": "pa_in", + "commonvoice_hours": 2.3, + "commonvoice_locale": "pa-IN", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.3099562778912564, + "model": 4.0 + }, + { + "bcp_47": "pa", + "speakers": 203571210, + "language_name": "Punjabi", + "flores_path": "pan_Guru", + "fleurs_tag": "pa_in", + "commonvoice_hours": 2.3, + "commonvoice_locale": "pa-IN", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4604060151149361, + "model": 4.0 + }, + { + "bcp_47": "pag", + "speakers": 1528534, + "language_name": "Pangasinan", + "flores_path": "pag_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pam", + "speakers": 2511163, + "language_name": "Pampanga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pap", + "speakers": 211640, + "language_name": "Papiamento", + "flores_path": "pap_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "pap-AW", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pau", + "speakers": 16047, + "language_name": "Palauan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pcd", + "speakers": 746330, + "language_name": "Picard", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pcm", + "speakers": 44945880, + "language_name": "Nigerian Pidgin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 14.0, + "commonvoice_locale": "pcm", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pdc", + "speakers": 129729, + "language_name": "Pennsylvania German", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pdt", + "speakers": 90466, + "language_name": "Plautdietsch", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pfl", + "speakers": 0, + "language_name": "Palatine German", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pis", + "speakers": 561780, + "language_name": "Pijin", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pko", + "speakers": 369343, + "language_name": "Pökoot", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pl", + "speakers": 41077399, + "language_name": "Polish", + "flores_path": "pol_Latn", + "fleurs_tag": "pl_pl", + "commonvoice_hours": 174.0, + "commonvoice_locale": "pl", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "model": 1.0 + }, + { + "bcp_47": "pl", + "speakers": 41077399, + "language_name": "Polish", + "flores_path": "pol_Latn", + "fleurs_tag": "pl_pl", + "commonvoice_hours": 174.0, + "commonvoice_locale": "pl", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9603182772393537, + "model": 1.0 + }, + { + "bcp_47": "pl", + "speakers": 41077399, + "language_name": "Polish", + "flores_path": "pol_Latn", + "fleurs_tag": "pl_pl", + "commonvoice_hours": 174.0, + "commonvoice_locale": "pl", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.26987204535648013, + "model": 1.0 + }, + { + "bcp_47": "pl", + "speakers": 41077399, + "language_name": "Polish", + "flores_path": "pol_Latn", + "fleurs_tag": "pl_pl", + "commonvoice_hours": 174.0, + "commonvoice_locale": "pl", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.45624928163848544, + "model": 1.0 + }, + { + "bcp_47": "pms", + "speakers": 6178, + "language_name": "Piedmontese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pnt", + "speakers": 392463, + "language_name": "Pontic", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pon", + "speakers": 23560, + "language_name": "Pohnpeian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pqm", + "speakers": 490, + "language_name": "Maliseet-Passamaquoddy", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "prd", + "speakers": 864342, + "language_name": "Parsi-Dari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "prg", + "speakers": 38, + "language_name": "Prussian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ps", + "speakers": 53542641, + "language_name": "Pashto", + "flores_path": null, + "fleurs_tag": "ps_af", + "commonvoice_hours": 79.0, + "commonvoice_locale": "ps", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "pt", + "speakers": 237496885, + "language_name": "Portuguese", + "flores_path": "por_Latn", + "fleurs_tag": "pt_br", + "commonvoice_hours": 177.0, + "commonvoice_locale": "pt", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.65, + "model": 4.0 + }, + { + "bcp_47": "pt", + "speakers": 237496885, + "language_name": "Portuguese", + "flores_path": "por_Latn", + "fleurs_tag": "pt_br", + "commonvoice_hours": 177.0, + "commonvoice_locale": "pt", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9598364847166063, + "model": 4.0 + }, + { + "bcp_47": "pt", + "speakers": 237496885, + "language_name": "Portuguese", + "flores_path": "por_Latn", + "fleurs_tag": "pt_br", + "commonvoice_hours": 177.0, + "commonvoice_locale": "pt", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.3232823660730954, + "model": 4.0 + }, + { + "bcp_47": "pt", + "speakers": 237496885, + "language_name": "Portuguese", + "flores_path": "por_Latn", + "fleurs_tag": "pt_br", + "commonvoice_hours": 177.0, + "commonvoice_locale": "pt", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4828937591427408, + "model": 4.0 + }, + { + "bcp_47": "puu", + "speakers": 200782, + "language_name": "Punu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "qu", + "speakers": 11385851, + "language_name": "Quechua", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "quc", + "speakers": 1200731, + "language_name": "Kʼicheʼ", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "quc", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "qug", + "speakers": 963579, + "language_name": "Chimborazo Highland Quichua", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "raj", + "speakers": 1326090, + "language_name": "Rajasthani", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rcf", + "speakers": 559185, + "language_name": "Réunion Creole French", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rej", + "speakers": 1228320, + "language_name": "Rejang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rgn", + "speakers": 0, + "language_name": "Romagnol", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rhg", + "speakers": 1824082, + "language_name": "Rohingya", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ria", + "speakers": 172392, + "language_name": "Riang (India)", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rif", + "speakers": 3692411, + "language_name": "Riffian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "rif", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rjs", + "speakers": 133443, + "language_name": "Rajbanshi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rkt", + "speakers": 16274502, + "language_name": "Rangpuri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rm", + "speakers": 42020, + "language_name": "Romansh", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rmf", + "speakers": 5015, + "language_name": "Kalo Finnish Romani", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rmo", + "speakers": 24372, + "language_name": "Sinte Romani", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rmt", + "speakers": 1613543, + "language_name": "Domari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rmu", + "speakers": 9488, + "language_name": "Tavringer Romani", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rn", + "speakers": 7475454, + "language_name": "Rundi", + "flores_path": "run_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "rn", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rng", + "speakers": 1023339, + "language_name": "Ronga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ro", + "speakers": 22187408, + "language_name": "Romanian", + "flores_path": "ron_Latn", + "fleurs_tag": "ro_ro", + "commonvoice_hours": 21.0, + "commonvoice_locale": "ro", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rob", + "speakers": 293729, + "language_name": "Tae'", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rof", + "speakers": 433291, + "language_name": "Rombo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rtm", + "speakers": 2527, + "language_name": "Rotuman", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ru", + "speakers": 195841151, + "language_name": "Russian", + "flores_path": "rus_Cyrl", + "fleurs_tag": "ru_ru", + "commonvoice_hours": 242.0, + "commonvoice_locale": "ru", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "model": 1.0 + }, + { + "bcp_47": "ru", + "speakers": 195841151, + "language_name": "Russian", + "flores_path": "rus_Cyrl", + "fleurs_tag": "ru_ru", + "commonvoice_hours": 242.0, + "commonvoice_locale": "ru", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9702818211253317, + "model": 1.0 + }, + { + "bcp_47": "ru", + "speakers": 195841151, + "language_name": "Russian", + "flores_path": "rus_Cyrl", + "fleurs_tag": "ru_ru", + "commonvoice_hours": 242.0, + "commonvoice_locale": "ru", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.21923866610511514, + "model": 1.0 + }, + { + "bcp_47": "ru", + "speakers": 195841151, + "language_name": "Russian", + "flores_path": "rus_Cyrl", + "fleurs_tag": "ru_ru", + "commonvoice_hours": 242.0, + "commonvoice_locale": "ru", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.41987611292148114, + "model": 1.0 + }, + { + "bcp_47": "rue", + "speakers": 527075, + "language_name": "Rusyn", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rug", + "speakers": 9591, + "language_name": "Roviana", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rw", + "speakers": 11083625, + "language_name": "Kinyarwanda", + "flores_path": "kin_Latn", + "fleurs_tag": null, + "commonvoice_hours": 2002.0, + "commonvoice_locale": "rw", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "rwk", + "speakers": 128816, + "language_name": "Rwa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ryu", + "speakers": 966404, + "language_name": "Central Okinawan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sa", + "speakers": 15913, + "language_name": "Sanskrit", + "flores_path": "san_Deva", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "saf", + "speakers": 4108, + "language_name": "Safaliba", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sah", + "speakers": 453510, + "language_name": "Yakut", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 9.5, + "commonvoice_locale": "sah", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "saq", + "speakers": 246228, + "language_name": "Samburu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sas", + "speakers": 2590152, + "language_name": "Sasak", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sat", + "speakers": 7293495, + "language_name": "Santali", + "flores_path": "sat_Olck", + "fleurs_tag": null, + "commonvoice_hours": 0.5, + "commonvoice_locale": "sat", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sav", + "speakers": 236046, + "language_name": "Saafi-Saafi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "saz", + "speakers": 384566, + "language_name": "Saurashtra", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sbp", + "speakers": 117106, + "language_name": "Sangu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sc", + "speakers": 1060846, + "language_name": "Sardinian", + "flores_path": "srd_Latn", + "fleurs_tag": null, + "commonvoice_hours": 2.9, + "commonvoice_locale": "sc", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sck", + "speakers": 2386962, + "language_name": "Sadri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "scn", + "speakers": 511702, + "language_name": "Sicilian", + "flores_path": "scn_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "scn", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sco", + "speakers": 1644028, + "language_name": "Scots", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "sco", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sd", + "speakers": 40329510, + "language_name": "Sindhi", + "flores_path": "snd_Arab", + "fleurs_tag": "sd_in", + "commonvoice_hours": 0.4, + "commonvoice_locale": "sd", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.3333333333333333, + "model": 1.0 + }, + { + "bcp_47": "sd", + "speakers": 40329510, + "language_name": "Sindhi", + "flores_path": "snd_Arab", + "fleurs_tag": "sd_in", + "commonvoice_hours": 0.4, + "commonvoice_locale": "sd", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9075877951969867, + "model": 1.0 + }, + { + "bcp_47": "sd", + "speakers": 40329510, + "language_name": "Sindhi", + "flores_path": "snd_Arab", + "fleurs_tag": "sd_in", + "commonvoice_hours": 0.4, + "commonvoice_locale": "sd", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.21679684560539594, + "model": 1.0 + }, + { + "bcp_47": "sd", + "speakers": 40329510, + "language_name": "Sindhi", + "flores_path": "snd_Arab", + "fleurs_tag": "sd_in", + "commonvoice_hours": 0.4, + "commonvoice_locale": "sd", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4130326388570076, + "model": 1.0 + }, + { + "bcp_47": "sdc", + "speakers": 106085, + "language_name": "Sassarese Sardinian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sdh", + "speakers": 3142162, + "language_name": "Southern Kurdish", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "sdh", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "se", + "speakers": 51530, + "language_name": "Northern Sami", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sef", + "speakers": 1181687, + "language_name": "Cebaara Senoufo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "seh", + "speakers": 1384517, + "language_name": "Sena", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sei", + "speakers": 901, + "language_name": "Seri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 1.2, + "commonvoice_locale": "sei", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ses", + "speakers": 664816, + "language_name": "Koyraboro Senni", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sg", + "speakers": 2935521, + "language_name": "Sango", + "flores_path": "sag_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sgs", + "speakers": 0, + "language_name": "Samogitian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "shi", + "speakers": 6187736, + "language_name": "Tachelhit", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "shi", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "shn", + "speakers": 3687984, + "language_name": "Shan", + "flores_path": "shn_Mymr", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "shn", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "si", + "speakers": 15564656, + "language_name": "Sinhala", + "flores_path": "sin_Sinh", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "si", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sid", + "speakers": 3783955, + "language_name": "Sidamo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sk", + "speakers": 6680269, + "language_name": "Slovak", + "flores_path": "slk_Latn", + "fleurs_tag": "sk_sk", + "commonvoice_hours": 46.0, + "commonvoice_locale": "sk", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "skr", + "speakers": 28020120, + "language_name": "Saraiki", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 4.3, + "commonvoice_locale": "skr", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sl", + "speakers": 1973181, + "language_name": "Slovenian", + "flores_path": "slv_Latn", + "fleurs_tag": "sl_si", + "commonvoice_hours": 17.0, + "commonvoice_locale": "sl", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sli", + "speakers": 11868, + "language_name": "Lower Silesian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sly", + "speakers": 144194, + "language_name": "Selayar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sm", + "speakers": 252717, + "language_name": "Samoan", + "flores_path": "smo_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sma", + "speakers": 296, + "language_name": "Southern Sami", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "smj", + "speakers": 1530, + "language_name": "Lule Sami", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "smn", + "speakers": 613, + "language_name": "Inari Sami", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sms", + "speakers": 613, + "language_name": "Skolt Sami", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sn", + "speakers": 11782503, + "language_name": "Shona", + "flores_path": "sna_Latn", + "fleurs_tag": "sn_zw", + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "snf", + "speakers": 37767, + "language_name": "Noon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "snk", + "speakers": 1153651, + "language_name": "Soninke", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "snk", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "so", + "speakers": 16911645, + "language_name": "Somali", + "flores_path": "som_Latn", + "fleurs_tag": "so_so", + "commonvoice_hours": 0.0, + "commonvoice_locale": "so", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sou", + "speakers": 5518192, + "language_name": "Southern Thai", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sq", + "speakers": 6791906, + "language_name": "Albanian", + "flores_path": "als_Latn", + "fleurs_tag": null, + "commonvoice_hours": 8.8, + "commonvoice_locale": "sq", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sr", + "speakers": 15602410, + "language_name": "Serbian", + "flores_path": "srp_Cyrl", + "fleurs_tag": "sr_rs", + "commonvoice_hours": 7.5, + "commonvoice_locale": "sr", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "srn", + "speakers": 414507, + "language_name": "Sranan Tongo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "srr", + "speakers": 1731004, + "language_name": "Serer", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "srx", + "speakers": 464132, + "language_name": "Sirmauri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ss", + "speakers": 2212379, + "language_name": "Swati", + "flores_path": "ssw_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ss", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ssy", + "speakers": 218923, + "language_name": "Saho", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "st", + "speakers": 6390567, + "language_name": "Southern Sotho", + "flores_path": "sot_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "st", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "stq", + "speakers": 962, + "language_name": "Saterland Frisian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "su", + "speakers": 32043120, + "language_name": "Sundanese", + "flores_path": "sun_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "suk", + "speakers": 5094094, + "language_name": "Sukuma", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sus", + "speakers": 1378014, + "language_name": "Susu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sv", + "speakers": 12932871, + "language_name": "Swedish", + "flores_path": "swe_Latn", + "fleurs_tag": "sv_se", + "commonvoice_hours": 47.0, + "commonvoice_locale": "sv-SE", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sw", + "speakers": 171610296, + "language_name": "Swahili", + "flores_path": "swh_Latn", + "fleurs_tag": "sw_ke", + "commonvoice_hours": 411.0, + "commonvoice_locale": "sw", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "model": 1.0 + }, + { + "bcp_47": "sw", + "speakers": 171610296, + "language_name": "Swahili", + "flores_path": "swh_Latn", + "fleurs_tag": "sw_ke", + "commonvoice_hours": 411.0, + "commonvoice_locale": "sw", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9363185104933659, + "model": 1.0 + }, + { + "bcp_47": "sw", + "speakers": 171610296, + "language_name": "Swahili", + "flores_path": "swh_Latn", + "fleurs_tag": "sw_ke", + "commonvoice_hours": 411.0, + "commonvoice_locale": "sw", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.2687578645492076, + "model": 1.0 + }, + { + "bcp_47": "sw", + "speakers": 171610296, + "language_name": "Swahili", + "flores_path": "swh_Latn", + "fleurs_tag": "sw_ke", + "commonvoice_hours": 411.0, + "commonvoice_locale": "sw", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.435973049682813, + "model": 1.0 + }, + { + "bcp_47": "swb", + "speakers": 170720, + "language_name": "Comorian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "swg", + "speakers": 801597, + "language_name": "Swabian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "swv", + "speakers": 3713052, + "language_name": "Shekhawati", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "sxn", + "speakers": 245664, + "language_name": "Sangir", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "syl", + "speakers": 8132550, + "language_name": "Sylheti", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "syr", + "speakers": 210659, + "language_name": "Syriac", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "syr", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "szl", + "speakers": 497670, + "language_name": "Silesian", + "flores_path": "szl_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ta", + "speakers": 85616159, + "language_name": "Tamil", + "flores_path": "tam_Taml", + "fleurs_tag": "ta_in", + "commonvoice_hours": 234.0, + "commonvoice_locale": "ta", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.43333333333333335, + "model": 1.0 + }, + { + "bcp_47": "ta", + "speakers": 85616159, + "language_name": "Tamil", + "flores_path": "tam_Taml", + "fleurs_tag": "ta_in", + "commonvoice_hours": 234.0, + "commonvoice_locale": "ta", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9604137478864351, + "model": 1.0 + }, + { + "bcp_47": "ta", + "speakers": 85616159, + "language_name": "Tamil", + "flores_path": "tam_Taml", + "fleurs_tag": "ta_in", + "commonvoice_hours": 234.0, + "commonvoice_locale": "ta", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.22755903113370943, + "model": 1.0 + }, + { + "bcp_47": "ta", + "speakers": 85616159, + "language_name": "Tamil", + "flores_path": "tam_Taml", + "fleurs_tag": "ta_in", + "commonvoice_hours": 234.0, + "commonvoice_locale": "ta", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.3968691612249629, + "model": 1.0 + }, + { + "bcp_47": "taj", + "speakers": 130410, + "language_name": "Eastern Tamang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tbw", + "speakers": 10045, + "language_name": "Tagbanwa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tcy", + "speakers": 1989135, + "language_name": "Tulu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tdd", + "speakers": 264864, + "language_name": "Tai Nüa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tdg", + "speakers": 394263, + "language_name": "Western Tamang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tdh", + "speakers": 36393, + "language_name": "Thulung", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "te", + "speakers": 95478480, + "language_name": "Telugu", + "flores_path": "tel_Telu", + "fleurs_tag": "te_in", + "commonvoice_hours": 0.3, + "commonvoice_locale": "te", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.36666666666666664, + "model": 1.0 + }, + { + "bcp_47": "te", + "speakers": 95478480, + "language_name": "Telugu", + "flores_path": "tel_Telu", + "fleurs_tag": "te_in", + "commonvoice_hours": 0.3, + "commonvoice_locale": "te", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9017537718464212, + "model": 1.0 + }, + { + "bcp_47": "te", + "speakers": 95478480, + "language_name": "Telugu", + "flores_path": "tel_Telu", + "fleurs_tag": "te_in", + "commonvoice_hours": 0.3, + "commonvoice_locale": "te", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.2660789099709258, + "model": 1.0 + }, + { + "bcp_47": "te", + "speakers": 95478480, + "language_name": "Telugu", + "flores_path": "tel_Telu", + "fleurs_tag": "te_in", + "commonvoice_hours": 0.3, + "commonvoice_locale": "te", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4454927673606575, + "model": 1.0 + }, + { + "bcp_47": "tem", + "speakers": 1722482, + "language_name": "Timne", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "teo", + "speakers": 2082973, + "language_name": "Teso", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tet", + "speakers": 816395, + "language_name": "Tetum", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tg", + "speakers": 9644223, + "language_name": "Tajik", + "flores_path": "tgk_Cyrl", + "fleurs_tag": "tg_tj", + "commonvoice_hours": 0.0, + "commonvoice_locale": "tg", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "th", + "speakers": 55181920, + "language_name": "Thai", + "flores_path": "tha_Thai", + "fleurs_tag": "th_th", + "commonvoice_hours": 172.0, + "commonvoice_locale": "th", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "model": 1.0 + }, + { + "bcp_47": "th", + "speakers": 55181920, + "language_name": "Thai", + "flores_path": "tha_Thai", + "fleurs_tag": "th_th", + "commonvoice_hours": 172.0, + "commonvoice_locale": "th", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9492189440417714, + "model": 1.0 + }, + { + "bcp_47": "th", + "speakers": 55181920, + "language_name": "Thai", + "flores_path": "tha_Thai", + "fleurs_tag": "th_th", + "commonvoice_hours": 172.0, + "commonvoice_locale": "th", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.22673808962220887, + "model": 1.0 + }, + { + "bcp_47": "th", + "speakers": 55181920, + "language_name": "Thai", + "flores_path": "tha_Thai", + "fleurs_tag": "th_th", + "commonvoice_hours": 172.0, + "commonvoice_locale": "th", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.41961494547318173, + "model": 1.0 + }, + { + "bcp_47": "thl", + "speakers": 606558, + "language_name": "Dangaura Tharu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "thq", + "speakers": 303279, + "language_name": "Kochila Tharu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "thr", + "speakers": 363935, + "language_name": "Rana Tharu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ti", + "speakers": 10145911, + "language_name": "Tigrinya", + "flores_path": "tir_Ethi", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ti", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tig", + "speakers": 1094616, + "language_name": "Tigre", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 5.2, + "commonvoice_locale": "tig", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tiv", + "speakers": 3424448, + "language_name": "Tiv", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tk", + "speakers": 6870838, + "language_name": "Turkmen", + "flores_path": "tuk_Latn", + "fleurs_tag": null, + "commonvoice_hours": 2.8, + "commonvoice_locale": "tk", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tkl", + "speakers": 1285, + "language_name": "Tokelau", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tkr", + "speakers": 16329, + "language_name": "Tsakhur", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tkt", + "speakers": 72787, + "language_name": "Kathoriya Tharu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tly", + "speakers": 1000168, + "language_name": "Talysh", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tmh", + "speakers": 1776965, + "language_name": "Tamashek", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tn", + "speakers": 6113428, + "language_name": "Tswana", + "flores_path": "tsn_Latn", + "fleurs_tag": null, + "commonvoice_hours": 4.2, + "commonvoice_locale": "tn", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tnr", + "speakers": 3305, + "language_name": "Ménik", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "to", + "speakers": 100790, + "language_name": "Tongan", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tog", + "speakers": 207727, + "language_name": "Nyasa Tonga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tpi", + "speakers": 5154217, + "language_name": "Tok Pisin", + "flores_path": "tpi_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tr", + "speakers": 80360704, + "language_name": "Turkish", + "flores_path": "tur_Latn", + "fleurs_tag": "tr_tr", + "commonvoice_hours": 128.0, + "commonvoice_locale": "tr", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "model": 1.0 + }, + { + "bcp_47": "tr", + "speakers": 80360704, + "language_name": "Turkish", + "flores_path": "tur_Latn", + "fleurs_tag": "tr_tr", + "commonvoice_hours": 128.0, + "commonvoice_locale": "tr", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9329665937492929, + "model": 1.0 + }, + { + "bcp_47": "tr", + "speakers": 80360704, + "language_name": "Turkish", + "flores_path": "tur_Latn", + "fleurs_tag": "tr_tr", + "commonvoice_hours": 128.0, + "commonvoice_locale": "tr", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.28856187360515456, + "model": 1.0 + }, + { + "bcp_47": "tr", + "speakers": 80360704, + "language_name": "Turkish", + "flores_path": "tur_Latn", + "fleurs_tag": "tr_tr", + "commonvoice_hours": 128.0, + "commonvoice_locale": "tr", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4483834465978942, + "model": 1.0 + }, + { + "bcp_47": "tru", + "speakers": 3035, + "language_name": "Turoyo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "trv", + "speakers": 4721, + "language_name": "Taroko", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 8.9, + "commonvoice_locale": "trv", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "trw", + "speakers": 123756, + "language_name": "Torwali", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 19.0, + "commonvoice_locale": "trw", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ts", + "speakers": 4880932, + "language_name": "Tsonga", + "flores_path": "tso_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ts", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tsd", + "speakers": 202, + "language_name": "Tsakonian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tsg", + "speakers": 1200991, + "language_name": "Tausug", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tsj", + "speakers": 117348, + "language_name": "Tshangla", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tt", + "speakers": 1984108, + "language_name": "Tatar", + "flores_path": "tat_Cyrl", + "fleurs_tag": null, + "commonvoice_hours": 32.0, + "commonvoice_locale": "tt", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ttj", + "speakers": 821807, + "language_name": "Tooro", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tts", + "speakers": 16554576, + "language_name": "Northeastern Thai", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ttt", + "speakers": 22453, + "language_name": "Muslim Tat", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tum", + "speakers": 1780514, + "language_name": "Tumbuka", + "flores_path": "tum_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tvl", + "speakers": 9868, + "language_name": "Tuvalu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "twq", + "speakers": 7970, + "language_name": "Tasawaq", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ty", + "speakers": 91488, + "language_name": "Tahitian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ty", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tyv", + "speakers": 184239, + "language_name": "Tuvinian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "tyv", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "tzm", + "speakers": 3485047, + "language_name": "Central Atlas Tamazight", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "udm", + "speakers": 538544, + "language_name": "Udmurt", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "udm", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ug", + "speakers": 8052967, + "language_name": "Uyghur", + "flores_path": "uig_Arab", + "fleurs_tag": null, + "commonvoice_hours": 364.0, + "commonvoice_locale": "ug", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "uk", + "speakers": 29348975, + "language_name": "Ukrainian", + "flores_path": "ukr_Cyrl", + "fleurs_tag": "uk_ua", + "commonvoice_hours": 98.0, + "commonvoice_locale": "uk", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "uli", + "speakers": 2971, + "language_name": "Ulithian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "umb", + "speakers": 9431467, + "language_name": "Umbundu", + "flores_path": "umb_Latn", + "fleurs_tag": "umb_ao", + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "unr", + "speakers": 1252287, + "language_name": "Mundari", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "unx", + "speakers": 636523, + "language_name": "Munda", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ur", + "speakers": 290790290, + "language_name": "Urdu", + "flores_path": "urd_Arab", + "fleurs_tag": "ur_pk", + "commonvoice_hours": 77.0, + "commonvoice_locale": "ur", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6166666666666667, + "model": 4.0 + }, + { + "bcp_47": "ur", + "speakers": 290790290, + "language_name": "Urdu", + "flores_path": "urd_Arab", + "fleurs_tag": "ur_pk", + "commonvoice_hours": 77.0, + "commonvoice_locale": "ur", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9375650463557482, + "model": 4.0 + }, + { + "bcp_47": "ur", + "speakers": 290790290, + "language_name": "Urdu", + "flores_path": "urd_Arab", + "fleurs_tag": "ur_pk", + "commonvoice_hours": 77.0, + "commonvoice_locale": "ur", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.24342394573959453, + "model": 4.0 + }, + { + "bcp_47": "ur", + "speakers": 290790290, + "language_name": "Urdu", + "flores_path": "urd_Arab", + "fleurs_tag": "ur_pk", + "commonvoice_hours": 77.0, + "commonvoice_locale": "ur", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4181802717137555, + "model": 4.0 + }, + { + "bcp_47": "uz", + "speakers": 32792780, + "language_name": "Uzbek", + "flores_path": "uzn_Latn", + "fleurs_tag": "uz_uz", + "commonvoice_hours": 100.0, + "commonvoice_locale": "uz", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.5, + "model": 1.0 + }, + { + "bcp_47": "uz", + "speakers": 32792780, + "language_name": "Uzbek", + "flores_path": "uzn_Latn", + "fleurs_tag": "uz_uz", + "commonvoice_hours": 100.0, + "commonvoice_locale": "uz", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9448611053734804, + "model": 1.0 + }, + { + "bcp_47": "uz", + "speakers": 32792780, + "language_name": "Uzbek", + "flores_path": "uzn_Latn", + "fleurs_tag": "uz_uz", + "commonvoice_hours": 100.0, + "commonvoice_locale": "uz", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.21766825893077738, + "model": 1.0 + }, + { + "bcp_47": "uz", + "speakers": 32792780, + "language_name": "Uzbek", + "flores_path": "uzn_Latn", + "fleurs_tag": "uz_uz", + "commonvoice_hours": 100.0, + "commonvoice_locale": "uz", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4195087994775591, + "model": 1.0 + }, + { + "bcp_47": "vai", + "speakers": 131906, + "language_name": "Vai", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ve", + "speakers": 1391759, + "language_name": "Venda", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "ve", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vec", + "speakers": 1380829, + "language_name": "Venetian", + "flores_path": "vec_Latn", + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "vec", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vep", + "speakers": 3543, + "language_name": "Veps", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vi", + "speakers": 86222962, + "language_name": "Vietnamese", + "flores_path": "vie_Latn", + "fleurs_tag": "vi_vn", + "commonvoice_hours": 5.9, + "commonvoice_locale": "vi", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "model": 1.0 + }, + { + "bcp_47": "vi", + "speakers": 86222962, + "language_name": "Vietnamese", + "flores_path": "vie_Latn", + "fleurs_tag": "vi_vn", + "commonvoice_hours": 5.9, + "commonvoice_locale": "vi", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9478434905295018, + "model": 1.0 + }, + { + "bcp_47": "vi", + "speakers": 86222962, + "language_name": "Vietnamese", + "flores_path": "vie_Latn", + "fleurs_tag": "vi_vn", + "commonvoice_hours": 5.9, + "commonvoice_locale": "vi", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.23107984716515415, + "model": 1.0 + }, + { + "bcp_47": "vi", + "speakers": 86222962, + "language_name": "Vietnamese", + "flores_path": "vie_Latn", + "fleurs_tag": "vi_vn", + "commonvoice_hours": 5.9, + "commonvoice_locale": "vi", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.4169594776564998, + "model": 1.0 + }, + { + "bcp_47": "vic", + "speakers": 3113, + "language_name": "Virgin Islands Creole English", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vls", + "speakers": 1172070, + "language_name": "West Flemish", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vmf", + "speakers": 4809582, + "language_name": "Main-Franconian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vmw", + "speakers": 3912766, + "language_name": "Makhuwa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.0, + "commonvoice_locale": "vmw", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vot", + "speakers": 0, + "language_name": "Votic", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 0.1, + "commonvoice_locale": "vot", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vro", + "speakers": 70031, + "language_name": "Võro", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "vun", + "speakers": 433291, + "language_name": "Vunjo", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wa", + "speakers": 679801, + "language_name": "Walloon", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wae", + "speakers": 11377, + "language_name": "Walser", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wal", + "speakers": 1946034, + "language_name": "Wolaytta", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "war", + "speakers": 3166927, + "language_name": "Waray", + "flores_path": "war_Latn", + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wbp", + "speakers": 2496, + "language_name": "Warlpiri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wbq", + "speakers": 2386962, + "language_name": "Waddar", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wbr", + "speakers": 1989135, + "language_name": "Wagdi", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wls", + "speakers": 9512, + "language_name": "Wallisian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wni", + "speakers": 287736, + "language_name": "Ndzwani Comorian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wo", + "speakers": 11025494, + "language_name": "Wolof", + "flores_path": "wol_Latn", + "fleurs_tag": "wo_sn", + "commonvoice_hours": 0.0, + "commonvoice_locale": "wo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wtm", + "speakers": 6100014, + "language_name": "Mewati", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "wuu", + "speakers": 83641200, + "language_name": "Wu Chinese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "xav", + "speakers": 9951, + "language_name": "Xavánte", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "xh", + "speakers": 10182944, + "language_name": "Xhosa", + "flores_path": "xho_Latn", + "fleurs_tag": "xh_za", + "commonvoice_hours": 0.0, + "commonvoice_locale": "xh", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "xmf", + "speakers": 439670, + "language_name": "Mingrelian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 11.0, + "commonvoice_locale": "xmf", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "xnr", + "speakers": 2121744, + "language_name": "Kangri", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "xog", + "speakers": 2292409, + "language_name": "Soga", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "xsr", + "speakers": 157705, + "language_name": "Sherpa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yao", + "speakers": 722357, + "language_name": "Yao", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yap", + "speakers": 6556, + "language_name": "Yapese", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yav", + "speakers": 2303, + "language_name": "Yangben", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "ybb", + "speakers": 443920, + "language_name": "Yemba", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yi", + "speakers": 997214, + "language_name": "Yiddish", + "flores_path": "ydd_Hebr", + "fleurs_tag": null, + "commonvoice_hours": 0.5, + "commonvoice_locale": "yi", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yo", + "speakers": 28685568, + "language_name": "Yoruba", + "flores_path": "yor_Latn", + "fleurs_tag": "yo_ng", + "commonvoice_hours": 6.0, + "commonvoice_locale": "yo", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yrl", + "speakers": 26171, + "language_name": "Nheengatu", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yua", + "speakers": 861955, + "language_name": "Yucateco", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "yue", + "speakers": 79654759, + "language_name": "Cantonese", + "flores_path": "yue_Hant", + "fleurs_tag": "yue_hant_hk", + "commonvoice_hours": 203.0, + "commonvoice_locale": "yue", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "model": 1.0 + }, + { + "bcp_47": "yue", + "speakers": 79654759, + "language_name": "Cantonese", + "flores_path": "yue_Hant", + "fleurs_tag": "yue_hant_hk", + "commonvoice_hours": 203.0, + "commonvoice_locale": "yue", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.8955168718505389, + "model": 1.0 + }, + { + "bcp_47": "yue", + "speakers": 79654759, + "language_name": "Cantonese", + "flores_path": "yue_Hant", + "fleurs_tag": "yue_hant_hk", + "commonvoice_hours": 203.0, + "commonvoice_locale": "yue", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.24293503135220604, + "model": 1.0 + }, + { + "bcp_47": "yue", + "speakers": 79654759, + "language_name": "Cantonese", + "flores_path": "yue_Hant", + "fleurs_tag": "yue_hant_hk", + "commonvoice_hours": 203.0, + "commonvoice_locale": "yue", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.43687518387422897, + "model": 1.0 + }, + { + "bcp_47": "za", + "speakers": 4321462, + "language_name": "Zhuang", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "zag", + "speakers": 232364, + "language_name": "Zaghawa", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "zdj", + "speakers": 313124, + "language_name": "Ngazidja Comorian", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "zea", + "speakers": 241926, + "language_name": "Zeelandic", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "zgh", + "speakers": 7823574, + "language_name": "Standard Moroccan Tamazight", + "flores_path": "zgh_Tfng", + "fleurs_tag": null, + "commonvoice_hours": 1.3, + "commonvoice_locale": "zgh", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "zh", + "speakers": 1304678914, + "language_name": "Chinese", + "flores_path": "cmn_Hans", + "fleurs_tag": "cmn_hans_cn", + "commonvoice_hours": 422.0, + "commonvoice_locale": "zh-TW", + "in_benchmark": true, + "task": "classification", + "metric": "accuracy", + "score": 0.6416666666666666, + "model": 4.0 + }, + { + "bcp_47": "zh", + "speakers": 1304678914, + "language_name": "Chinese", + "flores_path": "cmn_Hans", + "fleurs_tag": "cmn_hans_cn", + "commonvoice_hours": 422.0, + "commonvoice_locale": "zh-TW", + "in_benchmark": true, + "task": "language_modeling", + "metric": "chrf", + "score": 0.9270229139550292, + "model": 4.0 + }, + { + "bcp_47": "zh", + "speakers": 1304678914, + "language_name": "Chinese", + "flores_path": "cmn_Hans", + "fleurs_tag": "cmn_hans_cn", + "commonvoice_hours": 422.0, + "commonvoice_locale": "zh-TW", + "in_benchmark": true, + "task": "translation", + "metric": "bleu", + "score": 0.3835031558957527, + "model": 4.0 + }, + { + "bcp_47": "zh", + "speakers": 1304678914, + "language_name": "Chinese", + "flores_path": "cmn_Hans", + "fleurs_tag": "cmn_hans_cn", + "commonvoice_hours": 422.0, + "commonvoice_locale": "zh-TW", + "in_benchmark": true, + "task": "translation", + "metric": "chrf", + "score": 0.557217638850705, + "model": 4.0 + }, + { + "bcp_47": "zmi", + "speakers": 391825, + "language_name": "Negeri Sembilan Malay", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": null, + "commonvoice_locale": null, + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "zu", + "speakers": 13973830, + "language_name": "Zulu", + "flores_path": "zul_Latn", + "fleurs_tag": "zu_za", + "commonvoice_hours": 0.0, + "commonvoice_locale": "zu", + "in_benchmark": true, + "task": null, + "metric": null, + "score": null, + "model": null + }, + { + "bcp_47": "zza", + "speakers": 1148245, + "language_name": "Zaza", + "flores_path": null, + "fleurs_tag": null, + "commonvoice_hours": 1.8, + "commonvoice_locale": "zza", + "in_benchmark": false, + "task": null, + "metric": null, + "score": null, + "model": null + } + ], + "scores": [ + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ar", + "task": "classification", + "metric": "accuracy", + "score": 0.9, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ar", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9662394255427802, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ar", + "task": "translation", + "metric": "bleu", + "score": 0.33684899445707545, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ar", + "task": "translation", + "metric": "chrf", + "score": 0.5132383488065385, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "bn", + "task": "classification", + "metric": "accuracy", + "score": 0.9, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "bn", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9157239945539242, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "bn", + "task": "translation", + "metric": "bleu", + "score": 0.2946937518705462, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "bn", + "task": "translation", + "metric": "chrf", + "score": 0.47901362996280916, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "en", + "task": "classification", + "metric": "accuracy", + "score": 0.8666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "en", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9800307455880838, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "en", + "task": "translation", + "metric": "bleu", + "score": 0.5005636231739998, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "en", + "task": "translation", + "metric": "chrf", + "score": 0.6083608181074219, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "es", + "task": "classification", + "metric": "accuracy", + "score": 0.8666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "es", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9398094019787611, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "es", + "task": "translation", + "metric": "bleu", + "score": 0.341382728522014, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "es", + "task": "translation", + "metric": "chrf", + "score": 0.5025141961861047, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "fr", + "task": "classification", + "metric": "accuracy", + "score": 0.8666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "fr", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9883846649306203, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "fr", + "task": "translation", + "metric": "bleu", + "score": 0.340773340614899, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "fr", + "task": "translation", + "metric": "chrf", + "score": 0.5123861936301051, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "hi", + "task": "classification", + "metric": "accuracy", + "score": 0.8666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "hi", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9603938002806427, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "hi", + "task": "translation", + "metric": "bleu", + "score": 0.34270244014502865, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "hi", + "task": "translation", + "metric": "chrf", + "score": 0.5241272552859136, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pa", + "task": "classification", + "metric": "accuracy", + "score": 0.8666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pa", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9170681035031951, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pa", + "task": "translation", + "metric": "bleu", + "score": 0.37789354848061457, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pa", + "task": "translation", + "metric": "chrf", + "score": 0.5344045974435819, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pt", + "task": "classification", + "metric": "accuracy", + "score": 0.8, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pt", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9780371913896582, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pt", + "task": "translation", + "metric": "bleu", + "score": 0.3794780275173, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "pt", + "task": "translation", + "metric": "chrf", + "score": 0.5349002453164619, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ur", + "task": "classification", + "metric": "accuracy", + "score": 0.9, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ur", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9555863990700229, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ur", + "task": "translation", + "metric": "bleu", + "score": 0.31728190361318, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "ur", + "task": "translation", + "metric": "chrf", + "score": 0.4881878357149611, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "zh", + "task": "classification", + "metric": "accuracy", + "score": 0.8666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "zh", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9539892816788119, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "zh", + "task": "translation", + "metric": "bleu", + "score": 0.41028031844473206, + "sentence_nr": 14.5 + }, + { + "model": "google/gemini-2.0-flash-001", + "bcp_47": "zh", + "task": "translation", + "metric": "chrf", + "score": 0.5607632287491137, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "am", + "task": "classification", + "metric": "accuracy", + "score": 0.36666666666666664, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "am", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9031129205404201, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "am", + "task": "translation", + "metric": "bleu", + "score": 0.15002522598066087, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "am", + "task": "translation", + "metric": "chrf", + "score": 0.3344555209113584, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ar", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ar", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9551956628433433, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ar", + "task": "translation", + "metric": "bleu", + "score": 0.2811587891139184, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ar", + "task": "translation", + "metric": "chrf", + "score": 0.46109033782928127, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "arz", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "arz", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9319821809429131, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "arz", + "task": "translation", + "metric": "bleu", + "score": 0.20127691717583826, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "arz", + "task": "translation", + "metric": "chrf", + "score": 0.38780198426317497, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "az", + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "az", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9439975775415789, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "az", + "task": "translation", + "metric": "bleu", + "score": 0.18364881639775618, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "az", + "task": "translation", + "metric": "chrf", + "score": 0.3791669348856303, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bho", + "task": "classification", + "metric": "accuracy", + "score": 0.3333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bho", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9334228689163548, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bho", + "task": "translation", + "metric": "bleu", + "score": 0.24092898437545654, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bho", + "task": "translation", + "metric": "chrf", + "score": 0.41894143077328727, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bn", + "task": "classification", + "metric": "accuracy", + "score": 0.36666666666666664, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bn", + "task": "language_modeling", + "metric": "chrf", + "score": 0.8847379468653113, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bn", + "task": "translation", + "metric": "bleu", + "score": 0.23230854865261913, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "bn", + "task": "translation", + "metric": "chrf", + "score": 0.42063939652271853, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "de", + "task": "classification", + "metric": "accuracy", + "score": 0.6666666666666666, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "de", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9788487181545229, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "de", + "task": "translation", + "metric": "bleu", + "score": 0.31823711841849855, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "de", + "task": "translation", + "metric": "chrf", + "score": 0.49174647549269207, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "en", + "task": "classification", + "metric": "accuracy", + "score": 0.5, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "en", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9685562893433212, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "en", + "task": "translation", + "metric": "bleu", + "score": 0.4203985756610074, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "en", + "task": "translation", + "metric": "chrf", + "score": 0.5300571003447904, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "es", + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "es", + "task": "language_modeling", + "metric": "chrf", + "score": 0.961354451644757, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "es", + "task": "translation", + "metric": "bleu", + "score": 0.26818936209357325, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "es", + "task": "translation", + "metric": "chrf", + "score": 0.4507327709042758, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fa", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fa", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9396649061437635, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fa", + "task": "translation", + "metric": "bleu", + "score": 0.2516753344674677, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fa", + "task": "translation", + "metric": "chrf", + "score": 0.4448545956789697, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fil", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fil", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9553160038255677, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fil", + "task": "translation", + "metric": "bleu", + "score": 0.3248927726984041, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fil", + "task": "translation", + "metric": "chrf", + "score": 0.4689020729383555, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fr", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fr", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9659586250799681, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fr", + "task": "translation", + "metric": "bleu", + "score": 0.32618133837885355, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "fr", + "task": "translation", + "metric": "chrf", + "score": 0.49526445590376544, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "gu", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "gu", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9421488818900206, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "gu", + "task": "translation", + "metric": "bleu", + "score": 0.24812610549809738, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "gu", + "task": "translation", + "metric": "chrf", + "score": 0.4318359636701651, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ha", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ha", + "task": "language_modeling", + "metric": "chrf", + "score": 0.945704338611724, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ha", + "task": "translation", + "metric": "bleu", + "score": 0.14767816277169443, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ha", + "task": "translation", + "metric": "chrf", + "score": 0.34353973347368816, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "hi", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "hi", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9521896068400092, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "hi", + "task": "translation", + "metric": "bleu", + "score": 0.30694468553453214, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "hi", + "task": "translation", + "metric": "chrf", + "score": 0.4717417673162039, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "id", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "id", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9441891794331471, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "id", + "task": "translation", + "metric": "bleu", + "score": 0.28485630651027877, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "id", + "task": "translation", + "metric": "chrf", + "score": 0.4561447909933971, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "it", + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "it", + "task": "language_modeling", + "metric": "chrf", + "score": 0.96965822717479, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "it", + "task": "translation", + "metric": "bleu", + "score": 0.27748101044407486, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "it", + "task": "translation", + "metric": "chrf", + "score": 0.46396483435604213, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ja", + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ja", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9339719005290334, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ja", + "task": "translation", + "metric": "bleu", + "score": 0.26835607046224613, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ja", + "task": "translation", + "metric": "chrf", + "score": 0.4411714629040183, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "jv", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "jv", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9274301130074318, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "jv", + "task": "translation", + "metric": "bleu", + "score": 0.25461973194021953, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "jv", + "task": "translation", + "metric": "chrf", + "score": 0.4296209828775689, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "kn", + "task": "classification", + "metric": "accuracy", + "score": 0.4, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "kn", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9422502494463877, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "kn", + "task": "translation", + "metric": "bleu", + "score": 0.2550718176103704, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "kn", + "task": "translation", + "metric": "chrf", + "score": 0.44555883949922764, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ko", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ko", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9384158016197498, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ko", + "task": "translation", + "metric": "bleu", + "score": 0.21969579072372616, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ko", + "task": "translation", + "metric": "chrf", + "score": 0.4134343535369622, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ml", + "task": "classification", + "metric": "accuracy", + "score": 0.43333333333333335, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ml", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9372865200487422, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ml", + "task": "translation", + "metric": "bleu", + "score": 0.20114751241051923, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ml", + "task": "translation", + "metric": "chrf", + "score": 0.39404171184956394, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "mr", + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "mr", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9493846554320581, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "mr", + "task": "translation", + "metric": "bleu", + "score": 0.22832077978859452, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "mr", + "task": "translation", + "metric": "chrf", + "score": 0.4245203296342906, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ms", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ms", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9449541544914151, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ms", + "task": "translation", + "metric": "bleu", + "score": 0.26403874316694886, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ms", + "task": "translation", + "metric": "chrf", + "score": 0.45903065670305854, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "my", + "task": "classification", + "metric": "accuracy", + "score": 0.4, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "my", + "task": "language_modeling", + "metric": "chrf", + "score": 0.918432369873729, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "my", + "task": "translation", + "metric": "bleu", + "score": 0.18617334539824332, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "my", + "task": "translation", + "metric": "chrf", + "score": 0.3705060280208132, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "om", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "om", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9359301483225031, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "om", + "task": "translation", + "metric": "bleu", + "score": 0.06509147151730071, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "om", + "task": "translation", + "metric": "chrf", + "score": 0.22674886804446037, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "or", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "or", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9211968327986088, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "or", + "task": "translation", + "metric": "bleu", + "score": 0.2521285657827072, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "or", + "task": "translation", + "metric": "chrf", + "score": 0.4422326291663304, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pa", + "task": "classification", + "metric": "accuracy", + "score": 0.4, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pa", + "task": "language_modeling", + "metric": "chrf", + "score": 0.8971009455771796, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pa", + "task": "translation", + "metric": "bleu", + "score": 0.3260979917168239, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pa", + "task": "translation", + "metric": "chrf", + "score": 0.48620285493698817, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pl", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pl", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9603182772393537, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pl", + "task": "translation", + "metric": "bleu", + "score": 0.26987204535648013, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pl", + "task": "translation", + "metric": "chrf", + "score": 0.45624928163848544, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pt", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pt", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9510604972420862, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pt", + "task": "translation", + "metric": "bleu", + "score": 0.2806919135940658, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "pt", + "task": "translation", + "metric": "chrf", + "score": 0.45314727718184383, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ru", + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ru", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9702818211253317, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ru", + "task": "translation", + "metric": "bleu", + "score": 0.21923866610511514, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ru", + "task": "translation", + "metric": "chrf", + "score": 0.41987611292148114, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sd", + "task": "classification", + "metric": "accuracy", + "score": 0.3333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sd", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9075877951969867, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sd", + "task": "translation", + "metric": "bleu", + "score": 0.21679684560539594, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sd", + "task": "translation", + "metric": "chrf", + "score": 0.4130326388570076, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sw", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sw", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9363185104933659, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sw", + "task": "translation", + "metric": "bleu", + "score": 0.2687578645492076, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "sw", + "task": "translation", + "metric": "chrf", + "score": 0.435973049682813, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ta", + "task": "classification", + "metric": "accuracy", + "score": 0.43333333333333335, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ta", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9604137478864351, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ta", + "task": "translation", + "metric": "bleu", + "score": 0.22755903113370943, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ta", + "task": "translation", + "metric": "chrf", + "score": 0.3968691612249629, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "te", + "task": "classification", + "metric": "accuracy", + "score": 0.36666666666666664, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "te", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9017537718464212, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "te", + "task": "translation", + "metric": "bleu", + "score": 0.2660789099709258, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "te", + "task": "translation", + "metric": "chrf", + "score": 0.4454927673606575, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "th", + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "th", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9492189440417714, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "th", + "task": "translation", + "metric": "bleu", + "score": 0.22673808962220887, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "th", + "task": "translation", + "metric": "chrf", + "score": 0.41961494547318173, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "tr", + "task": "classification", + "metric": "accuracy", + "score": 0.5333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "tr", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9329665937492929, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "tr", + "task": "translation", + "metric": "bleu", + "score": 0.28856187360515456, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "tr", + "task": "translation", + "metric": "chrf", + "score": 0.4483834465978942, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ur", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ur", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9128780231729426, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ur", + "task": "translation", + "metric": "bleu", + "score": 0.21847309277555946, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "ur", + "task": "translation", + "metric": "chrf", + "score": 0.40360616182971726, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "uz", + "task": "classification", + "metric": "accuracy", + "score": 0.5, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "uz", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9448611053734804, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "uz", + "task": "translation", + "metric": "bleu", + "score": 0.21766825893077738, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "uz", + "task": "translation", + "metric": "chrf", + "score": 0.4195087994775591, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "vi", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "vi", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9478434905295018, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "vi", + "task": "translation", + "metric": "bleu", + "score": 0.23107984716515415, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "vi", + "task": "translation", + "metric": "chrf", + "score": 0.4169594776564998, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "yue", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "yue", + "task": "language_modeling", + "metric": "chrf", + "score": 0.8955168718505389, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "yue", + "task": "translation", + "metric": "bleu", + "score": 0.24293503135220604, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "yue", + "task": "translation", + "metric": "chrf", + "score": 0.43687518387422897, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "zh", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "zh", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9131870034415596, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "zh", + "task": "translation", + "metric": "bleu", + "score": 0.39048110791786933, + "sentence_nr": 14.5 + }, + { + "model": "meta-llama/llama-3.3-70b-instruct", + "bcp_47": "zh", + "task": "translation", + "metric": "chrf", + "score": 0.5665464429871689, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ar", + "task": "classification", + "metric": "accuracy", + "score": 0.7, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ar", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9318859252084998, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ar", + "task": "translation", + "metric": "bleu", + "score": 0.2068354433755052, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ar", + "task": "translation", + "metric": "chrf", + "score": 0.38571943918088597, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "bn", + "task": "classification", + "metric": "accuracy", + "score": 0.4, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "bn", + "task": "language_modeling", + "metric": "chrf", + "score": 0.8721745881216986, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "bn", + "task": "translation", + "metric": "bleu", + "score": 0.17813156872400582, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "bn", + "task": "translation", + "metric": "chrf", + "score": 0.34058339171576163, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "en", + "task": "classification", + "metric": "accuracy", + "score": 0.43333333333333335, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "en", + "task": "language_modeling", + "metric": "chrf", + "score": 0.7598862193678689, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "en", + "task": "translation", + "metric": "bleu", + "score": 0.39023213290403214, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "en", + "task": "translation", + "metric": "chrf", + "score": 0.5013108104875811, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "es", + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "es", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9466716556334129, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "es", + "task": "translation", + "metric": "bleu", + "score": 0.27947534892496323, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "es", + "task": "translation", + "metric": "chrf", + "score": 0.43006530569343165, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "fr", + "task": "classification", + "metric": "accuracy", + "score": 0.7666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "fr", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9558889194048766, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "fr", + "task": "translation", + "metric": "bleu", + "score": 0.2750376678830284, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "fr", + "task": "translation", + "metric": "chrf", + "score": 0.441500491331595, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "hi", + "task": "classification", + "metric": "accuracy", + "score": 0.5, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "hi", + "task": "language_modeling", + "metric": "chrf", + "score": 0.890720660152386, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "hi", + "task": "translation", + "metric": "bleu", + "score": 0.21739461408317115, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "hi", + "task": "translation", + "metric": "chrf", + "score": 0.359020024214477, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pa", + "task": "classification", + "metric": "accuracy", + "score": 0.3, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pa", + "task": "language_modeling", + "metric": "chrf", + "score": 0.8922615537670865, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pa", + "task": "translation", + "metric": "bleu", + "score": 0.21871159296535658, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pa", + "task": "translation", + "metric": "chrf", + "score": 0.35241753637848183, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pt", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pt", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9492522967960337, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pt", + "task": "translation", + "metric": "bleu", + "score": 0.30258414492830743, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "pt", + "task": "translation", + "metric": "chrf", + "score": 0.4573560946306326, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ur", + "task": "classification", + "metric": "accuracy", + "score": 0.6666666666666666, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ur", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9289246379251568, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ur", + "task": "translation", + "metric": "bleu", + "score": 0.18142367436048182, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "ur", + "task": "translation", + "metric": "chrf", + "score": 0.34598666510470966, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "zh", + "task": "classification", + "metric": "accuracy", + "score": 0.6666666666666666, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "zh", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9188930778144581, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "zh", + "task": "translation", + "metric": "bleu", + "score": 0.3631466653543813, + "sentence_nr": 14.5 + }, + { + "model": "mistralai/mistral-small-24b-instruct-2501", + "bcp_47": "zh", + "task": "translation", + "metric": "chrf", + "score": 0.5520065979059031, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ar", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ar", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9489111124535548, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ar", + "task": "translation", + "metric": "bleu", + "score": 0.26593690487060095, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ar", + "task": "translation", + "metric": "chrf", + "score": 0.46048583874582116, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "bn", + "task": "classification", + "metric": "accuracy", + "score": 0.3333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "bn", + "task": "language_modeling", + "metric": "chrf", + "score": 0.899742833244405, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "bn", + "task": "translation", + "metric": "bleu", + "score": 0.20957267610789626, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "bn", + "task": "translation", + "metric": "chrf", + "score": 0.3814341573965288, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "en", + "task": "classification", + "metric": "accuracy", + "score": 0.5666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "en", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9816685337276303, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "en", + "task": "translation", + "metric": "bleu", + "score": 0.40476391184425864, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "en", + "task": "translation", + "metric": "chrf", + "score": 0.5350771248567329, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "es", + "task": "classification", + "metric": "accuracy", + "score": 0.6, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "es", + "task": "language_modeling", + "metric": "chrf", + "score": 0.976774826379902, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "es", + "task": "translation", + "metric": "bleu", + "score": 0.30479108723403314, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "es", + "task": "translation", + "metric": "chrf", + "score": 0.4664322514490113, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "fr", + "task": "classification", + "metric": "accuracy", + "score": 0.6666666666666666, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "fr", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9771465942743917, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "fr", + "task": "translation", + "metric": "bleu", + "score": 0.3330934985862475, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "fr", + "task": "translation", + "metric": "chrf", + "score": 0.48898780285384186, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "hi", + "task": "classification", + "metric": "accuracy", + "score": 0.5, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "hi", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9371251285777896, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "hi", + "task": "translation", + "metric": "bleu", + "score": 0.3034809934459214, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "hi", + "task": "translation", + "metric": "chrf", + "score": 0.4682857313818616, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pa", + "task": "classification", + "metric": "accuracy", + "score": 0.3, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pa", + "task": "language_modeling", + "metric": "chrf", + "score": 0.8988042374730737, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pa", + "task": "translation", + "metric": "bleu", + "score": 0.3171219784022306, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pa", + "task": "translation", + "metric": "chrf", + "score": 0.46859907170069254, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pt", + "task": "classification", + "metric": "accuracy", + "score": 0.6333333333333333, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pt", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9609959534386474, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pt", + "task": "translation", + "metric": "bleu", + "score": 0.33037537825270835, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "pt", + "task": "translation", + "metric": "chrf", + "score": 0.48617141944202497, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ur", + "task": "classification", + "metric": "accuracy", + "score": 0.43333333333333335, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ur", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9528711252548706, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ur", + "task": "translation", + "metric": "bleu", + "score": 0.2565171122091569, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "ur", + "task": "translation", + "metric": "chrf", + "score": 0.43494042420563395, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "zh", + "task": "classification", + "metric": "accuracy", + "score": 0.4666666666666667, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "zh", + "task": "language_modeling", + "metric": "chrf", + "score": 0.9220222928852874, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "zh", + "task": "translation", + "metric": "bleu", + "score": 0.37010453186602793, + "sentence_nr": 14.5 + }, + { + "model": "openai/gpt-4o-mini", + "bcp_47": "zh", + "task": "translation", + "metric": "chrf", + "score": 0.5495542857606343, + "sentence_nr": 14.5 + } + ] +} \ No newline at end of file