diff --git "a/results.json" "b/results.json" --- "a/results.json" +++ "b/results.json" @@ -915,5 +915,13126 @@ "asr_wer": 0.20953788908863977, "asr_chrf": 84.56957135963033, "overall_score": 21.518011001013512 + }, + { + "language_name": "Russian", + "bcp_47": "ru", + "speakers": 195841151, + "scores": [], + "commonvoice_hours": 242.0, + "commonvoice_locale": "ru", + "population": { + "BG": 1602387, + "BY": 1137350, + "CA": 211087, + "CN": 13940, + "DE": 4809582, + "EE": 688027, + "FI": 45131, + "GE": 359730, + "IL": 954303, + "KG": 2147364, + "KZ": 13746168, + "LT": 2185168, + "LV": 714867, + "MD": 100935, + "MN": 4118, + "PL": 6890814, + "RU": 133218680, + "SJ": 1200, + "TJ": 1064840, + "TM": 663436, + "UA": 20204534, + "US": 798334, + "UZ": 4279156 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Swahili", + "bcp_47": "sw", + "speakers": 171610296, + "scores": [], + "commonvoice_hours": 411.0, + "commonvoice_locale": "sw", + "population": { + "BI": 6408, + "CD": 50890000, + "KE": 35328414, + "MZ": 9330, + "SO": 235142, + "TZ": 52697520, + "UG": 32439750, + "YT": 2716, + "ZA": 1016 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Indonesian", + "bcp_47": "id", + "speakers": 171207687, + "scores": [], + "commonvoice_hours": 33.0, + "commonvoice_locale": "id", + "population": { + "ID": 170896640, + "NL": 311047 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "German", + "bcp_47": "de", + "speakers": 136350226, + "scores": [], + "commonvoice_hours": 1359.0, + "commonvoice_locale": "de", + "population": { + "AT": 8593666, + "BE": 2578554, + "BG": 557352, + "BR": 1778414, + "CA": 294014, + "CH": 6134913, + "CZ": 1605375, + "DE": 72945327, + "DK": 2758623, + "FI": 1002901, + "FR": 3392410, + "GB": 5918499, + "GR": 530355, + "HU": 1758929, + "IT": 998443, + "KZ": 1221882, + "LI": 39137, + "LT": 382404, + "LU": 395880, + "NA": 23671, + "NL": 12269084, + "PL": 7273637, + "PY": 208559, + "RO": 44736, + "SI": 883126, + "SK": 1196932, + "US": 1563403 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Japanese", + "bcp_47": "ja", + "speakers": 119729026, + "scores": [], + "commonvoice_hours": 222.0, + "commonvoice_locale": "ja", + "population": { + "BR": 444604, + "CA": 52772, + "JP": 119231650 + }, + "language_family": "Japonic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Telugu", + "bcp_47": "te", + "speakers": 95478480, + "scores": [], + "commonvoice_hours": 0.3, + "commonvoice_locale": "te", + "population": { + "IN": 95478480 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Panjabi", + "bcp_47": "lah", + "speakers": 93433552, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 33152, + "PK": 93400400 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Marathi", + "bcp_47": "mr", + "speakers": 92826300, + "scores": [], + "commonvoice_hours": 20.0, + "commonvoice_locale": "mr", + "population": { + "IN": 92826300 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Javanese", + "bcp_47": "jv", + "speakers": 91180665, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "jv", + "population": { + "ID": 90788840, + "MY": 391825 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Vietnamese", + "bcp_47": "vi", + "speakers": 86222962, + "scores": [], + "commonvoice_hours": 5.9, + "commonvoice_locale": "vi", + "population": { + "CA": 184701, + "CN": 6970, + "US": 1130973, + "VN": 84900318 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tamil", + "bcp_47": "ta", + "speakers": 85616159, + "scores": [], + "commonvoice_hours": 234.0, + "commonvoice_locale": "ta", + "population": { + "CA": 184701, + "GB": 2104355, + "IN": 78239310, + "LK": 3433380, + "MU": 34484, + "MY": 1371388, + "RE": 118138, + "SG": 130403 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Persian", + "bcp_47": "fa", + "speakers": 84710459, + "scores": [], + "commonvoice_hours": 370.0, + "commonvoice_locale": "fa", + "population": { + "AE": 189850, + "AF": 18321900, + "CA": 245012, + "IQ": 338192, + "IR": 63692475, + "OM": 43849, + "PK": 1541107, + "QA": 268859, + "TJ": 69215 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Wu Chinese", + "bcp_47": "wuu", + "speakers": 83641200, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 83641200 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Turkish", + "bcp_47": "tr", + "speakers": 80360704, + "scores": [], + "commonvoice_hours": 127.0, + "commonvoice_locale": "tr", + "population": { + "BG": 766359, + "CA": 37694, + "CY": 291336, + "DE": 2003992, + "GB": 131522, + "GR": 127285, + "MK": 74409, + "NL": 207365, + "RO": 27694, + "TR": 76276275, + "UA": 184476, + "UZ": 232297 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Cantonese", + "bcp_47": "yue", + "speakers": 79654759, + "scores": [], + "commonvoice_hours": 203.0, + "commonvoice_locale": "yue", + "population": { + "CA": 640800, + "CN": 72489040, + "HK": 6524919 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Korean", + "bcp_47": "ko", + "speakers": 78357046, + "scores": [], + "commonvoice_hours": 1.7, + "commonvoice_locale": "ko", + "population": { + "BR": 44460, + "CA": 169623, + "CN": 2091030, + "JP": 652636, + "KP": 22566280, + "KR": 51835100, + "US": 997917 + }, + "language_family": "Koreanic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Italian", + "bcp_47": "it", + "speakers": 70247060, + "scores": [], + "commonvoice_hours": 362.0, + "commonvoice_locale": "it", + "population": { + "AT": 797350, + "AU": 483864, + "BR": 592805, + "CA": 343016, + "CH": 361372, + "DE": 5611179, + "FR": 1153419, + "GB": 131522, + "HR": 67644, + "IT": 59282565, + "MT": 256070, + "SI": 3995, + "SM": 30466, + "US": 1130973, + "VA": 820 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Filipino", + "bcp_47": "fil", + "speakers": 67471096, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "tl", + "population": { + "CA": 565412, + "PH": 65508600, + "US": 1397084 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Egyptian Arabic", + "bcp_47": "arz", + "speakers": 66639360, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "EG": 66639360 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gujarati", + "bcp_47": "gu", + "speakers": 61721799, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "gu-IN", + "population": { + "CA": 135699, + "GB": 1907072, + "IN": 59674050, + "KE": 4978 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Thai", + "bcp_47": "th", + "speakers": 55181920, + "scores": [], + "commonvoice_hours": 172.0, + "commonvoice_locale": "th", + "population": { + "TH": 55181920 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pashto", + "bcp_47": "ps", + "speakers": 53542641, + "scores": [], + "commonvoice_hours": 79.0, + "commonvoice_locale": "ps", + "population": { + "AE": 289770, + "AF": 15756834, + "IR": 135877, + "PK": 37360160 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kannada", + "bcp_47": "kn", + "speakers": 49065330, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "kn", + "population": { + "IN": 49065330 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nigerian Pidgin", + "bcp_47": "pcm", + "speakers": 44945880, + "scores": [], + "commonvoice_hours": 14.0, + "commonvoice_locale": "pcm", + "population": { + "NG": 44945880 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Malayalam", + "bcp_47": "ml", + "speakers": 43257484, + "scores": [], + "commonvoice_hours": 2.8, + "commonvoice_locale": "ml", + "population": { + "AE": 699446, + "BH": 49665, + "IL": 7981, + "IN": 42434880, + "MY": 48978, + "QA": 6599, + "SG": 9935 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Odia", + "bcp_47": "or", + "speakers": 42434880, + "scores": [], + "commonvoice_hours": 2.8, + "commonvoice_locale": "or", + "population": { + "IN": 42434880 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Polish", + "bcp_47": "pl", + "speakers": 41077399, + "scores": [], + "commonvoice_hours": 174.0, + "commonvoice_locale": "pl", + "population": { + "CA": 173393, + "CZ": 52442, + "DE": 232463, + "GB": 2630444, + "IL": 130132, + "PL": 36751008, + "RO": 2769, + "SK": 50598, + "UA": 1054150 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Xiang Chinese", + "bcp_47": "hsn", + "speakers": 40426580, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 40426580 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hausa", + "bcp_47": "ha", + "speakers": 40411882, + "scores": [], + "commonvoice_hours": 4.1, + "commonvoice_locale": "ha", + "population": { + "CM": 38843, + "GH": 252326, + "NE": 9336684, + "NG": 29963920, + "SD": 820109 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sindhi", + "bcp_47": "sd", + "speakers": 40329510, + "scores": [], + "commonvoice_hours": 0.4, + "commonvoice_locale": "sd", + "population": { + "IN": 5304360, + "PK": 35025150 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "North Levantine Arabic", + "bcp_47": "apc", + "speakers": 39031474, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IL": 1474832, + "JO": 7141596, + "LB": 5469610, + "PS": 4191886, + "SY": 16488640, + "TR": 4264910 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Malay", + "bcp_47": "ms", + "speakers": 38097307, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ms", + "population": { + "BN": 455189, + "CC": 495, + "ID": 12283196, + "MY": 24489075, + "SG": 869352 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Burmese", + "bcp_47": "my", + "speakers": 36559231, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "my", + "population": { + "BD": 341567, + "MM": 36217664 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Amharic", + "bcp_47": "am", + "speakers": 35728475, + "scores": [], + "commonvoice_hours": 1.8, + "commonvoice_locale": "am", + "population": { + "ET": 35677290, + "IL": 51185 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Algerian Arabic", + "bcp_47": "arq", + "speakers": 35667507, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DZ": 35667507 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Oromo", + "bcp_47": "om", + "speakers": 34897121, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "om", + "population": { + "ET": 34596160, + "KE": 251581, + "SO": 49380 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bhojpuri", + "bcp_47": "bho", + "speakers": 32934797, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 30500070, + "MU": 372430, + "NP": 2062297 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Uzbek", + "bcp_47": "uz", + "speakers": 32792780, + "scores": [], + "commonvoice_hours": 100.0, + "commonvoice_locale": "uz", + "population": { + "AF": 1722259, + "CN": 5576, + "TM": 497577, + "TR": 1968, + "UZ": 30565400 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Azerbaijani", + "bcp_47": "az", + "speakers": 32446682, + "scores": [], + "commonvoice_hours": 0.5, + "commonvoice_locale": "az", + "population": { + "AM": 0, + "AZ": 10093536, + "IQ": 699709, + "IR": 20381592, + "RU": 131801, + "TR": 1140044 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hakka Chinese", + "bcp_47": "hak", + "speakers": 32062460, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 32062460 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sundanese", + "bcp_47": "su", + "speakers": 32043120, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 32043120 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dutch", + "bcp_47": "nl", + "speakers": 31765645, + "scores": [], + "commonvoice_hours": 114.0, + "commonvoice_locale": "nl", + "population": { + "AW": 115845, + "BE": 6446385, + "BQ": 1600, + "CA": 56541, + "CW": 12108, + "DE": 7214373, + "FR": 88203, + "NL": 17280400, + "SR": 548612, + "SX": 1578 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Moroccan Arabic", + "bcp_47": "ary", + "speakers": 30938679, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MA": 30938679 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ukrainian", + "bcp_47": "uk", + "speakers": 29348975, + "scores": [], + "commonvoice_hours": 98.0, + "commonvoice_locale": "uk", + "population": { + "CA": 75388, + "MD": 471030, + "PL": 149301, + "RS": 0, + "SK": 103371, + "UA": 28549885 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yoruba", + "bcp_47": "yo", + "speakers": 28685568, + "scores": [], + "commonvoice_hours": 6.0, + "commonvoice_locale": "yo", + "population": { + "BJ": 861928, + "NG": 27823640 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Saraiki", + "bcp_47": "skr", + "speakers": 28020120, + "scores": [], + "commonvoice_hours": 4.3, + "commonvoice_locale": "skr", + "population": { + "PK": 28020120 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Igbo", + "bcp_47": "ig", + "speakers": 27823640, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ig", + "population": { + "NG": 27823640 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Min Nan Chinese", + "bcp_47": "nan", + "speakers": 26486380, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 26486380 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Cebuano", + "bcp_47": "ceb", + "speakers": 26203440, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 26203440 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Awadhi", + "bcp_47": "awa", + "speakers": 25862924, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 25195710, + "NP": 667214 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Malagasy", + "bcp_47": "mg", + "speakers": 24260130, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "mg", + "population": { + "MG": 24260130 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gan Chinese", + "bcp_47": "gan", + "speakers": 23698340, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 23698340 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Romanian", + "bcp_47": "ro", + "speakers": 22187408, + "scores": [], + "commonvoice_hours": 21.0, + "commonvoice_locale": "ro", + "population": { + "CA": 101774, + "HU": 96741, + "IL": 320993, + "MD": 2119635, + "RO": 19172610, + "RS": 147256, + "UA": 228399 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bavarian", + "bcp_47": "bar", + "speakers": 22043627, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AT": 8416478, + "DE": 13627149 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nepali", + "bcp_47": "ne", + "speakers": 20903374, + "scores": [], + "commonvoice_hours": 1.3, + "commonvoice_locale": "ne-NP", + "population": { + "BT": 132994, + "IN": 7426104, + "NP": 13344276 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Maithili", + "bcp_47": "mai", + "speakers": 19249149, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "mai", + "population": { + "IN": 15913080, + "NP": 3336069 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Assamese", + "bcp_47": "as", + "speakers": 17239170, + "scores": [], + "commonvoice_hours": 2.8, + "commonvoice_locale": "as", + "population": { + "IN": 17239170 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nyanja", + "bcp_47": "ny", + "speakers": 17026781, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ny", + "population": { + "MW": 13353858, + "MZ": 782553, + "ZM": 2613990, + "ZW": 276380 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Somali", + "bcp_47": "so", + "speakers": 16911645, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "so", + "population": { + "CA": 49002, + "DJ": 377940, + "ET": 6486780, + "GB": 131522, + "KE": 695863, + "SO": 9170538 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Madurese", + "bcp_47": "mad", + "speakers": 16822638, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 16822638 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northeastern Thai", + "bcp_47": "tts", + "speakers": 16554576, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TH": 16554576 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rangpuri", + "bcp_47": "rkt", + "speakers": 16274502, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BD": 10572315, + "IN": 5702187 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Magahi", + "bcp_47": "mag", + "speakers": 15913080, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 15913080 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Haryanvi", + "bcp_47": "bgc", + "speakers": 15913080, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 15913080 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Marwari", + "bcp_47": "mwr", + "speakers": 15913080, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 15913080 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Serbian", + "bcp_47": "sr", + "speakers": 15602410, + "scores": [], + "commonvoice_hours": 7.5, + "commonvoice_locale": "sr", + "population": { + "BA": 767118, + "CA": 64080, + "ME": 640352, + "RO": 25563, + "RS": 13884096, + "RU": 4960, + "TR": 22965, + "XK": 193276 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sinhala", + "bcp_47": "si", + "speakers": 15564656, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "si", + "population": { + "LK": 15564656 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Khmer", + "bcp_47": "km", + "speakers": 15065030, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "km", + "population": { + "KH": 15065030 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chhattisgarhi", + "bcp_47": "hne", + "speakers": 14586990, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 14586990 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nigerian Fulfulde", + "bcp_47": "fuv", + "speakers": 14339876, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 14339876 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Zulu", + "bcp_47": "zu", + "speakers": 13973830, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "zu", + "population": { + "LS": 275706, + "MW": 69949, + "MZ": 1806, + "SZ": 75105, + "ZA": 13551264 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kazakh", + "bcp_47": "kk", + "speakers": 13637392, + "scores": [], + "commonvoice_hours": 2.1, + "commonvoice_locale": "kk", + "population": { + "AF": 2015, + "CN": 1184917, + "IR": 2972, + "KZ": 12218816, + "MN": 228098, + "TR": 574 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Deccan", + "bcp_47": "dcc", + "speakers": 13128291, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 13128291 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Czech", + "bcp_47": "cs", + "speakers": 13045532, + "scores": [], + "commonvoice_hours": 74.0, + "commonvoice_locale": "cs", + "population": { + "CZ": 10488450, + "SK": 2557082 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Swedish", + "bcp_47": "sv", + "speakers": 12932871, + "scores": [], + "commonvoice_hours": 47.0, + "commonvoice_locale": "sv-SE", + "population": { + "AX": 25938, + "DK": 763023, + "FI": 2451535, + "SE": 9692375 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hungarian", + "bcp_47": "hu", + "speakers": 12443430, + "scores": [], + "commonvoice_hours": 92.0, + "commonvoice_locale": "hu", + "population": { + "AT": 23035, + "CA": 49002, + "HU": 9771830, + "IL": 86755, + "RO": 1405991, + "RS": 336584, + "SI": 9252, + "SK": 598466, + "UA": 162515 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Greek", + "bcp_47": "el", + "speakers": 12292242, + "scores": [], + "commonvoice_hours": 20.0, + "commonvoice_locale": "el", + "population": { + "AL": 58417, + "CA": 124391, + "CY": 1203346, + "DE": 304607, + "EG": 63516, + "GR": 10501029, + "IT": 21841, + "RO": 4048, + "TR": 4019, + "UA": 7028 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Shona", + "bcp_47": "sn", + "speakers": 11782503, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ZW": 11782503 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Low German", + "bcp_47": "nds", + "speakers": 11520008, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 9619164, + "NL": 1900844 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Akan", + "bcp_47": "ak", + "speakers": 11442678, + "scores": [], + "commonvoice_hours": 0.1, + "commonvoice_locale": "tw", + "population": { + "GH": 11442678 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Quechua", + "bcp_47": "qu", + "speakers": 11385851, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BO": 3724768, + "EC": 2873833, + "PE": 4787250 + }, + "language_family": "Quechuan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central Kurdish", + "bcp_47": "ckb", + "speakers": 11086549, + "scores": [], + "commonvoice_hours": 135.0, + "commonvoice_locale": "ckb", + "population": { + "IQ": 7774540, + "IR": 3312009 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kinyarwanda", + "bcp_47": "rw", + "speakers": 11083625, + "scores": [], + "commonvoice_hours": 2002.0, + "commonvoice_locale": "rw", + "population": { + "CD": 386764, + "RW": 9788548, + "UG": 908313 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Wolof", + "bcp_47": "wo", + "speakers": 11025494, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "wo", + "population": { + "MR": 10014, + "SN": 11015480 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tunisian Arabic", + "bcp_47": "aeb", + "speakers": 10549080, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TN": 10549080 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Iloko", + "bcp_47": "ilo", + "speakers": 10481376, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 10481376 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Xhosa", + "bcp_47": "xh", + "speakers": 10182944, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "xh", + "population": { + "LS": 19496, + "ZA": 10163448 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tigrinya", + "bcp_47": "ti", + "speakers": 10145911, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ti", + "population": { + "ER": 3648720, + "ET": 6486780, + "IL": 10411 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Belarusian", + "bcp_47": "be", + "speakers": 10064517, + "scores": [], + "commonvoice_hours": 1804.0, + "commonvoice_locale": "be", + "population": { + "BY": 9477920, + "PL": 222037, + "UA": 364560 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Luba-Lulua", + "bcp_47": "lua", + "speakers": 9770880, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CD": 9770880 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tajik", + "bcp_47": "tg", + "speakers": 9644223, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "tg", + "population": { + "PK": 770553, + "TJ": 8873670 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Umbundu", + "bcp_47": "umb", + "speakers": 9431467, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AO": 9431467 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bambara", + "bcp_47": "bm", + "speakers": 9385632, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "bm", + "population": { + "ML": 9385632 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Afrikaans", + "bcp_47": "af", + "speakers": 9318845, + "scores": [], + "commonvoice_hours": 0.5, + "commonvoice_locale": "af", + "population": { + "BW": 6025, + "NA": 1972552, + "ZA": 7340268 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hiligaynon", + "bcp_47": "hil", + "speakers": 9171204, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "hil", + "population": { + "PH": 9171204 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kikuyu", + "bcp_47": "ki", + "speakers": 9099743, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ki", + "population": { + "KE": 9099743 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Haitian Creole", + "bcp_47": "ht", + "speakers": 8964918, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ht", + "population": { + "HT": 8964918 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Catalan", + "bcp_47": "ca", + "speakers": 8679139, + "scores": [], + "commonvoice_hours": 2842.0, + "commonvoice_locale": "ca", + "population": { + "AD": 39270, + "ES": 8502686, + "FR": 115342, + "IT": 21841 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hebrew", + "bcp_47": "he", + "speakers": 8675480, + "scores": [], + "commonvoice_hours": 1.1, + "commonvoice_locale": "he", + "population": { + "IL": 8675480 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sichuan Yi", + "bcp_47": "ii", + "speakers": 8364120, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 8364120 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mossi", + "bcp_47": "mos", + "speakers": 8334160, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "mos", + "population": { + "BF": 8334160 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Baluchi", + "bcp_47": "bal", + "speakers": 8227887, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "bal", + "population": { + "AE": 229818, + "IR": 1698466, + "OM": 228577, + "PK": 6071026 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sylheti", + "bcp_47": "syl", + "speakers": 8132550, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BD": 8132550 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kimbundu", + "bcp_47": "kmb", + "speakers": 8130575, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AO": 8130575 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Uyghur", + "bcp_47": "ug", + "speakers": 8052967, + "scores": [], + "commonvoice_hours": 363.0, + "commonvoice_locale": "ug", + "population": { + "AF": 3005, + "CN": 7667110, + "KZ": 381838, + "MN": 1014 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Minangkabau", + "bcp_47": "min", + "speakers": 8010780, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 8010780 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Swiss German", + "bcp_47": "gsw", + "speakers": 7956952, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "gsw", + "population": { + "CH": 5462594, + "DE": 1843673, + "FR": 617419, + "LI": 33266 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bulgarian", + "bcp_47": "bg", + "speakers": 7878315, + "scores": [], + "commonvoice_hours": 16.0, + "commonvoice_locale": "bg", + "population": { + "BG": 6966900, + "GR": 28639, + "MD": 316263, + "RO": 6817, + "TR": 344474, + "UA": 215222 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Standard Moroccan Tamazight", + "bcp_47": "zgh", + "speakers": 7823574, + "scores": [], + "commonvoice_hours": 1.3, + "commonvoice_locale": "zgh", + "population": { + "MA": 7823574 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Fula", + "bcp_47": "ff", + "speakers": 7788904, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ff", + "population": { + "BF": 0, + "CM": 998820, + "GH": 0, + "GM": 0, + "GN": 3257124, + "GW": 4, + "LR": 0, + "MR": 228312, + "NE": 0, + "NG": 0, + "SL": 0, + "SN": 3304644 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bosnian", + "bcp_47": "bs", + "speakers": 7594468, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "bs", + "population": { + "BA": 7594468 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rundi", + "bcp_47": "rn", + "speakers": 7475454, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "rn", + "population": { + "BI": 7475454 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kanauji", + "bcp_47": "bjj", + "speakers": 7426104, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 7426104 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Santali", + "bcp_47": "sat", + "speakers": 7293495, + "scores": [], + "commonvoice_hours": 0.5, + "commonvoice_locale": "sat", + "population": { + "IN": 7293495 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Danish", + "bcp_47": "da", + "speakers": 7072056, + "scores": [], + "commonvoice_hours": 13.0, + "commonvoice_locale": "da", + "population": { + "DE": 1603194, + "DK": 5458551, + "GL": 8066, + "IS": 2245 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Turkmen", + "bcp_47": "tk", + "speakers": 6870838, + "scores": [], + "commonvoice_hours": 2.8, + "commonvoice_locale": "tk", + "population": { + "AF": 622945, + "IR": 2377852, + "TM": 3870041 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kurdish", + "bcp_47": "ku", + "speakers": 6866757, + "scores": [], + "commonvoice_hours": 69.0, + "commonvoice_locale": "kmr", + "population": { + "AM": 99704, + "AZ": 24494, + "DE": 529054, + "GE": 35573, + "LB": 92983, + "SY": 1551872, + "TM": 22115, + "TR": 4510962 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Croatian", + "bcp_47": "hr", + "speakers": 6813164, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "hr", + "population": { + "AT": 106313, + "BA": 460271, + "CA": 45233, + "DE": 633262, + "HR": 4185472, + "HU": 31270, + "IT": 3495, + "RS": 65213, + "SI": 1282635 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Albanian", + "bcp_47": "sq", + "speakers": 6791906, + "scores": [], + "commonvoice_hours": 8.8, + "commonvoice_locale": "sq", + "population": { + "AL": 3074580, + "GR": 9971, + "ME": 48179, + "MK": 531492, + "RS": 1332312, + "TR": 17224, + "XK": 1778148 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Slovak", + "bcp_47": "sk", + "speakers": 6680269, + "scores": [], + "commonvoice_hours": 44.0, + "commonvoice_locale": "sk", + "population": { + "CZ": 1712400, + "HU": 11726, + "RS": 59603, + "SK": 4896540 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dyula", + "bcp_47": "dyu", + "speakers": 6667328, + "scores": [], + "commonvoice_hours": 0.4, + "commonvoice_locale": "dyu", + "population": { + "BF": 6667328 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern Thai", + "bcp_47": "nod", + "speakers": 6621830, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TH": 6621830 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mongolian", + "bcp_47": "mn", + "speakers": 6572846, + "scores": [], + "commonvoice_hours": 46.0, + "commonvoice_locale": "mn", + "population": { + "CN": 3624452, + "MN": 2946268, + "RU": 2126 + }, + "language_family": "Mongolic-Khitan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Southern Sotho", + "bcp_47": "st", + "speakers": 6390567, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "st", + "population": { + "LS": 1929943, + "ZA": 4460624 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Krio", + "bcp_47": "kri", + "speakers": 6293684, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SL": 6293684 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tachelhit", + "bcp_47": "shi", + "speakers": 6187736, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "shi", + "population": { + "MA": 6187736 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tswana", + "bcp_47": "tn", + "speakers": 6113428, + "scores": [], + "commonvoice_hours": 4.2, + "commonvoice_locale": "tn", + "population": { + "BW": 1436683, + "NA": 14728, + "ZA": 4630015, + "ZW": 32002 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mewati", + "bcp_47": "wtm", + "speakers": 6100014, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 6100014 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Luyia", + "bcp_47": "luy", + "speakers": 5888069, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 5888069 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Guarani", + "bcp_47": "gn", + "speakers": 5827107, + "scores": [], + "commonvoice_hours": 3.7, + "commonvoice_locale": "gn", + "population": { + "AR": 21375, + "BO": 52380, + "PY": 5753352 + }, + "language_family": "Tupian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Finnish", + "bcp_47": "fi", + "speakers": 5736842, + "scores": [], + "commonvoice_hours": 15.0, + "commonvoice_locale": "fi", + "population": { + "EE": 258010, + "FI": 5237370, + "RU": 17007, + "SE": 224455 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ganda", + "bcp_47": "lg", + "speakers": 5622890, + "scores": [], + "commonvoice_hours": 437.0, + "commonvoice_locale": "lg", + "population": { + "UG": 5622890 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Betawi", + "bcp_47": "bew", + "speakers": 5607546, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "bew", + "population": { + "ID": 5607546 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kashmiri", + "bcp_47": "ks", + "speakers": 5598085, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ks", + "population": { + "IN": 5436969, + "PK": 161116 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Southern Thai", + "bcp_47": "sou", + "speakers": 5518192, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TH": 5518192 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Norwegian Bokmål", + "bcp_47": "nb", + "speakers": 5468932, + "scores": [], + "commonvoice_hours": 0.1, + "commonvoice_locale": "nb-NO", + "population": { + "NO": 5467440, + "SJ": 1492 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Norwegian", + "bcp_47": "no", + "speakers": 5467440, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NO": 5467440 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bemba", + "bcp_47": "bem", + "speakers": 5402246, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ZM": 5402246 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Armenian", + "bcp_47": "hy", + "speakers": 5317273, + "scores": [], + "commonvoice_hours": 31.0, + "commonvoice_locale": "hy-AM", + "population": { + "AM": 2960894, + "CY": 2787, + "GE": 279790, + "IR": 203816, + "LB": 284420, + "RU": 1190465, + "SY": 349171, + "TR": 45930 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern Sotho", + "bcp_47": "nso", + "speakers": 5307578, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "nso", + "population": { + "ZA": 5307578 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Luo (Kenya and Tanzania)", + "bcp_47": "luo", + "speakers": 5245734, + "scores": [], + "commonvoice_hours": 30.0, + "commonvoice_locale": "luo", + "population": { + "KE": 5245734 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tok Pisin", + "bcp_47": "tpi", + "speakers": 5154217, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PG": 5154217 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lao", + "bcp_47": "lo", + "speakers": 5138706, + "scores": [], + "commonvoice_hours": 0.2, + "commonvoice_locale": "lo", + "population": { + "LA": 5138706 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sukuma", + "bcp_47": "suk", + "speakers": 5094094, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 5094094 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Konkani", + "bcp_47": "kok", + "speakers": 4906533, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "knn", + "population": { + "IN": 4906533 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tsonga", + "bcp_47": "ts", + "speakers": 4880932, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ts", + "population": { + "MZ": 2377758, + "SZ": 18776, + "ZA": 2484398 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Main-Franconian", + "bcp_47": "vmf", + "speakers": 4809582, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 4809582 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Balinese", + "bcp_47": "ban", + "speakers": 4806468, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 4806468 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ewe", + "bcp_47": "ee", + "speakers": 4690857, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ee", + "population": { + "GH": 3227422, + "TG": 1463435 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Zhuang", + "bcp_47": "za", + "speakers": 4321462, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 4321462 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Buginese", + "bcp_47": "bug", + "speakers": 4298211, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 4272416, + "MY": 25795 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mazanderani", + "bcp_47": "mzn", + "speakers": 4246165, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IR": 4246165 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Goan Konkani", + "bcp_47": "gom", + "speakers": 4243488, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "gom", + "population": { + "IN": 4243488 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kamba", + "bcp_47": "kam", + "speakers": 4068120, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "kam", + "population": { + "KE": 4068120 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kalenjin", + "bcp_47": "kln", + "speakers": 4068120, + "scores": [], + "commonvoice_hours": 43.0, + "commonvoice_locale": "kln", + "population": { + "KE": 4068120 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Banjar", + "bcp_47": "bjn", + "speakers": 4010288, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 4005390, + "MY": 4898 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern Hindko", + "bcp_47": "hno", + "speakers": 3969517, + "scores": [], + "commonvoice_hours": 11.0, + "commonvoice_locale": "hno", + "population": { + "PK": 3969517 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Makhuwa", + "bcp_47": "vmw", + "speakers": 3912766, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "vmw", + "population": { + "MZ": 3912766 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gilaki", + "bcp_47": "glk", + "speakers": 3906472, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IR": 3906472 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lombard", + "bcp_47": "lmo", + "speakers": 3901518, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CH": 344564, + "IT": 3556954 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Zarma", + "bcp_47": "dje", + "speakers": 3871308, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NE": 3871308 + }, + "language_family": "Songhay", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ndau", + "bcp_47": "ndc", + "speakers": 3867046, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MZ": 2979722, + "ZW": 887324 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sidamo", + "bcp_47": "sid", + "speakers": 3783955, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ET": 3783955 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Achinese", + "bcp_47": "ace", + "speakers": 3738364, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ace", + "population": { + "ID": 3738364 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Shekhawati", + "bcp_47": "swv", + "speakers": 3713052, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 3713052 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Riffian", + "bcp_47": "rif", + "speakers": 3692411, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "rif", + "population": { + "MA": 3485046, + "NL": 207365 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Shan", + "bcp_47": "shn", + "speakers": 3687984, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "shn", + "population": { + "MM": 3621766, + "TH": 66218 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lambadi", + "bcp_47": "lmn", + "speakers": 3580443, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 3580443 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Garhwali", + "bcp_47": "gbm", + "speakers": 3580443, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 3580443 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Georgian", + "bcp_47": "ka", + "speakers": 3543646, + "scores": [], + "commonvoice_hours": 158.0, + "commonvoice_locale": "ka", + "population": { + "GE": 3437420, + "IR": 60296, + "TR": 45930 + }, + "language_family": "Kartvelian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Galician", + "bcp_47": "gl", + "speakers": 3515530, + "scores": [], + "commonvoice_hours": 110.0, + "commonvoice_locale": "gl", + "population": { + "ES": 3501106, + "PT": 14424 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lingala", + "bcp_47": "ln", + "speakers": 3514491, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ln", + "population": { + "AO": 217899, + "CD": 3155180, + "CF": 14378, + "CG": 127034 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mandingo", + "bcp_47": "man", + "speakers": 3511762, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GM": 630460, + "GN": 2881302 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central Atlas Tamazight", + "bcp_47": "tzm", + "speakers": 3485047, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MA": 3485047 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pattani Malay", + "bcp_47": "mfa", + "speakers": 3448870, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TH": 3448870 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tiv", + "bcp_47": "tiv", + "speakers": 3424448, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 3424448 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kabyle", + "bcp_47": "kab", + "speakers": 3351886, + "scores": [], + "commonvoice_hours": 571.0, + "commonvoice_locale": "kab", + "population": { + "DZ": 3351886 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kyrgyz", + "bcp_47": "ky", + "speakers": 3338267, + "scores": [], + "commonvoice_hours": 39.0, + "commonvoice_locale": "ky", + "population": { + "CN": 473967, + "KG": 2863152, + "TR": 1148 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bikol", + "bcp_47": "bik", + "speakers": 3275430, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 3275430 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Fon", + "bcp_47": "fon", + "speakers": 3216150, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BJ": 3216150 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gondi", + "bcp_47": "gon", + "speakers": 3182616, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 3182616 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Waray", + "bcp_47": "war", + "speakers": 3166927, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 678, + "PH": 3166249 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Southern Kurdish", + "bcp_47": "sdh", + "speakers": 3142162, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "sdh", + "population": { + "IR": 3142162 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Brahui", + "bcp_47": "brh", + "speakers": 3035513, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PK": 3035513 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Baoulé", + "bcp_47": "bci", + "speakers": 3022921, + "scores": [], + "commonvoice_hours": 2.0, + "commonvoice_locale": "bci", + "population": { + "CI": 3022921 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tibetan", + "bcp_47": "bo", + "speakers": 3006697, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "bo", + "population": { + "CN": 2788040, + "IN": 145870, + "NP": 72787 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ibibio", + "bcp_47": "ibb", + "speakers": 2996392, + "scores": [], + "commonvoice_hours": 2.6, + "commonvoice_locale": "ibb", + "population": { + "NG": 2996392 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Efik", + "bcp_47": "efi", + "speakers": 2996392, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 2996392 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sango", + "bcp_47": "sg", + "speakers": 2935521, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CF": 2935521 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kumaoni", + "bcp_47": "kfy", + "speakers": 2917398, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 2917398 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Aymara", + "bcp_47": "ay", + "speakers": 2838620, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BO": 2327980, + "PE": 510640 + }, + "language_family": "Aymaran", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nyankole", + "bcp_47": "nyn", + "speakers": 2724939, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "nyn", + "population": { + "UG": 2724939 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Jamaican Creole English", + "bcp_47": "jam", + "speakers": 2668142, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "JM": 2668142 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dogri", + "bcp_47": "doi", + "speakers": 2652180, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 2652180 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gusii", + "bcp_47": "guz", + "speakers": 2622867, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 2622867 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sasak", + "bcp_47": "sas", + "speakers": 2590152, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 2590152 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kurukh", + "bcp_47": "kru", + "speakers": 2519571, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 2519571 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pampanga", + "bcp_47": "pam", + "speakers": 2511163, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 2511163 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "West Albay Bikol", + "bcp_47": "fbl", + "speakers": 2511163, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 2511163 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lithuanian", + "bcp_47": "lt", + "speakers": 2488617, + "scores": [], + "commonvoice_hours": 25.0, + "commonvoice_locale": "lt", + "population": { + "GB": 131522, + "LT": 2349056, + "PL": 8039 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Beja", + "bcp_47": "bej", + "speakers": 2460326, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SD": 2460326 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Batak Toba", + "bcp_47": "bbc", + "speakers": 2456639, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 2456639 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sadri", + "bcp_47": "sck", + "speakers": 2386962, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 2386962 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Waddar", + "bcp_47": "wbq", + "speakers": 2386962, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 2386962 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Luba-Katanga", + "bcp_47": "lu", + "speakers": 2340940, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CD": 2340940 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chiga", + "bcp_47": "cgg", + "speakers": 2335662, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "UG": 2335662 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Soga", + "bcp_47": "xog", + "speakers": 2292409, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "UG": 2292409 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Swati", + "bcp_47": "ss", + "speakers": 2212379, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ss", + "population": { + "LS": 47264, + "SZ": 640598, + "ZA": 1524517 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hazaragi", + "bcp_47": "haz", + "speakers": 2161984, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AF": 2161984 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Meru", + "bcp_47": "mer", + "speakers": 2141116, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 2141116 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kangri", + "bcp_47": "xnr", + "speakers": 2121744, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 2121744 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Afar", + "bcp_47": "aa", + "speakers": 2119663, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "aa", + "population": { + "DJ": 387158, + "ER": 218923, + "ET": 1513582 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Teso", + "bcp_47": "teo", + "speakers": 2082973, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 396106, + "UG": 1686867 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lomwe", + "bcp_47": "ngl", + "speakers": 2046678, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MZ": 2046678 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Occitan", + "bcp_47": "oc", + "speakers": 2040398, + "scores": [], + "commonvoice_hours": 1.8, + "commonvoice_locale": "oc", + "population": { + "ES": 4952, + "FR": 2035446 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Balochi", + "bcp_47": "bgn", + "speakers": 2037382, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AF": 230856, + "IR": 475570, + "PK": 1330956 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern Luri", + "bcp_47": "lrc", + "speakers": 2020512, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IQ": 237123, + "IR": 1783389 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Wagdi", + "bcp_47": "wbr", + "speakers": 1989135, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1989135 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tulu", + "bcp_47": "tcy", + "speakers": 1989135, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1989135 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Khandesi", + "bcp_47": "khn", + "speakers": 1989135, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1989135 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tatar", + "bcp_47": "tt", + "speakers": 1984108, + "scores": [], + "commonvoice_hours": 32.0, + "commonvoice_locale": "tt", + "population": { + "RU": 1984108 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Slovenian", + "bcp_47": "sl", + "speakers": 1973181, + "scores": [], + "commonvoice_hours": 17.0, + "commonvoice_locale": "sl", + "population": { + "AT": 32780, + "HU": 4984, + "IT": 106085, + "SI": 1829332 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Makasar", + "bcp_47": "mak", + "speakers": 1949290, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 1949290 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Wolaytta", + "bcp_47": "wal", + "speakers": 1946034, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ET": 1946034 + }, + "language_family": "Ta-Ne-Omotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nyamwezi", + "bcp_47": "nym", + "speakers": 1932242, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 1932242 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bodo", + "bcp_47": "brx", + "speakers": 1856526, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1856526 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lampung Api", + "bcp_47": "ljp", + "speakers": 1842479, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 1842479 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chuvash", + "bcp_47": "cv", + "speakers": 1842386, + "scores": [], + "commonvoice_hours": 27.0, + "commonvoice_locale": "cv", + "population": { + "RU": 1842386 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bashkir", + "bcp_47": "ba", + "speakers": 1842386, + "scores": [], + "commonvoice_hours": 259.0, + "commonvoice_locale": "ba", + "population": { + "RU": 1842386 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rohingya", + "bcp_47": "rhg", + "speakers": 1824082, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BD": 862050, + "MM": 962032 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mende", + "bcp_47": "men", + "speakers": 1813083, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "LR": 24352, + "SL": 1788731 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tumbuka", + "bcp_47": "tum", + "speakers": 1780514, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MW": 1780514 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tamashek", + "bcp_47": "tmh", + "speakers": 1776965, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 410621, + "NE": 1366344 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "North Ndebele", + "bcp_47": "nd", + "speakers": 1745556, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "nd", + "population": { + "ZW": 1745556 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Masai", + "bcp_47": "mas", + "speakers": 1734738, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 856446, + "TZ": 878292 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Serer", + "bcp_47": "srr", + "speakers": 1731004, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 1731004 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nimadi", + "bcp_47": "noe", + "speakers": 1723917, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1723917 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Timne", + "bcp_47": "tem", + "speakers": 1722482, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SL": 1722482 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Scots", + "bcp_47": "sco", + "speakers": 1644028, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "sco", + "population": { + "GB": 1644028 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lango (Uganda)", + "bcp_47": "laj", + "speakers": 1643614, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "UG": 1643614 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Domari", + "bcp_47": "rmt", + "speakers": 1613543, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IR": 1613543 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Macedonian", + "bcp_47": "mk", + "speakers": 1608565, + "scores": [], + "commonvoice_hours": 18.0, + "commonvoice_locale": "mk", + "population": { + "AL": 14451, + "GR": 169714, + "MK": 1424400 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Acoli", + "bcp_47": "ach", + "speakers": 1600361, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "UG": 1600361 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central-Eastern Niger Fulfulde", + "bcp_47": "fuq", + "speakers": 1594068, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NE": 1594068 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bhili", + "bcp_47": "bhb", + "speakers": 1591308, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1591308 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pangasinan", + "bcp_47": "pag", + "speakers": 1528534, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 1528534 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kongo", + "bcp_47": "kg", + "speakers": 1526700, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CD": 1526700 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bini", + "bcp_47": "bin", + "speakers": 1519599, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 1519599 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Maasina Fulfulde", + "bcp_47": "ffm", + "speakers": 1505612, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 1505612 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Manipuri", + "bcp_47": "mni", + "speakers": 1476591, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "mni", + "population": { + "BD": 17892, + "IN": 1458699 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Abron", + "bcp_47": "abr", + "speakers": 1467010, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GH": 1467010 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Makonde", + "bcp_47": "kde", + "speakers": 1463820, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 1463820 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gheg Albanian", + "bcp_47": "aln", + "speakers": 1430250, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "aln", + "population": { + "XK": 1430250 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Venda", + "bcp_47": "ve", + "speakers": 1391759, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ve", + "population": { + "ZA": 1298663, + "ZW": 93096 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sena", + "bcp_47": "seh", + "speakers": 1384517, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MZ": 1384517 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Venetian", + "bcp_47": "vec", + "speakers": 1380829, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "vec", + "population": { + "BR": 508118, + "HR": 29594, + "IT": 811235, + "MX": 2444, + "SI": 29438 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Susu", + "bcp_47": "sus", + "speakers": 1378014, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GN": 1378014 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Norwegian Nynorsk", + "bcp_47": "nn", + "speakers": 1366860, + "scores": [], + "commonvoice_hours": 1.5, + "commonvoice_locale": "nn-NO", + "population": { + "NO": 1366860 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Makhuwa-Meetto", + "bcp_47": "mgh", + "speakers": 1354419, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MZ": 1354419 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rajasthani", + "bcp_47": "raj", + "speakers": 1326090, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1326090 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ho", + "bcp_47": "hoc", + "speakers": 1312829, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1312829 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Maguindanaon", + "bcp_47": "mdh", + "speakers": 1310172, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 1310172 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mewari", + "bcp_47": "mtr", + "speakers": 1286307, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1286307 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bulu", + "bcp_47": "bum", + "speakers": 1276270, + "scores": [], + "commonvoice_hours": 9.5, + "commonvoice_locale": "bum", + "population": { + "CM": 1276270 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Masaaba", + "bcp_47": "myx", + "speakers": 1254337, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "UG": 1254337 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mundari", + "bcp_47": "unr", + "speakers": 1252287, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1246525, + "NP": 5762 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Morisyen", + "bcp_47": "mfe", + "speakers": 1241433, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MU": 1241433 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Irish", + "bcp_47": "ga", + "speakers": 1237487, + "scores": [], + "commonvoice_hours": 5.8, + "commonvoice_locale": "ga-IE", + "population": { + "GB": 98642, + "IE": 1138845 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Fur", + "bcp_47": "fvr", + "speakers": 1230163, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SD": 1230163 + }, + "language_family": "Furan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rejang", + "bcp_47": "rej", + "speakers": 1228320, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 1228320 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bhilali", + "bcp_47": "bhi", + "speakers": 1220003, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1220003 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tausug", + "bcp_47": "tsg", + "speakers": 1200991, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 1200991 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kʼicheʼ", + "bcp_47": "quc", + "speakers": 1200731, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "quc", + "population": { + "GT": 1200731 + }, + "language_family": "Mayan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bakhtiari", + "bcp_47": "bqi", + "speakers": 1188926, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IR": 1188926 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kpelle", + "bcp_47": "kpe", + "speakers": 1186303, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GN": 476041, + "LR": 710262 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Cebaara Senoufo", + "bcp_47": "sef", + "speakers": 1181687, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CI": 1181687 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern Khmer", + "bcp_47": "kxm", + "speakers": 1172616, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TH": 1172616 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "West Flemish", + "bcp_47": "vls", + "speakers": 1172070, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BE": 1172070 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Soninke", + "bcp_47": "snk", + "speakers": 1153651, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "snk", + "population": { + "ML": 1153651 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Zaza", + "bcp_47": "zza", + "speakers": 1148245, + "scores": [], + "commonvoice_hours": 1.8, + "commonvoice_locale": "zza", + "population": { + "TR": 1148245 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Latvian", + "bcp_47": "lv", + "speakers": 1147550, + "scores": [], + "commonvoice_hours": 260.0, + "commonvoice_locale": "lv", + "population": { + "LV": 1147550 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dan", + "bcp_47": "dnj", + "speakers": 1099244, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CI": 1099244 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gorontalo", + "bcp_47": "gor", + "speakers": 1094807, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 1094807 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tigre", + "bcp_47": "tig", + "speakers": 1094616, + "scores": [], + "commonvoice_hours": 2.2, + "commonvoice_locale": "tig", + "population": { + "ER": 1094616 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Basque", + "bcp_47": "eu", + "speakers": 1088519, + "scores": [], + "commonvoice_hours": 335.0, + "commonvoice_locale": "eu", + "population": { + "ES": 1000316, + "FR": 88203 + }, + "language_family": null, + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hadothi", + "bcp_47": "hoj", + "speakers": 1087394, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1087394 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kabardian", + "bcp_47": "kbd", + "speakers": 1070873, + "scores": [], + "commonvoice_hours": 15.0, + "commonvoice_locale": "kbd", + "population": { + "RU": 439338, + "TR": 631535 + }, + "language_family": "Abkhaz-Adyge", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Khasi", + "bcp_47": "kha", + "speakers": 1060872, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 1060872 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sardinian", + "bcp_47": "sc", + "speakers": 1060846, + "scores": [], + "commonvoice_hours": 2.9, + "commonvoice_locale": "sc", + "population": { + "IT": 1060846 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lozi", + "bcp_47": "loz", + "speakers": 1045596, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ZM": 1045596 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Frafra", + "bcp_47": "gur", + "speakers": 1026907, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GH": 1026907 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Najdi Arabic", + "bcp_47": "ars", + "speakers": 1025205, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SA": 1025205 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ronga", + "bcp_47": "rng", + "speakers": 1023339, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MZ": 1023339 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Southern Luri", + "bcp_47": "luz", + "speakers": 1019080, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IR": 1019080 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Newari", + "bcp_47": "new", + "speakers": 1000821, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "new", + "population": { + "NP": 1000821 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Talysh", + "bcp_47": "tly", + "speakers": 1000168, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AZ": 1000168 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yiddish", + "bcp_47": "yi", + "speakers": 997214, + "scores": [], + "commonvoice_hours": 0.5, + "commonvoice_locale": "yi", + "population": { + "IL": 260264, + "SE": 2959, + "UA": 570998, + "US": 162993 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bena", + "bcp_47": "bez", + "speakers": 995398, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 995398 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Shambala", + "bcp_47": "ksb", + "speakers": 995398, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 995398 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kachhi", + "bcp_47": "kfr", + "speakers": 994568, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 994568 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ngaju", + "bcp_47": "nij", + "speakers": 987996, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 987996 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kita Maninkakan", + "bcp_47": "mwk", + "speakers": 977670, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 977670 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Jumli", + "bcp_47": "jml", + "speakers": 970493, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 970493 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central Okinawan", + "bcp_47": "ryu", + "speakers": 966404, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "JP": 966404 + }, + "language_family": "Japonic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mon", + "bcp_47": "mnw", + "speakers": 966114, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MM": 848852, + "TH": 117262 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chimborazo Highland Quichua", + "bcp_47": "qug", + "speakers": 963579, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "EC": 963579 + }, + "language_family": "Quechuan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kachin", + "bcp_47": "kac", + "speakers": 962032, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MM": 962032 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Southern Hindko", + "bcp_47": "hnd", + "speakers": 957354, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PK": 957354 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Limburgish", + "bcp_47": "li", + "speakers": 950422, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NL": 950422 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Manyika", + "bcp_47": "mxc", + "speakers": 945510, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ZW": 945510 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chechen", + "bcp_47": "ce", + "speakers": 935365, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 935365 + }, + "language_family": "Nakh-Daghestanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kuanyama", + "bcp_47": "kj", + "speakers": 920524, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NA": 920524 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "South Ndebele", + "bcp_47": "nr", + "speakers": 903418, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "nr", + "population": { + "ZA": 903418 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Welsh", + "bcp_47": "cy", + "speakers": 884910, + "scores": [], + "commonvoice_hours": 124.0, + "commonvoice_locale": "cy", + "population": { + "AR": 30016, + "GB": 854894 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Adangme", + "bcp_47": "ada", + "speakers": 880206, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GH": 880206 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Estonian", + "bcp_47": "et", + "speakers": 878449, + "scores": [], + "commonvoice_hours": 58.0, + "commonvoice_locale": "et", + "population": { + "EE": 872320, + "FI": 6129 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Parsi-Dari", + "bcp_47": "prd", + "speakers": 864342, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AF": 439726, + "IR": 424616 + }, + "language_family": "Bookkeeping", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yucateco", + "bcp_47": "yua", + "speakers": 861955, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MX": 861955 + }, + "language_family": "Mayan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ewondo", + "bcp_47": "ewo", + "speakers": 860095, + "scores": [], + "commonvoice_hours": 19.0, + "commonvoice_locale": "ewo", + "population": { + "CM": 860095 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Komering", + "bcp_47": "kge", + "speakers": 854483, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 854483 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tooro", + "bcp_47": "ttj", + "speakers": 821807, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "UG": 821807 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Garo", + "bcp_47": "grt", + "speakers": 821563, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BD": 118735, + "IN": 702828 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ga", + "bcp_47": "gaa", + "speakers": 821526, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GH": 821526 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mbunga", + "bcp_47": "mgy", + "speakers": 819739, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 819739 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tetum", + "bcp_47": "tet", + "speakers": 816395, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TL": 816395 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Iban", + "bcp_47": "iba", + "speakers": 816302, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MY": 816302 + }, + "language_family": "Bookkeeping", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Embu", + "bcp_47": "ebu", + "speakers": 802918, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 802918 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Swabian", + "bcp_47": "swg", + "speakers": 801597, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 801597 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hmong Njua", + "bcp_47": "hnj", + "speakers": 781687, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AU": 2190, + "CN": 55761, + "FR": 128912, + "GF": 4788, + "LA": 223422, + "MM": 12450, + "SR": 2316, + "TH": 67598, + "US": 116424, + "VN": 167826 + }, + "language_family": "Hmong-Mien", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kalanga", + "bcp_47": "kck", + "speakers": 770954, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ZW": 770954 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dotyali", + "bcp_47": "dty", + "speakers": 758198, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 758198 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Picard", + "bcp_47": "pcd", + "speakers": 746330, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FR": 746330 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Frisian", + "bcp_47": "fy", + "speakers": 743057, + "scores": [], + "commonvoice_hours": 66.0, + "commonvoice_locale": "fy-NL", + "population": { + "NL": 743057 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chakma", + "bcp_47": "ccp", + "speakers": 729137, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BD": 357832, + "IN": 371305 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yao", + "bcp_47": "yao", + "speakers": 722357, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MZ": 722357 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Uab Meto", + "bcp_47": "aoz", + "speakers": 720970, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 720970 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Capiznon", + "bcp_47": "cps", + "speakers": 720595, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 720595 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Asu", + "bcp_47": "asa", + "speakers": 702634, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 702634 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tai Dam", + "bcp_47": "blt", + "speakers": 681177, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "VN": 681177 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Walloon", + "bcp_47": "wa", + "speakers": 679801, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BE": 679801 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Koyraboro Senni", + "bcp_47": "ses", + "speakers": 664816, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 664816 + }, + "language_family": "Songhay", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bagheli", + "bcp_47": "bfy", + "speakers": 654424, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 490653, + "NP": 163771 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Asturian", + "bcp_47": "ast", + "speakers": 650205, + "scores": [], + "commonvoice_hours": 0.8, + "commonvoice_locale": "ast", + "population": { + "ES": 650205 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Laki", + "bcp_47": "lki", + "speakers": 645417, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IR": 645417 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Munda", + "bcp_47": "unx", + "speakers": 636523, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 636523 + }, + "language_family": "Bookkeeping", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lisu", + "bcp_47": "lis", + "speakers": 627309, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 627309 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "N’Ko", + "bcp_47": "nqo", + "speakers": 626370, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "nqo", + "population": { + "GN": 626370 + }, + "language_family": "Artificial Language", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gronings", + "bcp_47": "gos", + "speakers": 622094, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "gos", + "population": { + "NL": 622094 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mongo", + "bcp_47": "lol", + "speakers": 620858, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CD": 620858 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dangaura Tharu", + "bcp_47": "thl", + "speakers": 606558, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 606558 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Neapolitan", + "bcp_47": "nap", + "speakers": 605306, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IT": 605306 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nuer", + "bcp_47": "nus", + "speakers": 591427, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SS": 591427 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Breton", + "bcp_47": "br", + "speakers": 563140, + "scores": [], + "commonvoice_hours": 27.0, + "commonvoice_locale": "br", + "population": { + "FR": 563140 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pijin", + "bcp_47": "pis", + "speakers": 561780, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SB": 561780 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Réunion Creole French", + "bcp_47": "rcf", + "speakers": 559185, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RE": 559185 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Avaric", + "bcp_47": "av", + "speakers": 552716, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 552716 + }, + "language_family": "Nakh-Daghestanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ndonga", + "bcp_47": "ng", + "speakers": 552315, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NA": 552315 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ossetic", + "bcp_47": "os", + "speakers": 541444, + "scores": [], + "commonvoice_hours": 0.7, + "commonvoice_locale": "os", + "population": { + "GE": 87934, + "RU": 453510 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Udmurt", + "bcp_47": "udm", + "speakers": 538544, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "udm", + "population": { + "RU": 538544 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ligurian", + "bcp_47": "lij", + "speakers": 536663, + "scores": [], + "commonvoice_hours": 5.1, + "commonvoice_locale": "lij", + "population": { + "IT": 536663 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kabuverdianu", + "bcp_47": "kea", + "speakers": 530762, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CV": 530762 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rusyn", + "bcp_47": "rue", + "speakers": 527075, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "UA": 527075 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mari", + "bcp_47": "chm", + "speakers": 524371, + "scores": [], + "commonvoice_hours": 282.0, + "commonvoice_locale": "mhr", + "population": { + "RU": 524371 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sicilian", + "bcp_47": "scn", + "speakers": 511702, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "scn", + "population": { + "IT": 511702 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Langi", + "bcp_47": "lag", + "speakers": 509409, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 509409 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Balti", + "bcp_47": "bft", + "speakers": 502520, + "scores": [], + "commonvoice_hours": 18.0, + "commonvoice_locale": "bft", + "population": { + "IN": 82218, + "PK": 420302 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Eastern Huasteca Nahuatl", + "bcp_47": "nhe", + "speakers": 501735, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "nhe", + "population": { + "MX": 501735 + }, + "language_family": "Uto-Aztecan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Huasteca Nahuatl", + "bcp_47": "nhw", + "speakers": 501735, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MX": 501735 + }, + "language_family": "Uto-Aztecan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Silesian", + "bcp_47": "szl", + "speakers": 497670, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PL": 497670 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kara-Kalpak", + "bcp_47": "kaa", + "speakers": 489046, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "kaa", + "population": { + "UZ": 489046 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gujari", + "bcp_47": "gju", + "speakers": 467002, + "scores": [], + "commonvoice_hours": 11.0, + "commonvoice_locale": "gju", + "population": { + "PK": 467002 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sirmauri", + "bcp_47": "srx", + "speakers": 464132, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 464132 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Maltese", + "bcp_47": "mt", + "speakers": 457267, + "scores": [], + "commonvoice_hours": 8.7, + "commonvoice_locale": "mt", + "population": { + "MT": 457267 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bantawa", + "bcp_47": "bap", + "speakers": 454918, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 454918 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yakut", + "bcp_47": "sah", + "speakers": 453510, + "scores": [], + "commonvoice_hours": 8.5, + "commonvoice_locale": "sah", + "population": { + "RU": 453510 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Masalit", + "bcp_47": "mls", + "speakers": 451060, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SD": 451060 + }, + "language_family": "Maban", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Jju", + "bcp_47": "kaj", + "speakers": 449459, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 449459 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Adyghe", + "bcp_47": "ady", + "speakers": 444583, + "scores": [], + "commonvoice_hours": 11.0, + "commonvoice_locale": "ady", + "population": { + "RU": 124715, + "TR": 319868 + }, + "language_family": "Abkhaz-Adyge", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yemba", + "bcp_47": "ybb", + "speakers": 443920, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 443920 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mingrelian", + "bcp_47": "xmf", + "speakers": 439670, + "scores": [], + "commonvoice_hours": 9.1, + "commonvoice_locale": "xmf", + "population": { + "GE": 439670 + }, + "language_family": "Kartvelian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Erzya", + "bcp_47": "myv", + "speakers": 439338, + "scores": [], + "commonvoice_hours": 3.8, + "commonvoice_locale": "myv", + "population": { + "RU": 439338 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Taita", + "bcp_47": "dav", + "speakers": 438929, + "scores": [], + "commonvoice_hours": 9.3, + "commonvoice_locale": "dav", + "population": { + "KE": 438929 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central Mazahua", + "bcp_47": "maz", + "speakers": 437410, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MX": 437410 + }, + "language_family": "Otomanguean", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Vunjo", + "bcp_47": "vun", + "speakers": 433291, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 433291 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rombo", + "bcp_47": "rof", + "speakers": 433291, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 433291 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Machame", + "bcp_47": "jmc", + "speakers": 433291, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 433291 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Khmu", + "bcp_47": "kjg", + "speakers": 431949, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "LA": 431949 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Fang", + "bcp_47": "fan", + "speakers": 426451, + "scores": [], + "commonvoice_hours": 9.3, + "commonvoice_locale": "fan", + "population": { + "GQ": 426451 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kinaray-a", + "bcp_47": "krj", + "speakers": 425806, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 425806 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kuy", + "bcp_47": "kdt", + "speakers": 421207, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KH": 18620, + "LA": 71495, + "TH": 331092 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Luxembourgish", + "bcp_47": "lb", + "speakers": 421015, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "lb", + "population": { + "LU": 421015 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sranan Tongo", + "bcp_47": "srn", + "speakers": 414507, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SR": 414507 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Jola-Fonyi", + "bcp_47": "dyo", + "speakers": 409146, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 409146 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Tamang", + "bcp_47": "tdg", + "speakers": 394263, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 394263 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pontic", + "bcp_47": "pnt", + "speakers": 392463, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GR": 392463 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Negeri Sembilan Malay", + "bcp_47": "zmi", + "speakers": 391825, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MY": 391825 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ngiemboon", + "bcp_47": "nnh", + "speakers": 388430, + "scores": [], + "commonvoice_hours": 23.0, + "commonvoice_locale": "nnh", + "population": { + "CM": 388430 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ghomala", + "bcp_47": "bbj", + "speakers": 388430, + "scores": [], + "commonvoice_hours": 13.0, + "commonvoice_locale": "bbj", + "population": { + "CM": 388430 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Divehi", + "bcp_47": "dv", + "speakers": 388044, + "scores": [], + "commonvoice_hours": 39.0, + "commonvoice_locale": "dv", + "population": { + "IN": 3978, + "MV": 384066 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Saurashtra", + "bcp_47": "saz", + "speakers": 384566, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 384566 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Fiji Hindi", + "bcp_47": "hif", + "speakers": 383749, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FJ": 383749 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nobiin", + "bcp_47": "fia", + "speakers": 378161, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SD": 378161 + }, + "language_family": "Nubian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Balkan Gagauz Turkish", + "bcp_47": "bgx", + "speakers": 377280, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TR": 377280 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kerinci", + "bcp_47": "kvr", + "speakers": 373836, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 373836 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Parkari Koli", + "bcp_47": "kvx", + "speakers": 373602, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PK": 373602 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dzongkha", + "bcp_47": "dz", + "speakers": 370341, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BT": 367689, + "IN": 2652 + }, + "language_family": "Bookkeeping", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pökoot", + "bcp_47": "pko", + "speakers": 369343, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 369343 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dargwa", + "bcp_47": "dar", + "speakers": 368477, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "dar", + "population": { + "RU": 368477 + }, + "language_family": "Nakh-Daghestanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Limbu", + "bcp_47": "lif", + "speakers": 368085, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 34478, + "NP": 333607 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Fijian", + "bcp_47": "fj", + "speakers": 365030, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FJ": 365030 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rana Tharu", + "bcp_47": "thr", + "speakers": 363935, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 363935 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kom", + "bcp_47": "bkm", + "speakers": 360685, + "scores": [], + "commonvoice_hours": 13.0, + "commonvoice_locale": "bkm", + "population": { + "CM": 360685 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Icelandic", + "bcp_47": "is", + "speakers": 350734, + "scores": [], + "commonvoice_hours": 0.1, + "commonvoice_locale": "is", + "population": { + "IS": 350734 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Khowar", + "bcp_47": "khw", + "speakers": 350252, + "scores": [], + "commonvoice_hours": 18.0, + "commonvoice_locale": "khw", + "population": { + "PK": 350252 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tolaki", + "bcp_47": "lbw", + "speakers": 347134, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 347134 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Naxi", + "bcp_47": "nxq", + "speakers": 334565, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 334565 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Eastern Magar", + "bcp_47": "mgp", + "speakers": 333607, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 333607 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bamun", + "bcp_47": "bax", + "speakers": 332940, + "scores": [], + "commonvoice_hours": 11.0, + "commonvoice_locale": "bax", + "population": { + "CM": 332940 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Basaa", + "bcp_47": "bas", + "speakers": 332940, + "scores": [], + "commonvoice_hours": 12.0, + "commonvoice_locale": "bas", + "population": { + "CM": 332940 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Koyra Chiini", + "bcp_47": "khq", + "speakers": 332408, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 332408 + }, + "language_family": "Songhay", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Indus Kohistani", + "bcp_47": "mvy", + "speakers": 326901, + "scores": [], + "commonvoice_hours": 23.0, + "commonvoice_locale": "mvy", + "population": { + "PK": 326901 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gayo", + "bcp_47": "gay", + "speakers": 320431, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 320431 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ngazidja Comorian", + "bcp_47": "zdj", + "speakers": 313124, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KM": 313124 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Buriat", + "bcp_47": "bua", + "speakers": 311788, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "bxr", + "population": { + "RU": 311788 + }, + "language_family": "Mongolic-Khitan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rinconada Bikol", + "bcp_47": "bto", + "speakers": 305707, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 305707 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Medumba", + "bcp_47": "byv", + "speakers": 305195, + "scores": [], + "commonvoice_hours": 14.0, + "commonvoice_locale": "byv", + "population": { + "CM": 305195 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ao Naga", + "bcp_47": "njo", + "speakers": 305001, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 305001 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Badaga", + "bcp_47": "bfq", + "speakers": 305001, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 305001 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kochila Tharu", + "bcp_47": "thq", + "speakers": 303279, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 303279 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Moksha", + "bcp_47": "mdf", + "speakers": 297616, + "scores": [], + "commonvoice_hours": 0.5, + "commonvoice_locale": "mdf", + "population": { + "RU": 297616 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tae'", + "bcp_47": "rob", + "speakers": 293729, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 293729 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nzima", + "bcp_47": "nzi", + "speakers": 293402, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GH": 293402 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nama", + "bcp_47": "naq", + "speakers": 289308, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NA": 289308 + }, + "language_family": "Khoe-Kwadi", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ndzwani Comorian", + "bcp_47": "wni", + "speakers": 287736, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KM": 287736 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kumyk", + "bcp_47": "kum", + "speakers": 283444, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 283444 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mundang", + "bcp_47": "mua", + "speakers": 277450, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 277450 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mapuche", + "bcp_47": "arn", + "speakers": 272802, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "arn", + "population": { + "CL": 272802 + }, + "language_family": "Araucanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Cham", + "bcp_47": "cja", + "speakers": 270832, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KH": 270832 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bislama", + "bcp_47": "bi", + "speakers": 268500, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "VU": 268500 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lü", + "bcp_47": "khb", + "speakers": 264864, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 264864 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tai Nüa", + "bcp_47": "tdd", + "speakers": 264864, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 264864 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Wadiyara Koli", + "bcp_47": "kxp", + "speakers": 256851, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PK": 256851 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kachi Koli", + "bcp_47": "gjk", + "speakers": 256851, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PK": 256851 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lezghian", + "bcp_47": "lez", + "speakers": 255100, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 255100 + }, + "language_family": "Nakh-Daghestanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Komi", + "bcp_47": "kv", + "speakers": 255100, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "kpv", + "population": { + "RU": 255100 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Samoan", + "bcp_47": "sm", + "speakers": 252717, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AS": 48943, + "WS": 203774 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Magar", + "bcp_47": "mrd", + "speakers": 251722, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 251722 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Samburu", + "bcp_47": "saq", + "speakers": 246228, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KE": 246228 + }, + "language_family": "Nilotic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Crimean Tatar", + "bcp_47": "crh", + "speakers": 245968, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "crh", + "population": { + "UA": 245968 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mandar", + "bcp_47": "mdr", + "speakers": 245664, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 245664 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sangir", + "bcp_47": "sxn", + "speakers": 245664, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 245664 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Extremaduran", + "bcp_47": "ext", + "speakers": 245077, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ES": 245077 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central Huasteca Nahuatl", + "bcp_47": "nch", + "speakers": 244435, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MX": 244435 + }, + "language_family": "Uto-Aztecan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Zeelandic", + "bcp_47": "zea", + "speakers": 241926, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NL": 241926 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Karachay-Balkar", + "bcp_47": "krc", + "speakers": 240927, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "krc", + "population": { + "RU": 240927 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Colognian", + "bcp_47": "ksh", + "speakers": 240479, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 240479 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Herero", + "bcp_47": "hz", + "speakers": 239336, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NA": 239336 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Saafi-Saafi", + "bcp_47": "sav", + "speakers": 236046, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 236046 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Zaghawa", + "bcp_47": "zag", + "speakers": 232364, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SD": 232364 + }, + "language_family": "Saharan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ingush", + "bcp_47": "inh", + "speakers": 226755, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 226755 + }, + "language_family": "Nakh-Daghestanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Saho", + "bcp_47": "ssy", + "speakers": 218923, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ER": 218923 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tomo Kan Dogon", + "bcp_47": "dtm", + "speakers": 215087, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 215087 + }, + "language_family": "Dogon", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Papiamento", + "bcp_47": "pap", + "speakers": 211640, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "pap-AW", + "population": { + "AW": 72851, + "BQ": 16200, + "CW": 122589 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Syriac", + "bcp_47": "syr", + "speakers": 210659, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "syr", + "population": { + "IQ": 194364, + "SY": 16295 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nyasa Tonga", + "bcp_47": "tog", + "speakers": 207727, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MW": 207727 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mafa", + "bcp_47": "maf", + "speakers": 205313, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 205313 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Punu", + "bcp_47": "puu", + "speakers": 200782, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GA": 200782 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tyap", + "bcp_47": "kcg", + "speakers": 199046, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 199046 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Xaasongaxango", + "bcp_47": "kao", + "speakers": 195534, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 195534 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tuvinian", + "bcp_47": "tyv", + "speakers": 184239, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "tyv", + "population": { + "RU": 184239 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central Dusun", + "bcp_47": "dtp", + "speakers": 182852, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MY": 182852 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Riang (India)", + "bcp_47": "ria", + "speakers": 172392, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 172392 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Comorian", + "bcp_47": "swb", + "speakers": 170720, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "YT": 170720 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bomu", + "bcp_47": "bmq", + "speakers": 168159, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 168159 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Latgalian", + "bcp_47": "ltg", + "speakers": 167429, + "scores": [], + "commonvoice_hours": 28.0, + "commonvoice_locale": "ltg", + "population": { + "LV": 167429 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Navajo", + "bcp_47": "nv", + "speakers": 166320, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 166320 + }, + "language_family": "Athabaskan-Eyak-Tlingit", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Jenaama Bozo", + "bcp_47": "bze", + "speakers": 166204, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ML": 166204 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Corsican", + "bcp_47": "co", + "speakers": 162836, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "co", + "population": { + "FR": 162836 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bafut", + "bcp_47": "bfd", + "speakers": 158146, + "scores": [], + "commonvoice_hours": 11.0, + "commonvoice_locale": "bfd", + "population": { + "CM": 158146 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sherpa", + "bcp_47": "xsr", + "speakers": 157705, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 157705 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kirmanjki", + "bcp_47": "kiu", + "speakers": 155833, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TR": 155833 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hiri Motu", + "bcp_47": "ho", + "speakers": 152449, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PG": 152449 + }, + "language_family": "Pidgin", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kako", + "bcp_47": "kkj", + "speakers": 149823, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 149823 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Akoose", + "bcp_47": "bss", + "speakers": 149823, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 149823 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Selayar", + "bcp_47": "sly", + "speakers": 144194, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 144194 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Māori", + "bcp_47": "mi", + "speakers": 137913, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NZ": 137913 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rajbanshi", + "bcp_47": "rjs", + "speakers": 133443, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 133443 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Duala", + "bcp_47": "dua", + "speakers": 133176, + "scores": [], + "commonvoice_hours": 14.0, + "commonvoice_locale": "dua", + "population": { + "CM": 133176 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Wayuu", + "bcp_47": "guc", + "speakers": 132529, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "guc", + "population": { + "CO": 132529 + }, + "language_family": "Arawakan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Vai", + "bcp_47": "vai", + "speakers": 131906, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "LR": 131906 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Eastern Tamang", + "bcp_47": "taj", + "speakers": 130410, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 130410 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Metaʼ", + "bcp_47": "mgo", + "speakers": 130401, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 130401 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pennsylvania German", + "bcp_47": "pdc", + "speakers": 129729, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 129729 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rwa", + "bcp_47": "rwk", + "speakers": 128816, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 128816 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Torwali", + "bcp_47": "trw", + "speakers": 123756, + "scores": [], + "commonvoice_hours": 18.0, + "commonvoice_locale": "trw", + "population": { + "PK": 123756 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mandjak", + "bcp_47": "mfv", + "speakers": 121170, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 121170 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tshangla", + "bcp_47": "tsj", + "speakers": 117348, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BT": 117348 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sangu", + "bcp_47": "sbp", + "speakers": 117106, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TZ": 117106 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Karelian", + "bcp_47": "krl", + "speakers": 116212, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 116212 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ladino", + "bcp_47": "lad", + "speakers": 112781, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IL": 112781 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ifè", + "bcp_47": "ife", + "speakers": 111910, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TG": 111910 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gagauz", + "bcp_47": "gag", + "speakers": 111028, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MD": 111028 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lak", + "bcp_47": "lbe", + "speakers": 110543, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 110543 + }, + "language_family": "Nakh-Daghestanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sassarese Sardinian", + "bcp_47": "sdc", + "speakers": 106085, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IT": 106085 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tongan", + "bcp_47": "to", + "speakers": 100790, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TO": 100790 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Balanta-Ganja", + "bcp_47": "bjt", + "speakers": 95992, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 95992 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ngomba", + "bcp_47": "jgo", + "speakers": 94333, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 94333 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Seselwa Creole French", + "bcp_47": "crs", + "speakers": 94061, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SC": 94061 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Abkhazian", + "bcp_47": "ab", + "speakers": 91953, + "scores": [], + "commonvoice_hours": 68.0, + "commonvoice_locale": "ab", + "population": { + "GE": 87934, + "TR": 4019 + }, + "language_family": "Abkhaz-Adyge", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tahitian", + "bcp_47": "ty", + "speakers": 91488, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ty", + "population": { + "PF": 91488 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Inuktitut", + "bcp_47": "iu", + "speakers": 90466, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 90466 + }, + "language_family": "Eskimo-Aleut", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Plautdietsch", + "bcp_47": "pdt", + "speakers": 90466, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 90466 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bishnupriya", + "bcp_47": "bpy", + "speakers": 90174, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 90174 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bafia", + "bcp_47": "ksf", + "speakers": 88784, + "scores": [], + "commonvoice_hours": 20.0, + "commonvoice_locale": "ksf", + "population": { + "CM": 88784 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gurung", + "bcp_47": "gvr", + "speakers": 87951, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 87951 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Eastern Cham", + "bcp_47": "cjm", + "speakers": 87862, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "VN": 87862 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Lawa", + "bcp_47": "lcp", + "speakers": 87751, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 80853, + "TH": 6898 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mankanya", + "bcp_47": "knf", + "speakers": 83151, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GW": 50105, + "SN": 33046 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lepcha", + "bcp_47": "lep", + "speakers": 79743, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BT": 30510, + "IN": 46413, + "NP": 2820 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Blin", + "bcp_47": "byn", + "speakers": 79056, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ER": 79056 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bateri", + "bcp_47": "btv", + "speakers": 78843, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 34478, + "PK": 44365 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kathoriya Tharu", + "bcp_47": "tkt", + "speakers": 72787, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 72787 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Scottish Gaelic", + "bcp_47": "gd", + "speakers": 72337, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GB": 72337 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Faroese", + "bcp_47": "fo", + "speakers": 71351, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "fo", + "population": { + "DK": 22304, + "FO": 49047 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Võro", + "bcp_47": "vro", + "speakers": 70031, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "EE": 70031 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kenyang", + "bcp_47": "ken", + "speakers": 69362, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 69362 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gilbertese", + "bcp_47": "gil", + "speakers": 67078, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "KI": 67078 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bube", + "bcp_47": "bvb", + "speakers": 66058, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GQ": 66058 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mentawai", + "bcp_47": "mwv", + "speakers": 64086, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ID": 64086 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Arpitan", + "bcp_47": "frp", + "speakers": 63777, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FR": 63777 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Komi-Permyak", + "bcp_47": "koi", + "speakers": 63775, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 63775 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Koro", + "bcp_47": "kfo", + "speakers": 63207, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CI": 63207 + }, + "language_family": "Mande", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Marshallese", + "bcp_47": "mh", + "speakers": 56879, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "MH": 56879 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tornedalen Finnish", + "bcp_47": "fit", + "speakers": 56114, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SE": 56114 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kalaallisut", + "bcp_47": "kl", + "speakers": 55440, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DK": 7043, + "GL": 48397 + }, + "language_family": "Eskimo-Aleut", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Braj", + "bcp_47": "bra", + "speakers": 54370, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 54370 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Guianese Creole French", + "bcp_47": "gcr", + "speakers": 51872, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GF": 51872 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern Sami", + "bcp_47": "se", + "speakers": 51530, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FI": 2006, + "NO": 15856, + "SE": 33668 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Anii", + "bcp_47": "blo", + "speakers": 51507, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BJ": 38594, + "TG": 12913 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kaingang", + "bcp_47": "kgp", + "speakers": 50812, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BR": 50812 + }, + "language_family": "Nuclear-Macro-Je", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kashubian", + "bcp_47": "csb", + "speakers": 49767, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PL": 49767 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Koro Wachi", + "bcp_47": "bqv", + "speakers": 46718, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CI": 46718 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chamorro", + "bcp_47": "ch", + "speakers": 46325, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GU": 37067, + "MP": 9258 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Atsam", + "bcp_47": "cch", + "speakers": 44946, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 44946 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bushi", + "bcp_47": "buc", + "speakers": 44620, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "YT": 44620 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Romansh", + "bcp_47": "rm", + "speakers": 42020, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CH": 42020 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Aghem", + "bcp_47": "agq", + "speakers": 38843, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 38843 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kuvi", + "bcp_47": "kxv", + "speakers": 38457, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 38457 + }, + "language_family": "Dravidian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Noon", + "bcp_47": "snf", + "speakers": 37767, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 37767 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Friulian", + "bcp_47": "fur", + "speakers": 37442, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IT": 37442 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Thulung", + "bcp_47": "tdh", + "speakers": 36393, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NP": 36393 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Emilian", + "bcp_47": "egl", + "speakers": 31201, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IT": 31201 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chuukese", + "bcp_47": "chk", + "speakers": 30731, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FM": 30731 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Western Mari", + "bcp_47": "mrj", + "speakers": 29762, + "scores": [], + "commonvoice_hours": 34.0, + "commonvoice_locale": "mrj", + "population": { + "RU": 29762 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hawaiian", + "bcp_47": "haw", + "speakers": 29605, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 29605 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mru", + "bcp_47": "mro", + "speakers": 29277, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BD": 29277 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Cajun French", + "bcp_47": "frc", + "speakers": 27942, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 27942 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nheengatu", + "bcp_47": "yrl", + "speakers": 26171, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BR": 21172, + "CO": 2994, + "VE": 2005 + }, + "language_family": "Tupian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Aragonese", + "bcp_47": "an", + "speakers": 26008, + "scores": [], + "commonvoice_hours": 13.0, + "commonvoice_locale": "an", + "population": { + "ES": 26008 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Cherokee", + "bcp_47": "chr", + "speakers": 25613, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 25613 + }, + "language_family": "Iroquoian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sinte Romani", + "bcp_47": "rmo", + "speakers": 24372, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CH": 24372 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ojibwa", + "bcp_47": "oj", + "speakers": 23747, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 23747 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Pohnpeian", + "bcp_47": "pon", + "speakers": 23560, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FM": 23560 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Laz", + "bcp_47": "lzz", + "speakers": 22965, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "lzz", + "population": { + "TR": 22965 + }, + "language_family": "Kartvelian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Muslim Tat", + "bcp_47": "ttt", + "speakers": 22453, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AZ": 22453 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Central Yupik", + "bcp_47": "esu", + "speakers": 20956, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "esu", + "population": { + "US": 20956 + }, + "language_family": "Eskimo-Aleut", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dakota", + "bcp_47": "dak", + "speakers": 20832, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 1206, + "US": 19626 + }, + "language_family": "Siouan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Southern Altai", + "bcp_47": "alt", + "speakers": 19841, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 19841 + }, + "language_family": "Turkic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Amo", + "bcp_47": "amo", + "speakers": 18620, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 18620 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Guajajára", + "bcp_47": "gub", + "speakers": 17784, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BR": 17784 + }, + "language_family": "Tupian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hanunoo", + "bcp_47": "hnn", + "speakers": 17469, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 17469 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tsakhur", + "bcp_47": "tkr", + "speakers": 16329, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AZ": 16329 + }, + "language_family": "Nakh-Daghestanian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Palauan", + "bcp_47": "pau", + "speakers": 16047, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PW": 16047 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Sanskrit", + "bcp_47": "sa", + "speakers": 15913, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 15913 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Bassari", + "bcp_47": "bsc", + "speakers": 15264, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 15264 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Oji-Cree", + "bcp_47": "ojs", + "speakers": 15078, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 15078 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Khamti", + "bcp_47": "kht", + "speakers": 13527, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IN": 9283, + "MM": 4244 + }, + "language_family": "Tai-Kadai", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Upper Sorbian", + "bcp_47": "hsb", + "speakers": 12826, + "scores": [], + "commonvoice_hours": 2.9, + "commonvoice_locale": "hsb", + "population": { + "DE": 12826 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chipewyan", + "bcp_47": "chp", + "speakers": 12816, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 12816 + }, + "language_family": "Athabaskan-Eyak-Tlingit", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Innu-aimun", + "bcp_47": "moe", + "speakers": 12062, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 12062 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lower Silesian", + "bcp_47": "sli", + "speakers": 11868, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PL": 11868 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Walser", + "bcp_47": "wae", + "speakers": 11377, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CH": 10085, + "LI": 1292 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Choctaw", + "bcp_47": "cho", + "speakers": 10977, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 10977 + }, + "language_family": "Muskogean", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tagbanwa", + "bcp_47": "tbw", + "speakers": 10045, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 10045 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Xavánte", + "bcp_47": "xav", + "speakers": 9951, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BR": 9951 + }, + "language_family": "Nuclear-Macro-Je", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tuvalu", + "bcp_47": "tvl", + "speakers": 9868, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TV": 9868 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern Frisian", + "bcp_47": "frr", + "speakers": 9619, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 9619 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Roviana", + "bcp_47": "rug", + "speakers": 9591, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SB": 9591 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Wallisian", + "bcp_47": "wls", + "speakers": 9512, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "WF": 9512 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tavringer Romani", + "bcp_47": "rmu", + "speakers": 9488, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SE": 9488 + }, + "language_family": "Speech Register", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Cree", + "bcp_47": "cr", + "speakers": 9047, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 9047 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kwasio", + "bcp_47": "nmg", + "speakers": 8878, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 8878 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lakota", + "bcp_47": "lkt", + "speakers": 8316, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 8316 + }, + "language_family": "Siouan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kosraean", + "bcp_47": "kos", + "speakers": 7990, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FM": 7990 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Inupiaq", + "bcp_47": "ik", + "speakers": 7983, + "scores": [], + "commonvoice_hours": 2.6, + "commonvoice_locale": "ipk", + "population": { + "US": 7983 + }, + "language_family": "Eskimo-Aleut", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Zoroastrian Dari", + "bcp_47": "gbz", + "speakers": 7983, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IR": 7983 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tasawaq", + "bcp_47": "twq", + "speakers": 7970, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NE": 7970 + }, + "language_family": "Songhay", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Buhid", + "bcp_47": "bku", + "speakers": 7970, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PH": 7970 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mi'kmaw", + "bcp_47": "mic", + "speakers": 7916, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 7916 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Hassaniyya", + "bcp_47": "mey", + "speakers": 7239, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 7239 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lower Sorbian", + "bcp_47": "dsb", + "speakers": 6974, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "dsb", + "population": { + "DE": 6974 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Nauru", + "bcp_47": "na", + "speakers": 6930, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NR": 6930 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Eastern Lawa", + "bcp_47": "lwl", + "speakers": 6898, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TH": 6898 + }, + "language_family": "Austroasiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yapese", + "bcp_47": "yap", + "speakers": 6556, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FM": 6556 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Atikamekw", + "bcp_47": "atj", + "speakers": 6408, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 6408 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Piedmontese", + "bcp_47": "pms", + "speakers": 6178, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IT": 6178 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kalo Finnish Romani", + "bcp_47": "rmf", + "speakers": 5015, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FI": 5015 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Siksiká", + "bcp_47": "bla", + "speakers": 4900, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 4900 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "East Futuna", + "bcp_47": "fud", + "speakers": 4756, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "WF": 4756 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Taroko", + "bcp_47": "trv", + "speakers": 4721, + "scores": [], + "commonvoice_hours": 4.7, + "commonvoice_locale": "trv", + "population": { + "TW": 4721 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Plains Cree", + "bcp_47": "crk", + "speakers": 4146, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 4146 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Safaliba", + "bcp_47": "saf", + "speakers": 4108, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GH": 4108 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Muscogee", + "bcp_47": "mus", + "speakers": 3992, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 3992 + }, + "language_family": "Muskogean", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Veps", + "bcp_47": "vep", + "speakers": 3543, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 3543 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ménik", + "bcp_47": "tnr", + "speakers": 3305, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SN": 3305 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Virgin Islands Creole English", + "bcp_47": "vic", + "speakers": 3113, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SX": 3113 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Turoyo", + "bcp_47": "tru", + "speakers": 3035, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TR": 3035 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ulithian", + "bcp_47": "uli", + "speakers": 2971, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FM": 2971 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Rotuman", + "bcp_47": "rtm", + "speakers": 2527, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FJ": 2527 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Warlpiri", + "bcp_47": "wbp", + "speakers": 2496, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "AU": 2496 + }, + "language_family": "Pama-Nyungan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Yangben", + "bcp_47": "yav", + "speakers": 2303, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CM": 2303 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Slave", + "bcp_47": "den", + "speakers": 2299, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 2299 + }, + "language_family": "Athabaskan-Eyak-Tlingit", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Dogrib", + "bcp_47": "dgr", + "speakers": 2111, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 2111 + }, + "language_family": "Athabaskan-Eyak-Tlingit", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Eastern Frisian", + "bcp_47": "frs", + "speakers": 2004, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 2004 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Cornish", + "bcp_47": "kw", + "speakers": 1973, + "scores": [], + "commonvoice_hours": 2.9, + "commonvoice_locale": "kw", + "population": { + "GB": 1973 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Swampy Cree", + "bcp_47": "csw", + "speakers": 1809, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 1809 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Mohawk", + "bcp_47": "moh", + "speakers": 1772, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 1772 + }, + "language_family": "Iroquoian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Manx", + "bcp_47": "gv", + "speakers": 1719, + "scores": [], + "commonvoice_hours": 2.7, + "commonvoice_locale": "gv", + "population": { + "IM": 1719 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lule Sami", + "bcp_47": "smj", + "speakers": 1530, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SE": 1530 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Naskapi", + "bcp_47": "nsk", + "speakers": 1395, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 1395 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tokelau", + "bcp_47": "tkl", + "speakers": 1285, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "TK": 1285 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Niuean", + "bcp_47": "niu", + "speakers": 1120, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NU": 1120 + }, + "language_family": "Austronesian", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Saterland Frisian", + "bcp_47": "stq", + "speakers": 962, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 962 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Seri", + "bcp_47": "sei", + "speakers": 901, + "scores": [], + "commonvoice_hours": 1.0, + "commonvoice_locale": "sei", + "population": { + "MX": 901 + }, + "language_family": null, + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chilcotin", + "bcp_47": "clc", + "speakers": 867, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 867 + }, + "language_family": "Athabaskan-Eyak-Tlingit", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Latin", + "bcp_47": "la", + "speakers": 820, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "VA": 820 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Halkomelem", + "bcp_47": "hur", + "speakers": 716, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 716 + }, + "language_family": "Salishan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Michif", + "bcp_47": "crg", + "speakers": 678, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 678 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Skolt Sami", + "bcp_47": "sms", + "speakers": 613, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FI": 613 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Inari Sami", + "bcp_47": "smn", + "speakers": 613, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "FI": 613 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lillooet", + "bcp_47": "lil", + "speakers": 528, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 528 + }, + "language_family": "Salishan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Okanagan", + "bcp_47": "oka", + "speakers": 490, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 490 + }, + "language_family": "Salishan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Maliseet-Passamaquoddy", + "bcp_47": "pqm", + "speakers": 490, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 490 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Kwakʼwala", + "bcp_47": "kwk", + "speakers": 377, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 377 + }, + "language_family": "Wakashan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Northern East Cree", + "bcp_47": "crl", + "speakers": 377, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 377 + }, + "language_family": "Algic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Gwichʼin", + "bcp_47": "gwi", + "speakers": 302, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CA": 302 + }, + "language_family": "Athabaskan-Eyak-Tlingit", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Esperanto", + "bcp_47": "eo", + "speakers": 301, + "scores": [], + "commonvoice_hours": 1436.0, + "commonvoice_locale": "eo", + "population": { + "SM": 301 + }, + "language_family": "Artificial Language", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Southern Sami", + "bcp_47": "sma", + "speakers": 296, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "SE": 296 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Tsakonian", + "bcp_47": "tsd", + "speakers": 202, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "GR": 202 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ingrian", + "bcp_47": "izh", + "speakers": 142, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "izh", + "population": { + "RU": 142 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Interlingua", + "bcp_47": "ia", + "speakers": 136, + "scores": [], + "commonvoice_hours": 14.0, + "commonvoice_locale": "ia", + "population": { + "FR": 136, + "SE": 0 + }, + "language_family": "Artificial Language", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Araona", + "bcp_47": "aro", + "speakers": 105, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "BO": 105 + }, + "language_family": "Pano-Tacanan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Prussian", + "bcp_47": "prg", + "speakers": 38, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "PL": 38 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Interlingue", + "bcp_47": "ie", + "speakers": 1, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "ie", + "population": { + "EE": 1 + }, + "language_family": "Artificial Language", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Literary Chinese", + "bcp_47": "lzh", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "CN": 0 + }, + "language_family": "Sino-Tibetan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Ido", + "bcp_47": "io", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 0 + }, + "language_family": "Artificial Language", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Lojban", + "bcp_47": "jbo", + "speakers": 0, + "scores": [], + "commonvoice_hours": 0.0, + "commonvoice_locale": "jbo", + "population": { + "US": 0 + }, + "language_family": "Artificial Language", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Jutish", + "bcp_47": "jut", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DK": 0 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Votic", + "bcp_47": "vot", + "speakers": 0, + "scores": [], + "commonvoice_hours": 0.1, + "commonvoice_locale": "vot", + "population": { + "RU": 0 + }, + "language_family": "Uralic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Geez", + "bcp_47": "gez", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "ET": 0 + }, + "language_family": "Afro-Asiatic", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Osage", + "bcp_47": "osa", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 0 + }, + "language_family": "Siouan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Romagnol", + "bcp_47": "rgn", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "IT": 0 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Church Slavic", + "bcp_47": "cu", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "RU": 0 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Samogitian", + "bcp_47": "sgs", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "LT": 0 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Obolo", + "bcp_47": "ann", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "NG": 0 + }, + "language_family": "Atlantic-Congo", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Chickasaw", + "bcp_47": "cic", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 0 + }, + "language_family": "Muskogean", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Caddo", + "bcp_47": "cad", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "US": 0 + }, + "language_family": "Caddoan", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null + }, + { + "language_name": "Palatine German", + "bcp_47": "pfl", + "speakers": 0, + "scores": [], + "commonvoice_hours": null, + "commonvoice_locale": null, + "population": { + "DE": 0 + }, + "language_family": "Indo-European", + "mt_bleu": null, + "mt_chrf": null, + "cls_acc": null, + "mlm_chrf": null, + "asr_wer": null, + "asr_chrf": null, + "overall_score": null } ] \ No newline at end of file