{ "model_table": [ { "rank": 1, "provider": "Google", "model": "Gemini 2.0 Flash 001", "hf_id": null, "creation_date": null, "size": null, "type": "Commercial", "license": null, "average": 0.72, "classification_accuracy": 0.87, "language_modeling_chrf": 0.96, "translation_bleu": 0.45, "translation_chrf": 0.58 }, { "rank": 2, "provider": "Google", "model": "Gemini 2.0 Flash Lite 001", "hf_id": null, "creation_date": null, "size": null, "type": "Commercial", "license": null, "average": 0.66, "classification_accuracy": 0.73, "language_modeling_chrf": 0.97, "translation_bleu": 0.4, "translation_chrf": 0.54 }, { "rank": 3, "provider": "Google", "model": "Gemma 3 27b It", "hf_id": "google/gemma-3-27b-it", "creation_date": "2025-03-01", "size": 27432406640.0, "type": "Open", "license": "Gemma", "average": 0.65, "classification_accuracy": 0.72, "language_modeling_chrf": 0.96, "translation_bleu": 0.37, "translation_chrf": 0.54 }, { "rank": 4, "provider": "Meta Llama", "model": "Llama 3.1 70b Instruct", "hf_id": "meta-llama/Llama-3.1-70B-Instruct", "creation_date": "2024-07-16", "size": 70553706496.0, "type": "Open", "license": "Llama3.1", "average": 0.62, "classification_accuracy": 0.57, "language_modeling_chrf": 0.92, "translation_bleu": 0.43, "translation_chrf": 0.57 }, { "rank": 5, "provider": "Amazon", "model": "Nova Micro V1", "hf_id": null, "creation_date": null, "size": null, "type": "Commercial", "license": null, "average": 0.61, "classification_accuracy": 0.52, "language_modeling_chrf": 0.94, "translation_bleu": 0.4, "translation_chrf": 0.56 }, { "rank": 6, "provider": "Meta Llama", "model": "Llama 3 70b Instruct", "hf_id": null, "creation_date": null, "size": null, "type": "Commercial", "license": null, "average": 0.61, "classification_accuracy": 0.8, "language_modeling_chrf": 0.95, "translation_bleu": 0.25, "translation_chrf": 0.43 }, { "rank": 7, "provider": "OpenAI", "model": "GPT 4o Mini", "hf_id": null, "creation_date": null, "size": null, "type": "Commercial", "license": null, "average": 0.6, "classification_accuracy": 0.52, "language_modeling_chrf": 0.95, "translation_bleu": 0.39, "translation_chrf": 0.55 }, { "rank": 8, "provider": "MistralAI", "model": "Mistral Small 24b Instruct 2501", "hf_id": "mistralai/Mistral-Small-24B-Instruct-2501", "creation_date": "2025-01-28", "size": 23572403200.0, "type": "Open", "license": "Apache 2.0", "average": 0.58, "classification_accuracy": 0.55, "language_modeling_chrf": 0.86, "translation_bleu": 0.38, "translation_chrf": 0.52 }, { "rank": 9, "provider": "Meta Llama", "model": "Llama 3.3 70b Instruct", "hf_id": "meta-llama/Llama-3.3-70B-Instruct", "creation_date": "2024-11-26", "size": 70553706496.0, "type": "Open", "license": "Llama3.3", "average": 0.56, "classification_accuracy": 0.5, "language_modeling_chrf": 0.94, "translation_bleu": 0.31, "translation_chrf": 0.48 }, { "rank": 10, "provider": "MistralAI", "model": "Mistral Nemo", "hf_id": null, "creation_date": null, "size": null, "type": "Commercial", "license": null, "average": 0.55, "classification_accuracy": 0.5, "language_modeling_chrf": 0.88, "translation_bleu": 0.32, "translation_chrf": 0.49 }, { "rank": 11, "provider": "Microsoft", "model": "Phi 4 Multimodal Instruct", "hf_id": "microsoft/Phi-4-multimodal-instruct", "creation_date": "2025-02-24", "size": 5574460384.0, "type": "Open", "license": "Mit", "average": 0.52, "classification_accuracy": 0.42, "language_modeling_chrf": 0.87, "translation_bleu": 0.32, "translation_chrf": 0.46 }, { "rank": 12, "provider": "Qwen", "model": "Qwq 32b", "hf_id": "Qwen/QwQ-32B", "creation_date": "2025-03-05", "size": 32763876352.0, "type": "Open", "license": "Apache 2.0", "average": 0.25, "classification_accuracy": 0.0, "language_modeling_chrf": 0.48, "translation_bleu": 0.21, "translation_chrf": 0.3 } ], "language_table": [ { "bcp_47": "en", "language_name": "English", "autonym": "English", "speakers": 1636485840, "family": "Indo-European", "average": 0.47, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.58, "language_modeling_chrf": 0.92, "translation_bleu": 0.37, "translation_chrf": 0.49 }, { "bcp_47": "zh", "language_name": "Chinese", "autonym": "中文", "speakers": 1304678914, "family": "Sino-Tibetan", "average": 0.46, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.55, "language_modeling_chrf": 0.86, "translation_bleu": 0.35, "translation_chrf": 0.53 }, { "bcp_47": "hi", "language_name": "Hindi", "autonym": "हिन्दी", "speakers": 546882144, "family": "Indo-European", "average": 0.46, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.53, "language_modeling_chrf": 0.95, "translation_bleu": 0.32, "translation_chrf": 0.49 }, { "bcp_47": "es", "language_name": "Spanish", "autonym": "Español", "speakers": 493528077, "family": "Indo-European", "average": 0.45, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.53, "language_modeling_chrf": 0.96, "translation_bleu": 0.28, "translation_chrf": 0.46 }, { "bcp_47": "ar", "language_name": "Arabic", "autonym": "العربية", "speakers": 351664197, "family": "Afro-Asiatic", "average": 0.42, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.43, "language_modeling_chrf": 0.93, "translation_bleu": 0.28, "translation_chrf": 0.47 }, { "bcp_47": "ur", "language_name": "Urdu", "autonym": "اردو", "speakers": 290790290, "family": "Indo-European", "average": 0.42, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.5, "language_modeling_chrf": 0.93, "translation_bleu": 0.24, "translation_chrf": 0.42 }, { "bcp_47": "fr", "language_name": "French", "autonym": "Français", "speakers": 278611507, "family": "Indo-European", "average": 0.46, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.53, "language_modeling_chrf": 0.98, "translation_bleu": 0.32, "translation_chrf": 0.49 }, { "bcp_47": "bn", "language_name": "Bangla", "autonym": "বাংলা", "speakers": 267193288, "family": "Indo-European", "average": 0.38, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.4, "language_modeling_chrf": 0.9, "translation_bleu": 0.2, "translation_chrf": 0.41 }, { "bcp_47": "pt", "language_name": "Portuguese", "autonym": "Português", "speakers": 237496885, "family": "Indo-European", "average": 0.46, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.5, "language_modeling_chrf": 0.97, "translation_bleu": 0.31, "translation_chrf": 0.49 }, { "bcp_47": "pa", "language_name": "Punjabi", "autonym": "ਪੰਜਾਬੀ", "speakers": 203571210, "family": "Indo-European", "average": 0.42, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.4, "language_modeling_chrf": 0.87, "translation_bleu": 0.34, "translation_chrf": 0.49 }, { "bcp_47": "ru", "language_name": "Russian", "autonym": "Русский", "speakers": 195841151, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sw", "language_name": "Swahili", "autonym": "Kiswahili", "speakers": 171610296, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "id", "language_name": "Indonesian", "autonym": "Bahasa Indonesia", "speakers": 171207687, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "de", "language_name": "German", "autonym": "Deutsch", "speakers": 136350226, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ja", "language_name": "Japanese", "autonym": "日本語", "speakers": 119729026, "family": "Japonic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "te", "language_name": "Telugu", "autonym": "తెలుగు", "speakers": 95478480, "family": "Dravidian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lah", "language_name": "Western Panjabi", "autonym": "لہندا پنجابی", "speakers": 93433552, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mr", "language_name": "Marathi", "autonym": "मराठी", "speakers": 92826300, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "jv", "language_name": "Javanese", "autonym": "Jawa", "speakers": 91180665, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vi", "language_name": "Vietnamese", "autonym": "Tiếng Việt", "speakers": 86222962, "family": "Austroasiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ta", "language_name": "Tamil", "autonym": "தமிழ்", "speakers": 85616159, "family": "Dravidian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fa", "language_name": "Persian", "autonym": "فارسی", "speakers": 84710459, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wuu", "language_name": "Wu Chinese", "autonym": "Wu Chinese", "speakers": 83641200, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tr", "language_name": "Turkish", "autonym": "Türkçe", "speakers": 80360704, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yue", "language_name": "Cantonese", "autonym": "粵語", "speakers": 79654759, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ko", "language_name": "Korean", "autonym": "한국어", "speakers": 78357046, "family": "Koreanic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "it", "language_name": "Italian", "autonym": "Italiano", "speakers": 70247060, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fil", "language_name": "Filipino", "autonym": "Filipino", "speakers": 67471096, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "arz", "language_name": "Egyptian Arabic", "autonym": "Egyptian Arabic", "speakers": 66639360, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gu", "language_name": "Gujarati", "autonym": "ગુજરાતી", "speakers": 61721799, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "th", "language_name": "Thai", "autonym": "ไทย", "speakers": 55181920, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ps", "language_name": "Pashto", "autonym": "پښتو", "speakers": 53542641, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kn", "language_name": "Kannada", "autonym": "ಕನ್ನಡ", "speakers": 49065330, "family": "Dravidian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pcm", "language_name": "Nigerian Pidgin", "autonym": "Naijíriá Píjin", "speakers": 44945880, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ml", "language_name": "Malayalam", "autonym": "മലയാളം", "speakers": 43257484, "family": "Dravidian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "or", "language_name": "Odia", "autonym": "ଓଡ଼ିଆ", "speakers": 42434880, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pl", "language_name": "Polish", "autonym": "Polski", "speakers": 41077399, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hsn", "language_name": "Xiang Chinese", "autonym": "Xiang Chinese", "speakers": 40426580, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ha", "language_name": "Hausa", "autonym": "Hausa", "speakers": 40411882, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sd", "language_name": "Sindhi", "autonym": "سنڌي", "speakers": 40329510, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "apc", "language_name": "North Levantine Arabic", "autonym": "العامية", "speakers": 39031474, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ms", "language_name": "Malay", "autonym": "Bahasa Malaysia", "speakers": 38097307, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "my", "language_name": "Burmese", "autonym": "မြန်မာ", "speakers": 36559231, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "am", "language_name": "Amharic", "autonym": "አማርኛ", "speakers": 35728475, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "arq", "language_name": "Algerian Arabic", "autonym": "Algerian Arabic", "speakers": 35667507, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "om", "language_name": "Oromo", "autonym": "Oromoo", "speakers": 34897121, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bho", "language_name": "Bhojpuri", "autonym": "भोजपुरी", "speakers": 32934797, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "uz", "language_name": "Uzbek", "autonym": "O‘Zbek", "speakers": 32792780, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "az", "language_name": "Azerbaijani", "autonym": "Azərbaycan", "speakers": 32446682, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hak", "language_name": "Hakka Chinese", "autonym": "Hakka Chinese", "speakers": 32062460, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "su", "language_name": "Sundanese", "autonym": "Basa Sunda", "speakers": 32043120, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nl", "language_name": "Dutch", "autonym": "Nederlands", "speakers": 31765645, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ary", "language_name": "Moroccan Arabic", "autonym": "Moroccan Arabic", "speakers": 30938679, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "uk", "language_name": "Ukrainian", "autonym": "Українська", "speakers": 29348975, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yo", "language_name": "Yoruba", "autonym": "Èdè Yorùbá", "speakers": 28685568, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "skr", "language_name": "Saraiki", "autonym": "سرائیکی", "speakers": 28020120, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ig", "language_name": "Igbo", "autonym": "Igbo", "speakers": 27823640, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nan", "language_name": "Min Nan Chinese", "autonym": "Min Nan Chinese", "speakers": 26486380, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ceb", "language_name": "Cebuano", "autonym": "Cebuano", "speakers": 26203440, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "awa", "language_name": "Awadhi", "autonym": "Awadhi", "speakers": 25862924, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mg", "language_name": "Malagasy", "autonym": "Malagasy", "speakers": 24260130, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gan", "language_name": "Gan Chinese", "autonym": "Gan Chinese", "speakers": 23698340, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ro", "language_name": "Romanian", "autonym": "Română", "speakers": 22187408, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bar", "language_name": "Bavarian", "autonym": "Bavarian", "speakers": 22043627, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ne", "language_name": "Nepali", "autonym": "नेपाली", "speakers": 20903374, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mai", "language_name": "Maithili", "autonym": "मैथिली", "speakers": 19249149, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "as", "language_name": "Assamese", "autonym": "অসমীয়া", "speakers": 17239170, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ny", "language_name": "Nyanja", "autonym": "Nyanja", "speakers": 17026781, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "so", "language_name": "Somali", "autonym": "Soomaali", "speakers": 16911645, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mad", "language_name": "Madurese", "autonym": "Madurese", "speakers": 16822638, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tts", "language_name": "Northeastern Thai", "autonym": "Northeastern Thai", "speakers": 16554576, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rkt", "language_name": "Rangpuri", "autonym": "Rangpuri", "speakers": 16274502, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mag", "language_name": "Magahi", "autonym": "Magahi", "speakers": 15913080, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bgc", "language_name": "Haryanvi", "autonym": "हरियाणवी", "speakers": 15913080, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mwr", "language_name": "Marwari", "autonym": "Marwari", "speakers": 15913080, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sr", "language_name": "Serbian", "autonym": "Српски", "speakers": 15602410, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "si", "language_name": "Sinhala", "autonym": "සිංහල", "speakers": 15564656, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "km", "language_name": "Khmer", "autonym": "ខ្មែរ", "speakers": 15065030, "family": "Austroasiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hne", "language_name": "Chhattisgarhi", "autonym": "Chhattisgarhi", "speakers": 14586990, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fuv", "language_name": "Nigerian Fulfulde", "autonym": "Nigerian Fulfulde", "speakers": 14339876, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "zu", "language_name": "Zulu", "autonym": "Isizulu", "speakers": 13973830, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kk", "language_name": "Kazakh", "autonym": "Қазақ Тілі", "speakers": 13637392, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dcc", "language_name": "Deccan", "autonym": "Deccan", "speakers": 13128291, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cs", "language_name": "Czech", "autonym": "Čeština", "speakers": 13045532, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sv", "language_name": "Swedish", "autonym": "Svenska", "speakers": 12932871, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hu", "language_name": "Hungarian", "autonym": "Magyar", "speakers": 12443430, "family": "Uralic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "el", "language_name": "Greek", "autonym": "Ελληνικά", "speakers": 12292242, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sn", "language_name": "Shona", "autonym": "Chishona", "speakers": 11782503, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nds", "language_name": "Low German", "autonym": "Neddersass’Sch", "speakers": 11520008, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ak", "language_name": "Akan", "autonym": "Akan", "speakers": 11442678, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "qu", "language_name": "Quechua", "autonym": "Runasimi", "speakers": 11385851, "family": "Quechuan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ckb", "language_name": "Central Kurdish", "autonym": "کوردیی ناوەندی", "speakers": 11086549, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rw", "language_name": "Kinyarwanda", "autonym": "Kinyarwanda", "speakers": 11083625, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wo", "language_name": "Wolof", "autonym": "Wolof", "speakers": 11025494, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "aeb", "language_name": "Tunisian Arabic", "autonym": "Tunisian Arabic", "speakers": 10549080, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ilo", "language_name": "Iloko", "autonym": "Ilokano", "speakers": 10481376, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "xh", "language_name": "Xhosa", "autonym": "Isixhosa", "speakers": 10182944, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ti", "language_name": "Tigrinya", "autonym": "ትግርኛ", "speakers": 10145911, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "be", "language_name": "Belarusian", "autonym": "Беларуская", "speakers": 10064517, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lua", "language_name": "Luba-Lulua", "autonym": "Luba-Lulua", "speakers": 9770880, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tg", "language_name": "Tajik", "autonym": "Тоҷикӣ", "speakers": 9644223, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "umb", "language_name": "Umbundu", "autonym": "Umbundu", "speakers": 9431467, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bm", "language_name": "Bambara", "autonym": "Bamanakan", "speakers": 9385632, "family": "Mande", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "af", "language_name": "Afrikaans", "autonym": "Afrikaans", "speakers": 9318845, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hil", "language_name": "Hiligaynon", "autonym": "Ilonggo", "speakers": 9171204, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ki", "language_name": "Kikuyu", "autonym": "Gikuyu", "speakers": 9099743, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ht", "language_name": "Haitian Creole", "autonym": "Haitian Creole", "speakers": 8964918, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ca", "language_name": "Catalan", "autonym": "Català", "speakers": 8679139, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "he", "language_name": "Hebrew", "autonym": "עברית", "speakers": 8675480, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ii", "language_name": "Sichuan Yi", "autonym": "ꆈꌠꉙ", "speakers": 8364120, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mos", "language_name": "Mossi", "autonym": "Mossi", "speakers": 8334160, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bal", "language_name": "Baluchi", "autonym": "بلۆچی", "speakers": 8227887, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "syl", "language_name": "Sylheti", "autonym": "Sylheti", "speakers": 8132550, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kmb", "language_name": "Kimbundu", "autonym": "Kimbundu", "speakers": 8130575, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ug", "language_name": "Uyghur", "autonym": "ئۇيغۇرچە", "speakers": 8052967, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "min", "language_name": "Minangkabau", "autonym": "Minangkabau", "speakers": 8010780, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gsw", "language_name": "Swiss German", "autonym": "Schwiizertüütsch", "speakers": 7956952, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bg", "language_name": "Bulgarian", "autonym": "Български", "speakers": 7878315, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "zgh", "language_name": "Standard Moroccan Tamazight", "autonym": "ⵜⴰⵎⴰⵣⵉⵖⵜ", "speakers": 7823574, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ff", "language_name": "Fula", "autonym": "Pulaar", "speakers": 7788904, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bs", "language_name": "Bosnian", "autonym": "Bosanski", "speakers": 7594468, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rn", "language_name": "Rundi", "autonym": "Ikirundi", "speakers": 7475454, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bjj", "language_name": "Kanauji", "autonym": "Kanauji", "speakers": 7426104, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sat", "language_name": "Santali", "autonym": "ᱥᱟᱱᱛᱟᱲᱤ", "speakers": 7293495, "family": "Austroasiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "da", "language_name": "Danish", "autonym": "Dansk", "speakers": 7072056, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tk", "language_name": "Turkmen", "autonym": "Türkmen Dili", "speakers": 6870838, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ku", "language_name": "Kurdish", "autonym": "Kurdî (Kurmancî)", "speakers": 6866757, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hr", "language_name": "Croatian", "autonym": "Hrvatski", "speakers": 6813164, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sq", "language_name": "Albanian", "autonym": "Shqip", "speakers": 6791906, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sk", "language_name": "Slovak", "autonym": "Slovenčina", "speakers": 6680269, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dyu", "language_name": "Dyula", "autonym": "Dyula", "speakers": 6667328, "family": "Mande", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nod", "language_name": "Northern Thai", "autonym": "Northern Thai", "speakers": 6621830, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mn", "language_name": "Mongolian", "autonym": "Монгол", "speakers": 6572846, "family": "Mongolic-Khitan", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "st", "language_name": "Southern Sotho", "autonym": "Sesotho", "speakers": 6390567, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kri", "language_name": "Krio", "autonym": "Krio", "speakers": 6293684, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "shi", "language_name": "Tachelhit", "autonym": "ⵜⴰⵛⵍⵃⵉⵜ", "speakers": 6187736, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tn", "language_name": "Tswana", "autonym": "Tswana", "speakers": 6113428, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wtm", "language_name": "Mewati", "autonym": "Mewati", "speakers": 6100014, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "luy", "language_name": "Luyia", "autonym": "Luluhia", "speakers": 5888069, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gn", "language_name": "Guarani", "autonym": "Avañe’Ẽ", "speakers": 5827107, "family": "Tupian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fi", "language_name": "Finnish", "autonym": "Suomi", "speakers": 5736842, "family": "Uralic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lg", "language_name": "Ganda", "autonym": "Luganda", "speakers": 5622890, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bew", "language_name": "Betawi", "autonym": "Betawi", "speakers": 5607546, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ks", "language_name": "Kashmiri", "autonym": "کٲشُر", "speakers": 5598085, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sou", "language_name": "Southern Thai", "autonym": "Southern Thai", "speakers": 5518192, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nb", "language_name": "Norwegian Bokmål", "autonym": "Norsk Bokmål", "speakers": 5468932, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "no", "language_name": "Norwegian", "autonym": "Norsk", "speakers": 5467440, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bem", "language_name": "Bemba", "autonym": "Ichibemba", "speakers": 5402246, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hy", "language_name": "Armenian", "autonym": "Հայերեն", "speakers": 5317273, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nso", "language_name": "Northern Sotho", "autonym": "Northern Sotho", "speakers": 5307578, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "luo", "language_name": "Luo (Kenya and Tanzania)", "autonym": "Dholuo", "speakers": 5245734, "family": "Nilotic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tpi", "language_name": "Tok Pisin", "autonym": "Tok Pisin", "speakers": 5154217, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lo", "language_name": "Lao", "autonym": "ລາວ", "speakers": 5138706, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "suk", "language_name": "Sukuma", "autonym": "Sukuma", "speakers": 5094094, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kok", "language_name": "Konkani", "autonym": "कोंकणी", "speakers": 4906533, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ts", "language_name": "Tsonga", "autonym": "Tsonga", "speakers": 4880932, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vmf", "language_name": "Main-Franconian", "autonym": "Main-Franconian", "speakers": 4809582, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ban", "language_name": "Balinese", "autonym": "Balinese", "speakers": 4806468, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ee", "language_name": "Ewe", "autonym": "Eʋegbe", "speakers": 4690857, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "za", "language_name": "Zhuang", "autonym": "Vahcuengh", "speakers": 4321462, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bug", "language_name": "Buginese", "autonym": "Buginese", "speakers": 4298211, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mzn", "language_name": "Mazanderani", "autonym": "مازرونی", "speakers": 4246165, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gom", "language_name": "Goan Konkani", "autonym": "Goan Konkani", "speakers": 4243488, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kam", "language_name": "Kamba", "autonym": "Kikamba", "speakers": 4068120, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kln", "language_name": "Kalenjin", "autonym": "Kalenjin", "speakers": 4068120, "family": "Nilotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bjn", "language_name": "Banjar", "autonym": "Banjar", "speakers": 4010288, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hno", "language_name": "Northern Hindko", "autonym": "Northern Hindko", "speakers": 3969517, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vmw", "language_name": "Makhuwa", "autonym": "Emakhuwa", "speakers": 3912766, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "glk", "language_name": "Gilaki", "autonym": "Gilaki", "speakers": 3906472, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lmo", "language_name": "Lombard", "autonym": "Lombard", "speakers": 3901518, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dje", "language_name": "Zarma", "autonym": "Zarmaciine", "speakers": 3871308, "family": "Songhay", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ndc", "language_name": "Ndau", "autonym": "Ndau", "speakers": 3867046, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sid", "language_name": "Sidamo", "autonym": "Sidamo", "speakers": 3783955, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ace", "language_name": "Achinese", "autonym": "Achinese", "speakers": 3738364, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "swv", "language_name": "Shekhawati", "autonym": "Shekhawati", "speakers": 3713052, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rif", "language_name": "Riffian", "autonym": "Tarifit", "speakers": 3692411, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "shn", "language_name": "Shan", "autonym": "တႆး", "speakers": 3687984, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lmn", "language_name": "Lambadi", "autonym": "Lambadi", "speakers": 3580443, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gbm", "language_name": "Garhwali", "autonym": "Garhwali", "speakers": 3580443, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ka", "language_name": "Georgian", "autonym": "ქართული", "speakers": 3543646, "family": "Kartvelian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gl", "language_name": "Galician", "autonym": "Galego", "speakers": 3515530, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ln", "language_name": "Lingala", "autonym": "Lingála", "speakers": 3514491, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "man", "language_name": "Mandingo", "autonym": "Mandingo", "speakers": 3511762, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tzm", "language_name": "Central Atlas Tamazight", "autonym": "Tamaziɣt N Laṭlaṣ", "speakers": 3485047, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mfa", "language_name": "Pattani Malay", "autonym": "Pattani Malay", "speakers": 3448870, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tiv", "language_name": "Tiv", "autonym": "Tiv", "speakers": 3424448, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kab", "language_name": "Kabyle", "autonym": "Taqbaylit", "speakers": 3351886, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ky", "language_name": "Kyrgyz", "autonym": "Кыргызча", "speakers": 3338267, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bik", "language_name": "Bikol", "autonym": "Bikol", "speakers": 3275430, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fon", "language_name": "Fon", "autonym": "Fon", "speakers": 3216150, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gon", "language_name": "Gondi", "autonym": "Gondi", "speakers": 3182616, "family": "Dravidian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "war", "language_name": "Waray", "autonym": "Waray", "speakers": 3166927, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sdh", "language_name": "Southern Kurdish", "autonym": "کوردی خوارگ", "speakers": 3142162, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "brh", "language_name": "Brahui", "autonym": "Brahui", "speakers": 3035513, "family": "Dravidian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bci", "language_name": "Baoulé", "autonym": "Baoulé", "speakers": 3022921, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bo", "language_name": "Tibetan", "autonym": "བོད་སྐད་", "speakers": 3006697, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ibb", "language_name": "Ibibio", "autonym": "Ibibio", "speakers": 2996392, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "efi", "language_name": "Efik", "autonym": "Efik", "speakers": 2996392, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sg", "language_name": "Sango", "autonym": "Sängö", "speakers": 2935521, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kfy", "language_name": "Kumaoni", "autonym": "Kumaoni", "speakers": 2917398, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ay", "language_name": "Aymara", "autonym": "Aymara", "speakers": 2838620, "family": "Aymaran", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nyn", "language_name": "Nyankole", "autonym": "Runyankore", "speakers": 2724939, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "jam", "language_name": "Jamaican Creole English", "autonym": "Jamaican Creole English", "speakers": 2668142, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "doi", "language_name": "Dogri", "autonym": "डोगरी", "speakers": 2652180, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "guz", "language_name": "Gusii", "autonym": "Ekegusii", "speakers": 2622867, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sas", "language_name": "Sasak", "autonym": "Sasak", "speakers": 2590152, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kru", "language_name": "Kurukh", "autonym": "Kurukh", "speakers": 2519571, "family": "Dravidian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pam", "language_name": "Pampanga", "autonym": "Pampanga", "speakers": 2511163, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fbl", "language_name": "West Albay Bikol", "autonym": "West Albay Bikol", "speakers": 2511163, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lt", "language_name": "Lithuanian", "autonym": "Lietuvių", "speakers": 2488617, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bej", "language_name": "Beja", "autonym": "Beja", "speakers": 2460326, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bbc", "language_name": "Batak Toba", "autonym": "Batak Toba", "speakers": 2456639, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sck", "language_name": "Sadri", "autonym": "Sadri", "speakers": 2386962, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wbq", "language_name": "Waddar", "autonym": "Waddar", "speakers": 2386962, "family": "Dravidian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lu", "language_name": "Luba-Katanga", "autonym": "Tshiluba", "speakers": 2340940, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cgg", "language_name": "Chiga", "autonym": "Rukiga", "speakers": 2335662, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "xog", "language_name": "Soga", "autonym": "Olusoga", "speakers": 2292409, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ss", "language_name": "Swati", "autonym": "Siswati", "speakers": 2212379, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "haz", "language_name": "Hazaragi", "autonym": "Hazaragi", "speakers": 2161984, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mer", "language_name": "Meru", "autonym": "Kĩmĩrũ", "speakers": 2141116, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "xnr", "language_name": "Kangri", "autonym": "कांगड़ी", "speakers": 2121744, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "aa", "language_name": "Afar", "autonym": "Afar", "speakers": 2119663, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "teo", "language_name": "Teso", "autonym": "Kiteso", "speakers": 2082973, "family": "Nilotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ngl", "language_name": "Lomwe", "autonym": "Lomwe", "speakers": 2046678, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "oc", "language_name": "Occitan", "autonym": "Occitan", "speakers": 2040398, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bgn", "language_name": "Western Balochi", "autonym": "بلوچی (رخشانی)", "speakers": 2037382, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lrc", "language_name": "Northern Luri", "autonym": "لۊری شومالی", "speakers": 2020512, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wbr", "language_name": "Wagdi", "autonym": "Wagdi", "speakers": 1989135, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tcy", "language_name": "Tulu", "autonym": "Tulu", "speakers": 1989135, "family": "Dravidian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "khn", "language_name": "Khandesi", "autonym": "Khandesi", "speakers": 1989135, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tt", "language_name": "Tatar", "autonym": "Татар", "speakers": 1984108, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sl", "language_name": "Slovenian", "autonym": "Slovenščina", "speakers": 1973181, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mak", "language_name": "Makasar", "autonym": "Makasar", "speakers": 1949290, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wal", "language_name": "Wolaytta", "autonym": "Wolaytta", "speakers": 1946034, "family": "Ta-Ne-Omotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nym", "language_name": "Nyamwezi", "autonym": "Nyamwezi", "speakers": 1932242, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "brx", "language_name": "Bodo", "autonym": "बर’", "speakers": 1856526, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ljp", "language_name": "Lampung Api", "autonym": "Lampung Api", "speakers": 1842479, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cv", "language_name": "Chuvash", "autonym": "Чӑваш", "speakers": 1842386, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ba", "language_name": "Bashkir", "autonym": "Башҡорт Теле", "speakers": 1842386, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rhg", "language_name": "Rohingya", "autonym": "𐴌𐴗𐴥𐴝𐴙𐴚𐴒𐴙𐴝", "speakers": 1824082, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "men", "language_name": "Mende", "autonym": "Mende", "speakers": 1813083, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tum", "language_name": "Tumbuka", "autonym": "Tumbuka", "speakers": 1780514, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tmh", "language_name": "Tamashek", "autonym": "Tamashek", "speakers": 1776965, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nd", "language_name": "North Ndebele", "autonym": "Isindebele", "speakers": 1745556, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mas", "language_name": "Masai", "autonym": "Maa", "speakers": 1734738, "family": "Nilotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "srr", "language_name": "Serer", "autonym": "Serer", "speakers": 1731004, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "noe", "language_name": "Nimadi", "autonym": "Nimadi", "speakers": 1723917, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tem", "language_name": "Timne", "autonym": "Timne", "speakers": 1722482, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sco", "language_name": "Scots", "autonym": "Scots", "speakers": 1644028, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "laj", "language_name": "Lango (Uganda)", "autonym": "Lango (Uganda)", "speakers": 1643614, "family": "Nilotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rmt", "language_name": "Domari", "autonym": "Domari", "speakers": 1613543, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mk", "language_name": "Macedonian", "autonym": "Македонски", "speakers": 1608565, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ach", "language_name": "Acoli", "autonym": "Acoli", "speakers": 1600361, "family": "Nilotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fuq", "language_name": "Central-Eastern Niger Fulfulde", "autonym": "Central-Eastern Niger Fulfulde", "speakers": 1594068, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bhb", "language_name": "Bhili", "autonym": "Bhili", "speakers": 1591308, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pag", "language_name": "Pangasinan", "autonym": "Pangasinan", "speakers": 1528534, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kg", "language_name": "Kongo", "autonym": "Kongo", "speakers": 1526700, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bin", "language_name": "Bini", "autonym": "Bini", "speakers": 1519599, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ffm", "language_name": "Maasina Fulfulde", "autonym": "Maasina Fulfulde", "speakers": 1505612, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mni", "language_name": "Manipuri", "autonym": "মৈতৈলোন্", "speakers": 1476591, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "abr", "language_name": "Abron", "autonym": "Abron", "speakers": 1467010, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kde", "language_name": "Makonde", "autonym": "Chimakonde", "speakers": 1463820, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "aln", "language_name": "Gheg Albanian", "autonym": "Gheg Albanian", "speakers": 1430250, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ve", "language_name": "Venda", "autonym": "Tshivenḓa", "speakers": 1391759, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "seh", "language_name": "Sena", "autonym": "Sena", "speakers": 1384517, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vec", "language_name": "Venetian", "autonym": "Veneto", "speakers": 1380829, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sus", "language_name": "Susu", "autonym": "Susu", "speakers": 1378014, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nn", "language_name": "Norwegian Nynorsk", "autonym": "Norsk Nynorsk", "speakers": 1366860, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mgh", "language_name": "Makhuwa-Meetto", "autonym": "Makua", "speakers": 1354419, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "raj", "language_name": "Rajasthani", "autonym": "राजस्थानी", "speakers": 1326090, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hoc", "language_name": "Ho", "autonym": "Ho", "speakers": 1312829, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mdh", "language_name": "Maguindanaon", "autonym": "Maguindanaon", "speakers": 1310172, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mtr", "language_name": "Mewari", "autonym": "Mewari", "speakers": 1286307, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bum", "language_name": "Bulu", "autonym": "Bulu", "speakers": 1276270, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "myx", "language_name": "Masaaba", "autonym": "Masaaba", "speakers": 1254337, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "unr", "language_name": "Mundari", "autonym": "Mundari", "speakers": 1252287, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mfe", "language_name": "Morisyen", "autonym": "Kreol Morisien", "speakers": 1241433, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ga", "language_name": "Irish", "autonym": "Gaeilge", "speakers": 1237487, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fvr", "language_name": "Fur", "autonym": "Fur", "speakers": 1230163, "family": "Furan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rej", "language_name": "Rejang", "autonym": "Rejang", "speakers": 1228320, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bhi", "language_name": "Bhilali", "autonym": "Bhilali", "speakers": 1220003, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tsg", "language_name": "Tausug", "autonym": "Tausug", "speakers": 1200991, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "quc", "language_name": "Kʼicheʼ", "autonym": "KʼIcheʼ", "speakers": 1200731, "family": "Mayan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bqi", "language_name": "Bakhtiari", "autonym": "Bakhtiari", "speakers": 1188926, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kpe", "language_name": "Kpelle", "autonym": "Kpɛlɛɛ", "speakers": 1186303, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sef", "language_name": "Cebaara Senoufo", "autonym": "Cebaara Senoufo", "speakers": 1181687, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kxm", "language_name": "Northern Khmer", "autonym": "Northern Khmer", "speakers": 1172616, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vls", "language_name": "West Flemish", "autonym": "West Flemish", "speakers": 1172070, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "snk", "language_name": "Soninke", "autonym": "Soninke", "speakers": 1153651, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "zza", "language_name": "Zaza", "autonym": "Zaza", "speakers": 1148245, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lv", "language_name": "Latvian", "autonym": "Latviešu", "speakers": 1147550, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dnj", "language_name": "Dan", "autonym": "Dan", "speakers": 1099244, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gor", "language_name": "Gorontalo", "autonym": "Gorontalo", "speakers": 1094807, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tig", "language_name": "Tigre", "autonym": "Tigre", "speakers": 1094616, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "eu", "language_name": "Basque", "autonym": "Euskara", "speakers": 1088519, "family": null, "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hoj", "language_name": "Hadothi", "autonym": "Hadothi", "speakers": 1087394, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kbd", "language_name": "Kabardian", "autonym": "Kabardian", "speakers": 1070873, "family": "Abkhaz-Adyge", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kha", "language_name": "Khasi", "autonym": "Khasi", "speakers": 1060872, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sc", "language_name": "Sardinian", "autonym": "Sardu", "speakers": 1060846, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "loz", "language_name": "Lozi", "autonym": "Lozi", "speakers": 1045596, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gur", "language_name": "Frafra", "autonym": "Frafra", "speakers": 1026907, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ars", "language_name": "Najdi Arabic", "autonym": "Najdi Arabic", "speakers": 1025205, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rng", "language_name": "Ronga", "autonym": "Ronga", "speakers": 1023339, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "luz", "language_name": "Southern Luri", "autonym": "Southern Luri", "speakers": 1019080, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "new", "language_name": "Newari", "autonym": "Newari", "speakers": 1000821, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tly", "language_name": "Talysh", "autonym": "Talysh", "speakers": 1000168, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yi", "language_name": "Yiddish", "autonym": "ייִדיש", "speakers": 997214, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bez", "language_name": "Bena", "autonym": "Hibena", "speakers": 995398, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ksb", "language_name": "Shambala", "autonym": "Kishambaa", "speakers": 995398, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kfr", "language_name": "Kachhi", "autonym": "Kachhi", "speakers": 994568, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nij", "language_name": "Ngaju", "autonym": "Ngaju", "speakers": 987996, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mwk", "language_name": "Kita Maninkakan", "autonym": "Kita Maninkakan", "speakers": 977670, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "jml", "language_name": "Jumli", "autonym": "Jumli", "speakers": 970493, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ryu", "language_name": "Central Okinawan", "autonym": "Central Okinawan", "speakers": 966404, "family": "Japonic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mnw", "language_name": "Mon", "autonym": "Mon", "speakers": 966114, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "qug", "language_name": "Chimborazo Highland Quichua", "autonym": "Chimborazo Highland Quichua", "speakers": 963579, "family": "Quechuan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kac", "language_name": "Kachin", "autonym": "Kachin", "speakers": 962032, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hnd", "language_name": "Southern Hindko", "autonym": "Southern Hindko", "speakers": 957354, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "li", "language_name": "Limburgish", "autonym": "Limburgish", "speakers": 950422, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mxc", "language_name": "Manyika", "autonym": "Manyika", "speakers": 945510, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ce", "language_name": "Chechen", "autonym": "Нохчийн", "speakers": 935365, "family": "Nakh-Daghestanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kj", "language_name": "Kuanyama", "autonym": "Kuanyama", "speakers": 920524, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nr", "language_name": "South Ndebele", "autonym": "South Ndebele", "speakers": 903418, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cy", "language_name": "Welsh", "autonym": "Cymraeg", "speakers": 884910, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ada", "language_name": "Adangme", "autonym": "Adangme", "speakers": 880206, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "et", "language_name": "Estonian", "autonym": "Eesti", "speakers": 878449, "family": "Uralic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "prd", "language_name": "Parsi-Dari", "autonym": "Parsi-Dari", "speakers": 864342, "family": "Bookkeeping", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yua", "language_name": "Yucateco", "autonym": "Yucateco", "speakers": 861955, "family": "Mayan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ewo", "language_name": "Ewondo", "autonym": "Ewondo", "speakers": 860095, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kge", "language_name": "Komering", "autonym": "Komering", "speakers": 854483, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ttj", "language_name": "Tooro", "autonym": "Tooro", "speakers": 821807, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "grt", "language_name": "Garo", "autonym": "Garo", "speakers": 821563, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gaa", "language_name": "Ga", "autonym": "Gã", "speakers": 821526, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mgy", "language_name": "Mbunga", "autonym": "Mbunga", "speakers": 819739, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tet", "language_name": "Tetum", "autonym": "Tetum", "speakers": 816395, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "iba", "language_name": "Iban", "autonym": "Iban", "speakers": 816302, "family": "Bookkeeping", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ebu", "language_name": "Embu", "autonym": "Kĩembu", "speakers": 802918, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "swg", "language_name": "Swabian", "autonym": "Swabian", "speakers": 801597, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hnj", "language_name": "Hmong Njua", "autonym": "𞄀𞄄𞄰𞄩𞄍𞄜𞄰", "speakers": 781687, "family": "Hmong-Mien", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kck", "language_name": "Kalanga", "autonym": "Kalanga", "speakers": 770954, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dty", "language_name": "Dotyali", "autonym": "Dotyali", "speakers": 758198, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pcd", "language_name": "Picard", "autonym": "Picard", "speakers": 746330, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fy", "language_name": "Western Frisian", "autonym": "Frysk", "speakers": 743057, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ccp", "language_name": "Chakma", "autonym": "𑄌𑄋𑄴𑄟𑄳𑄦", "speakers": 729137, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yao", "language_name": "Yao", "autonym": "Yao", "speakers": 722357, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "aoz", "language_name": "Uab Meto", "autonym": "Uab Meto", "speakers": 720970, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cps", "language_name": "Capiznon", "autonym": "Capiznon", "speakers": 720595, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "asa", "language_name": "Asu", "autonym": "Kipare", "speakers": 702634, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "blt", "language_name": "Tai Dam", "autonym": "ꪼꪕꪒꪾ", "speakers": 681177, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wa", "language_name": "Walloon", "autonym": "Walon", "speakers": 679801, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ses", "language_name": "Koyraboro Senni", "autonym": "Koyraboro Senni", "speakers": 664816, "family": "Songhay", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bfy", "language_name": "Bagheli", "autonym": "Bagheli", "speakers": 654424, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ast", "language_name": "Asturian", "autonym": "Asturianu", "speakers": 650205, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lki", "language_name": "Laki", "autonym": "Laki", "speakers": 645417, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "unx", "language_name": "Munda", "autonym": "Munda", "speakers": 636523, "family": "Bookkeeping", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lis", "language_name": "Lisu", "autonym": "Lisu", "speakers": 627309, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nqo", "language_name": "N’Ko", "autonym": "ߒߞߏ", "speakers": 626370, "family": "Artificial Language", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gos", "language_name": "Gronings", "autonym": "Gronings", "speakers": 622094, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lol", "language_name": "Mongo", "autonym": "Mongo", "speakers": 620858, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "thl", "language_name": "Dangaura Tharu", "autonym": "Dangaura Tharu", "speakers": 606558, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nap", "language_name": "Neapolitan", "autonym": "Neapolitan", "speakers": 605306, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nus", "language_name": "Nuer", "autonym": "Thok Nath", "speakers": 591427, "family": "Nilotic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "br", "language_name": "Breton", "autonym": "Brezhoneg", "speakers": 563140, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pis", "language_name": "Pijin", "autonym": "Pijin", "speakers": 561780, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rcf", "language_name": "Réunion Creole French", "autonym": "Réunion Creole French", "speakers": 559185, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "av", "language_name": "Avaric", "autonym": "Avaric", "speakers": 552716, "family": "Nakh-Daghestanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ng", "language_name": "Ndonga", "autonym": "Ndonga", "speakers": 552315, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "os", "language_name": "Ossetic", "autonym": "Ирон", "speakers": 541444, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "udm", "language_name": "Udmurt", "autonym": "Udmurt", "speakers": 538544, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lij", "language_name": "Ligurian", "autonym": "Ligure", "speakers": 536663, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kea", "language_name": "Kabuverdianu", "autonym": "Kabuverdianu", "speakers": 530762, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rue", "language_name": "Rusyn", "autonym": "Rusyn", "speakers": 527075, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "chm", "language_name": "Mari", "autonym": "Mari", "speakers": 524371, "family": "Uralic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "scn", "language_name": "Sicilian", "autonym": "Sicilianu", "speakers": 511702, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lag", "language_name": "Langi", "autonym": "Kɨlaangi", "speakers": 509409, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bft", "language_name": "Balti", "autonym": "Balti", "speakers": 502520, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nhe", "language_name": "Eastern Huasteca Nahuatl", "autonym": "Eastern Huasteca Nahuatl", "speakers": 501735, "family": "Uto-Aztecan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nhw", "language_name": "Western Huasteca Nahuatl", "autonym": "Western Huasteca Nahuatl", "speakers": 501735, "family": "Uto-Aztecan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "szl", "language_name": "Silesian", "autonym": "Ślōnski", "speakers": 497670, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kaa", "language_name": "Kara-Kalpak", "autonym": "Kara-Kalpak", "speakers": 489046, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gju", "language_name": "Gujari", "autonym": "Gujari", "speakers": 467002, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "srx", "language_name": "Sirmauri", "autonym": "Sirmauri", "speakers": 464132, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mt", "language_name": "Maltese", "autonym": "Malti", "speakers": 457267, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bap", "language_name": "Bantawa", "autonym": "Bantawa", "speakers": 454918, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sah", "language_name": "Yakut", "autonym": "Саха Тыла", "speakers": 453510, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mls", "language_name": "Masalit", "autonym": "Masalit", "speakers": 451060, "family": "Maban", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kaj", "language_name": "Jju", "autonym": "Kaje", "speakers": 449459, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ady", "language_name": "Adyghe", "autonym": "Adyghe", "speakers": 444583, "family": "Abkhaz-Adyge", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ybb", "language_name": "Yemba", "autonym": "Yemba", "speakers": 443920, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "xmf", "language_name": "Mingrelian", "autonym": "Mingrelian", "speakers": 439670, "family": "Kartvelian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "myv", "language_name": "Erzya", "autonym": "Эрзянь Кель", "speakers": 439338, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dav", "language_name": "Taita", "autonym": "Kitaita", "speakers": 438929, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "maz", "language_name": "Central Mazahua", "autonym": "Central Mazahua", "speakers": 437410, "family": "Otomanguean", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vun", "language_name": "Vunjo", "autonym": "Kyivunjo", "speakers": 433291, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rof", "language_name": "Rombo", "autonym": "Kihorombo", "speakers": 433291, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "jmc", "language_name": "Machame", "autonym": "Kimachame", "speakers": 433291, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kjg", "language_name": "Khmu", "autonym": "Khmu", "speakers": 431949, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fan", "language_name": "Fang", "autonym": "Fang", "speakers": 426451, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "krj", "language_name": "Kinaray-a", "autonym": "Kinaray-A", "speakers": 425806, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kdt", "language_name": "Kuy", "autonym": "Kuy", "speakers": 421207, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lb", "language_name": "Luxembourgish", "autonym": "Lëtzebuergesch", "speakers": 421015, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "srn", "language_name": "Sranan Tongo", "autonym": "Sranan Tongo", "speakers": 414507, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dyo", "language_name": "Jola-Fonyi", "autonym": "Joola", "speakers": 409146, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tdg", "language_name": "Western Tamang", "autonym": "Western Tamang", "speakers": 394263, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pnt", "language_name": "Pontic", "autonym": "Pontic", "speakers": 392463, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "zmi", "language_name": "Negeri Sembilan Malay", "autonym": "Negeri Sembilan Malay", "speakers": 391825, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nnh", "language_name": "Ngiemboon", "autonym": "Shwóŋò Ngiembɔɔn", "speakers": 388430, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bbj", "language_name": "Ghomala", "autonym": "Ghomala", "speakers": 388430, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dv", "language_name": "Divehi", "autonym": "Divehi", "speakers": 388044, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "saz", "language_name": "Saurashtra", "autonym": "Saurashtra", "speakers": 384566, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hif", "language_name": "Fiji Hindi", "autonym": "Fiji Hindi", "speakers": 383749, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fia", "language_name": "Nobiin", "autonym": "Nobiin", "speakers": 378161, "family": "Nubian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bgx", "language_name": "Balkan Gagauz Turkish", "autonym": "Balkan Gagauz Turkish", "speakers": 377280, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kvr", "language_name": "Kerinci", "autonym": "Kerinci", "speakers": 373836, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kvx", "language_name": "Parkari Koli", "autonym": "Parkari Koli", "speakers": 373602, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dz", "language_name": "Dzongkha", "autonym": "རྫོང་ཁ", "speakers": 370341, "family": "Bookkeeping", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pko", "language_name": "Pökoot", "autonym": "Pökoot", "speakers": 369343, "family": "Nilotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dar", "language_name": "Dargwa", "autonym": "Dargwa", "speakers": 368477, "family": "Nakh-Daghestanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lif", "language_name": "Limbu", "autonym": "Limbu", "speakers": 368085, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fj", "language_name": "Fijian", "autonym": "Fijian", "speakers": 365030, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "thr", "language_name": "Rana Tharu", "autonym": "Rana Tharu", "speakers": 363935, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bkm", "language_name": "Kom", "autonym": "Kom", "speakers": 360685, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "is", "language_name": "Icelandic", "autonym": "Íslenska", "speakers": 350734, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "khw", "language_name": "Khowar", "autonym": "Khowar", "speakers": 350252, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lbw", "language_name": "Tolaki", "autonym": "Tolaki", "speakers": 347134, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nxq", "language_name": "Naxi", "autonym": "Naxi", "speakers": 334565, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mgp", "language_name": "Eastern Magar", "autonym": "Eastern Magar", "speakers": 333607, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bax", "language_name": "Bamun", "autonym": "Bamun", "speakers": 332940, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bas", "language_name": "Basaa", "autonym": "Ɓàsàa", "speakers": 332940, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "khq", "language_name": "Koyra Chiini", "autonym": "Koyra Ciini", "speakers": 332408, "family": "Songhay", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mvy", "language_name": "Indus Kohistani", "autonym": "Indus Kohistani", "speakers": 326901, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gay", "language_name": "Gayo", "autonym": "Gayo", "speakers": 320431, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "zdj", "language_name": "Ngazidja Comorian", "autonym": "Ngazidja Comorian", "speakers": 313124, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bua", "language_name": "Buriat", "autonym": "Buriat", "speakers": 311788, "family": "Mongolic-Khitan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bto", "language_name": "Rinconada Bikol", "autonym": "Rinconada Bikol", "speakers": 305707, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "byv", "language_name": "Medumba", "autonym": "Medumba", "speakers": 305195, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "njo", "language_name": "Ao Naga", "autonym": "Ao Naga", "speakers": 305001, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bfq", "language_name": "Badaga", "autonym": "Badaga", "speakers": 305001, "family": "Dravidian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "thq", "language_name": "Kochila Tharu", "autonym": "Kochila Tharu", "speakers": 303279, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mdf", "language_name": "Moksha", "autonym": "Мокшень Кяль", "speakers": 297616, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rob", "language_name": "Tae'", "autonym": "Tae'", "speakers": 293729, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nzi", "language_name": "Nzima", "autonym": "Nzima", "speakers": 293402, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "naq", "language_name": "Nama", "autonym": "Khoekhoegowab", "speakers": 289308, "family": "Khoe-Kwadi", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wni", "language_name": "Ndzwani Comorian", "autonym": "Ndzwani Comorian", "speakers": 287736, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kum", "language_name": "Kumyk", "autonym": "Kumyk", "speakers": 283444, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mua", "language_name": "Mundang", "autonym": "Mundaŋ", "speakers": 277450, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "arn", "language_name": "Mapuche", "autonym": "Mapudungun", "speakers": 272802, "family": "Araucanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cja", "language_name": "Western Cham", "autonym": "Western Cham", "speakers": 270832, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bi", "language_name": "Bislama", "autonym": "Bislama", "speakers": 268500, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "khb", "language_name": "Lü", "autonym": "Lü", "speakers": 264864, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tdd", "language_name": "Tai Nüa", "autonym": "Tai Nüa", "speakers": 264864, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kxp", "language_name": "Wadiyara Koli", "autonym": "Wadiyara Koli", "speakers": 256851, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gjk", "language_name": "Kachi Koli", "autonym": "Kachi Koli", "speakers": 256851, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lez", "language_name": "Lezghian", "autonym": "Lezghian", "speakers": 255100, "family": "Nakh-Daghestanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kv", "language_name": "Komi", "autonym": "Komi", "speakers": 255100, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sm", "language_name": "Samoan", "autonym": "Samoan", "speakers": 252717, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mrd", "language_name": "Western Magar", "autonym": "Western Magar", "speakers": 251722, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "saq", "language_name": "Samburu", "autonym": "Kisampur", "speakers": 246228, "family": "Nilotic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "crh", "language_name": "Crimean Tatar", "autonym": "Crimean Tatar", "speakers": 245968, "family": "Turkic", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mdr", "language_name": "Mandar", "autonym": "Mandar", "speakers": 245664, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sxn", "language_name": "Sangir", "autonym": "Sangir", "speakers": 245664, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ext", "language_name": "Extremaduran", "autonym": "Extremaduran", "speakers": 245077, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nch", "language_name": "Central Huasteca Nahuatl", "autonym": "Central Huasteca Nahuatl", "speakers": 244435, "family": "Uto-Aztecan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "zea", "language_name": "Zeelandic", "autonym": "Zeelandic", "speakers": 241926, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "krc", "language_name": "Karachay-Balkar", "autonym": "Karachay-Balkar", "speakers": 240927, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ksh", "language_name": "Colognian", "autonym": "Kölsch", "speakers": 240479, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hz", "language_name": "Herero", "autonym": "Herero", "speakers": 239336, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sav", "language_name": "Saafi-Saafi", "autonym": "Saafi-Saafi", "speakers": 236046, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "zag", "language_name": "Zaghawa", "autonym": "Zaghawa", "speakers": 232364, "family": "Saharan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "inh", "language_name": "Ingush", "autonym": "Ingush", "speakers": 226755, "family": "Nakh-Daghestanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ssy", "language_name": "Saho", "autonym": "Saho", "speakers": 218923, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dtm", "language_name": "Tomo Kan Dogon", "autonym": "Tomo Kan Dogon", "speakers": 215087, "family": "Dogon", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pap", "language_name": "Papiamento", "autonym": "Papiamentu", "speakers": 211640, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "syr", "language_name": "Syriac", "autonym": "ܣܘܪܝܝܐ", "speakers": 210659, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tog", "language_name": "Nyasa Tonga", "autonym": "Nyasa Tonga", "speakers": 207727, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "maf", "language_name": "Mafa", "autonym": "Mafa", "speakers": 205313, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "puu", "language_name": "Punu", "autonym": "Punu", "speakers": 200782, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kcg", "language_name": "Tyap", "autonym": "Katab", "speakers": 199046, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kao", "language_name": "Xaasongaxango", "autonym": "Xaasongaxango", "speakers": 195534, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tyv", "language_name": "Tuvinian", "autonym": "Tuvinian", "speakers": 184239, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dtp", "language_name": "Central Dusun", "autonym": "Central Dusun", "speakers": 182852, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ria", "language_name": "Riang (India)", "autonym": "Riang (India)", "speakers": 172392, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "swb", "language_name": "Comorian", "autonym": "Comorian", "speakers": 170720, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bmq", "language_name": "Bomu", "autonym": "Bomu", "speakers": 168159, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ltg", "language_name": "Latgalian", "autonym": "Latgalian", "speakers": 167429, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nv", "language_name": "Navajo", "autonym": "Diné Bizaad", "speakers": 166320, "family": "Athabaskan-Eyak-Tlingit", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bze", "language_name": "Jenaama Bozo", "autonym": "Jenaama Bozo", "speakers": 166204, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "co", "language_name": "Corsican", "autonym": "Corsu", "speakers": 162836, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bfd", "language_name": "Bafut", "autonym": "Bafut", "speakers": 158146, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "xsr", "language_name": "Sherpa", "autonym": "Sherpa", "speakers": 157705, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kiu", "language_name": "Kirmanjki", "autonym": "Kirmanjki", "speakers": 155833, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ho", "language_name": "Hiri Motu", "autonym": "Hiri Motu", "speakers": 152449, "family": "Pidgin", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kkj", "language_name": "Kako", "autonym": "Kakɔ", "speakers": 149823, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bss", "language_name": "Akoose", "autonym": "Akoose", "speakers": 149823, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sly", "language_name": "Selayar", "autonym": "Selayar", "speakers": 144194, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mi", "language_name": "Māori", "autonym": "Māori", "speakers": 137913, "family": "Austronesian", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rjs", "language_name": "Rajbanshi", "autonym": "Rajbanshi", "speakers": 133443, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dua", "language_name": "Duala", "autonym": "Duálá", "speakers": 133176, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "guc", "language_name": "Wayuu", "autonym": "Wayuu", "speakers": 132529, "family": "Arawakan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vai", "language_name": "Vai", "autonym": "ꕙꔤ", "speakers": 131906, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "taj", "language_name": "Eastern Tamang", "autonym": "Eastern Tamang", "speakers": 130410, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mgo", "language_name": "Metaʼ", "autonym": "Metaʼ", "speakers": 130401, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pdc", "language_name": "Pennsylvania German", "autonym": "Pennsylvania German", "speakers": 129729, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rwk", "language_name": "Rwa", "autonym": "Kiruwa", "speakers": 128816, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "trw", "language_name": "Torwali", "autonym": "توروالی", "speakers": 123756, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mfv", "language_name": "Mandjak", "autonym": "Mandjak", "speakers": 121170, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tsj", "language_name": "Tshangla", "autonym": "Tshangla", "speakers": 117348, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sbp", "language_name": "Sangu", "autonym": "Ishisangu", "speakers": 117106, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "krl", "language_name": "Karelian", "autonym": "Karelian", "speakers": 116212, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lad", "language_name": "Ladino", "autonym": "Ladino", "speakers": 112781, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ife", "language_name": "Ifè", "autonym": "Ifè", "speakers": 111910, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gag", "language_name": "Gagauz", "autonym": "Gagauz", "speakers": 111028, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lbe", "language_name": "Lak", "autonym": "Lak", "speakers": 110543, "family": "Nakh-Daghestanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sdc", "language_name": "Sassarese Sardinian", "autonym": "Sassarese Sardinian", "speakers": 106085, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "to", "language_name": "Tongan", "autonym": "Lea Fakatonga", "speakers": 100790, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bjt", "language_name": "Balanta-Ganja", "autonym": "Balanta-Ganja", "speakers": 95992, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "jgo", "language_name": "Ngomba", "autonym": "Ndaꞌa", "speakers": 94333, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "crs", "language_name": "Seselwa Creole French", "autonym": "Seselwa Creole French", "speakers": 94061, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ab", "language_name": "Abkhazian", "autonym": "Аԥсшәа", "speakers": 91953, "family": "Abkhaz-Adyge", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ty", "language_name": "Tahitian", "autonym": "Tahitian", "speakers": 91488, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "iu", "language_name": "Inuktitut", "autonym": "Inuktitut", "speakers": 90466, "family": "Eskimo-Aleut", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pdt", "language_name": "Plautdietsch", "autonym": "Plautdietsch", "speakers": 90466, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bpy", "language_name": "Bishnupriya", "autonym": "Bishnupriya", "speakers": 90174, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ksf", "language_name": "Bafia", "autonym": "Rikpa", "speakers": 88784, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gvr", "language_name": "Gurung", "autonym": "Gurung", "speakers": 87951, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cjm", "language_name": "Eastern Cham", "autonym": "Eastern Cham", "speakers": 87862, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lcp", "language_name": "Western Lawa", "autonym": "Western Lawa", "speakers": 87751, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "knf", "language_name": "Mankanya", "autonym": "Mankanya", "speakers": 83151, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lep", "language_name": "Lepcha", "autonym": "Lepcha", "speakers": 79743, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "byn", "language_name": "Blin", "autonym": "Blin", "speakers": 79056, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "btv", "language_name": "Bateri", "autonym": "Bateri", "speakers": 78843, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tkt", "language_name": "Kathoriya Tharu", "autonym": "Kathoriya Tharu", "speakers": 72787, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gd", "language_name": "Scottish Gaelic", "autonym": "Gàidhlig", "speakers": 72337, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fo", "language_name": "Faroese", "autonym": "Føroyskt", "speakers": 71351, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vro", "language_name": "Võro", "autonym": "Võro", "speakers": 70031, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ken", "language_name": "Kenyang", "autonym": "Kɛnyaŋ", "speakers": 69362, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gil", "language_name": "Gilbertese", "autonym": "Gilbertese", "speakers": 67078, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bvb", "language_name": "Bube", "autonym": "Bube", "speakers": 66058, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mwv", "language_name": "Mentawai", "autonym": "Mentawai", "speakers": 64086, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "frp", "language_name": "Arpitan", "autonym": "Arpitan", "speakers": 63777, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "koi", "language_name": "Komi-Permyak", "autonym": "Komi-Permyak", "speakers": 63775, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kfo", "language_name": "Koro", "autonym": "Koro", "speakers": 63207, "family": "Mande", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mh", "language_name": "Marshallese", "autonym": "Marshallese", "speakers": 56879, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fit", "language_name": "Tornedalen Finnish", "autonym": "Tornedalen Finnish", "speakers": 56114, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kl", "language_name": "Kalaallisut", "autonym": "Kalaallisut", "speakers": 55440, "family": "Eskimo-Aleut", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bra", "language_name": "Braj", "autonym": "Braj", "speakers": 54370, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gcr", "language_name": "Guianese Creole French", "autonym": "Guianese Creole French", "speakers": 51872, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "se", "language_name": "Northern Sami", "autonym": "Davvisámegiella", "speakers": 51530, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "blo", "language_name": "Anii", "autonym": "Anii Kagɩja", "speakers": 51507, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kgp", "language_name": "Kaingang", "autonym": "Kanhgág", "speakers": 50812, "family": "Nuclear-Macro-Je", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "csb", "language_name": "Kashubian", "autonym": "Kashubian", "speakers": 49767, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bqv", "language_name": "Koro Wachi", "autonym": "Koro Wachi", "speakers": 46718, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ch", "language_name": "Chamorro", "autonym": "Chamorro", "speakers": 46325, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cch", "language_name": "Atsam", "autonym": "Atsam", "speakers": 44946, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "buc", "language_name": "Bushi", "autonym": "Bushi", "speakers": 44620, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rm", "language_name": "Romansh", "autonym": "Rumantsch", "speakers": 42020, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "agq", "language_name": "Aghem", "autonym": "Aghem", "speakers": 38843, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kxv", "language_name": "Kuvi", "autonym": "Kuvi", "speakers": 38457, "family": "Dravidian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "snf", "language_name": "Noon", "autonym": "Noon", "speakers": 37767, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fur", "language_name": "Friulian", "autonym": "Furlan", "speakers": 37442, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tdh", "language_name": "Thulung", "autonym": "Thulung", "speakers": 36393, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "egl", "language_name": "Emilian", "autonym": "Emilian", "speakers": 31201, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "chk", "language_name": "Chuukese", "autonym": "Chuukese", "speakers": 30731, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mrj", "language_name": "Western Mari", "autonym": "Western Mari", "speakers": 29762, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "haw", "language_name": "Hawaiian", "autonym": "ʻŌlelo HawaiʻI", "speakers": 29605, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mro", "language_name": "Mru", "autonym": "Mru", "speakers": 29277, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "frc", "language_name": "Cajun French", "autonym": "Cajun French", "speakers": 27942, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yrl", "language_name": "Nheengatu", "autonym": "Nheẽgatu", "speakers": 26171, "family": "Tupian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "an", "language_name": "Aragonese", "autonym": "Aragonés", "speakers": 26008, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "chr", "language_name": "Cherokee", "autonym": "Ꮳꮃꭹ", "speakers": 25613, "family": "Iroquoian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rmo", "language_name": "Sinte Romani", "autonym": "Sinte Romani", "speakers": 24372, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "oj", "language_name": "Ojibwa", "autonym": "Ojibwa", "speakers": 23747, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pon", "language_name": "Pohnpeian", "autonym": "Pohnpeian", "speakers": 23560, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lzz", "language_name": "Laz", "autonym": "Laz", "speakers": 22965, "family": "Kartvelian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ttt", "language_name": "Muslim Tat", "autonym": "Muslim Tat", "speakers": 22453, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "esu", "language_name": "Central Yupik", "autonym": "Central Yupik", "speakers": 20956, "family": "Eskimo-Aleut", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dak", "language_name": "Dakota", "autonym": "Dakota", "speakers": 20832, "family": "Siouan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "alt", "language_name": "Southern Altai", "autonym": "Southern Altai", "speakers": 19841, "family": "Turkic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "amo", "language_name": "Amo", "autonym": "Amo", "speakers": 18620, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gub", "language_name": "Guajajára", "autonym": "Guajajára", "speakers": 17784, "family": "Tupian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hnn", "language_name": "Hanunoo", "autonym": "Hanunoo", "speakers": 17469, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tkr", "language_name": "Tsakhur", "autonym": "Tsakhur", "speakers": 16329, "family": "Nakh-Daghestanian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pau", "language_name": "Palauan", "autonym": "Palauan", "speakers": 16047, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sa", "language_name": "Sanskrit", "autonym": "संस्कृत भाषा", "speakers": 15913, "family": "Indo-European", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bsc", "language_name": "Bassari", "autonym": "Bassari", "speakers": 15264, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ojs", "language_name": "Oji-Cree", "autonym": "Oji-Cree", "speakers": 15078, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kht", "language_name": "Khamti", "autonym": "Khamti", "speakers": 13527, "family": "Tai-Kadai", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hsb", "language_name": "Upper Sorbian", "autonym": "Hornjoserbšćina", "speakers": 12826, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "chp", "language_name": "Chipewyan", "autonym": "Chipewyan", "speakers": 12816, "family": "Athabaskan-Eyak-Tlingit", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "moe", "language_name": "Innu-aimun", "autonym": "Innu-Aimun", "speakers": 12062, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sli", "language_name": "Lower Silesian", "autonym": "Lower Silesian", "speakers": 11868, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wae", "language_name": "Walser", "autonym": "Walser", "speakers": 11377, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cho", "language_name": "Choctaw", "autonym": "Chahta", "speakers": 10977, "family": "Muskogean", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tbw", "language_name": "Tagbanwa", "autonym": "Tagbanwa", "speakers": 10045, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "xav", "language_name": "Xavánte", "autonym": "Xavánte", "speakers": 9951, "family": "Nuclear-Macro-Je", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tvl", "language_name": "Tuvalu", "autonym": "Tuvalu", "speakers": 9868, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "frr", "language_name": "Northern Frisian", "autonym": "Nordfriisk", "speakers": 9619, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rug", "language_name": "Roviana", "autonym": "Roviana", "speakers": 9591, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wls", "language_name": "Wallisian", "autonym": "Wallisian", "speakers": 9512, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rmu", "language_name": "Tavringer Romani", "autonym": "Tavringer Romani", "speakers": 9488, "family": "Speech Register", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cr", "language_name": "Cree", "autonym": "Cree", "speakers": 9047, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nmg", "language_name": "Kwasio", "autonym": "Kwasio", "speakers": 8878, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lkt", "language_name": "Lakota", "autonym": "LakȟólʼIyapi", "speakers": 8316, "family": "Siouan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kos", "language_name": "Kosraean", "autonym": "Kosraean", "speakers": 7990, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ik", "language_name": "Inupiaq", "autonym": "Inupiaq", "speakers": 7983, "family": "Eskimo-Aleut", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gbz", "language_name": "Zoroastrian Dari", "autonym": "Zoroastrian Dari", "speakers": 7983, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "twq", "language_name": "Tasawaq", "autonym": "Tasawaq Senni", "speakers": 7970, "family": "Songhay", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bku", "language_name": "Buhid", "autonym": "Buhid", "speakers": 7970, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mic", "language_name": "Mi'kmaw", "autonym": "LʼNuiʼSuti", "speakers": 7916, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mey", "language_name": "Hassaniyya", "autonym": "Hassaniyya", "speakers": 7239, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dsb", "language_name": "Lower Sorbian", "autonym": "Dolnoserbšćina", "speakers": 6974, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "na", "language_name": "Nauru", "autonym": "Nauru", "speakers": 6930, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lwl", "language_name": "Eastern Lawa", "autonym": "Eastern Lawa", "speakers": 6898, "family": "Austroasiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yap", "language_name": "Yapese", "autonym": "Yapese", "speakers": 6556, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "atj", "language_name": "Atikamekw", "autonym": "Atikamekw", "speakers": 6408, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pms", "language_name": "Piedmontese", "autonym": "Piedmontese", "speakers": 6178, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rmf", "language_name": "Kalo Finnish Romani", "autonym": "Kalo Finnish Romani", "speakers": 5015, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "bla", "language_name": "Siksiká", "autonym": "Siksiká", "speakers": 4900, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "fud", "language_name": "East Futuna", "autonym": "East Futuna", "speakers": 4756, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "trv", "language_name": "Taroko", "autonym": "Patas Taroko", "speakers": 4721, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "crk", "language_name": "Plains Cree", "autonym": "Plains Cree", "speakers": 4146, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "saf", "language_name": "Safaliba", "autonym": "Safaliba", "speakers": 4108, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "mus", "language_name": "Muscogee", "autonym": "Mvskoke", "speakers": 3992, "family": "Muskogean", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vep", "language_name": "Veps", "autonym": "Veps", "speakers": 3543, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tnr", "language_name": "Ménik", "autonym": "Ménik", "speakers": 3305, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vic", "language_name": "Virgin Islands Creole English", "autonym": "Virgin Islands Creole English", "speakers": 3113, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tru", "language_name": "Turoyo", "autonym": "Turoyo", "speakers": 3035, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "uli", "language_name": "Ulithian", "autonym": "Ulithian", "speakers": 2971, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rtm", "language_name": "Rotuman", "autonym": "Rotuman", "speakers": 2527, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "wbp", "language_name": "Warlpiri", "autonym": "Warlpiri", "speakers": 2496, "family": "Pama-Nyungan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "yav", "language_name": "Yangben", "autonym": "Nuasue", "speakers": 2303, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "den", "language_name": "Slave", "autonym": "Slave", "speakers": 2299, "family": "Athabaskan-Eyak-Tlingit", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "dgr", "language_name": "Dogrib", "autonym": "Dogrib", "speakers": 2111, "family": "Athabaskan-Eyak-Tlingit", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "frs", "language_name": "Eastern Frisian", "autonym": "Eastern Frisian", "speakers": 2004, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kw", "language_name": "Cornish", "autonym": "Kernewek", "speakers": 1973, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "csw", "language_name": "Swampy Cree", "autonym": "ᓀᐦᐃᓇᐍᐏᐣ", "speakers": 1809, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "moh", "language_name": "Mohawk", "autonym": "KanienʼKéha", "speakers": 1772, "family": "Iroquoian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gv", "language_name": "Manx", "autonym": "Gaelg", "speakers": 1719, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "smj", "language_name": "Lule Sami", "autonym": "Julevsámegiella", "speakers": 1530, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "nsk", "language_name": "Naskapi", "autonym": "Naskapi", "speakers": 1395, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tkl", "language_name": "Tokelau", "autonym": "Tokelau", "speakers": 1285, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "niu", "language_name": "Niuean", "autonym": "Niuean", "speakers": 1120, "family": "Austronesian", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "stq", "language_name": "Saterland Frisian", "autonym": "Saterland Frisian", "speakers": 962, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sei", "language_name": "Seri", "autonym": "Seri", "speakers": 901, "family": null, "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "clc", "language_name": "Chilcotin", "autonym": "Chilcotin", "speakers": 867, "family": "Athabaskan-Eyak-Tlingit", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "la", "language_name": "Latin", "autonym": "Lingua Latina", "speakers": 820, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "hur", "language_name": "Halkomelem", "autonym": "Halkomelem", "speakers": 716, "family": "Salishan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "crg", "language_name": "Michif", "autonym": "Michif", "speakers": 678, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sms", "language_name": "Skolt Sami", "autonym": "SääʹMǩiõll", "speakers": 613, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "smn", "language_name": "Inari Sami", "autonym": "Anarâškielâ", "speakers": 613, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lil", "language_name": "Lillooet", "autonym": "Lillooet", "speakers": 528, "family": "Salishan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "oka", "language_name": "Okanagan", "autonym": "Okanagan", "speakers": 490, "family": "Salishan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pqm", "language_name": "Maliseet-Passamaquoddy", "autonym": "Maliseet-Passamaquoddy", "speakers": 490, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "kwk", "language_name": "Kwakʼwala", "autonym": "KwakʼWala", "speakers": 377, "family": "Wakashan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "crl", "language_name": "Northern East Cree", "autonym": "Northern East Cree", "speakers": 377, "family": "Algic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gwi", "language_name": "Gwichʼin", "autonym": "GwichʼIn", "speakers": 302, "family": "Athabaskan-Eyak-Tlingit", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "eo", "language_name": "Esperanto", "autonym": "Esperanto", "speakers": 301, "family": "Artificial Language", "average": 0.0, "in_benchmark": true, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sma", "language_name": "Southern Sami", "autonym": "Åarjelsaemien Gïele", "speakers": 296, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "tsd", "language_name": "Tsakonian", "autonym": "Tsakonian", "speakers": 202, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "izh", "language_name": "Ingrian", "autonym": "Ingrian", "speakers": 142, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ia", "language_name": "Interlingua", "autonym": "Interlingua", "speakers": 136, "family": "Artificial Language", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "aro", "language_name": "Araona", "autonym": "Araona", "speakers": 105, "family": "Pano-Tacanan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "prg", "language_name": "Prussian", "autonym": "Prūsiskan", "speakers": 38, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ie", "language_name": "Interlingue", "autonym": "Interlingue", "speakers": 1, "family": "Artificial Language", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "lzh", "language_name": "Literary Chinese", "autonym": "Literary Chinese", "speakers": 0, "family": "Sino-Tibetan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "io", "language_name": "Ido", "autonym": "Ido", "speakers": 0, "family": "Artificial Language", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "jbo", "language_name": "Lojban", "autonym": "La .Lojban.", "speakers": 0, "family": "Artificial Language", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "jut", "language_name": "Jutish", "autonym": "Jutish", "speakers": 0, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "vot", "language_name": "Votic", "autonym": "Votic", "speakers": 0, "family": "Uralic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "gez", "language_name": "Geez", "autonym": "Geez", "speakers": 0, "family": "Afro-Asiatic", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "osa", "language_name": "Osage", "autonym": "𐓏𐓘𐓻𐓘𐓻𐓟", "speakers": 0, "family": "Siouan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "rgn", "language_name": "Romagnol", "autonym": "Romagnol", "speakers": 0, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cu", "language_name": "Church Slavic", "autonym": "Church Slavic", "speakers": 0, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "sgs", "language_name": "Samogitian", "autonym": "Samogitian", "speakers": 0, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "ann", "language_name": "Obolo", "autonym": "Obolo", "speakers": 0, "family": "Atlantic-Congo", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cic", "language_name": "Chickasaw", "autonym": "Chikashshanompaʼ", "speakers": 0, "family": "Muskogean", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "cad", "language_name": "Caddo", "autonym": "Caddo", "speakers": 0, "family": "Caddoan", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 }, { "bcp_47": "pfl", "language_name": "Palatine German", "autonym": "Palatine German", "speakers": 0, "family": "Indo-European", "average": 0.0, "in_benchmark": false, "NaN": 0.0, "classification_accuracy": 0.0, "language_modeling_chrf": 0.0, "translation_bleu": 0.0, "translation_chrf": 0.0 } ], "dataset_table": [ { "name": "FLORES+", "author": "Meta", "author_url": "https://ai.meta.com", "url": "https://huggingface.co/datasets/openlanguagedata/flores_plus", "n_languages": 200, "tasks": [ "translation", "classification", "language_modeling" ], "parallel": 1.0, "base": "FLORES", "implemented": 1.0 }, { "name": "FLEURS", "author": "Meta", "author_url": "https://ai.meta.com", "url": "https://huggingface.co/datasets/google/fleurs", "n_languages": 102, "tasks": [ "speech_recognition" ], "parallel": 1.0, "base": "FLORES", "implemented": 1.0 }, { "name": "CommonVoice", "author": "Mozilla", "author_url": "https://mozilla.ai", "url": "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0", "n_languages": 124, "tasks": [ "speech_recognition" ], "parallel": null, "base": null, "implemented": null }, { "name": "MMMLU", "author": "OpenAI", "author_url": "https://openai.com", "url": "https://huggingface.co/datasets/openai/MMMLU", "n_languages": 14, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "MMLU", "implemented": null }, { "name": "AfriMMLU", "author": "Masakhane", "author_url": "https://www.masakhane.io", "url": "https://huggingface.co/datasets/masakhane/afrimmlu", "n_languages": 17, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "MMLU", "implemented": null }, { "name": "Okapi MMLU", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/jon-tow/okapi_mmlu", "n_languages": 16, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "MMLU", "implemented": null }, { "name": "Global MMLU", "author": "Cohere", "author_url": "https://cohere.com", "url": "https://huggingface.co/datasets/CohereForAI/Global-MMLU", "n_languages": 42, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "MMLU", "implemented": null }, { "name": "MGSM", "author": "Google", "author_url": "https://google.com", "url": "https://huggingface.co/datasets/juletxara/mgsm", "n_languages": 10, "tasks": [ "math" ], "parallel": 1.0, "base": "MGSM", "implemented": null }, { "name": "AfriMGSM", "author": "Masakhane", "author_url": "https://www.masakhane.io", "url": "https://huggingface.co/datasets/masakhane/afrimgsm", "n_languages": 18, "tasks": [ "math" ], "parallel": 1.0, "base": "MGSM", "implemented": null }, { "name": "Okapi ARC Challenge", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/jon-tow/okapi_arc_challenge", "n_languages": 31, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "AI2 ARC", "implemented": null }, { "name": "Uhuru ARC Easy", "author": "Masakhane", "author_url": "https://www.masakhane.io", "url": "https://huggingface.co/datasets/masakhane/uhura-arc-easy", "n_languages": 6, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "AI2 ARC", "implemented": null }, { "name": "Okapi TruthfulQA", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/jon-tow/okapi_truthfulqa/tree/main/data", "n_languages": 31, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "TruthfulQA", "implemented": null }, { "name": "Uhura TruthfulQA", "author": "Masakhane", "author_url": "https://www.masakhane.io", "url": "https://huggingface.co/datasets/masakhane/uhura-truthfulqa", "n_languages": 6, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "TruthfulQA", "implemented": null }, { "name": "XNLI", "author": "Meta", "author_url": "https://ai.meta.com", "url": "https://huggingface.co/datasets/facebook/xnli", "n_languages": 14, "tasks": [ "classification" ], "parallel": 1.0, "base": "XNLI", "implemented": null }, { "name": "AfriXNLI", "author": "Masakhane", "author_url": "https://www.masakhane.io", "url": "https://huggingface.co/datasets/masakhane/afrixnli", "n_languages": 18, "tasks": [ "classification" ], "parallel": 1.0, "base": "XNLI", "implemented": null }, { "name": "Okapi HellaSwag", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/jon-tow/okapi_hellaswag", "n_languages": 31, "tasks": [ "question_answering" ], "parallel": 1.0, "base": "HellaSwag", "implemented": null }, { "name": "WikiANN / PAN-X", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/unimelb-nlp/wikiann", "n_languages": 176, "tasks": [ "ner" ], "parallel": 0.0, "base": null, "implemented": null }, { "name": "MSVAMP", "author": "Microsoft", "author_url": "https://microsoft.com", "url": "https://huggingface.co/datasets/Mathoctopus/MSVAMP", "n_languages": 10, "tasks": [ "math" ], "parallel": 1.0, "base": null, "implemented": null }, { "name": "XLSUM", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/csebuetnlp/xlsum", "n_languages": 45, "tasks": [ "summarization" ], "parallel": 1.0, "base": null, "implemented": null }, { "name": "SEA-IFEVAL", "author": "AI Singapore", "author_url": "https://aisingapore.org", "url": "https://huggingface.co/datasets/aisingapore/instruction_following-ifeval", "n_languages": 7, "tasks": [ "instruction_following" ], "parallel": 1.0, "base": "IFEVAL", "implemented": null }, { "name": "XTREME", "author": "Google", "author_url": "https://google.com", "url": "https://huggingface.co/datasets/google/xtreme", "n_languages": 40, "tasks": [ "translation", "classification", "question_answering", "ner" ], "parallel": null, "base": null, "implemented": null }, { "name": "XGLUE", "author": "Microsoft", "author_url": "https://microsoft.com", "url": "https://huggingface.co/datasets/microsoft/xglue", "n_languages": 18, "tasks": [ "pos" ], "parallel": null, "base": "GLUE", "implemented": null }, { "name": "IndicGLUE", "author": "AI4Bharat", "author_url": "https://models.ai4bharat.org", "url": "https://huggingface.co/datasets/ai4bharat/indic_glue", "n_languages": 11, "tasks": [ "question_answering" ], "parallel": null, "base": "GLUE", "implemented": null }, { "name": "Opus Gnome", "author": "Helsinki NLP", "author_url": null, "url": "https://huggingface.co/datasets/Helsinki-NLP/opus_gnome", "n_languages": 187, "tasks": [ "translation" ], "parallel": 1.0, "base": null, "implemented": null }, { "name": "Opus Paracrawl", "author": "Helsinki NLP", "author_url": null, "url": "https://huggingface.co/datasets/Helsinki-NLP/opus_paracrawl", "n_languages": 43, "tasks": [ "translation" ], "parallel": 0.0, "base": null, "implemented": null }, { "name": "CCAligned", "author": "Meta", "author_url": "https://ai.meta.com", "url": "https://huggingface.co/datasets/ahelk/ccaligned_multilingual", "n_languages": 137, "tasks": [ "translation" ], "parallel": 0.0, "base": null, "implemented": null }, { "name": "OPUS Collection", "author": "Helsinki NLP", "author_url": null, "url": "https://opus.nlpl.eu", "n_languages": 747, "tasks": [ "translation" ], "parallel": 0.0, "base": null, "implemented": null }, { "name": "MasakhaNER", "author": "Masakhane", "author_url": "https://www.masakhane.io", "url": "https://huggingface.co/datasets/masakhane/masakhaner", "n_languages": 10, "tasks": [ "ner" ], "parallel": null, "base": null, "implemented": null }, { "name": "Multilingual Sentiments", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/tyqiangz/multilingual-sentiments", "n_languages": 12, "tasks": [ "sentiment_analysis" ], "parallel": null, "base": null, "implemented": null }, { "name": "CulturaX", "author": "Academic", "author_url": null, "url": "https://huggingface.co/datasets/uonlp/CulturaX", "n_languages": 167, "tasks": [ "language_modeling" ], "parallel": 0.0, "base": null, "implemented": null }, { "name": "Tülu 3 SFT Mixture", "author": "AllenAI", "author_url": "https://allenai.org", "url": "https://huggingface.co/datasets/allenai/tulu-3-sft-mixture", "n_languages": 70, "tasks": [ "instruction_following" ], "parallel": 0.0, "base": null, "implemented": null }, { "name": "xP3", "author": "BigScience", "author_url": "https://bigscience.huggingface.co", "url": "https://huggingface.co/datasets/bigscience/xP3", "n_languages": 46, "tasks": [ "instruction_following" ], "parallel": 0.0, "base": null, "implemented": null }, { "name": "Aya", "author": "Cohere", "author_url": "https://cohere.com", "url": "https://huggingface.co/datasets/CohereForAI/aya_dataset", "n_languages": 65, "tasks": [ "instruction_following" ], "parallel": null, "base": null, "implemented": null }, { "name": "Lanfrica", "author": "Lanfrica", "author_url": "https://lanfrica.com", "url": "https://lanfrica.com/records?language=yor&task=machine%20translation", "n_languages": 2200, "tasks": [ "datasets" ], "parallel": null, "base": null, "implemented": null }, { "name": "HuggingFace Languages", "author": "HuggingFace", "author_url": "https://huggingface.co", "url": "https://huggingface.co/languages", "n_languages": 4680, "tasks": [ "datasets", "models" ], "parallel": null, "base": null, "implemented": null }, { "name": "HuggingFace Multilingual Datasets", "author": "HuggingFace", "author_url": "https://huggingface.co", "url": "https://huggingface.co/datasets?other=multilinguality:multilingual", "n_languages": 2012, "tasks": [ "datasets" ], "parallel": 0.0, "base": null, "implemented": null } ], "countries": { "AC": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 931, "score": 0.47 } ] }, "AE": { "score": 0.39591834659201586, "languages": [ { "name": "English", "bcp_47": "en", "population": 4996040, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 7793822, "score": 0.42 }, { "name": "Persian", "bcp_47": "fa", "population": 189850, "score": 0.0 }, { "name": "Pashto", "bcp_47": "ps", "population": 289770, "score": 0.0 }, { "name": "Malayalam", "bcp_47": "ml", "population": 699446, "score": 0.0 }, { "name": "Baluchi", "bcp_47": "bal", "population": 229818, "score": 0.0 } ] }, "AG": { "score": 0.4698173362013836, "languages": [ { "name": "English", "bcp_47": "en", "population": 84434, "score": 0.47 }, { "name": "Portuguese", "bcp_47": "pt", "population": 1571, "score": 0.46 } ] }, "AI": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 17186, "score": 0.47 } ] }, "AQ": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 300, "score": 0.47 } ] }, "AR": { "score": 0.45083230214508235, "languages": [ { "name": "English", "bcp_47": "en", "population": 3183537, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 45479100, "score": 0.45 }, { "name": "Guarani", "bcp_47": "gn", "population": 21375, "score": 0.0 }, { "name": "Welsh", "bcp_47": "cy", "population": 30016, "score": 0.0 } ] }, "AS": { "score": 0.23260142212865204, "languages": [ { "name": "English", "bcp_47": "en", "population": 47954, "score": 0.47 }, { "name": "Samoan", "bcp_47": "sm", "population": 48943, "score": 0.0 } ] }, "AT": { "score": 0.13725900574384256, "languages": [ { "name": "English", "bcp_47": "en", "population": 6467398, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 974540, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 8593666, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 797350, "score": 0.0 }, { "name": "Bavarian", "bcp_47": "bar", "population": 8416478, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 23035, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 106313, "score": 0.0 }, { "name": "Slovenian", "bcp_47": "sl", "population": 32780, "score": 0.0 } ] }, "AU": { "score": 0.46077520536342514, "languages": [ { "name": "English", "bcp_47": "en", "population": 24447840, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 534796, "score": 0.46 }, { "name": "Italian", "bcp_47": "it", "population": 483864, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 2190, "score": 0.0 }, { "name": "Warlpiri", "bcp_47": "wbp", "population": 2496, "score": 0.0 } ] }, "AW": { "score": 0.0073216055759017535, "languages": [ { "name": "English", "bcp_47": "en", "population": 2986, "score": 0.47 }, { "name": "Dutch", "bcp_47": "nl", "population": 115845, "score": 0.0 }, { "name": "Papiamento", "bcp_47": "pap", "population": 72851, "score": 0.0 } ] }, "BA": { "score": 0.07690910954274856, "languages": [ { "name": "English", "bcp_47": "en", "population": 1726016, "score": 0.47 }, { "name": "Serbian", "bcp_47": "sr", "population": 767118, "score": 0.0 }, { "name": "Bosnian", "bcp_47": "bs", "population": 7594468, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 460271, "score": 0.0 } ] }, "BB": { "score": 0.4699999999999999, "languages": [ { "name": "English", "bcp_47": "en", "population": 294560, "score": 0.47 } ] }, "BD": { "score": 0.3554705133359761, "languages": [ { "name": "English", "bcp_47": "en", "population": 29277180, "score": 0.47 }, { "name": "Bangla", "bcp_47": "bn", "population": 159397980, "score": 0.38 }, { "name": "Burmese", "bcp_47": "my", "population": 341567, "score": 0.0 }, { "name": "Rangpuri", "bcp_47": "rkt", "population": 10572315, "score": 0.0 }, { "name": "Sylheti", "bcp_47": "syl", "population": 8132550, "score": 0.0 }, { "name": "Rohingya", "bcp_47": "rhg", "population": 862050, "score": 0.0 }, { "name": "Manipuri", "bcp_47": "mni", "population": 17892, "score": 0.0 }, { "name": "Garo", "bcp_47": "grt", "population": 118735, "score": 0.0 }, { "name": "Chakma", "bcp_47": "ccp", "population": 357832, "score": 0.0 }, { "name": "Mru", "bcp_47": "mro", "population": 29277, "score": 0.0 } ] }, "BE": { "score": 0.23819809898359195, "languages": [ { "name": "English", "bcp_47": "en", "population": 6915213, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 4453866, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 2578554, "score": 0.0 }, { "name": "Dutch", "bcp_47": "nl", "population": 6446385, "score": 0.0 }, { "name": "West Flemish", "bcp_47": "vls", "population": 1172070, "score": 0.0 }, { "name": "Walloon", "bcp_47": "wa", "population": 679801, "score": 0.0 } ] }, "BG": { "score": 0.07035928143712575, "languages": [ { "name": "English", "bcp_47": "en", "population": 1741725, "score": 0.47 }, { "name": "Russian", "bcp_47": "ru", "population": 1602387, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 557352, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 766359, "score": 0.0 }, { "name": "Bulgarian", "bcp_47": "bg", "population": 6966900, "score": 0.0 } ] }, "BI": { "score": 0.22246807623977216, "languages": [ { "name": "English", "bcp_47": "en", "population": 6289, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 7000822, "score": 0.46 }, { "name": "Swahili", "bcp_47": "sw", "population": 6408, "score": 0.0 }, { "name": "Rundi", "bcp_47": "rn", "population": 7475454, "score": 0.0 } ] }, "BM": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 66010, "score": 0.47 } ] }, "BN": { "score": 0.05292700193318268, "languages": [ { "name": "English", "bcp_47": "en", "population": 7896, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 51093, "score": 0.46 }, { "name": "Malay", "bcp_47": "ms", "population": 455189, "score": 0.0 } ] }, "BR": { "score": 0.45330626204700775, "languages": [ { "name": "English", "bcp_47": "en", "population": 16937280, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 76218, "score": 0.45 }, { "name": "Portuguese", "bcp_47": "pt", "population": 192661560, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 1778414, "score": 0.0 }, { "name": "Japanese", "bcp_47": "ja", "population": 444604, "score": 0.0 }, { "name": "Korean", "bcp_47": "ko", "population": 44460, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 592805, "score": 0.0 }, { "name": "Venetian", "bcp_47": "vec", "population": 508118, "score": 0.0 }, { "name": "Kaingang", "bcp_47": "kgp", "population": 50812, "score": 0.0 }, { "name": "Nheengatu", "bcp_47": "yrl", "population": 21172, "score": 0.0 }, { "name": "Guajajára", "bcp_47": "gub", "population": 17784, "score": 0.0 }, { "name": "Xavánte", "bcp_47": "xav", "population": 9951, "score": 0.0 } ] }, "BS": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 337721, "score": 0.47 } ] }, "BT": { "score": 0.05505863086648988, "languages": [ { "name": "English", "bcp_47": "en", "population": 86055, "score": 0.47 }, { "name": "Nepali", "bcp_47": "ne", "population": 132994, "score": 0.0 }, { "name": "Dzongkha", "bcp_47": "dz", "population": 367689, "score": 0.0 }, { "name": "Tshangla", "bcp_47": "tsj", "population": 117348, "score": 0.0 }, { "name": "Lepcha", "bcp_47": "lep", "population": 30510, "score": 0.0 } ] }, "BV": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 1, "score": 0.47 } ] }, "BW": { "score": 0.26574054482622333, "languages": [ { "name": "English", "bcp_47": "en", "population": 1876956, "score": 0.47 }, { "name": "Afrikaans", "bcp_47": "af", "population": 6025, "score": 0.0 }, { "name": "Tswana", "bcp_47": "tn", "population": 1436683, "score": 0.0 } ] }, "BZ": { "score": 0.4656250134412544, "languages": [ { "name": "English", "bcp_47": "en", "population": 399598, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 111887, "score": 0.45 } ] }, "CA": { "score": 0.4280483033489603, "languages": [ { "name": "English", "bcp_47": "en", "population": 32416926, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 678494, "score": 0.46 }, { "name": "Hindi", "bcp_47": "hi", "population": 188470, "score": 0.46 }, { "name": "Spanish", "bcp_47": "es", "population": 603106, "score": 0.45 }, { "name": "Arabic", "bcp_47": "ar", "population": 565412, "score": 0.42 }, { "name": "Urdu", "bcp_47": "ur", "population": 286475, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 11308230, "score": 0.46 }, { "name": "Bangla", "bcp_47": "bn", "population": 90466, "score": 0.38 }, { "name": "Portuguese", "bcp_47": "pt", "population": 229934, "score": 0.46 }, { "name": "Punjabi", "bcp_47": "pa", "population": 603106, "score": 0.42 }, { "name": "Russian", "bcp_47": "ru", "population": 211087, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 294014, "score": 0.0 }, { "name": "Japanese", "bcp_47": "ja", "population": 52772, "score": 0.0 }, { "name": "Vietnamese", "bcp_47": "vi", "population": 184701, "score": 0.0 }, { "name": "Tamil", "bcp_47": "ta", "population": 184701, "score": 0.0 }, { "name": "Persian", "bcp_47": "fa", "population": 245012, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 37694, "score": 0.0 }, { "name": "Cantonese", "bcp_47": "yue", "population": 640800, "score": 0.0 }, { "name": "Korean", "bcp_47": "ko", "population": 169623, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 343016, "score": 0.0 }, { "name": "Filipino", "bcp_47": "fil", "population": 565412, "score": 0.0 }, { "name": "Gujarati", "bcp_47": "gu", "population": 135699, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 173393, "score": 0.0 }, { "name": "Dutch", "bcp_47": "nl", "population": 56541, "score": 0.0 }, { "name": "Ukrainian", "bcp_47": "uk", "population": 75388, "score": 0.0 }, { "name": "Romanian", "bcp_47": "ro", "population": 101774, "score": 0.0 }, { "name": "Somali", "bcp_47": "so", "population": 49002, "score": 0.0 }, { "name": "Serbian", "bcp_47": "sr", "population": 64080, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 49002, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 124391, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 45233, "score": 0.0 }, { "name": "Waray", "bcp_47": "war", "population": 678, "score": 0.0 }, { "name": "Inuktitut", "bcp_47": "iu", "population": 90466, "score": 0.0 }, { "name": "Plautdietsch", "bcp_47": "pdt", "population": 90466, "score": 0.0 }, { "name": "Ojibwa", "bcp_47": "oj", "population": 23747, "score": 0.0 }, { "name": "Dakota", "bcp_47": "dak", "population": 1206, "score": 0.0 }, { "name": "Oji-Cree", "bcp_47": "ojs", "population": 15078, "score": 0.0 }, { "name": "Chipewyan", "bcp_47": "chp", "population": 12816, "score": 0.0 }, { "name": "Innu-aimun", "bcp_47": "moe", "population": 12062, "score": 0.0 }, { "name": "Cree", "bcp_47": "cr", "population": 9047, "score": 0.0 }, { "name": "Mi'kmaw", "bcp_47": "mic", "population": 7916, "score": 0.0 }, { "name": "Atikamekw", "bcp_47": "atj", "population": 6408, "score": 0.0 }, { "name": "Siksiká", "bcp_47": "bla", "population": 4900, "score": 0.0 }, { "name": "Plains Cree", "bcp_47": "crk", "population": 4146, "score": 0.0 }, { "name": "Slave", "bcp_47": "den", "population": 2299, "score": 0.0 }, { "name": "Dogrib", "bcp_47": "dgr", "population": 2111, "score": 0.0 }, { "name": "Swampy Cree", "bcp_47": "csw", "population": 1809, "score": 0.0 }, { "name": "Mohawk", "bcp_47": "moh", "population": 1772, "score": 0.0 }, { "name": "Naskapi", "bcp_47": "nsk", "population": 1395, "score": 0.0 }, { "name": "Chilcotin", "bcp_47": "clc", "population": 867, "score": 0.0 }, { "name": "Halkomelem", "bcp_47": "hur", "population": 716, "score": 0.0 }, { "name": "Michif", "bcp_47": "crg", "population": 678, "score": 0.0 }, { "name": "Lillooet", "bcp_47": "lil", "population": 528, "score": 0.0 }, { "name": "Okanagan", "bcp_47": "oka", "population": 490, "score": 0.0 }, { "name": "Maliseet-Passamaquoddy", "bcp_47": "pqm", "population": 490, "score": 0.0 }, { "name": "Kwakʼwala", "bcp_47": "kwk", "population": 377, "score": 0.0 }, { "name": "Northern East Cree", "bcp_47": "crl", "population": 377, "score": 0.0 }, { "name": "Gwichʼin", "bcp_47": "gwi", "population": 302, "score": 0.0 } ] }, "CC": { "score": 0.07964765100671141, "languages": [ { "name": "English", "bcp_47": "en", "population": 101, "score": 0.47 }, { "name": "Malay", "bcp_47": "ms", "population": 495, "score": 0.0 } ] }, "CH": { "score": 0.17143224232353874, "languages": [ { "name": "English", "bcp_47": "en", "population": 5126434, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 1764838, "score": 0.46 }, { "name": "Portuguese", "bcp_47": "pt", "population": 285736, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 6134913, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 361372, "score": 0.0 }, { "name": "Swiss German", "bcp_47": "gsw", "population": 5462594, "score": 0.0 }, { "name": "Lombard", "bcp_47": "lmo", "population": 344564, "score": 0.0 }, { "name": "Romansh", "bcp_47": "rm", "population": 42020, "score": 0.0 }, { "name": "Sinte Romani", "bcp_47": "rmo", "population": 24372, "score": 0.0 }, { "name": "Walser", "bcp_47": "wae", "population": 10085, "score": 0.0 } ] }, "CK": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 8574, "score": 0.47 } ] }, "CL": { "score": 0.44555045871559634, "languages": [ { "name": "English", "bcp_47": "en", "population": 1727746, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 17823064, "score": 0.45 }, { "name": "Mapuche", "bcp_47": "arn", "population": 272802, "score": 0.0 } ] }, "CM": { "score": 0.3722156934094152, "languages": [ { "name": "English", "bcp_47": "en", "population": 10543100, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 108206, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 18866600, "score": 0.46 }, { "name": "Hausa", "bcp_47": "ha", "population": 38843, "score": 0.0 }, { "name": "Fula", "bcp_47": "ff", "population": 998820, "score": 0.0 }, { "name": "Bulu", "bcp_47": "bum", "population": 1276270, "score": 0.0 }, { "name": "Ewondo", "bcp_47": "ewo", "population": 860095, "score": 0.0 }, { "name": "Yemba", "bcp_47": "ybb", "population": 443920, "score": 0.0 }, { "name": "Ngiemboon", "bcp_47": "nnh", "population": 388430, "score": 0.0 }, { "name": "Ghomala", "bcp_47": "bbj", "population": 388430, "score": 0.0 }, { "name": "Kom", "bcp_47": "bkm", "population": 360685, "score": 0.0 }, { "name": "Bamun", "bcp_47": "bax", "population": 332940, "score": 0.0 }, { "name": "Basaa", "bcp_47": "bas", "population": 332940, "score": 0.0 }, { "name": "Medumba", "bcp_47": "byv", "population": 305195, "score": 0.0 }, { "name": "Mundang", "bcp_47": "mua", "population": 277450, "score": 0.0 }, { "name": "Mafa", "bcp_47": "maf", "population": 205313, "score": 0.0 }, { "name": "Bafut", "bcp_47": "bfd", "population": 158146, "score": 0.0 }, { "name": "Kako", "bcp_47": "kkj", "population": 149823, "score": 0.0 }, { "name": "Akoose", "bcp_47": "bss", "population": 149823, "score": 0.0 }, { "name": "Duala", "bcp_47": "dua", "population": 133176, "score": 0.0 }, { "name": "Metaʼ", "bcp_47": "mgo", "population": 130401, "score": 0.0 }, { "name": "Ngomba", "bcp_47": "jgo", "population": 94333, "score": 0.0 }, { "name": "Bafia", "bcp_47": "ksf", "population": 88784, "score": 0.0 }, { "name": "Kenyang", "bcp_47": "ken", "population": 69362, "score": 0.0 }, { "name": "Aghem", "bcp_47": "agq", "population": 38843, "score": 0.0 }, { "name": "Kwasio", "bcp_47": "nmg", "population": 8878, "score": 0.0 }, { "name": "Yangben", "bcp_47": "yav", "population": 2303, "score": 0.0 } ] }, "CN": { "score": 0.36863417321148484, "languages": [ { "name": "English", "bcp_47": "en", "population": 62731, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 1254618000, "score": 0.46 }, { "name": "Russian", "bcp_47": "ru", "population": 13940, "score": 0.0 }, { "name": "Vietnamese", "bcp_47": "vi", "population": 6970, "score": 0.0 }, { "name": "Wu Chinese", "bcp_47": "wuu", "population": 83641200, "score": 0.0 }, { "name": "Cantonese", "bcp_47": "yue", "population": 72489040, "score": 0.0 }, { "name": "Korean", "bcp_47": "ko", "population": 2091030, "score": 0.0 }, { "name": "Xiang Chinese", "bcp_47": "hsn", "population": 40426580, "score": 0.0 }, { "name": "Uzbek", "bcp_47": "uz", "population": 5576, "score": 0.0 }, { "name": "Hakka Chinese", "bcp_47": "hak", "population": 32062460, "score": 0.0 }, { "name": "Min Nan Chinese", "bcp_47": "nan", "population": 26486380, "score": 0.0 }, { "name": "Gan Chinese", "bcp_47": "gan", "population": 23698340, "score": 0.0 }, { "name": "Kazakh", "bcp_47": "kk", "population": 1184917, "score": 0.0 }, { "name": "Sichuan Yi", "bcp_47": "ii", "population": 8364120, "score": 0.0 }, { "name": "Uyghur", "bcp_47": "ug", "population": 7667110, "score": 0.0 }, { "name": "Mongolian", "bcp_47": "mn", "population": 3624452, "score": 0.0 }, { "name": "Zhuang", "bcp_47": "za", "population": 4321462, "score": 0.0 }, { "name": "Kyrgyz", "bcp_47": "ky", "population": 473967, "score": 0.0 }, { "name": "Tibetan", "bcp_47": "bo", "population": 2788040, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 55761, "score": 0.0 }, { "name": "Lisu", "bcp_47": "lis", "population": 627309, "score": 0.0 }, { "name": "Naxi", "bcp_47": "nxq", "population": 334565, "score": 0.0 }, { "name": "Lü", "bcp_47": "khb", "population": 264864, "score": 0.0 }, { "name": "Tai Nüa", "bcp_47": "tdd", "population": 264864, "score": 0.0 }, { "name": "Western Lawa", "bcp_47": "lcp", "population": 80853, "score": 0.0 }, { "name": "Literary Chinese", "bcp_47": "lzh", "population": 0, "score": 0.0 } ] }, "CP": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 1, "score": 0.47 } ] }, "CQ": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 482, "score": 0.47 } ] }, "CX": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 1389, "score": 0.47 } ] }, "CY": { "score": 0.18945142670615586, "languages": [ { "name": "English", "bcp_47": "en", "population": 924676, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 1267, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 88668, "score": 0.46 }, { "name": "Turkish", "bcp_47": "tr", "population": 291336, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 1203346, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 2787, "score": 0.0 } ] }, "CZ": { "score": 0.08109144475315826, "languages": [ { "name": "English", "bcp_47": "en", "population": 2889675, "score": 0.47 }, { "name": "German", "bcp_47": "de", "population": 1605375, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 52442, "score": 0.0 }, { "name": "Czech", "bcp_47": "cs", "population": 10488450, "score": 0.0 }, { "name": "Slovak", "bcp_47": "sk", "population": 1712400, "score": 0.0 } ] }, "DE": { "score": 0.16673407486802613, "languages": [ { "name": "English", "bcp_47": "en", "population": 51302208, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 4809582, "score": 0.45 }, { "name": "French", "bcp_47": "fr", "population": 14428746, "score": 0.46 }, { "name": "Russian", "bcp_47": "ru", "population": 4809582, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 72945327, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 2003992, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 5611179, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 232463, "score": 0.0 }, { "name": "Dutch", "bcp_47": "nl", "population": 7214373, "score": 0.0 }, { "name": "Bavarian", "bcp_47": "bar", "population": 13627149, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 304607, "score": 0.0 }, { "name": "Low German", "bcp_47": "nds", "population": 9619164, "score": 0.0 }, { "name": "Swiss German", "bcp_47": "gsw", "population": 1843673, "score": 0.0 }, { "name": "Danish", "bcp_47": "da", "population": 1603194, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 529054, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 633262, "score": 0.0 }, { "name": "Main-Franconian", "bcp_47": "vmf", "population": 4809582, "score": 0.0 }, { "name": "Swabian", "bcp_47": "swg", "population": 801597, "score": 0.0 }, { "name": "Colognian", "bcp_47": "ksh", "population": 240479, "score": 0.0 }, { "name": "Upper Sorbian", "bcp_47": "hsb", "population": 12826, "score": 0.0 }, { "name": "Northern Frisian", "bcp_47": "frr", "population": 9619, "score": 0.0 }, { "name": "Lower Sorbian", "bcp_47": "dsb", "population": 6974, "score": 0.0 }, { "name": "Eastern Frisian", "bcp_47": "frs", "population": 2004, "score": 0.0 }, { "name": "Saterland Frisian", "bcp_47": "stq", "population": 962, "score": 0.0 }, { "name": "Palatine German", "bcp_47": "pfl", "population": 0, "score": 0.0 } ] }, "DG": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 495, "score": 0.47 } ] }, "DK": { "score": 0.1687682799969866, "languages": [ { "name": "English", "bcp_47": "en", "population": 5047693, "score": 0.47 }, { "name": "German", "bcp_47": "de", "population": 2758623, "score": 0.0 }, { "name": "Swedish", "bcp_47": "sv", "population": 763023, "score": 0.0 }, { "name": "Danish", "bcp_47": "da", "population": 5458551, "score": 0.0 }, { "name": "Faroese", "bcp_47": "fo", "population": 22304, "score": 0.0 }, { "name": "Kalaallisut", "bcp_47": "kl", "population": 7043, "score": 0.0 }, { "name": "Jutish", "bcp_47": "jut", "population": 0, "score": 0.0 } ] }, "DM": { "score": 0.47000000000000003, "languages": [ { "name": "English", "bcp_47": "en", "population": 69788, "score": 0.47 } ] }, "DO": { "score": 0.45001946876617066, "languages": [ { "name": "English", "bcp_47": "en", "population": 7980, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 8189766, "score": 0.45 } ] }, "DZ": { "score": 0.2271637127514295, "languages": [ { "name": "English", "bcp_47": "en", "population": 3008103, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 31799946, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 8594580, "score": 0.46 }, { "name": "Algerian Arabic", "bcp_47": "arq", "population": 35667507, "score": 0.0 }, { "name": "Kabyle", "bcp_47": "kab", "population": 3351886, "score": 0.0 } ] }, "EE": { "score": 0.1153657311566433, "languages": [ { "name": "English", "bcp_47": "en", "population": 614310, "score": 0.47 }, { "name": "Russian", "bcp_47": "ru", "population": 688027, "score": 0.0 }, { "name": "Finnish", "bcp_47": "fi", "population": 258010, "score": 0.0 }, { "name": "Estonian", "bcp_47": "et", "population": 872320, "score": 0.0 }, { "name": "Võro", "bcp_47": "vro", "population": 70031, "score": 0.0 }, { "name": "Interlingue", "bcp_47": "ie", "population": 1, "score": 0.0 } ] }, "EG": { "score": 0.28970118200899325, "languages": [ { "name": "English", "bcp_47": "en", "population": 36443400, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 97876560, "score": 0.42 }, { "name": "Egyptian Arabic", "bcp_47": "arz", "population": 66639360, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 63516, "score": 0.0 } ] }, "ER": { "score": 0.1980585154915333, "languages": [ { "name": "English", "bcp_47": "en", "population": 3587908, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 297979, "score": 0.42 }, { "name": "Tigrinya", "bcp_47": "ti", "population": 3648720, "score": 0.0 }, { "name": "Afar", "bcp_47": "aa", "population": 218923, "score": 0.0 }, { "name": "Tigre", "bcp_47": "tig", "population": 1094616, "score": 0.0 }, { "name": "Saho", "bcp_47": "ssy", "population": 218923, "score": 0.0 }, { "name": "Blin", "bcp_47": "byn", "population": 79056, "score": 0.0 } ] }, "ES": { "score": 0.37009809252734244, "languages": [ { "name": "English", "bcp_47": "en", "population": 12003792, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 49515642, "score": 0.45 }, { "name": "Catalan", "bcp_47": "ca", "population": 8502686, "score": 0.0 }, { "name": "Galician", "bcp_47": "gl", "population": 3501106, "score": 0.0 }, { "name": "Occitan", "bcp_47": "oc", "population": 4952, "score": 0.0 }, { "name": "Basque", "bcp_47": "eu", "population": 1000316, "score": 0.0 }, { "name": "Asturian", "bcp_47": "ast", "population": 650205, "score": 0.0 }, { "name": "Extremaduran", "bcp_47": "ext", "population": 245077, "score": 0.0 }, { "name": "Aragonese", "bcp_47": "an", "population": 26008, "score": 0.0 } ] }, "ET": { "score": 0.15951065509076556, "languages": [ { "name": "English", "bcp_47": "en", "population": 46488590, "score": 0.47 }, { "name": "Amharic", "bcp_47": "am", "population": 35677290, "score": 0.0 }, { "name": "Oromo", "bcp_47": "om", "population": 34596160, "score": 0.0 }, { "name": "Somali", "bcp_47": "so", "population": 6486780, "score": 0.0 }, { "name": "Tigrinya", "bcp_47": "ti", "population": 6486780, "score": 0.0 }, { "name": "Sidamo", "bcp_47": "sid", "population": 3783955, "score": 0.0 }, { "name": "Afar", "bcp_47": "aa", "population": 1513582, "score": 0.0 }, { "name": "Wolaytta", "bcp_47": "wal", "population": 1946034, "score": 0.0 }, { "name": "Geez", "bcp_47": "gez", "population": 0, "score": 0.0 } ] }, "FI": { "score": 0.14489049029987158, "languages": [ { "name": "English", "bcp_47": "en", "population": 3900169, "score": 0.47 }, { "name": "Russian", "bcp_47": "ru", "population": 45131, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 1002901, "score": 0.0 }, { "name": "Swedish", "bcp_47": "sv", "population": 2451535, "score": 0.0 }, { "name": "Finnish", "bcp_47": "fi", "population": 5237370, "score": 0.0 }, { "name": "Estonian", "bcp_47": "et", "population": 6129, "score": 0.0 }, { "name": "Northern Sami", "bcp_47": "se", "population": 2006, "score": 0.0 }, { "name": "Kalo Finnish Romani", "bcp_47": "rmf", "population": 5015, "score": 0.0 }, { "name": "Skolt Sami", "bcp_47": "sms", "population": 613, "score": 0.0 }, { "name": "Inari Sami", "bcp_47": "smn", "population": 613, "score": 0.0 } ] }, "FJ": { "score": 0.2951391687808469, "languages": [ { "name": "English", "bcp_47": "en", "population": 879816, "score": 0.47 }, { "name": "Hindi", "bcp_47": "hi", "population": 411829, "score": 0.46 }, { "name": "Fiji Hindi", "bcp_47": "hif", "population": 383749, "score": 0.0 }, { "name": "Fijian", "bcp_47": "fj", "population": 365030, "score": 0.0 }, { "name": "Rotuman", "bcp_47": "rtm", "population": 2527, "score": 0.0 } ] }, "FK": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 2814, "score": 0.47 } ] }, "FM": { "score": 0.2107792806285859, "languages": [ { "name": "English", "bcp_47": "en", "population": 58389, "score": 0.47 }, { "name": "Chuukese", "bcp_47": "chk", "population": 30731, "score": 0.0 }, { "name": "Pohnpeian", "bcp_47": "pon", "population": 23560, "score": 0.0 }, { "name": "Kosraean", "bcp_47": "kos", "population": 7990, "score": 0.0 }, { "name": "Yapese", "bcp_47": "yap", "population": 6556, "score": 0.0 }, { "name": "Ulithian", "bcp_47": "uli", "population": 2971, "score": 0.0 } ] }, "FR": { "score": 0.4241282220594123, "languages": [ { "name": "English", "bcp_47": "en", "population": 26460798, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 8820266, "score": 0.45 }, { "name": "French", "bcp_47": "fr", "population": 67169718, "score": 0.46 }, { "name": "Portuguese", "bcp_47": "pt", "population": 882027, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 3392410, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 1153419, "score": 0.0 }, { "name": "Dutch", "bcp_47": "nl", "population": 88203, "score": 0.0 }, { "name": "Catalan", "bcp_47": "ca", "population": 115342, "score": 0.0 }, { "name": "Swiss German", "bcp_47": "gsw", "population": 617419, "score": 0.0 }, { "name": "Occitan", "bcp_47": "oc", "population": 2035446, "score": 0.0 }, { "name": "Basque", "bcp_47": "eu", "population": 88203, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 128912, "score": 0.0 }, { "name": "Picard", "bcp_47": "pcd", "population": 746330, "score": 0.0 }, { "name": "Breton", "bcp_47": "br", "population": 563140, "score": 0.0 }, { "name": "Corsican", "bcp_47": "co", "population": 162836, "score": 0.0 }, { "name": "Arpitan", "bcp_47": "frp", "population": 63777, "score": 0.0 }, { "name": "Interlingua", "bcp_47": "ia", "population": 136, "score": 0.0 } ] }, "GB": { "score": 0.3951929468077104, "languages": [ { "name": "English", "bcp_47": "en", "population": 64445878, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 197283, "score": 0.46 }, { "name": "Spanish", "bcp_47": "es", "population": 5260888, "score": 0.45 }, { "name": "Arabic", "bcp_47": "ar", "population": 197283, "score": 0.42 }, { "name": "Urdu", "bcp_47": "ur", "population": 2301638, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 15125053, "score": 0.46 }, { "name": "Bangla", "bcp_47": "bn", "population": 263044, "score": 0.38 }, { "name": "Portuguese", "bcp_47": "pt", "population": 131522, "score": 0.46 }, { "name": "Punjabi", "bcp_47": "pa", "population": 2367400, "score": 0.42 }, { "name": "German", "bcp_47": "de", "population": 5918499, "score": 0.0 }, { "name": "Tamil", "bcp_47": "ta", "population": 2104355, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 131522, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 131522, "score": 0.0 }, { "name": "Gujarati", "bcp_47": "gu", "population": 1907072, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 2630444, "score": 0.0 }, { "name": "Somali", "bcp_47": "so", "population": 131522, "score": 0.0 }, { "name": "Lithuanian", "bcp_47": "lt", "population": 131522, "score": 0.0 }, { "name": "Scots", "bcp_47": "sco", "population": 1644028, "score": 0.0 }, { "name": "Irish", "bcp_47": "ga", "population": 98642, "score": 0.0 }, { "name": "Welsh", "bcp_47": "cy", "population": 854894, "score": 0.0 }, { "name": "Scottish Gaelic", "bcp_47": "gd", "population": 72337, "score": 0.0 }, { "name": "Cornish", "bcp_47": "kw", "population": 1973, "score": 0.0 } ] }, "GD": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 108570, "score": 0.47 } ] }, "GG": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 67052, "score": 0.47 } ] }, "GH": { "score": 0.11322182754078493, "languages": [ { "name": "English", "bcp_47": "en", "population": 6161442, "score": 0.47 }, { "name": "Hausa", "bcp_47": "ha", "population": 252326, "score": 0.0 }, { "name": "Akan", "bcp_47": "ak", "population": 11442678, "score": 0.0 }, { "name": "Fula", "bcp_47": "ff", "population": 0, "score": 0.0 }, { "name": "Ewe", "bcp_47": "ee", "population": 3227422, "score": 0.0 }, { "name": "Abron", "bcp_47": "abr", "population": 1467010, "score": 0.0 }, { "name": "Frafra", "bcp_47": "gur", "population": 1026907, "score": 0.0 }, { "name": "Adangme", "bcp_47": "ada", "population": 880206, "score": 0.0 }, { "name": "Ga", "bcp_47": "gaa", "population": 821526, "score": 0.0 }, { "name": "Nzima", "bcp_47": "nzi", "population": 293402, "score": 0.0 }, { "name": "Safaliba", "bcp_47": "saf", "population": 4108, "score": 0.0 } ] }, "GI": { "score": 0.46230789234169806, "languages": [ { "name": "English", "bcp_47": "en", "population": 23665, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 14790, "score": 0.45 } ] }, "GM": { "score": 0.27246376811594203, "languages": [ { "name": "English", "bcp_47": "en", "population": 869600, "score": 0.47 }, { "name": "Fula", "bcp_47": "ff", "population": 0, "score": 0.0 }, { "name": "Mandingo", "bcp_47": "man", "population": 630460, "score": 0.0 } ] }, "GR": { "score": 0.16451496911429414, "languages": [ { "name": "English", "bcp_47": "en", "population": 5409621, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 954639, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 530355, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 127285, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 10501029, "score": 0.0 }, { "name": "Bulgarian", "bcp_47": "bg", "population": 28639, "score": 0.0 }, { "name": "Albanian", "bcp_47": "sq", "population": 9971, "score": 0.0 }, { "name": "Macedonian", "bcp_47": "mk", "population": 169714, "score": 0.0 }, { "name": "Pontic", "bcp_47": "pnt", "population": 392463, "score": 0.0 }, { "name": "Tsakonian", "bcp_47": "tsd", "population": 202, "score": 0.0 } ] }, "GS": { "score": 0.4699999999999999, "languages": [ { "name": "English", "bcp_47": "en", "population": 20, "score": 0.47 } ] }, "GU": { "score": 0.37849481059730655, "languages": [ { "name": "English", "bcp_47": "en", "population": 153321, "score": 0.47 }, { "name": "Chamorro", "bcp_47": "ch", "population": 37067, "score": 0.0 } ] }, "GY": { "score": 0.47000000000000003, "languages": [ { "name": "English", "bcp_47": "en", "population": 750204, "score": 0.47 } ] }, "HK": { "score": 0.29033194917916566, "languages": [ { "name": "English", "bcp_47": "en", "population": 3697454, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 7249910, "score": 0.46 }, { "name": "Cantonese", "bcp_47": "yue", "population": 6524919, "score": 0.0 } ] }, "HM": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 1, "score": 0.47 } ] }, "HN": { "score": 0.45011218630076477, "languages": [ { "name": "English", "bcp_47": "en", "population": 40635, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 7203565, "score": 0.45 } ] }, "HR": { "score": 0.15322692258543336, "languages": [ { "name": "English", "bcp_47": "en", "population": 2071598, "score": 0.47 }, { "name": "Italian", "bcp_47": "it", "population": 67644, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 4185472, "score": 0.0 }, { "name": "Venetian", "bcp_47": "vec", "population": 29594, "score": 0.0 } ] }, "HU": { "score": 0.07565921456157332, "languages": [ { "name": "English", "bcp_47": "en", "population": 1954366, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 293155, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 1758929, "score": 0.0 }, { "name": "Romanian", "bcp_47": "ro", "population": 96741, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 9771830, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 31270, "score": 0.0 }, { "name": "Slovak", "bcp_47": "sk", "population": 11726, "score": 0.0 }, { "name": "Slovenian", "bcp_47": "sl", "population": 4984, "score": 0.0 } ] }, "IE": { "score": 0.3932846989826846, "languages": [ { "name": "English", "bcp_47": "en", "population": 5073039, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 880017, "score": 0.46 }, { "name": "Irish", "bcp_47": "ga", "population": 1138845, "score": 0.0 } ] }, "IL": { "score": 0.19791078395296563, "languages": [ { "name": "English", "bcp_47": "en", "population": 7374158, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 1735096, "score": 0.42 }, { "name": "Russian", "bcp_47": "ru", "population": 954303, "score": 0.0 }, { "name": "Malayalam", "bcp_47": "ml", "population": 7981, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 130132, "score": 0.0 }, { "name": "North Levantine Arabic", "bcp_47": "apc", "population": 1474832, "score": 0.0 }, { "name": "Amharic", "bcp_47": "am", "population": 51185, "score": 0.0 }, { "name": "Romanian", "bcp_47": "ro", "population": 320993, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 86755, "score": 0.0 }, { "name": "Tigrinya", "bcp_47": "ti", "population": 10411, "score": 0.0 }, { "name": "Hebrew", "bcp_47": "he", "population": 8675480, "score": 0.0 }, { "name": "Yiddish", "bcp_47": "yi", "population": 260264, "score": 0.0 }, { "name": "Ladino", "bcp_47": "lad", "population": 112781, "score": 0.0 } ] }, "IM": { "score": 0.4612389121429656, "languages": [ { "name": "English", "bcp_47": "en", "population": 90499, "score": 0.47 }, { "name": "Manx", "bcp_47": "gv", "population": 1719, "score": 0.0 } ] }, "IN": { "score": 0.26031158182809067, "languages": [ { "name": "English", "bcp_47": "en", "population": 251957100, "score": 0.47 }, { "name": "Hindi", "bcp_47": "hi", "population": 545022990, "score": 0.46 }, { "name": "Urdu", "bcp_47": "ur", "population": 66304500, "score": 0.42 }, { "name": "Bangla", "bcp_47": "bn", "population": 107413290, "score": 0.38 }, { "name": "Punjabi", "bcp_47": "pa", "population": 37130520, "score": 0.42 }, { "name": "Telugu", "bcp_47": "te", "population": 95478480, "score": 0.0 }, { "name": "Western Panjabi", "bcp_47": "lah", "population": 33152, "score": 0.0 }, { "name": "Marathi", "bcp_47": "mr", "population": 92826300, "score": 0.0 }, { "name": "Tamil", "bcp_47": "ta", "population": 78239310, "score": 0.0 }, { "name": "Gujarati", "bcp_47": "gu", "population": 59674050, "score": 0.0 }, { "name": "Kannada", "bcp_47": "kn", "population": 49065330, "score": 0.0 }, { "name": "Malayalam", "bcp_47": "ml", "population": 42434880, "score": 0.0 }, { "name": "Odia", "bcp_47": "or", "population": 42434880, "score": 0.0 }, { "name": "Sindhi", "bcp_47": "sd", "population": 5304360, "score": 0.0 }, { "name": "Bhojpuri", "bcp_47": "bho", "population": 30500070, "score": 0.0 }, { "name": "Awadhi", "bcp_47": "awa", "population": 25195710, "score": 0.0 }, { "name": "Nepali", "bcp_47": "ne", "population": 7426104, "score": 0.0 }, { "name": "Maithili", "bcp_47": "mai", "population": 15913080, "score": 0.0 }, { "name": "Assamese", "bcp_47": "as", "population": 17239170, "score": 0.0 }, { "name": "Rangpuri", "bcp_47": "rkt", "population": 5702187, "score": 0.0 }, { "name": "Magahi", "bcp_47": "mag", "population": 15913080, "score": 0.0 }, { "name": "Haryanvi", "bcp_47": "bgc", "population": 15913080, "score": 0.0 }, { "name": "Marwari", "bcp_47": "mwr", "population": 15913080, "score": 0.0 }, { "name": "Chhattisgarhi", "bcp_47": "hne", "population": 14586990, "score": 0.0 }, { "name": "Deccan", "bcp_47": "dcc", "population": 13128291, "score": 0.0 }, { "name": "Kanauji", "bcp_47": "bjj", "population": 7426104, "score": 0.0 }, { "name": "Santali", "bcp_47": "sat", "population": 7293495, "score": 0.0 }, { "name": "Mewati", "bcp_47": "wtm", "population": 6100014, "score": 0.0 }, { "name": "Kashmiri", "bcp_47": "ks", "population": 5436969, "score": 0.0 }, { "name": "Konkani", "bcp_47": "kok", "population": 4906533, "score": 0.0 }, { "name": "Goan Konkani", "bcp_47": "gom", "population": 4243488, "score": 0.0 }, { "name": "Shekhawati", "bcp_47": "swv", "population": 3713052, "score": 0.0 }, { "name": "Lambadi", "bcp_47": "lmn", "population": 3580443, "score": 0.0 }, { "name": "Garhwali", "bcp_47": "gbm", "population": 3580443, "score": 0.0 }, { "name": "Gondi", "bcp_47": "gon", "population": 3182616, "score": 0.0 }, { "name": "Tibetan", "bcp_47": "bo", "population": 145870, "score": 0.0 }, { "name": "Kumaoni", "bcp_47": "kfy", "population": 2917398, "score": 0.0 }, { "name": "Dogri", "bcp_47": "doi", "population": 2652180, "score": 0.0 }, { "name": "Kurukh", "bcp_47": "kru", "population": 2519571, "score": 0.0 }, { "name": "Sadri", "bcp_47": "sck", "population": 2386962, "score": 0.0 }, { "name": "Waddar", "bcp_47": "wbq", "population": 2386962, "score": 0.0 }, { "name": "Kangri", "bcp_47": "xnr", "population": 2121744, "score": 0.0 }, { "name": "Wagdi", "bcp_47": "wbr", "population": 1989135, "score": 0.0 }, { "name": "Tulu", "bcp_47": "tcy", "population": 1989135, "score": 0.0 }, { "name": "Khandesi", "bcp_47": "khn", "population": 1989135, "score": 0.0 }, { "name": "Bodo", "bcp_47": "brx", "population": 1856526, "score": 0.0 }, { "name": "Nimadi", "bcp_47": "noe", "population": 1723917, "score": 0.0 }, { "name": "Bhili", "bcp_47": "bhb", "population": 1591308, "score": 0.0 }, { "name": "Manipuri", "bcp_47": "mni", "population": 1458699, "score": 0.0 }, { "name": "Rajasthani", "bcp_47": "raj", "population": 1326090, "score": 0.0 }, { "name": "Ho", "bcp_47": "hoc", "population": 1312829, "score": 0.0 }, { "name": "Mewari", "bcp_47": "mtr", "population": 1286307, "score": 0.0 }, { "name": "Mundari", "bcp_47": "unr", "population": 1246525, "score": 0.0 }, { "name": "Bhilali", "bcp_47": "bhi", "population": 1220003, "score": 0.0 }, { "name": "Hadothi", "bcp_47": "hoj", "population": 1087394, "score": 0.0 }, { "name": "Khasi", "bcp_47": "kha", "population": 1060872, "score": 0.0 }, { "name": "Kachhi", "bcp_47": "kfr", "population": 994568, "score": 0.0 }, { "name": "Garo", "bcp_47": "grt", "population": 702828, "score": 0.0 }, { "name": "Chakma", "bcp_47": "ccp", "population": 371305, "score": 0.0 }, { "name": "Bagheli", "bcp_47": "bfy", "population": 490653, "score": 0.0 }, { "name": "Munda", "bcp_47": "unx", "population": 636523, "score": 0.0 }, { "name": "Balti", "bcp_47": "bft", "population": 82218, "score": 0.0 }, { "name": "Sirmauri", "bcp_47": "srx", "population": 464132, "score": 0.0 }, { "name": "Divehi", "bcp_47": "dv", "population": 3978, "score": 0.0 }, { "name": "Saurashtra", "bcp_47": "saz", "population": 384566, "score": 0.0 }, { "name": "Dzongkha", "bcp_47": "dz", "population": 2652, "score": 0.0 }, { "name": "Limbu", "bcp_47": "lif", "population": 34478, "score": 0.0 }, { "name": "Ao Naga", "bcp_47": "njo", "population": 305001, "score": 0.0 }, { "name": "Badaga", "bcp_47": "bfq", "population": 305001, "score": 0.0 }, { "name": "Riang (India)", "bcp_47": "ria", "population": 172392, "score": 0.0 }, { "name": "Bishnupriya", "bcp_47": "bpy", "population": 90174, "score": 0.0 }, { "name": "Lepcha", "bcp_47": "lep", "population": 46413, "score": 0.0 }, { "name": "Bateri", "bcp_47": "btv", "population": 34478, "score": 0.0 }, { "name": "Braj", "bcp_47": "bra", "population": 54370, "score": 0.0 }, { "name": "Kuvi", "bcp_47": "kxv", "population": 38457, "score": 0.0 }, { "name": "Sanskrit", "bcp_47": "sa", "population": 15913, "score": 0.0 }, { "name": "Khamti", "bcp_47": "kht", "population": 9283, "score": 0.0 } ] }, "IO": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 3500, "score": 0.47 } ] }, "IQ": { "score": 0.35502445223850776, "languages": [ { "name": "English", "bcp_47": "en", "population": 13605445, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 26433436, "score": 0.42 }, { "name": "Persian", "bcp_47": "fa", "population": 338192, "score": 0.0 }, { "name": "Azerbaijani", "bcp_47": "az", "population": 699709, "score": 0.0 }, { "name": "Central Kurdish", "bcp_47": "ckb", "population": 7774540, "score": 0.0 }, { "name": "Northern Luri", "bcp_47": "lrc", "population": 237123, "score": 0.0 }, { "name": "Syriac", "bcp_47": "syr", "population": 194364, "score": 0.0 } ] }, "IT": { "score": 0.12688064203402252, "languages": [ { "name": "English", "bcp_47": "en", "population": 21216918, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 3931370, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 998443, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 59282565, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 21841, "score": 0.0 }, { "name": "Catalan", "bcp_47": "ca", "population": 21841, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 3495, "score": 0.0 }, { "name": "Lombard", "bcp_47": "lmo", "population": 3556954, "score": 0.0 }, { "name": "Slovenian", "bcp_47": "sl", "population": 106085, "score": 0.0 }, { "name": "Venetian", "bcp_47": "vec", "population": 811235, "score": 0.0 }, { "name": "Sardinian", "bcp_47": "sc", "population": 1060846, "score": 0.0 }, { "name": "Neapolitan", "bcp_47": "nap", "population": 605306, "score": 0.0 }, { "name": "Ligurian", "bcp_47": "lij", "population": 536663, "score": 0.0 }, { "name": "Sicilian", "bcp_47": "scn", "population": 511702, "score": 0.0 }, { "name": "Sassarese Sardinian", "bcp_47": "sdc", "population": 106085, "score": 0.0 }, { "name": "Friulian", "bcp_47": "fur", "population": 37442, "score": 0.0 }, { "name": "Emilian", "bcp_47": "egl", "population": 31201, "score": 0.0 }, { "name": "Piedmontese", "bcp_47": "pms", "population": 6178, "score": 0.0 }, { "name": "Romagnol", "bcp_47": "rgn", "population": 0, "score": 0.0 } ] }, "JE": { "score": 0.47000000000000003, "languages": [ { "name": "English", "bcp_47": "en", "population": 96019, "score": 0.47 } ] }, "JM": { "score": 0.2386528447990708, "languages": [ { "name": "English", "bcp_47": "en", "population": 2752399, "score": 0.47 }, { "name": "Jamaican Creole English", "bcp_47": "jam", "population": 2668142, "score": 0.0 } ] }, "JO": { "score": 0.29928909952606636, "languages": [ { "name": "English", "bcp_47": "en", "population": 4869270, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 10820600, "score": 0.42 }, { "name": "North Levantine Arabic", "bcp_47": "apc", "population": 7141596, "score": 0.0 } ] }, "KE": { "score": 0.057955683710036364, "languages": [ { "name": "English", "bcp_47": "en", "population": 10170301, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 24623, "score": 0.42 }, { "name": "Punjabi", "bcp_47": "pa", "population": 10170, "score": 0.42 }, { "name": "Swahili", "bcp_47": "sw", "population": 35328414, "score": 0.0 }, { "name": "Gujarati", "bcp_47": "gu", "population": 4978, "score": 0.0 }, { "name": "Oromo", "bcp_47": "om", "population": 251581, "score": 0.0 }, { "name": "Somali", "bcp_47": "so", "population": 695863, "score": 0.0 }, { "name": "Kikuyu", "bcp_47": "ki", "population": 9099743, "score": 0.0 }, { "name": "Luyia", "bcp_47": "luy", "population": 5888069, "score": 0.0 }, { "name": "Luo (Kenya and Tanzania)", "bcp_47": "luo", "population": 5245734, "score": 0.0 }, { "name": "Kamba", "bcp_47": "kam", "population": 4068120, "score": 0.0 }, { "name": "Kalenjin", "bcp_47": "kln", "population": 4068120, "score": 0.0 }, { "name": "Gusii", "bcp_47": "guz", "population": 2622867, "score": 0.0 }, { "name": "Meru", "bcp_47": "mer", "population": 2141116, "score": 0.0 }, { "name": "Teso", "bcp_47": "teo", "population": 396106, "score": 0.0 }, { "name": "Masai", "bcp_47": "mas", "population": 856446, "score": 0.0 }, { "name": "Embu", "bcp_47": "ebu", "population": 802918, "score": 0.0 }, { "name": "Taita", "bcp_47": "dav", "population": 438929, "score": 0.0 }, { "name": "Pökoot", "bcp_47": "pko", "population": 369343, "score": 0.0 }, { "name": "Samburu", "bcp_47": "saq", "population": 246228, "score": 0.0 } ] }, "KI": { "score": 0.29374934311302925, "languages": [ { "name": "English", "bcp_47": "en", "population": 111796, "score": 0.47 }, { "name": "Gilbertese", "bcp_47": "gil", "population": 67078, "score": 0.0 } ] }, "KN": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 52745, "score": 0.47 } ] }, "KY": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 60705, "score": 0.47 } ] }, "KZ": { "score": 0.0442283557549302, "languages": [ { "name": "English", "bcp_47": "en", "population": 2863785, "score": 0.47 }, { "name": "Russian", "bcp_47": "ru", "population": 13746168, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 1221882, "score": 0.0 }, { "name": "Kazakh", "bcp_47": "kk", "population": 12218816, "score": 0.0 }, { "name": "Uyghur", "bcp_47": "ug", "population": 381838, "score": 0.0 } ] }, "LB": { "score": 0.236164974261225, "languages": [ { "name": "English", "bcp_47": "en", "population": 2187844, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 4703865, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 20238, "score": 0.46 }, { "name": "North Levantine Arabic", "bcp_47": "apc", "population": 5469610, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 92983, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 284420, "score": 0.0 } ] }, "LC": { "score": 0.47000000000000003, "languages": [ { "name": "English", "bcp_47": "en", "population": 149838, "score": 0.47 } ] }, "LK": { "score": 0.05053763440860214, "languages": [ { "name": "English", "bcp_47": "en", "population": 2288920, "score": 0.47 }, { "name": "Tamil", "bcp_47": "ta", "population": 3433380, "score": 0.0 }, { "name": "Sinhala", "bcp_47": "si", "population": 15564656, "score": 0.0 } ] }, "LR": { "score": 0.3897881418272767, "languages": [ { "name": "English", "bcp_47": "en", "population": 4210839, "score": 0.47 }, { "name": "Fula", "bcp_47": "ff", "population": 0, "score": 0.0 }, { "name": "Mende", "bcp_47": "men", "population": 24352, "score": 0.0 }, { "name": "Kpelle", "bcp_47": "kpe", "population": 710262, "score": 0.0 }, { "name": "Vai", "bcp_47": "vai", "population": 131906, "score": 0.0 } ] }, "LS": { "score": 0.08912144167455979, "languages": [ { "name": "English", "bcp_47": "en", "population": 531719, "score": 0.47 }, { "name": "Zulu", "bcp_47": "zu", "population": 275706, "score": 0.0 }, { "name": "Xhosa", "bcp_47": "xh", "population": 19496, "score": 0.0 }, { "name": "Southern Sotho", "bcp_47": "st", "population": 1929943, "score": 0.0 }, { "name": "Swati", "bcp_47": "ss", "population": 47264, "score": 0.0 } ] }, "LT": { "score": 0.08192661853903119, "languages": [ { "name": "English", "bcp_47": "en", "population": 1037955, "score": 0.47 }, { "name": "Russian", "bcp_47": "ru", "population": 2185168, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 382404, "score": 0.0 }, { "name": "Lithuanian", "bcp_47": "lt", "population": 2349056, "score": 0.0 }, { "name": "Samogitian", "bcp_47": "sgs", "population": 0, "score": 0.0 } ] }, "LU": { "score": 0.255017252012643, "languages": [ { "name": "English", "bcp_47": "en", "population": 351893, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 546691, "score": 0.46 }, { "name": "Portuguese", "bcp_47": "pt", "population": 100541, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 395880, "score": 0.0 }, { "name": "Luxembourgish", "bcp_47": "lb", "population": 421015, "score": 0.0 } ] }, "LV": { "score": 0.14048091124242368, "languages": [ { "name": "English", "bcp_47": "en", "population": 865366, "score": 0.47 }, { "name": "Russian", "bcp_47": "ru", "population": 714867, "score": 0.0 }, { "name": "Latvian", "bcp_47": "lv", "population": 1147550, "score": 0.0 }, { "name": "Latgalian", "bcp_47": "ltg", "population": 167429, "score": 0.0 } ] }, "MA": { "score": 0.1728843489070226, "languages": [ { "name": "English", "bcp_47": "en", "population": 4978638, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 23115, "score": 0.45 }, { "name": "Arabic", "bcp_47": "ar", "population": 22048254, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 7112340, "score": 0.46 }, { "name": "Moroccan Arabic", "bcp_47": "ary", "population": 30938679, "score": 0.0 }, { "name": "Standard Moroccan Tamazight", "bcp_47": "zgh", "population": 7823574, "score": 0.0 }, { "name": "Tachelhit", "bcp_47": "shi", "population": 6187736, "score": 0.0 }, { "name": "Riffian", "bcp_47": "rif", "population": 3485046, "score": 0.0 }, { "name": "Central Atlas Tamazight", "bcp_47": "tzm", "population": 3485047, "score": 0.0 } ] }, "MG": { "score": 0.22711864406779658, "languages": [ { "name": "English", "bcp_47": "en", "population": 4852026, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 18599433, "score": 0.46 }, { "name": "Malagasy", "bcp_47": "mg", "population": 24260130, "score": 0.0 } ] }, "MH": { "score": 0.2633143913036755, "languages": [ { "name": "English", "bcp_47": "en", "population": 72463, "score": 0.47 }, { "name": "Marshallese", "bcp_47": "mh", "population": 56879, "score": 0.0 } ] }, "MO": { "score": 0.46020852883372587, "languages": [ { "name": "English", "bcp_47": "en", "population": 14133, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 632892, "score": 0.46 }, { "name": "Portuguese", "bcp_47": "pt", "population": 30723, "score": 0.46 } ] }, "MP": { "score": 0.39643436802596876, "languages": [ { "name": "English", "bcp_47": "en", "population": 49890, "score": 0.47 }, { "name": "Chamorro", "bcp_47": "ch", "population": 9258, "score": 0.0 } ] }, "MS": { "score": 0.47000000000000003, "languages": [ { "name": "English", "bcp_47": "en", "population": 3492, "score": 0.47 } ] }, "MT": { "score": 0.18203906242629914, "languages": [ { "name": "English", "bcp_47": "en", "population": 402395, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 50299, "score": 0.46 }, { "name": "Italian", "bcp_47": "it", "population": 256070, "score": 0.0 }, { "name": "Maltese", "bcp_47": "mt", "population": 457267, "score": 0.0 } ] }, "MU": { "score": 0.18730089040118697, "languages": [ { "name": "English", "bcp_47": "en", "population": 993146, "score": 0.47 }, { "name": "Urdu", "bcp_47": "ur", "population": 71727, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 41381, "score": 0.46 }, { "name": "Tamil", "bcp_47": "ta", "population": 34484, "score": 0.0 }, { "name": "Bhojpuri", "bcp_47": "bho", "population": 372430, "score": 0.0 }, { "name": "Morisyen", "bcp_47": "mfe", "population": 1241433, "score": 0.0 } ] }, "MV": { "score": 0.20375720139116277, "languages": [ { "name": "English", "bcp_47": "en", "population": 293928, "score": 0.47 }, { "name": "Divehi", "bcp_47": "dv", "population": 384066, "score": 0.0 } ] }, "MW": { "score": 0.21818583638561564, "languages": [ { "name": "English", "bcp_47": "en", "population": 13353858, "score": 0.47 }, { "name": "Nyanja", "bcp_47": "ny", "population": 13353858, "score": 0.0 }, { "name": "Zulu", "bcp_47": "zu", "population": 69949, "score": 0.0 }, { "name": "Tumbuka", "bcp_47": "tum", "population": 1780514, "score": 0.0 }, { "name": "Nyasa Tonga", "bcp_47": "tog", "population": 207727, "score": 0.0 } ] }, "MX": { "score": 0.4435481398281213, "languages": [ { "name": "English", "bcp_47": "en", "population": 16724500, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 106779500, "score": 0.45 }, { "name": "Venetian", "bcp_47": "vec", "population": 2444, "score": 0.0 }, { "name": "Yucateco", "bcp_47": "yua", "population": 861955, "score": 0.0 }, { "name": "Eastern Huasteca Nahuatl", "bcp_47": "nhe", "population": 501735, "score": 0.0 }, { "name": "Western Huasteca Nahuatl", "bcp_47": "nhw", "population": 501735, "score": 0.0 }, { "name": "Central Mazahua", "bcp_47": "maz", "population": 437410, "score": 0.0 }, { "name": "Central Huasteca Nahuatl", "bcp_47": "nch", "population": 244435, "score": 0.0 }, { "name": "Seri", "bcp_47": "sei", "population": 901, "score": 0.0 } ] }, "MY": { "score": 0.1439334800637596, "languages": [ { "name": "English", "bcp_47": "en", "population": 6856941, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 5550857, "score": 0.46 }, { "name": "Javanese", "bcp_47": "jv", "population": 391825, "score": 0.0 }, { "name": "Tamil", "bcp_47": "ta", "population": 1371388, "score": 0.0 }, { "name": "Malayalam", "bcp_47": "ml", "population": 48978, "score": 0.0 }, { "name": "Malay", "bcp_47": "ms", "population": 24489075, "score": 0.0 }, { "name": "Buginese", "bcp_47": "bug", "population": 25795, "score": 0.0 }, { "name": "Banjar", "bcp_47": "bjn", "population": 4898, "score": 0.0 }, { "name": "Iban", "bcp_47": "iba", "population": 816302, "score": 0.0 }, { "name": "Negeri Sembilan Malay", "bcp_47": "zmi", "population": 391825, "score": 0.0 }, { "name": "Central Dusun", "bcp_47": "dtp", "population": 182852, "score": 0.0 } ] }, "NA": { "score": 0.020619217407487452, "languages": [ { "name": "English", "bcp_47": "en", "population": 184105, "score": 0.47 }, { "name": "German", "bcp_47": "de", "population": 23671, "score": 0.0 }, { "name": "Afrikaans", "bcp_47": "af", "population": 1972552, "score": 0.0 }, { "name": "Tswana", "bcp_47": "tn", "population": 14728, "score": 0.0 }, { "name": "Kuanyama", "bcp_47": "kj", "population": 920524, "score": 0.0 }, { "name": "Ndonga", "bcp_47": "ng", "population": 552315, "score": 0.0 }, { "name": "Nama", "bcp_47": "naq", "population": 289308, "score": 0.0 }, { "name": "Herero", "bcp_47": "hz", "population": 239336, "score": 0.0 } ] }, "NF": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 1678, "score": 0.47 } ] }, "NG": { "score": 0.19759994365435074, "languages": [ { "name": "English", "bcp_47": "en", "population": 113434840, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 151960, "score": 0.42 }, { "name": "Nigerian Pidgin", "bcp_47": "pcm", "population": 44945880, "score": 0.0 }, { "name": "Hausa", "bcp_47": "ha", "population": 29963920, "score": 0.0 }, { "name": "Yoruba", "bcp_47": "yo", "population": 27823640, "score": 0.0 }, { "name": "Igbo", "bcp_47": "ig", "population": 27823640, "score": 0.0 }, { "name": "Nigerian Fulfulde", "bcp_47": "fuv", "population": 14339876, "score": 0.0 }, { "name": "Fula", "bcp_47": "ff", "population": 0, "score": 0.0 }, { "name": "Tiv", "bcp_47": "tiv", "population": 3424448, "score": 0.0 }, { "name": "Ibibio", "bcp_47": "ibb", "population": 2996392, "score": 0.0 }, { "name": "Efik", "bcp_47": "efi", "population": 2996392, "score": 0.0 }, { "name": "Bini", "bcp_47": "bin", "population": 1519599, "score": 0.0 }, { "name": "Jju", "bcp_47": "kaj", "population": 449459, "score": 0.0 }, { "name": "Tyap", "bcp_47": "kcg", "population": 199046, "score": 0.0 }, { "name": "Atsam", "bcp_47": "cch", "population": 44946, "score": 0.0 }, { "name": "Amo", "bcp_47": "amo", "population": 18620, "score": 0.0 }, { "name": "Obolo", "bcp_47": "ann", "population": 0, "score": 0.0 } ] }, "NL": { "score": 0.17387499999999997, "languages": [ { "name": "English", "bcp_47": "en", "population": 15552360, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 5011316, "score": 0.46 }, { "name": "Indonesian", "bcp_47": "id", "population": 311047, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 12269084, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 207365, "score": 0.0 }, { "name": "Dutch", "bcp_47": "nl", "population": 17280400, "score": 0.0 }, { "name": "Low German", "bcp_47": "nds", "population": 1900844, "score": 0.0 }, { "name": "Riffian", "bcp_47": "rif", "population": 207365, "score": 0.0 }, { "name": "Limburgish", "bcp_47": "li", "population": 950422, "score": 0.0 }, { "name": "Western Frisian", "bcp_47": "fy", "population": 743057, "score": 0.0 }, { "name": "Gronings", "bcp_47": "gos", "population": 622094, "score": 0.0 }, { "name": "Zeelandic", "bcp_47": "zea", "population": 241926, "score": 0.0 } ] }, "NP": { "score": 0.018334010922876218, "languages": [ { "name": "English", "bcp_47": "en", "population": 909837, "score": 0.47 }, { "name": "Hindi", "bcp_47": "hi", "population": 127377, "score": 0.46 }, { "name": "Bangla", "bcp_47": "bn", "population": 28508, "score": 0.38 }, { "name": "Bhojpuri", "bcp_47": "bho", "population": 2062297, "score": 0.0 }, { "name": "Awadhi", "bcp_47": "awa", "population": 667214, "score": 0.0 }, { "name": "Nepali", "bcp_47": "ne", "population": 13344276, "score": 0.0 }, { "name": "Maithili", "bcp_47": "mai", "population": 3336069, "score": 0.0 }, { "name": "Tibetan", "bcp_47": "bo", "population": 72787, "score": 0.0 }, { "name": "Mundari", "bcp_47": "unr", "population": 5762, "score": 0.0 }, { "name": "Newari", "bcp_47": "new", "population": 1000821, "score": 0.0 }, { "name": "Jumli", "bcp_47": "jml", "population": 970493, "score": 0.0 }, { "name": "Dotyali", "bcp_47": "dty", "population": 758198, "score": 0.0 }, { "name": "Bagheli", "bcp_47": "bfy", "population": 163771, "score": 0.0 }, { "name": "Dangaura Tharu", "bcp_47": "thl", "population": 606558, "score": 0.0 }, { "name": "Bantawa", "bcp_47": "bap", "population": 454918, "score": 0.0 }, { "name": "Western Tamang", "bcp_47": "tdg", "population": 394263, "score": 0.0 }, { "name": "Limbu", "bcp_47": "lif", "population": 333607, "score": 0.0 }, { "name": "Rana Tharu", "bcp_47": "thr", "population": 363935, "score": 0.0 }, { "name": "Eastern Magar", "bcp_47": "mgp", "population": 333607, "score": 0.0 }, { "name": "Kochila Tharu", "bcp_47": "thq", "population": 303279, "score": 0.0 }, { "name": "Western Magar", "bcp_47": "mrd", "population": 251722, "score": 0.0 }, { "name": "Sherpa", "bcp_47": "xsr", "population": 157705, "score": 0.0 }, { "name": "Rajbanshi", "bcp_47": "rjs", "population": 133443, "score": 0.0 }, { "name": "Eastern Tamang", "bcp_47": "taj", "population": 130410, "score": 0.0 }, { "name": "Gurung", "bcp_47": "gvr", "population": 87951, "score": 0.0 }, { "name": "Lepcha", "bcp_47": "lep", "population": 2820, "score": 0.0 }, { "name": "Kathoriya Tharu", "bcp_47": "tkt", "population": 72787, "score": 0.0 }, { "name": "Thulung", "bcp_47": "tdh", "population": 36393, "score": 0.0 } ] }, "NR": { "score": 0.2699324324324324, "languages": [ { "name": "English", "bcp_47": "en", "population": 9350, "score": 0.47 }, { "name": "Nauru", "bcp_47": "na", "population": 6930, "score": 0.0 } ] }, "NU": { "score": 0.235, "languages": [ { "name": "English", "bcp_47": "en", "population": 1120, "score": 0.47 }, { "name": "Niuean", "bcp_47": "niu", "population": 1120, "score": 0.0 } ] }, "NZ": { "score": 0.45694448388813996, "languages": [ { "name": "English", "bcp_47": "en", "population": 4826970, "score": 0.47 }, { "name": "Māori", "bcp_47": "mi", "population": 137913, "score": 0.0 } ] }, "PA": { "score": 0.4533854469232938, "languages": [ { "name": "English", "bcp_47": "en", "population": 545171, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 5841, "score": 0.46 }, { "name": "Spanish", "bcp_47": "es", "population": 2686915, "score": 0.45 } ] }, "PG": { "score": 0.19090169012205813, "languages": [ { "name": "English", "bcp_47": "en", "population": 3629730, "score": 0.47 }, { "name": "Tok Pisin", "bcp_47": "tpi", "population": 5154217, "score": 0.0 }, { "name": "Hiri Motu", "bcp_47": "ho", "population": 152449, "score": 0.0 } ] }, "PH": { "score": 0.2080044997553085, "languages": [ { "name": "English", "bcp_47": "en", "population": 69875840, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 797021, "score": 0.46 }, { "name": "Spanish", "bcp_47": "es", "population": 33846110, "score": 0.45 }, { "name": "Filipino", "bcp_47": "fil", "population": 65508600, "score": 0.0 }, { "name": "Cebuano", "bcp_47": "ceb", "population": 26203440, "score": 0.0 }, { "name": "Iloko", "bcp_47": "ilo", "population": 10481376, "score": 0.0 }, { "name": "Hiligaynon", "bcp_47": "hil", "population": 9171204, "score": 0.0 }, { "name": "Bikol", "bcp_47": "bik", "population": 3275430, "score": 0.0 }, { "name": "Waray", "bcp_47": "war", "population": 3166249, "score": 0.0 }, { "name": "Pampanga", "bcp_47": "pam", "population": 2511163, "score": 0.0 }, { "name": "West Albay Bikol", "bcp_47": "fbl", "population": 2511163, "score": 0.0 }, { "name": "Pangasinan", "bcp_47": "pag", "population": 1528534, "score": 0.0 }, { "name": "Maguindanaon", "bcp_47": "mdh", "population": 1310172, "score": 0.0 }, { "name": "Tausug", "bcp_47": "tsg", "population": 1200991, "score": 0.0 }, { "name": "Capiznon", "bcp_47": "cps", "population": 720595, "score": 0.0 }, { "name": "Kinaray-a", "bcp_47": "krj", "population": 425806, "score": 0.0 }, { "name": "Rinconada Bikol", "bcp_47": "bto", "population": 305707, "score": 0.0 }, { "name": "Hanunoo", "bcp_47": "hnn", "population": 17469, "score": 0.0 }, { "name": "Tagbanwa", "bcp_47": "tbw", "population": 10045, "score": 0.0 }, { "name": "Buhid", "bcp_47": "bku", "population": 7970, "score": 0.0 } ] }, "PK": { "score": 0.30251563862393366, "languages": [ { "name": "English", "bcp_47": "en", "population": 116750500, "score": 0.47 }, { "name": "Urdu", "bcp_47": "ur", "population": 221825950, "score": 0.42 }, { "name": "Punjabi", "bcp_47": "pa", "population": 163450700, "score": 0.42 }, { "name": "Western Panjabi", "bcp_47": "lah", "population": 93400400, "score": 0.0 }, { "name": "Persian", "bcp_47": "fa", "population": 1541107, "score": 0.0 }, { "name": "Pashto", "bcp_47": "ps", "population": 37360160, "score": 0.0 }, { "name": "Sindhi", "bcp_47": "sd", "population": 35025150, "score": 0.0 }, { "name": "Saraiki", "bcp_47": "skr", "population": 28020120, "score": 0.0 }, { "name": "Tajik", "bcp_47": "tg", "population": 770553, "score": 0.0 }, { "name": "Baluchi", "bcp_47": "bal", "population": 6071026, "score": 0.0 }, { "name": "Kashmiri", "bcp_47": "ks", "population": 161116, "score": 0.0 }, { "name": "Northern Hindko", "bcp_47": "hno", "population": 3969517, "score": 0.0 }, { "name": "Brahui", "bcp_47": "brh", "population": 3035513, "score": 0.0 }, { "name": "Western Balochi", "bcp_47": "bgn", "population": 1330956, "score": 0.0 }, { "name": "Southern Hindko", "bcp_47": "hnd", "population": 957354, "score": 0.0 }, { "name": "Balti", "bcp_47": "bft", "population": 420302, "score": 0.0 }, { "name": "Gujari", "bcp_47": "gju", "population": 467002, "score": 0.0 }, { "name": "Parkari Koli", "bcp_47": "kvx", "population": 373602, "score": 0.0 }, { "name": "Khowar", "bcp_47": "khw", "population": 350252, "score": 0.0 }, { "name": "Indus Kohistani", "bcp_47": "mvy", "population": 326901, "score": 0.0 }, { "name": "Wadiyara Koli", "bcp_47": "kxp", "population": 256851, "score": 0.0 }, { "name": "Kachi Koli", "bcp_47": "gjk", "population": 256851, "score": 0.0 }, { "name": "Torwali", "bcp_47": "trw", "population": 123756, "score": 0.0 }, { "name": "Bateri", "bcp_47": "btv", "population": 44365, "score": 0.0 } ] }, "PL": { "score": 0.09207365219510223, "languages": [ { "name": "English", "bcp_47": "en", "population": 12633159, "score": 0.47 }, { "name": "Russian", "bcp_47": "ru", "population": 6890814, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 7273637, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 36751008, "score": 0.0 }, { "name": "Ukrainian", "bcp_47": "uk", "population": 149301, "score": 0.0 }, { "name": "Belarusian", "bcp_47": "be", "population": 222037, "score": 0.0 }, { "name": "Lithuanian", "bcp_47": "lt", "population": 8039, "score": 0.0 }, { "name": "Silesian", "bcp_47": "szl", "population": 497670, "score": 0.0 }, { "name": "Kashubian", "bcp_47": "csb", "population": 49767, "score": 0.0 }, { "name": "Lower Silesian", "bcp_47": "sli", "population": 11868, "score": 0.0 }, { "name": "Prussian", "bcp_47": "prg", "population": 38, "score": 0.0 } ] }, "PM": { "score": 0.46035150375939854, "languages": [ { "name": "English", "bcp_47": "en", "population": 187, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 5133, "score": 0.46 } ] }, "PN": { "score": 0.4699999999999999, "languages": [ { "name": "English", "bcp_47": "en", "population": 46, "score": 0.47 } ] }, "PR": { "score": 0.4572058813018271, "languages": [ { "name": "English", "bcp_47": "en", "population": 1562644, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 2774491, "score": 0.45 } ] }, "PT": { "score": 0.4607128325652157, "languages": [ { "name": "English", "bcp_47": "en", "population": 2781729, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 1030270, "score": 0.45 }, { "name": "French", "bcp_47": "fr", "population": 1545405, "score": 0.46 }, { "name": "Portuguese", "bcp_47": "pt", "population": 9890592, "score": 0.46 }, { "name": "Galician", "bcp_47": "gl", "population": 14424, "score": 0.0 } ] }, "PW": { "score": 0.04945299431247909, "languages": [ { "name": "English", "bcp_47": "en", "population": 1887, "score": 0.47 }, { "name": "Palauan", "bcp_47": "pau", "population": 16047, "score": 0.0 } ] }, "RO": { "score": 0.17334519793826225, "languages": [ { "name": "English", "bcp_47": "en", "population": 6603899, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 2130290, "score": 0.45 }, { "name": "French", "bcp_47": "fr", "population": 3621493, "score": 0.46 }, { "name": "German", "bcp_47": "de", "population": 44736, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 27694, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 2769, "score": 0.0 }, { "name": "Romanian", "bcp_47": "ro", "population": 19172610, "score": 0.0 }, { "name": "Serbian", "bcp_47": "sr", "population": 25563, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 1405991, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 4048, "score": 0.0 }, { "name": "Bulgarian", "bcp_47": "bg", "population": 6817, "score": 0.0 } ] }, "RW": { "score": 0.07670541959715828, "languages": [ { "name": "English", "bcp_47": "en", "population": 1906860, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 2288, "score": 0.46 }, { "name": "Kinyarwanda", "bcp_47": "rw", "population": 9788548, "score": 0.0 } ] }, "SB": { "score": 0.25627042630612157, "languages": [ { "name": "English", "bcp_47": "en", "population": 685097, "score": 0.47 }, { "name": "Pijin", "bcp_47": "pis", "population": 561780, "score": 0.0 }, { "name": "Roviana", "bcp_47": "rug", "population": 9591, "score": 0.0 } ] }, "SC": { "score": 0.23194000733562617, "languages": [ { "name": "English", "bcp_47": "en", "population": 36473, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 57589, "score": 0.46 }, { "name": "Seselwa Creole French", "bcp_47": "crs", "population": 94061, "score": 0.0 } ] }, "SD": { "score": 0.40445504435404195, "languages": [ { "name": "English", "bcp_47": "en", "population": 27792576, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 27792576, "score": 0.42 }, { "name": "Hausa", "bcp_47": "ha", "population": 820109, "score": 0.0 }, { "name": "Beja", "bcp_47": "bej", "population": 2460326, "score": 0.0 }, { "name": "Fur", "bcp_47": "fvr", "population": 1230163, "score": 0.0 }, { "name": "Masalit", "bcp_47": "mls", "population": 451060, "score": 0.0 }, { "name": "Nobiin", "bcp_47": "fia", "population": 378161, "score": 0.0 }, { "name": "Zaghawa", "bcp_47": "zag", "population": 232364, "score": 0.0 } ] }, "SE": { "score": 0.21941169569516628, "languages": [ { "name": "English", "bcp_47": "en", "population": 8774150, "score": 0.47 }, { "name": "Swedish", "bcp_47": "sv", "population": 9692375, "score": 0.0 }, { "name": "Finnish", "bcp_47": "fi", "population": 224455, "score": 0.0 }, { "name": "Yiddish", "bcp_47": "yi", "population": 2959, "score": 0.0 }, { "name": "Tornedalen Finnish", "bcp_47": "fit", "population": 56114, "score": 0.0 }, { "name": "Northern Sami", "bcp_47": "se", "population": 33668, "score": 0.0 }, { "name": "Tavringer Romani", "bcp_47": "rmu", "population": 9488, "score": 0.0 }, { "name": "Lule Sami", "bcp_47": "smj", "population": 1530, "score": 0.0 }, { "name": "Southern Sami", "bcp_47": "sma", "population": 296, "score": 0.0 }, { "name": "Interlingua", "bcp_47": "ia", "population": 0, "score": 0.0 } ] }, "SG": { "score": 0.42483238543445395, "languages": [ { "name": "English", "bcp_47": "en", "population": 5774984, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 4781438, "score": 0.46 }, { "name": "Punjabi", "bcp_47": "pa", "population": 9314, "score": 0.42 }, { "name": "Tamil", "bcp_47": "ta", "population": 130403, "score": 0.0 }, { "name": "Malayalam", "bcp_47": "ml", "population": 9935, "score": 0.0 }, { "name": "Malay", "bcp_47": "ms", "population": 869352, "score": 0.0 } ] }, "SH": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 5425, "score": 0.47 } ] }, "SI": { "score": 0.11046483765124727, "languages": [ { "name": "English", "bcp_47": "en", "population": 1240581, "score": 0.47 }, { "name": "German", "bcp_47": "de", "population": 883126, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 3995, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 9252, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 1282635, "score": 0.0 }, { "name": "Slovenian", "bcp_47": "sl", "population": 1829332, "score": 0.0 }, { "name": "Venetian", "bcp_47": "vec", "population": 29438, "score": 0.0 } ] }, "SK": { "score": 0.06145953818542007, "languages": [ { "name": "English", "bcp_47": "en", "population": 1414556, "score": 0.47 }, { "name": "German", "bcp_47": "de", "population": 1196932, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 50598, "score": 0.0 }, { "name": "Ukrainian", "bcp_47": "uk", "population": 103371, "score": 0.0 }, { "name": "Czech", "bcp_47": "cs", "population": 2557082, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 598466, "score": 0.0 }, { "name": "Slovak", "bcp_47": "sk", "population": 4896540, "score": 0.0 } ] }, "SL": { "score": 0.08989072161019854, "languages": [ { "name": "English", "bcp_47": "en", "population": 2318726, "score": 0.47 }, { "name": "Fula", "bcp_47": "ff", "population": 0, "score": 0.0 }, { "name": "Krio", "bcp_47": "kri", "population": 6293684, "score": 0.0 }, { "name": "Mende", "bcp_47": "men", "population": 1788731, "score": 0.0 }, { "name": "Timne", "bcp_47": "tem", "population": 1722482, "score": 0.0 } ] }, "SS": { "score": 0.4031879322739386, "languages": [ { "name": "English", "bcp_47": "en", "population": 2851524, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 2851524, "score": 0.42 }, { "name": "Nuer", "bcp_47": "nus", "population": 591427, "score": 0.0 } ] }, "SX": { "score": 0.41148919399949146, "languages": [ { "name": "English", "bcp_47": "en", "population": 29816, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 4823, "score": 0.45 }, { "name": "Dutch", "bcp_47": "nl", "population": 1578, "score": 0.0 }, { "name": "Virgin Islands Creole English", "bcp_47": "vic", "population": 3113, "score": 0.0 } ] }, "SZ": { "score": 0.2566553218261588, "languages": [ { "name": "English", "bcp_47": "en", "population": 883584, "score": 0.47 }, { "name": "Zulu", "bcp_47": "zu", "population": 75105, "score": 0.0 }, { "name": "Tsonga", "bcp_47": "ts", "population": 18776, "score": 0.0 }, { "name": "Swati", "bcp_47": "ss", "population": 640598, "score": 0.0 } ] }, "TA": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 272, "score": 0.47 } ] }, "TC": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 54807, "score": 0.47 } ] }, "TH": { "score": 0.0855764589364112, "languages": [ { "name": "English", "bcp_47": "en", "population": 18623898, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 1241593, "score": 0.46 }, { "name": "Thai", "bcp_47": "th", "population": 55181920, "score": 0.0 }, { "name": "Northeastern Thai", "bcp_47": "tts", "population": 16554576, "score": 0.0 }, { "name": "Northern Thai", "bcp_47": "nod", "population": 6621830, "score": 0.0 }, { "name": "Southern Thai", "bcp_47": "sou", "population": 5518192, "score": 0.0 }, { "name": "Shan", "bcp_47": "shn", "population": 66218, "score": 0.0 }, { "name": "Pattani Malay", "bcp_47": "mfa", "population": 3448870, "score": 0.0 }, { "name": "Northern Khmer", "bcp_47": "kxm", "population": 1172616, "score": 0.0 }, { "name": "Mon", "bcp_47": "mnw", "population": 117262, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 67598, "score": 0.0 }, { "name": "Kuy", "bcp_47": "kdt", "population": 331092, "score": 0.0 }, { "name": "Western Lawa", "bcp_47": "lcp", "population": 6898, "score": 0.0 }, { "name": "Eastern Lawa", "bcp_47": "lwl", "population": 6898, "score": 0.0 } ] }, "TK": { "score": 0.235, "languages": [ { "name": "English", "bcp_47": "en", "population": 1285, "score": 0.47 }, { "name": "Tokelau", "bcp_47": "tkl", "population": 1285, "score": 0.0 } ] }, "TO": { "score": 0.10699318758285631, "languages": [ { "name": "English", "bcp_47": "en", "population": 29707, "score": 0.47 }, { "name": "Tongan", "bcp_47": "to", "population": 100790, "score": 0.0 } ] }, "TR": { "score": 0.06502802610982708, "languages": [ { "name": "English", "bcp_47": "en", "population": 13942975, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 459298, "score": 0.42 }, { "name": "Turkish", "bcp_47": "tr", "population": 76276275, "score": 0.0 }, { "name": "North Levantine Arabic", "bcp_47": "apc", "population": 4264910, "score": 0.0 }, { "name": "Uzbek", "bcp_47": "uz", "population": 1968, "score": 0.0 }, { "name": "Azerbaijani", "bcp_47": "az", "population": 1140044, "score": 0.0 }, { "name": "Serbian", "bcp_47": "sr", "population": 22965, "score": 0.0 }, { "name": "Kazakh", "bcp_47": "kk", "population": 574, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 4019, "score": 0.0 }, { "name": "Bulgarian", "bcp_47": "bg", "population": 344474, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 4510962, "score": 0.0 }, { "name": "Albanian", "bcp_47": "sq", "population": 17224, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 45930, "score": 0.0 }, { "name": "Georgian", "bcp_47": "ka", "population": 45930, "score": 0.0 }, { "name": "Kyrgyz", "bcp_47": "ky", "population": 1148, "score": 0.0 }, { "name": "Zaza", "bcp_47": "zza", "population": 1148245, "score": 0.0 }, { "name": "Kabardian", "bcp_47": "kbd", "population": 631535, "score": 0.0 }, { "name": "Adyghe", "bcp_47": "ady", "population": 319868, "score": 0.0 }, { "name": "Balkan Gagauz Turkish", "bcp_47": "bgx", "population": 377280, "score": 0.0 }, { "name": "Kirmanjki", "bcp_47": "kiu", "population": 155833, "score": 0.0 }, { "name": "Abkhazian", "bcp_47": "ab", "population": 4019, "score": 0.0 }, { "name": "Laz", "bcp_47": "lzz", "population": 22965, "score": 0.0 }, { "name": "Turoyo", "bcp_47": "tru", "population": 3035, "score": 0.0 } ] }, "TT": { "score": 0.4699230225360422, "languages": [ { "name": "English", "bcp_47": "en", "population": 1063735, "score": 0.47 }, { "name": "Spanish", "bcp_47": "es", "population": 4110, "score": 0.45 } ] }, "TV": { "score": 0.04582220596305103, "languages": [ { "name": "English", "bcp_47": "en", "population": 1066, "score": 0.47 }, { "name": "Tuvalu", "bcp_47": "tvl", "population": 9868, "score": 0.0 } ] }, "TZ": { "score": 0.17576282848459832, "languages": [ { "name": "English", "bcp_47": "en", "population": 40401432, "score": 0.47 }, { "name": "Swahili", "bcp_47": "sw", "population": 52697520, "score": 0.0 }, { "name": "Sukuma", "bcp_47": "suk", "population": 5094094, "score": 0.0 }, { "name": "Nyamwezi", "bcp_47": "nym", "population": 1932242, "score": 0.0 }, { "name": "Masai", "bcp_47": "mas", "population": 878292, "score": 0.0 }, { "name": "Makonde", "bcp_47": "kde", "population": 1463820, "score": 0.0 }, { "name": "Bena", "bcp_47": "bez", "population": 995398, "score": 0.0 }, { "name": "Shambala", "bcp_47": "ksb", "population": 995398, "score": 0.0 }, { "name": "Mbunga", "bcp_47": "mgy", "population": 819739, "score": 0.0 }, { "name": "Asu", "bcp_47": "asa", "population": 702634, "score": 0.0 }, { "name": "Langi", "bcp_47": "lag", "population": 509409, "score": 0.0 }, { "name": "Vunjo", "bcp_47": "vun", "population": 433291, "score": 0.0 }, { "name": "Rombo", "bcp_47": "rof", "population": 433291, "score": 0.0 }, { "name": "Machame", "bcp_47": "jmc", "population": 433291, "score": 0.0 }, { "name": "Rwa", "bcp_47": "rwk", "population": 128816, "score": 0.0 }, { "name": "Sangu", "bcp_47": "sbp", "population": 117106, "score": 0.0 } ] }, "UG": { "score": 0.014428243049412084, "languages": [ { "name": "English", "bcp_47": "en", "population": 1686867, "score": 0.47 }, { "name": "Hindi", "bcp_47": "hi", "population": 2206, "score": 0.46 }, { "name": "Swahili", "bcp_47": "sw", "population": 32439750, "score": 0.0 }, { "name": "Kinyarwanda", "bcp_47": "rw", "population": 908313, "score": 0.0 }, { "name": "Ganda", "bcp_47": "lg", "population": 5622890, "score": 0.0 }, { "name": "Nyankole", "bcp_47": "nyn", "population": 2724939, "score": 0.0 }, { "name": "Chiga", "bcp_47": "cgg", "population": 2335662, "score": 0.0 }, { "name": "Soga", "bcp_47": "xog", "population": 2292409, "score": 0.0 }, { "name": "Teso", "bcp_47": "teo", "population": 1686867, "score": 0.0 }, { "name": "Lango (Uganda)", "bcp_47": "laj", "population": 1643614, "score": 0.0 }, { "name": "Acoli", "bcp_47": "ach", "population": 1600361, "score": 0.0 }, { "name": "Masaaba", "bcp_47": "myx", "population": 1254337, "score": 0.0 }, { "name": "Tooro", "bcp_47": "ttj", "population": 821807, "score": 0.0 } ] }, "UM": { "score": 0.4699999999999999, "languages": [ { "name": "English", "bcp_47": "en", "population": 316, "score": 0.47 } ] }, "US": { "score": 0.45809839699094473, "languages": [ { "name": "English", "bcp_47": "en", "population": 319333440, "score": 0.47 }, { "name": "Chinese", "bcp_47": "zh", "population": 2295209, "score": 0.46 }, { "name": "Spanish", "bcp_47": "es", "population": 31933344, "score": 0.45 }, { "name": "French", "bcp_47": "fr", "population": 1862778, "score": 0.46 }, { "name": "Russian", "bcp_47": "ru", "population": 798334, "score": 0.0 }, { "name": "German", "bcp_47": "de", "population": 1563403, "score": 0.0 }, { "name": "Vietnamese", "bcp_47": "vi", "population": 1130973, "score": 0.0 }, { "name": "Korean", "bcp_47": "ko", "population": 997917, "score": 0.0 }, { "name": "Italian", "bcp_47": "it", "population": 1130973, "score": 0.0 }, { "name": "Filipino", "bcp_47": "fil", "population": 1397084, "score": 0.0 }, { "name": "Yiddish", "bcp_47": "yi", "population": 162993, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 116424, "score": 0.0 }, { "name": "Navajo", "bcp_47": "nv", "population": 166320, "score": 0.0 }, { "name": "Pennsylvania German", "bcp_47": "pdc", "population": 129729, "score": 0.0 }, { "name": "Hawaiian", "bcp_47": "haw", "population": 29605, "score": 0.0 }, { "name": "Cajun French", "bcp_47": "frc", "population": 27942, "score": 0.0 }, { "name": "Cherokee", "bcp_47": "chr", "population": 25613, "score": 0.0 }, { "name": "Central Yupik", "bcp_47": "esu", "population": 20956, "score": 0.0 }, { "name": "Dakota", "bcp_47": "dak", "population": 19626, "score": 0.0 }, { "name": "Choctaw", "bcp_47": "cho", "population": 10977, "score": 0.0 }, { "name": "Lakota", "bcp_47": "lkt", "population": 8316, "score": 0.0 }, { "name": "Inupiaq", "bcp_47": "ik", "population": 7983, "score": 0.0 }, { "name": "Muscogee", "bcp_47": "mus", "population": 3992, "score": 0.0 }, { "name": "Ido", "bcp_47": "io", "population": 0, "score": 0.0 }, { "name": "Lojban", "bcp_47": "jbo", "population": 0, "score": 0.0 }, { "name": "Osage", "bcp_47": "osa", "population": 0, "score": 0.0 }, { "name": "Chickasaw", "bcp_47": "cic", "population": 0, "score": 0.0 }, { "name": "Caddo", "bcp_47": "cad", "population": 0, "score": 0.0 } ] }, "VC": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 97334, "score": 0.47 } ] }, "VG": { "score": 0.47, "languages": [ { "name": "English", "bcp_47": "en", "population": 36633, "score": 0.47 } ] }, "VI": { "score": 0.47000000000000003, "languages": [ { "name": "English", "bcp_47": "en", "population": 79676, "score": 0.47 } ] }, "VU": { "score": 0.27807137424430545, "languages": [ { "name": "English", "bcp_47": "en", "population": 247616, "score": 0.47 }, { "name": "French", "bcp_47": "fr", "population": 149166, "score": 0.46 }, { "name": "Bislama", "bcp_47": "bi", "population": 268500, "score": 0.0 } ] }, "WS": { "score": 0.00966643114975511, "languages": [ { "name": "English", "bcp_47": "en", "population": 4279, "score": 0.47 }, { "name": "Samoan", "bcp_47": "sm", "population": 203774, "score": 0.0 } ] }, "YE": { "score": 0.4254216867469879, "languages": [ { "name": "English", "bcp_47": "en", "population": 2689596, "score": 0.47 }, { "name": "Arabic", "bcp_47": "ar", "population": 22114456, "score": 0.42 } ] }, "ZA": { "score": 0.12441587427910845, "languages": [ { "name": "English", "bcp_47": "en", "population": 17503716, "score": 0.47 }, { "name": "Hindi", "bcp_47": "hi", "population": 1129272, "score": 0.46 }, { "name": "Swahili", "bcp_47": "sw", "population": 1016, "score": 0.0 }, { "name": "Zulu", "bcp_47": "zu", "population": 13551264, "score": 0.0 }, { "name": "Xhosa", "bcp_47": "xh", "population": 10163448, "score": 0.0 }, { "name": "Afrikaans", "bcp_47": "af", "population": 7340268, "score": 0.0 }, { "name": "Southern Sotho", "bcp_47": "st", "population": 4460624, "score": 0.0 }, { "name": "Tswana", "bcp_47": "tn", "population": 4630015, "score": 0.0 }, { "name": "Northern Sotho", "bcp_47": "nso", "population": 5307578, "score": 0.0 }, { "name": "Tsonga", "bcp_47": "ts", "population": 2484398, "score": 0.0 }, { "name": "Swati", "bcp_47": "ss", "population": 1524517, "score": 0.0 }, { "name": "Venda", "bcp_47": "ve", "population": 1298663, "score": 0.0 }, { "name": "South Ndebele", "bcp_47": "nr", "population": 903418, "score": 0.0 } ] }, "ZM": { "score": 0.11058823529411763, "languages": [ { "name": "English", "bcp_47": "en", "population": 2788256, "score": 0.47 }, { "name": "Nyanja", "bcp_47": "ny", "population": 2613990, "score": 0.0 }, { "name": "Bemba", "bcp_47": "bem", "population": 5402246, "score": 0.0 }, { "name": "Lozi", "bcp_47": "loz", "population": 1045596, "score": 0.0 } ] }, "ZW": { "score": 0.12681485053220737, "languages": [ { "name": "English", "bcp_47": "en", "population": 6109446, "score": 0.47 }, { "name": "Nyanja", "bcp_47": "ny", "population": 276380, "score": 0.0 }, { "name": "Shona", "bcp_47": "sn", "population": 11782503, "score": 0.0 }, { "name": "Tswana", "bcp_47": "tn", "population": 32002, "score": 0.0 }, { "name": "Ndau", "bcp_47": "ndc", "population": 887324, "score": 0.0 }, { "name": "North Ndebele", "bcp_47": "nd", "population": 1745556, "score": 0.0 }, { "name": "Venda", "bcp_47": "ve", "population": 93096, "score": 0.0 }, { "name": "Manyika", "bcp_47": "mxc", "population": 945510, "score": 0.0 }, { "name": "Kalanga", "bcp_47": "kck", "population": 770954, "score": 0.0 } ] }, "GF": { "score": 0.33892599990709343, "languages": [ { "name": "Chinese", "bcp_47": "zh", "population": 4988, "score": 0.46 }, { "name": "French", "bcp_47": "fr", "population": 153622, "score": 0.46 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 4788, "score": 0.0 }, { "name": "Guianese Creole French", "bcp_47": "gcr", "population": 51872, "score": 0.0 } ] }, "ID": { "score": 0.0030419341755196384, "languages": [ { "name": "Chinese", "bcp_47": "zh", "population": 2456639, "score": 0.46 }, { "name": "Indonesian", "bcp_47": "id", "population": 170896640, "score": 0.0 }, { "name": "Javanese", "bcp_47": "jv", "population": 90788840, "score": 0.0 }, { "name": "Malay", "bcp_47": "ms", "population": 12283196, "score": 0.0 }, { "name": "Sundanese", "bcp_47": "su", "population": 32043120, "score": 0.0 }, { "name": "Madurese", "bcp_47": "mad", "population": 16822638, "score": 0.0 }, { "name": "Minangkabau", "bcp_47": "min", "population": 8010780, "score": 0.0 }, { "name": "Betawi", "bcp_47": "bew", "population": 5607546, "score": 0.0 }, { "name": "Balinese", "bcp_47": "ban", "population": 4806468, "score": 0.0 }, { "name": "Buginese", "bcp_47": "bug", "population": 4272416, "score": 0.0 }, { "name": "Banjar", "bcp_47": "bjn", "population": 4005390, "score": 0.0 }, { "name": "Achinese", "bcp_47": "ace", "population": 3738364, "score": 0.0 }, { "name": "Sasak", "bcp_47": "sas", "population": 2590152, "score": 0.0 }, { "name": "Batak Toba", "bcp_47": "bbc", "population": 2456639, "score": 0.0 }, { "name": "Makasar", "bcp_47": "mak", "population": 1949290, "score": 0.0 }, { "name": "Lampung Api", "bcp_47": "ljp", "population": 1842479, "score": 0.0 }, { "name": "Rejang", "bcp_47": "rej", "population": 1228320, "score": 0.0 }, { "name": "Gorontalo", "bcp_47": "gor", "population": 1094807, "score": 0.0 }, { "name": "Ngaju", "bcp_47": "nij", "population": 987996, "score": 0.0 }, { "name": "Komering", "bcp_47": "kge", "population": 854483, "score": 0.0 }, { "name": "Uab Meto", "bcp_47": "aoz", "population": 720970, "score": 0.0 }, { "name": "Kerinci", "bcp_47": "kvr", "population": 373836, "score": 0.0 }, { "name": "Tolaki", "bcp_47": "lbw", "population": 347134, "score": 0.0 }, { "name": "Gayo", "bcp_47": "gay", "population": 320431, "score": 0.0 }, { "name": "Tae'", "bcp_47": "rob", "population": 293729, "score": 0.0 }, { "name": "Mandar", "bcp_47": "mdr", "population": 245664, "score": 0.0 }, { "name": "Sangir", "bcp_47": "sxn", "population": 245664, "score": 0.0 }, { "name": "Selayar", "bcp_47": "sly", "population": 144194, "score": 0.0 }, { "name": "Mentawai", "bcp_47": "mwv", "population": 64086, "score": 0.0 } ] }, "MN": { "score": 0.00632843339485398, "languages": [ { "name": "Chinese", "bcp_47": "zh", "population": 44352, "score": 0.46 }, { "name": "Russian", "bcp_47": "ru", "population": 4118, "score": 0.0 }, { "name": "Kazakh", "bcp_47": "kk", "population": 228098, "score": 0.0 }, { "name": "Uyghur", "bcp_47": "ug", "population": 1014, "score": 0.0 }, { "name": "Mongolian", "bcp_47": "mn", "population": 2946268, "score": 0.0 } ] }, "PF": { "score": 0.3171135805738615, "languages": [ { "name": "Chinese", "bcp_47": "zh", "population": 23019, "score": 0.46 }, { "name": "French", "bcp_47": "fr", "population": 180024, "score": 0.46 }, { "name": "Tahitian", "bcp_47": "ty", "population": 91488, "score": 0.0 } ] }, "SR": { "score": 0.003172691176168042, "languages": [ { "name": "Chinese", "bcp_47": "zh", "population": 6705, "score": 0.46 }, { "name": "Dutch", "bcp_47": "nl", "population": 548612, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 2316, "score": 0.0 }, { "name": "Sranan Tongo", "bcp_47": "srn", "population": 414507, "score": 0.0 } ] }, "TW": { "score": 0.45990317007579645, "languages": [ { "name": "Chinese", "bcp_47": "zh", "population": 22422850, "score": 0.46 }, { "name": "Taroko", "bcp_47": "trv", "population": 4721, "score": 0.0 } ] }, "VN": { "score": 0.005746798518511479, "languages": [ { "name": "Chinese", "bcp_47": "zh", "population": 1085934, "score": 0.46 }, { "name": "Vietnamese", "bcp_47": "vi", "population": 84900318, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 167826, "score": 0.0 }, { "name": "Tai Dam", "bcp_47": "blt", "population": 681177, "score": 0.0 }, { "name": "Eastern Cham", "bcp_47": "cjm", "population": 87862, "score": 0.0 } ] }, "AD": { "score": 0.2246305418719212, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 33110, "score": 0.45 }, { "name": "French", "bcp_47": "fr", "population": 5775, "score": 0.46 }, { "name": "Catalan", "bcp_47": "ca", "population": 39270, "score": 0.0 } ] }, "BO": { "score": 0.24195487707764574, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 7100339, "score": 0.45 }, { "name": "Quechua", "bcp_47": "qu", "population": 3724768, "score": 0.0 }, { "name": "Guarani", "bcp_47": "gn", "population": 52380, "score": 0.0 }, { "name": "Aymara", "bcp_47": "ay", "population": 2327980, "score": 0.0 }, { "name": "Araona", "bcp_47": "aro", "population": 105, "score": 0.0 } ] }, "CO": { "score": 0.4486679880632671, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 45648864, "score": 0.45 }, { "name": "Wayuu", "bcp_47": "guc", "population": 132529, "score": 0.0 }, { "name": "Nheengatu", "bcp_47": "yrl", "population": 2994, "score": 0.0 } ] }, "CR": { "score": 0.45, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 4843090, "score": 0.45 } ] }, "CU": { "score": 0.45, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 11059100, "score": 0.45 } ] }, "CW": { "score": 0.01842639268626111, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 5751, "score": 0.45 }, { "name": "Dutch", "bcp_47": "nl", "population": 12108, "score": 0.0 }, { "name": "Papiamento", "bcp_47": "pap", "population": 122589, "score": 0.0 } ] }, "EA": { "score": 0.45, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 147000, "score": 0.45 } ] }, "EC": { "score": 0.36394271816229906, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 16228704, "score": 0.45 }, { "name": "Quechua", "bcp_47": "qu", "population": 2873833, "score": 0.0 }, { "name": "Chimborazo Highland Quichua", "bcp_47": "qug", "population": 963579, "score": 0.0 } ] }, "GQ": { "score": 0.2792374044214109, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 727475, "score": 0.45 }, { "name": "French", "bcp_47": "fr", "population": 73584, "score": 0.46 }, { "name": "Portuguese", "bcp_47": "pt", "population": 1, "score": 0.46 }, { "name": "Fang", "bcp_47": "fan", "population": 426451, "score": 0.0 }, { "name": "Bube", "bcp_47": "bvb", "population": 66058, "score": 0.0 } ] }, "GT": { "score": 0.4185, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 15952569, "score": 0.45 }, { "name": "Kʼicheʼ", "bcp_47": "quc", "population": 1200731, "score": 0.0 } ] }, "IC": { "score": 0.45, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 2056618, "score": 0.45 } ] }, "NI": { "score": 0.45, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 4838683, "score": 0.45 } ] }, "PE": { "score": 0.3666294642857143, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 23297950, "score": 0.45 }, { "name": "Quechua", "bcp_47": "qu", "population": 4787250, "score": 0.0 }, { "name": "Aymara", "bcp_47": "ay", "population": 510640, "score": 0.0 } ] }, "PY": { "score": 0.016724733105137318, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 230134, "score": 0.45 }, { "name": "German", "bcp_47": "de", "population": 208559, "score": 0.0 }, { "name": "Guarani", "bcp_47": "gn", "population": 5753352, "score": 0.0 } ] }, "SV": { "score": 0.45000000000000007, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 5768179, "score": 0.45 } ] }, "UY": { "score": 0.45000000000000007, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 2981097, "score": 0.45 } ] }, "VE": { "score": 0.4499615909817796, "languages": [ { "name": "Spanish", "bcp_47": "es", "population": 23488572, "score": 0.45 }, { "name": "Nheengatu", "bcp_47": "yrl", "population": 2005, "score": 0.0 } ] }, "BH": { "score": 0.4046511627906977, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 1309350, "score": 0.42 }, { "name": "Malayalam", "bcp_47": "ml", "population": 49665, "score": 0.0 } ] }, "DJ": { "score": 0.04363652160028553, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 67292, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 19358, "score": 0.46 }, { "name": "Somali", "bcp_47": "so", "population": 377940, "score": 0.0 }, { "name": "Afar", "bcp_47": "aa", "population": 387158, "score": 0.0 } ] }, "EH": { "score": 0.42, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 652271, "score": 0.42 } ] }, "IR": { "score": 0.00636827269940037, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 1698466, "score": 0.42 }, { "name": "Persian", "bcp_47": "fa", "population": 63692475, "score": 0.0 }, { "name": "Pashto", "bcp_47": "ps", "population": 135877, "score": 0.0 }, { "name": "Azerbaijani", "bcp_47": "az", "population": 20381592, "score": 0.0 }, { "name": "Kazakh", "bcp_47": "kk", "population": 2972, "score": 0.0 }, { "name": "Central Kurdish", "bcp_47": "ckb", "population": 3312009, "score": 0.0 }, { "name": "Baluchi", "bcp_47": "bal", "population": 1698466, "score": 0.0 }, { "name": "Turkmen", "bcp_47": "tk", "population": 2377852, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 203816, "score": 0.0 }, { "name": "Mazanderani", "bcp_47": "mzn", "population": 4246165, "score": 0.0 }, { "name": "Gilaki", "bcp_47": "glk", "population": 3906472, "score": 0.0 }, { "name": "Georgian", "bcp_47": "ka", "population": 60296, "score": 0.0 }, { "name": "Southern Kurdish", "bcp_47": "sdh", "population": 3142162, "score": 0.0 }, { "name": "Western Balochi", "bcp_47": "bgn", "population": 475570, "score": 0.0 }, { "name": "Northern Luri", "bcp_47": "lrc", "population": 1783389, "score": 0.0 }, { "name": "Domari", "bcp_47": "rmt", "population": 1613543, "score": 0.0 }, { "name": "Bakhtiari", "bcp_47": "bqi", "population": 1188926, "score": 0.0 }, { "name": "Southern Luri", "bcp_47": "luz", "population": 1019080, "score": 0.0 }, { "name": "Parsi-Dari", "bcp_47": "prd", "population": 424616, "score": 0.0 }, { "name": "Laki", "bcp_47": "lki", "population": 645417, "score": 0.0 }, { "name": "Zoroastrian Dari", "bcp_47": "gbz", "population": 7983, "score": 0.0 } ] }, "KM": { "score": 0.27709828190644586, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 558545, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 473917, "score": 0.46 }, { "name": "Ngazidja Comorian", "bcp_47": "zdj", "population": 313124, "score": 0.0 }, { "name": "Ndzwani Comorian", "bcp_47": "wni", "population": 287736, "score": 0.0 } ] }, "KW": { "score": 0.42, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 2993710, "score": 0.42 } ] }, "LY": { "score": 0.42, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 5099000, "score": 0.42 } ] }, "ML": { "score": 0.17298209200310574, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 175981, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 8994564, "score": 0.46 }, { "name": "Bambara", "bcp_47": "bm", "population": 9385632, "score": 0.0 }, { "name": "Tamashek", "bcp_47": "tmh", "population": 410621, "score": 0.0 }, { "name": "Maasina Fulfulde", "bcp_47": "ffm", "population": 1505612, "score": 0.0 }, { "name": "Soninke", "bcp_47": "snk", "population": 1153651, "score": 0.0 }, { "name": "Kita Maninkakan", "bcp_47": "mwk", "population": 977670, "score": 0.0 }, { "name": "Koyraboro Senni", "bcp_47": "ses", "population": 664816, "score": 0.0 }, { "name": "Koyra Chiini", "bcp_47": "khq", "population": 332408, "score": 0.0 }, { "name": "Tomo Kan Dogon", "bcp_47": "dtm", "population": 215087, "score": 0.0 }, { "name": "Xaasongaxango", "bcp_47": "kao", "population": 195534, "score": 0.0 }, { "name": "Bomu", "bcp_47": "bmq", "population": 168159, "score": 0.0 }, { "name": "Jenaama Bozo", "bcp_47": "bze", "population": 166204, "score": 0.0 } ] }, "MR": { "score": 0.4031496171525996, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 3404658, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 680932, "score": 0.46 }, { "name": "Wolof", "bcp_47": "wo", "population": 10014, "score": 0.0 }, { "name": "Fula", "bcp_47": "ff", "population": 228312, "score": 0.0 } ] }, "NE": { "score": 0.13395381465163778, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 47822, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 6603996, "score": 0.46 }, { "name": "Hausa", "bcp_47": "ha", "population": 9336684, "score": 0.0 }, { "name": "Fula", "bcp_47": "ff", "population": 0, "score": 0.0 }, { "name": "Zarma", "bcp_47": "dje", "population": 3871308, "score": 0.0 }, { "name": "Tamashek", "bcp_47": "tmh", "population": 1366344, "score": 0.0 }, { "name": "Central-Eastern Niger Fulfulde", "bcp_47": "fuq", "population": 1594068, "score": 0.0 }, { "name": "Tasawaq", "bcp_47": "twq", "population": 7970, "score": 0.0 } ] }, "OM": { "score": 0.3917550122860191, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 3778520, "score": 0.42 }, { "name": "Persian", "bcp_47": "fa", "population": 43849, "score": 0.0 }, { "name": "Baluchi", "bcp_47": "bal", "population": 228577, "score": 0.0 } ] }, "PS": { "score": 0.22459893546675047, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 4818260, "score": 0.42 }, { "name": "North Levantine Arabic", "bcp_47": "apc", "population": 4191886, "score": 0.0 } ] }, "QA": { "score": 0.37279344564910033, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 2175311, "score": 0.42 }, { "name": "Persian", "bcp_47": "fa", "population": 268859, "score": 0.0 }, { "name": "Malayalam", "bcp_47": "ml", "population": 6599, "score": 0.0 } ] }, "SA": { "score": 0.4077669902912621, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 34173500, "score": 0.42 }, { "name": "Najdi Arabic", "bcp_47": "ars", "population": 1025205, "score": 0.0 } ] }, "SO": { "score": 0.12480335438670982, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 3997414, "score": 0.42 }, { "name": "Swahili", "bcp_47": "sw", "population": 235142, "score": 0.0 }, { "name": "Oromo", "bcp_47": "om", "population": 49380, "score": 0.0 }, { "name": "Somali", "bcp_47": "so", "population": 9170538, "score": 0.0 } ] }, "SY": { "score": 0.20086954810836308, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 15518720, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 1144506, "score": 0.46 }, { "name": "North Levantine Arabic", "bcp_47": "apc", "population": 16488640, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 1551872, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 349171, "score": 0.0 }, { "name": "Syriac", "bcp_47": "syr", "population": 16295, "score": 0.0 } ] }, "TD": { "score": 0.4441860465116279, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 2869158, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 4388124, "score": 0.46 } ] }, "TJ": { "score": 4.095636386779862e-05, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 976, "score": 0.42 }, { "name": "Russian", "bcp_47": "ru", "population": 1064840, "score": 0.0 }, { "name": "Persian", "bcp_47": "fa", "population": 69215, "score": 0.0 }, { "name": "Tajik", "bcp_47": "tg", "population": 8873670, "score": 0.0 } ] }, "TN": { "score": 0.28283464566929134, "languages": [ { "name": "Arabic", "bcp_47": "ar", "population": 10549080, "score": 0.42 }, { "name": "French", "bcp_47": "fr", "population": 8673688, "score": 0.46 }, { "name": "Tunisian Arabic", "bcp_47": "aeb", "population": 10549080, "score": 0.0 } ] }, "BF": { "score": 0.1076595744680851, "languages": [ { "name": "French", "bcp_47": "fr", "population": 4583788, "score": 0.46 }, { "name": "Mossi", "bcp_47": "mos", "population": 8334160, "score": 0.0 }, { "name": "Fula", "bcp_47": "ff", "population": 0, "score": 0.0 }, { "name": "Dyula", "bcp_47": "dyu", "population": 6667328, "score": 0.0 } ] }, "BJ": { "score": 0.24029850746268658, "languages": [ { "name": "French", "bcp_47": "fr", "population": 4502610, "score": 0.46 }, { "name": "Yoruba", "bcp_47": "yo", "population": 861928, "score": 0.0 }, { "name": "Fon", "bcp_47": "fon", "population": 3216150, "score": 0.0 }, { "name": "Anii", "bcp_47": "blo", "population": 38594, "score": 0.0 } ] }, "BL": { "score": 0.46, "languages": [ { "name": "French", "bcp_47": "fr", "population": 6837, "score": 0.46 } ] }, "CD": { "score": 0.024519567961845984, "languages": [ { "name": "French", "bcp_47": "fr", "population": 3867640, "score": 0.46 }, { "name": "Swahili", "bcp_47": "sw", "population": 50890000, "score": 0.0 }, { "name": "Kinyarwanda", "bcp_47": "rw", "population": 386764, "score": 0.0 }, { "name": "Luba-Lulua", "bcp_47": "lua", "population": 9770880, "score": 0.0 }, { "name": "Lingala", "bcp_47": "ln", "population": 3155180, "score": 0.0 }, { "name": "Luba-Katanga", "bcp_47": "lu", "population": 2340940, "score": 0.0 }, { "name": "Kongo", "bcp_47": "kg", "population": 1526700, "score": 0.0 }, { "name": "Mongo", "bcp_47": "lol", "population": 620858, "score": 0.0 } ] }, "CF": { "score": 0.22943811316779433, "languages": [ { "name": "French", "bcp_47": "fr", "population": 2935521, "score": 0.46 }, { "name": "Lingala", "bcp_47": "ln", "population": 14378, "score": 0.0 }, { "name": "Sango", "bcp_47": "sg", "population": 2935521, "score": 0.0 } ] }, "CG": { "score": 0.4472221914876915, "languages": [ { "name": "French", "bcp_47": "fr", "population": 4446179, "score": 0.46 }, { "name": "Lingala", "bcp_47": "ln", "population": 127034, "score": 0.0 } ] }, "CI": { "score": 0.32809315344736595, "languages": [ { "name": "French", "bcp_47": "fr", "population": 13465739, "score": 0.46 }, { "name": "Baoulé", "bcp_47": "bci", "population": 3022921, "score": 0.0 }, { "name": "Cebaara Senoufo", "bcp_47": "sef", "population": 1181687, "score": 0.0 }, { "name": "Dan", "bcp_47": "dnj", "population": 1099244, "score": 0.0 }, { "name": "Koro", "bcp_47": "kfo", "population": 63207, "score": 0.0 }, { "name": "Koro Wachi", "bcp_47": "bqv", "population": 46718, "score": 0.0 } ] }, "GA": { "score": 0.4024999642024461, "languages": [ { "name": "French", "bcp_47": "fr", "population": 1405473, "score": 0.46 }, { "name": "Punu", "bcp_47": "puu", "population": 200782, "score": 0.0 } ] }, "GN": { "score": 0.13640082022253552, "languages": [ { "name": "French", "bcp_47": "fr", "population": 3632946, "score": 0.46 }, { "name": "Fula", "bcp_47": "ff", "population": 3257124, "score": 0.0 }, { "name": "Mandingo", "bcp_47": "man", "population": 2881302, "score": 0.0 }, { "name": "Susu", "bcp_47": "sus", "population": 1378014, "score": 0.0 }, { "name": "Kpelle", "bcp_47": "kpe", "population": 476041, "score": 0.0 }, { "name": "N’Ko", "bcp_47": "nqo", "population": 626370, "score": 0.0 } ] }, "GP": { "score": 0.46, "languages": [ { "name": "French", "bcp_47": "fr", "population": 407498, "score": 0.46 } ] }, "HT": { "score": 0.025227556257943377, "languages": [ { "name": "French", "bcp_47": "fr", "population": 520187, "score": 0.46 }, { "name": "Haitian Creole", "bcp_47": "ht", "population": 8964918, "score": 0.0 } ] }, "MC": { "score": 0.4600000000000001, "languages": [ { "name": "French", "bcp_47": "fr", "population": 38610, "score": 0.46 } ] }, "MF": { "score": 0.46, "languages": [ { "name": "French", "bcp_47": "fr", "population": 32556, "score": 0.46 } ] }, "MQ": { "score": 0.4600000000000001, "languages": [ { "name": "French", "bcp_47": "fr", "population": 427408, "score": 0.46 } ] }, "NC": { "score": 0.46, "languages": [ { "name": "French", "bcp_47": "fr", "population": 278409, "score": 0.46 } ] }, "RE": { "score": 0.23394276750687273, "languages": [ { "name": "French", "bcp_47": "fr", "population": 700950, "score": 0.46 }, { "name": "Tamil", "bcp_47": "ta", "population": 118138, "score": 0.0 }, { "name": "Réunion Creole French", "bcp_47": "rcf", "population": 559185, "score": 0.0 } ] }, "SN": { "score": 0.1219628328989918, "languages": [ { "name": "French", "bcp_47": "fr", "population": 6137196, "score": 0.46 }, { "name": "Wolof", "bcp_47": "wo", "population": 11015480, "score": 0.0 }, { "name": "Fula", "bcp_47": "ff", "population": 3304644, "score": 0.0 }, { "name": "Serer", "bcp_47": "srr", "population": 1731004, "score": 0.0 }, { "name": "Jola-Fonyi", "bcp_47": "dyo", "population": 409146, "score": 0.0 }, { "name": "Saafi-Saafi", "bcp_47": "sav", "population": 236046, "score": 0.0 }, { "name": "Mandjak", "bcp_47": "mfv", "population": 121170, "score": 0.0 }, { "name": "Balanta-Ganja", "bcp_47": "bjt", "population": 95992, "score": 0.0 }, { "name": "Mankanya", "bcp_47": "knf", "population": 33046, "score": 0.0 }, { "name": "Noon", "bcp_47": "snf", "population": 37767, "score": 0.0 }, { "name": "Bassari", "bcp_47": "bsc", "population": 15264, "score": 0.0 }, { "name": "Hassaniyya", "bcp_47": "mey", "population": 7239, "score": 0.0 }, { "name": "Ménik", "bcp_47": "tnr", "population": 3305, "score": 0.0 } ] }, "TF": { "score": 0.46, "languages": [ { "name": "French", "bcp_47": "fr", "population": 140, "score": 0.46 } ] }, "TG": { "score": 0.353178050842427, "languages": [ { "name": "French", "bcp_47": "fr", "population": 5251148, "score": 0.46 }, { "name": "Ewe", "bcp_47": "ee", "population": 1463435, "score": 0.0 }, { "name": "Ifè", "bcp_47": "ife", "population": 111910, "score": 0.0 }, { "name": "Anii", "bcp_47": "blo", "population": 12913, "score": 0.0 } ] }, "WF": { "score": 0.16000548496206235, "languages": [ { "name": "French", "bcp_47": "fr", "population": 7610, "score": 0.46 }, { "name": "Wallisian", "bcp_47": "wls", "population": 9512, "score": 0.0 }, { "name": "East Futuna", "bcp_47": "fud", "population": 4756, "score": 0.0 } ] }, "YT": { "score": 0.15478158205430934, "languages": [ { "name": "French", "bcp_47": "fr", "population": 110580, "score": 0.46 }, { "name": "Swahili", "bcp_47": "sw", "population": 2716, "score": 0.0 }, { "name": "Comorian", "bcp_47": "swb", "population": 170720, "score": 0.0 }, { "name": "Bushi", "bcp_47": "buc", "population": 44620, "score": 0.0 } ] }, "AO": { "score": 0.2533081311690543, "languages": [ { "name": "Portuguese", "bcp_47": "pt", "population": 21789941, "score": 0.46 }, { "name": "Umbundu", "bcp_47": "umb", "population": 9431467, "score": 0.0 }, { "name": "Kimbundu", "bcp_47": "kmb", "population": 8130575, "score": 0.0 }, { "name": "Lingala", "bcp_47": "ln", "population": 217899, "score": 0.0 } ] }, "CV": { "score": 0.20934137957939955, "languages": [ { "name": "Portuguese", "bcp_47": "pt", "population": 443274, "score": 0.46 }, { "name": "Kabuverdianu", "bcp_47": "kea", "population": 530762, "score": 0.0 } ] }, "GW": { "score": 0.4483420821976837, "languages": [ { "name": "Portuguese", "bcp_47": "pt", "population": 1927100, "score": 0.46 }, { "name": "Fula", "bcp_47": "ff", "population": 4, "score": 0.0 }, { "name": "Mankanya", "bcp_47": "knf", "population": 50105, "score": 0.0 } ] }, "MZ": { "score": 0.1512107791359021, "languages": [ { "name": "Portuguese", "bcp_47": "pt", "population": 8126514, "score": 0.46 }, { "name": "Swahili", "bcp_47": "sw", "population": 9330, "score": 0.0 }, { "name": "Nyanja", "bcp_47": "ny", "population": 782553, "score": 0.0 }, { "name": "Zulu", "bcp_47": "zu", "population": 1806, "score": 0.0 }, { "name": "Tsonga", "bcp_47": "ts", "population": 2377758, "score": 0.0 }, { "name": "Makhuwa", "bcp_47": "vmw", "population": 3912766, "score": 0.0 }, { "name": "Ndau", "bcp_47": "ndc", "population": 2979722, "score": 0.0 }, { "name": "Lomwe", "bcp_47": "ngl", "population": 2046678, "score": 0.0 }, { "name": "Sena", "bcp_47": "seh", "population": 1384517, "score": 0.0 }, { "name": "Makhuwa-Meetto", "bcp_47": "mgh", "population": 1354419, "score": 0.0 }, { "name": "Ronga", "bcp_47": "rng", "population": 1023339, "score": 0.0 }, { "name": "Yao", "bcp_47": "yao", "population": 722357, "score": 0.0 } ] }, "ST": { "score": 0.45999999999999996, "languages": [ { "name": "Portuguese", "bcp_47": "pt", "population": 179454, "score": 0.46 } ] }, "TL": { "score": 0.23, "languages": [ { "name": "Portuguese", "bcp_47": "pt", "population": 816395, "score": 0.46 }, { "name": "Tetum", "bcp_47": "tet", "population": 816395, "score": 0.0 } ] }, "BY": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 1137350, "score": 0.0 }, { "name": "Belarusian", "bcp_47": "be", "population": 9477920, "score": 0.0 } ] }, "GE": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 359730, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 35573, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 279790, "score": 0.0 }, { "name": "Georgian", "bcp_47": "ka", "population": 3437420, "score": 0.0 }, { "name": "Ossetic", "bcp_47": "os", "population": 87934, "score": 0.0 }, { "name": "Mingrelian", "bcp_47": "xmf", "population": 439670, "score": 0.0 }, { "name": "Abkhazian", "bcp_47": "ab", "population": 87934, "score": 0.0 } ] }, "KG": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 2147364, "score": 0.0 }, { "name": "Kyrgyz", "bcp_47": "ky", "population": 2863152, "score": 0.0 } ] }, "MD": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 100935, "score": 0.0 }, { "name": "Ukrainian", "bcp_47": "uk", "population": 471030, "score": 0.0 }, { "name": "Romanian", "bcp_47": "ro", "population": 2119635, "score": 0.0 }, { "name": "Bulgarian", "bcp_47": "bg", "population": 316263, "score": 0.0 }, { "name": "Gagauz", "bcp_47": "gag", "population": 111028, "score": 0.0 } ] }, "RU": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 133218680, "score": 0.0 }, { "name": "Azerbaijani", "bcp_47": "az", "population": 131801, "score": 0.0 }, { "name": "Serbian", "bcp_47": "sr", "population": 4960, "score": 0.0 }, { "name": "Mongolian", "bcp_47": "mn", "population": 2126, "score": 0.0 }, { "name": "Finnish", "bcp_47": "fi", "population": 17007, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 1190465, "score": 0.0 }, { "name": "Tatar", "bcp_47": "tt", "population": 1984108, "score": 0.0 }, { "name": "Chuvash", "bcp_47": "cv", "population": 1842386, "score": 0.0 }, { "name": "Bashkir", "bcp_47": "ba", "population": 1842386, "score": 0.0 }, { "name": "Kabardian", "bcp_47": "kbd", "population": 439338, "score": 0.0 }, { "name": "Chechen", "bcp_47": "ce", "population": 935365, "score": 0.0 }, { "name": "Avaric", "bcp_47": "av", "population": 552716, "score": 0.0 }, { "name": "Ossetic", "bcp_47": "os", "population": 453510, "score": 0.0 }, { "name": "Udmurt", "bcp_47": "udm", "population": 538544, "score": 0.0 }, { "name": "Mari", "bcp_47": "chm", "population": 524371, "score": 0.0 }, { "name": "Yakut", "bcp_47": "sah", "population": 453510, "score": 0.0 }, { "name": "Adyghe", "bcp_47": "ady", "population": 124715, "score": 0.0 }, { "name": "Erzya", "bcp_47": "myv", "population": 439338, "score": 0.0 }, { "name": "Dargwa", "bcp_47": "dar", "population": 368477, "score": 0.0 }, { "name": "Buriat", "bcp_47": "bua", "population": 311788, "score": 0.0 }, { "name": "Moksha", "bcp_47": "mdf", "population": 297616, "score": 0.0 }, { "name": "Kumyk", "bcp_47": "kum", "population": 283444, "score": 0.0 }, { "name": "Lezghian", "bcp_47": "lez", "population": 255100, "score": 0.0 }, { "name": "Komi", "bcp_47": "kv", "population": 255100, "score": 0.0 }, { "name": "Karachay-Balkar", "bcp_47": "krc", "population": 240927, "score": 0.0 }, { "name": "Ingush", "bcp_47": "inh", "population": 226755, "score": 0.0 }, { "name": "Tuvinian", "bcp_47": "tyv", "population": 184239, "score": 0.0 }, { "name": "Karelian", "bcp_47": "krl", "population": 116212, "score": 0.0 }, { "name": "Lak", "bcp_47": "lbe", "population": 110543, "score": 0.0 }, { "name": "Komi-Permyak", "bcp_47": "koi", "population": 63775, "score": 0.0 }, { "name": "Western Mari", "bcp_47": "mrj", "population": 29762, "score": 0.0 }, { "name": "Southern Altai", "bcp_47": "alt", "population": 19841, "score": 0.0 }, { "name": "Veps", "bcp_47": "vep", "population": 3543, "score": 0.0 }, { "name": "Ingrian", "bcp_47": "izh", "population": 142, "score": 0.0 }, { "name": "Votic", "bcp_47": "vot", "population": 0, "score": 0.0 }, { "name": "Church Slavic", "bcp_47": "cu", "population": 0, "score": 0.0 } ] }, "SJ": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 1200, "score": 0.0 }, { "name": "Norwegian Bokmål", "bcp_47": "nb", "population": 1492, "score": 0.0 } ] }, "TM": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 663436, "score": 0.0 }, { "name": "Uzbek", "bcp_47": "uz", "population": 497577, "score": 0.0 }, { "name": "Turkmen", "bcp_47": "tk", "population": 3870041, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 22115, "score": 0.0 } ] }, "UA": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 20204534, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 184476, "score": 0.0 }, { "name": "Polish", "bcp_47": "pl", "population": 1054150, "score": 0.0 }, { "name": "Ukrainian", "bcp_47": "uk", "population": 28549885, "score": 0.0 }, { "name": "Romanian", "bcp_47": "ro", "population": 228399, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 162515, "score": 0.0 }, { "name": "Greek", "bcp_47": "el", "population": 7028, "score": 0.0 }, { "name": "Belarusian", "bcp_47": "be", "population": 364560, "score": 0.0 }, { "name": "Bulgarian", "bcp_47": "bg", "population": 215222, "score": 0.0 }, { "name": "Yiddish", "bcp_47": "yi", "population": 570998, "score": 0.0 }, { "name": "Rusyn", "bcp_47": "rue", "population": 527075, "score": 0.0 }, { "name": "Crimean Tatar", "bcp_47": "crh", "population": 245968, "score": 0.0 } ] }, "UZ": { "score": 0.0, "languages": [ { "name": "Russian", "bcp_47": "ru", "population": 4279156, "score": 0.0 }, { "name": "Turkish", "bcp_47": "tr", "population": 232297, "score": 0.0 }, { "name": "Uzbek", "bcp_47": "uz", "population": 30565400, "score": 0.0 }, { "name": "Kara-Kalpak", "bcp_47": "kaa", "population": 489046, "score": 0.0 } ] }, "LI": { "score": 0.0, "languages": [ { "name": "German", "bcp_47": "de", "population": 39137, "score": 0.0 }, { "name": "Swiss German", "bcp_47": "gsw", "population": 33266, "score": 0.0 }, { "name": "Walser", "bcp_47": "wae", "population": 1292, "score": 0.0 } ] }, "JP": { "score": 0.0, "languages": [ { "name": "Japanese", "bcp_47": "ja", "population": 119231650, "score": 0.0 }, { "name": "Korean", "bcp_47": "ko", "population": 652636, "score": 0.0 }, { "name": "Central Okinawan", "bcp_47": "ryu", "population": 966404, "score": 0.0 } ] }, "AF": { "score": 0.0, "languages": [ { "name": "Persian", "bcp_47": "fa", "population": 18321900, "score": 0.0 }, { "name": "Pashto", "bcp_47": "ps", "population": 15756834, "score": 0.0 }, { "name": "Uzbek", "bcp_47": "uz", "population": 1722259, "score": 0.0 }, { "name": "Kazakh", "bcp_47": "kk", "population": 2015, "score": 0.0 }, { "name": "Uyghur", "bcp_47": "ug", "population": 3005, "score": 0.0 }, { "name": "Turkmen", "bcp_47": "tk", "population": 622945, "score": 0.0 }, { "name": "Hazaragi", "bcp_47": "haz", "population": 2161984, "score": 0.0 }, { "name": "Western Balochi", "bcp_47": "bgn", "population": 230856, "score": 0.0 }, { "name": "Parsi-Dari", "bcp_47": "prd", "population": 439726, "score": 0.0 } ] }, "MK": { "score": 0.0, "languages": [ { "name": "Turkish", "bcp_47": "tr", "population": 74409, "score": 0.0 }, { "name": "Albanian", "bcp_47": "sq", "population": 531492, "score": 0.0 }, { "name": "Macedonian", "bcp_47": "mk", "population": 1424400, "score": 0.0 } ] }, "KP": { "score": 0.0, "languages": [ { "name": "Korean", "bcp_47": "ko", "population": 22566280, "score": 0.0 } ] }, "KR": { "score": 0.0, "languages": [ { "name": "Korean", "bcp_47": "ko", "population": 51835100, "score": 0.0 } ] }, "SM": { "score": 0.0, "languages": [ { "name": "Italian", "bcp_47": "it", "population": 30466, "score": 0.0 }, { "name": "Esperanto", "bcp_47": "eo", "population": 301, "score": 0.0 } ] }, "VA": { "score": 0.0, "languages": [ { "name": "Italian", "bcp_47": "it", "population": 820, "score": 0.0 }, { "name": "Latin", "bcp_47": "la", "population": 820, "score": 0.0 } ] }, "MM": { "score": 0.0, "languages": [ { "name": "Burmese", "bcp_47": "my", "population": 36217664, "score": 0.0 }, { "name": "Shan", "bcp_47": "shn", "population": 3621766, "score": 0.0 }, { "name": "Rohingya", "bcp_47": "rhg", "population": 962032, "score": 0.0 }, { "name": "Mon", "bcp_47": "mnw", "population": 848852, "score": 0.0 }, { "name": "Kachin", "bcp_47": "kac", "population": 962032, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 12450, "score": 0.0 }, { "name": "Khamti", "bcp_47": "kht", "population": 4244, "score": 0.0 } ] }, "AM": { "score": 0.0, "languages": [ { "name": "Azerbaijani", "bcp_47": "az", "population": 0, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 99704, "score": 0.0 }, { "name": "Armenian", "bcp_47": "hy", "population": 2960894, "score": 0.0 } ] }, "AZ": { "score": 0.0, "languages": [ { "name": "Azerbaijani", "bcp_47": "az", "population": 10093536, "score": 0.0 }, { "name": "Kurdish", "bcp_47": "ku", "population": 24494, "score": 0.0 }, { "name": "Talysh", "bcp_47": "tly", "population": 1000168, "score": 0.0 }, { "name": "Muslim Tat", "bcp_47": "ttt", "population": 22453, "score": 0.0 }, { "name": "Tsakhur", "bcp_47": "tkr", "population": 16329, "score": 0.0 } ] }, "BQ": { "score": 0.0, "languages": [ { "name": "Dutch", "bcp_47": "nl", "population": 1600, "score": 0.0 }, { "name": "Papiamento", "bcp_47": "pap", "population": 16200, "score": 0.0 } ] }, "RS": { "score": 0.0, "languages": [ { "name": "Ukrainian", "bcp_47": "uk", "population": 0, "score": 0.0 }, { "name": "Romanian", "bcp_47": "ro", "population": 147256, "score": 0.0 }, { "name": "Serbian", "bcp_47": "sr", "population": 13884096, "score": 0.0 }, { "name": "Hungarian", "bcp_47": "hu", "population": 336584, "score": 0.0 }, { "name": "Croatian", "bcp_47": "hr", "population": 65213, "score": 0.0 }, { "name": "Albanian", "bcp_47": "sq", "population": 1332312, "score": 0.0 }, { "name": "Slovak", "bcp_47": "sk", "population": 59603, "score": 0.0 } ] }, "ME": { "score": 0.0, "languages": [ { "name": "Serbian", "bcp_47": "sr", "population": 640352, "score": 0.0 }, { "name": "Albanian", "bcp_47": "sq", "population": 48179, "score": 0.0 } ] }, "XK": { "score": 0.0, "languages": [ { "name": "Serbian", "bcp_47": "sr", "population": 193276, "score": 0.0 }, { "name": "Albanian", "bcp_47": "sq", "population": 1778148, "score": 0.0 }, { "name": "Gheg Albanian", "bcp_47": "aln", "population": 1430250, "score": 0.0 } ] }, "KH": { "score": 0.0, "languages": [ { "name": "Khmer", "bcp_47": "km", "population": 15065030, "score": 0.0 }, { "name": "Kuy", "bcp_47": "kdt", "population": 18620, "score": 0.0 }, { "name": "Western Cham", "bcp_47": "cja", "population": 270832, "score": 0.0 } ] }, "AX": { "score": 0.0, "languages": [ { "name": "Swedish", "bcp_47": "sv", "population": 25938, "score": 0.0 } ] }, "AL": { "score": 0.0, "languages": [ { "name": "Greek", "bcp_47": "el", "population": 58417, "score": 0.0 }, { "name": "Albanian", "bcp_47": "sq", "population": 3074580, "score": 0.0 }, { "name": "Macedonian", "bcp_47": "mk", "population": 14451, "score": 0.0 } ] }, "GL": { "score": 0.0, "languages": [ { "name": "Danish", "bcp_47": "da", "population": 8066, "score": 0.0 }, { "name": "Kalaallisut", "bcp_47": "kl", "population": 48397, "score": 0.0 } ] }, "IS": { "score": 0.0, "languages": [ { "name": "Danish", "bcp_47": "da", "population": 2245, "score": 0.0 }, { "name": "Icelandic", "bcp_47": "is", "population": 350734, "score": 0.0 } ] }, "NO": { "score": 0.0, "languages": [ { "name": "Norwegian Bokmål", "bcp_47": "nb", "population": 5467440, "score": 0.0 }, { "name": "Norwegian", "bcp_47": "no", "population": 5467440, "score": 0.0 }, { "name": "Norwegian Nynorsk", "bcp_47": "nn", "population": 1366860, "score": 0.0 }, { "name": "Northern Sami", "bcp_47": "se", "population": 15856, "score": 0.0 } ] }, "LA": { "score": 0.0, "languages": [ { "name": "Lao", "bcp_47": "lo", "population": 5138706, "score": 0.0 }, { "name": "Hmong Njua", "bcp_47": "hnj", "population": 223422, "score": 0.0 }, { "name": "Khmu", "bcp_47": "kjg", "population": 431949, "score": 0.0 }, { "name": "Kuy", "bcp_47": "kdt", "population": 71495, "score": 0.0 } ] }, "FO": { "score": 0.0, "languages": [ { "name": "Faroese", "bcp_47": "fo", "population": 49047, "score": 0.0 } ] } } }