diff --git "a/frontend/public/results.json" "b/frontend/public/results.json" deleted file mode 100644--- "a/frontend/public/results.json" +++ /dev/null @@ -1,20200 +0,0 @@ -{ - "model_table": [ - { - "rank": 1, - "provider": "Google", - "model": "Gemini 2.0 Flash 001", - "hf_id": null, - "creation_date": null, - "size": null, - "type": "Commercial", - "license": null, - "average": 0.72, - "classification_accuracy": 0.87, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.45, - "translation_chrf": 0.58 - }, - { - "rank": 2, - "provider": "Google", - "model": "Gemini 2.0 Flash Lite 001", - "hf_id": null, - "creation_date": null, - "size": null, - "type": "Commercial", - "license": null, - "average": 0.66, - "classification_accuracy": 0.73, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.4, - "translation_chrf": 0.54 - }, - { - "rank": 3, - "provider": "Google", - "model": "Gemma 3 27b It", - "hf_id": "google/gemma-3-27b-it", - "creation_date": "2025-03-01", - "size": 27432406640.0, - "type": "Open", - "license": "Gemma", - "average": 0.64, - "classification_accuracy": 0.72, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.37, - "translation_chrf": 0.54 - }, - { - "rank": 4, - "provider": "Meta Llama", - "model": "Llama 3.1 70b Instruct", - "hf_id": "meta-llama/Llama-3.1-70B-Instruct", - "creation_date": "2024-07-16", - "size": 70553706496.0, - "type": "Open", - "license": "Llama3.1", - "average": 0.63, - "classification_accuracy": 0.57, - "language_modeling_chrf": 0.95, - "translation_bleu": 0.43, - "translation_chrf": 0.57 - }, - { - "rank": 5, - "provider": "Meta Llama", - "model": "Llama 3 70b Instruct", - "hf_id": null, - "creation_date": null, - "size": null, - "type": "Commercial", - "license": null, - "average": 0.61, - "classification_accuracy": 0.8, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.25, - "translation_chrf": 0.43 - }, - { - "rank": 6, - "provider": "Amazon", - "model": "Nova Micro V1", - "hf_id": null, - "creation_date": null, - "size": null, - "type": "Commercial", - "license": null, - "average": 0.6, - "classification_accuracy": 0.52, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.4, - "translation_chrf": 0.56 - }, - { - "rank": 7, - "provider": "OpenAI", - "model": "GPT 4o Mini", - "hf_id": null, - "creation_date": null, - "size": null, - "type": "Commercial", - "license": null, - "average": 0.6, - "classification_accuracy": 0.52, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.39, - "translation_chrf": 0.55 - }, - { - "rank": 8, - "provider": "MistralAI", - "model": "Mistral Small 24b Instruct 2501", - "hf_id": "mistralai/Mistral-Small-24B-Instruct-2501", - "creation_date": "2025-01-28", - "size": 23572403200.0, - "type": "Open", - "license": "Apache 2.0", - "average": 0.58, - "classification_accuracy": 0.55, - "language_modeling_chrf": 0.88, - "translation_bleu": 0.38, - "translation_chrf": 0.52 - }, - { - "rank": 9, - "provider": "Meta Llama", - "model": "Llama 3.3 70b Instruct", - "hf_id": "meta-llama/Llama-3.3-70B-Instruct", - "creation_date": "2024-11-26", - "size": 70553706496.0, - "type": "Open", - "license": "Llama3.3", - "average": 0.55, - "classification_accuracy": 0.51, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.28, - "translation_chrf": 0.46 - }, - { - "rank": 10, - "provider": "MistralAI", - "model": "Mistral Nemo", - "hf_id": null, - "creation_date": null, - "size": null, - "type": "Commercial", - "license": null, - "average": 0.54, - "classification_accuracy": 0.5, - "language_modeling_chrf": 0.86, - "translation_bleu": 0.32, - "translation_chrf": 0.49 - }, - { - "rank": 11, - "provider": "Microsoft", - "model": "Phi 4 Multimodal Instruct", - "hf_id": "microsoft/Phi-4-multimodal-instruct", - "creation_date": "2025-02-24", - "size": 5574460384.0, - "type": "Open", - "license": "Mit", - "average": 0.52, - "classification_accuracy": 0.42, - "language_modeling_chrf": 0.88, - "translation_bleu": 0.32, - "translation_chrf": 0.46 - }, - { - "rank": 12, - "provider": "Qwen", - "model": "Qwq 32b", - "hf_id": "Qwen/QwQ-32B", - "creation_date": "2025-03-05", - "size": 32763876352.0, - "type": "Open", - "license": "Apache 2.0", - "average": 0.25, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.47, - "translation_bleu": 0.21, - "translation_chrf": 0.3 - } - ], - "language_table": [ - { - "bcp_47": "en", - "language_name": "English", - "autonym": "English", - "speakers": 1636485840, - "family": "Indo-European", - "average": 0.47, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.58, - "language_modeling_chrf": 0.92, - "translation_bleu": 0.37, - "translation_chrf": 0.49 - }, - { - "bcp_47": "zh", - "language_name": "Chinese", - "autonym": "中文", - "speakers": 1304678914, - "family": "Sino-Tibetan", - "average": 0.46, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.55, - "language_modeling_chrf": 0.86, - "translation_bleu": 0.35, - "translation_chrf": 0.53 - }, - { - "bcp_47": "hi", - "language_name": "Hindi", - "autonym": "हिन्दी", - "speakers": 546882144, - "family": "Indo-European", - "average": 0.46, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.53, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.32, - "translation_chrf": 0.49 - }, - { - "bcp_47": "es", - "language_name": "Spanish", - "autonym": "Español", - "speakers": 493528077, - "family": "Indo-European", - "average": 0.45, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.53, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.28, - "translation_chrf": 0.46 - }, - { - "bcp_47": "ar", - "language_name": "Arabic", - "autonym": "العربية", - "speakers": 351664197, - "family": "Afro-Asiatic", - "average": 0.42, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.43, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.28, - "translation_chrf": 0.47 - }, - { - "bcp_47": "ur", - "language_name": "Urdu", - "autonym": "اردو", - "speakers": 290790290, - "family": "Indo-European", - "average": 0.42, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.5, - "language_modeling_chrf": 0.92, - "translation_bleu": 0.24, - "translation_chrf": 0.42 - }, - { - "bcp_47": "fr", - "language_name": "French", - "autonym": "Français", - "speakers": 278611507, - "family": "Indo-European", - "average": 0.46, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.53, - "language_modeling_chrf": 0.98, - "translation_bleu": 0.32, - "translation_chrf": 0.49 - }, - { - "bcp_47": "bn", - "language_name": "Bangla", - "autonym": "বাংলা", - "speakers": 267193288, - "family": "Indo-European", - "average": 0.38, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.4, - "language_modeling_chrf": 0.91, - "translation_bleu": 0.2, - "translation_chrf": 0.41 - }, - { - "bcp_47": "pt", - "language_name": "Portuguese", - "autonym": "Português", - "speakers": 237496885, - "family": "Indo-European", - "average": 0.45, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.5, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.31, - "translation_chrf": 0.49 - }, - { - "bcp_47": "pa", - "language_name": "Punjabi", - "autonym": "ਪੰਜਾਬੀ", - "speakers": 203571210, - "family": "Indo-European", - "average": 0.43, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.4, - "language_modeling_chrf": 0.9, - "translation_bleu": 0.34, - "translation_chrf": 0.49 - }, - { - "bcp_47": "ru", - "language_name": "Russian", - "autonym": "Русский", - "speakers": 195841151, - "family": "Indo-European", - "average": 0.45, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.57, - "language_modeling_chrf": 0.97, - "translation_bleu": 0.26, - "translation_chrf": 0.45 - }, - { - "bcp_47": "sw", - "language_name": "Swahili", - "autonym": "Kiswahili", - "speakers": 171610296, - "family": "Atlantic-Congo", - "average": 0.45, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.57, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.3, - "translation_chrf": 0.47 - }, - { - "bcp_47": "id", - "language_name": "Indonesian", - "autonym": "Bahasa Indonesia", - "speakers": 171207687, - "family": "Austronesian", - "average": 0.47, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.63, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.29, - "translation_chrf": 0.47 - }, - { - "bcp_47": "de", - "language_name": "German", - "autonym": "Deutsch", - "speakers": 136350226, - "family": "Indo-European", - "average": 0.49, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.67, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.32, - "translation_chrf": 0.5 - }, - { - "bcp_47": "ja", - "language_name": "Japanese", - "autonym": "日本語", - "speakers": 119729026, - "family": "Japonic", - "average": 0.46, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.63, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.27, - "translation_chrf": 0.44 - }, - { - "bcp_47": "te", - "language_name": "Telugu", - "autonym": "తెలుగు", - "speakers": 95478480, - "family": "Dravidian", - "average": 0.41, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.37, - "language_modeling_chrf": 0.95, - "translation_bleu": 0.28, - "translation_chrf": 0.47 - }, - { - "bcp_47": "lah", - "language_name": "Western Panjabi", - "autonym": "لہندا پنجابی", - "speakers": 93433552, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mr", - "language_name": "Marathi", - "autonym": "मराठी", - "speakers": 92826300, - "family": "Indo-European", - "average": 0.45, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.63, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.25, - "translation_chrf": 0.42 - }, - { - "bcp_47": "jv", - "language_name": "Javanese", - "autonym": "Jawa", - "speakers": 91180665, - "family": "Austronesian", - "average": 0.41, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.47, - "language_modeling_chrf": 0.93, - "translation_bleu": 0.24, - "translation_chrf": 0.42 - }, - { - "bcp_47": "vi", - "language_name": "Vietnamese", - "autonym": "Tiếng Việt", - "speakers": 86222962, - "family": "Austroasiatic", - "average": 0.45, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.6, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.26, - "translation_chrf": 0.44 - }, - { - "bcp_47": "ta", - "language_name": "Tamil", - "autonym": "தமிழ்", - "speakers": 85616159, - "family": "Dravidian", - "average": 0.41, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.43, - "language_modeling_chrf": 0.96, - "translation_bleu": 0.25, - "translation_chrf": 0.42 - }, - { - "bcp_47": "fa", - "language_name": "Persian", - "autonym": "فارسی", - "speakers": 84710459, - "family": "Indo-European", - "average": 0.41, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.4, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.26, - "translation_chrf": 0.45 - }, - { - "bcp_47": "wuu", - "language_name": "Wu Chinese", - "autonym": "Wu Chinese", - "speakers": 83641200, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tr", - "language_name": "Turkish", - "autonym": "Türkçe", - "speakers": 80360704, - "family": "Turkic", - "average": 0.44, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.53, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.28, - "translation_chrf": 0.45 - }, - { - "bcp_47": "yue", - "language_name": "Cantonese", - "autonym": "粵語", - "speakers": 79654759, - "family": "Sino-Tibetan", - "average": 0.39, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.43, - "language_modeling_chrf": 0.9, - "translation_bleu": 0.23, - "translation_chrf": 0.41 - }, - { - "bcp_47": "ko", - "language_name": "Korean", - "autonym": "한국어", - "speakers": 78357046, - "family": "Koreanic", - "average": 0.41, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.53, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.2, - "translation_chrf": 0.4 - }, - { - "bcp_47": "it", - "language_name": "Italian", - "autonym": "Italiano", - "speakers": 70247060, - "family": "Indo-European", - "average": 0.47, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.67, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.28, - "translation_chrf": 0.47 - }, - { - "bcp_47": "fil", - "language_name": "Filipino", - "autonym": "Filipino", - "speakers": 67471096, - "family": "Austronesian", - "average": 0.42, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.43, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.29, - "translation_chrf": 0.45 - }, - { - "bcp_47": "arz", - "language_name": "Egyptian Arabic", - "autonym": "Egyptian Arabic", - "speakers": 66639360, - "family": "Afro-Asiatic", - "average": 0.38, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.4, - "language_modeling_chrf": 0.93, - "translation_bleu": 0.2, - "translation_chrf": 0.39 - }, - { - "bcp_47": "gu", - "language_name": "Gujarati", - "autonym": "ગુજરાતી", - "speakers": 61721799, - "family": "Indo-European", - "average": 0.42, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.43, - "language_modeling_chrf": 0.94, - "translation_bleu": 0.26, - "translation_chrf": 0.44 - }, - { - "bcp_47": "th", - "language_name": "Thai", - "autonym": "ไทย", - "speakers": 55181920, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ps", - "language_name": "Pashto", - "autonym": "پښتو", - "speakers": 53542641, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kn", - "language_name": "Kannada", - "autonym": "ಕನ್ನಡ", - "speakers": 49065330, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pcm", - "language_name": "Nigerian Pidgin", - "autonym": "Naijíriá Píjin", - "speakers": 44945880, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ml", - "language_name": "Malayalam", - "autonym": "മലയാളം", - "speakers": 43257484, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "or", - "language_name": "Odia", - "autonym": "ଓଡ଼ିଆ", - "speakers": 42434880, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pl", - "language_name": "Polish", - "autonym": "Polski", - "speakers": 41077399, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hsn", - "language_name": "Xiang Chinese", - "autonym": "Xiang Chinese", - "speakers": 40426580, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ha", - "language_name": "Hausa", - "autonym": "Hausa", - "speakers": 40411882, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sd", - "language_name": "Sindhi", - "autonym": "سنڌي", - "speakers": 40329510, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "apc", - "language_name": "North Levantine Arabic", - "autonym": "العامية", - "speakers": 39031474, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ms", - "language_name": "Malay", - "autonym": "Bahasa Malaysia", - "speakers": 38097307, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "my", - "language_name": "Burmese", - "autonym": "မြန်မာ", - "speakers": 36559231, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "am", - "language_name": "Amharic", - "autonym": "አማርኛ", - "speakers": 35728475, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "arq", - "language_name": "Algerian Arabic", - "autonym": "Algerian Arabic", - "speakers": 35667507, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "om", - "language_name": "Oromo", - "autonym": "Oromoo", - "speakers": 34897121, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bho", - "language_name": "Bhojpuri", - "autonym": "भोजपुरी", - "speakers": 32934797, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "uz", - "language_name": "Uzbek", - "autonym": "O‘Zbek", - "speakers": 32792780, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "az", - "language_name": "Azerbaijani", - "autonym": "Azərbaycan", - "speakers": 32446682, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hak", - "language_name": "Hakka Chinese", - "autonym": "Hakka Chinese", - "speakers": 32062460, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "su", - "language_name": "Sundanese", - "autonym": "Basa Sunda", - "speakers": 32043120, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nl", - "language_name": "Dutch", - "autonym": "Nederlands", - "speakers": 31765645, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ary", - "language_name": "Moroccan Arabic", - "autonym": "Moroccan Arabic", - "speakers": 30938679, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "uk", - "language_name": "Ukrainian", - "autonym": "Українська", - "speakers": 29348975, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "yo", - "language_name": "Yoruba", - "autonym": "Èdè Yorùbá", - "speakers": 28685568, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "skr", - "language_name": "Saraiki", - "autonym": "سرائیکی", - "speakers": 28020120, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ig", - "language_name": "Igbo", - "autonym": "Igbo", - "speakers": 27823640, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nan", - "language_name": "Min Nan Chinese", - "autonym": "Min Nan Chinese", - "speakers": 26486380, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ceb", - "language_name": "Cebuano", - "autonym": "Cebuano", - "speakers": 26203440, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "awa", - "language_name": "Awadhi", - "autonym": "Awadhi", - "speakers": 25862924, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mg", - "language_name": "Malagasy", - "autonym": "Malagasy", - "speakers": 24260130, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gan", - "language_name": "Gan Chinese", - "autonym": "Gan Chinese", - "speakers": 23698340, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ro", - "language_name": "Romanian", - "autonym": "Română", - "speakers": 22187408, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bar", - "language_name": "Bavarian", - "autonym": "Bavarian", - "speakers": 22043627, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ne", - "language_name": "Nepali", - "autonym": "नेपाली", - "speakers": 20903374, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mai", - "language_name": "Maithili", - "autonym": "मैथिली", - "speakers": 19249149, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "as", - "language_name": "Assamese", - "autonym": "অসমীয়া", - "speakers": 17239170, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ny", - "language_name": "Nyanja", - "autonym": "Nyanja", - "speakers": 17026781, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "so", - "language_name": "Somali", - "autonym": "Soomaali", - "speakers": 16911645, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mad", - "language_name": "Madurese", - "autonym": "Madurese", - "speakers": 16822638, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tts", - "language_name": "Northeastern Thai", - "autonym": "Northeastern Thai", - "speakers": 16554576, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rkt", - "language_name": "Rangpuri", - "autonym": "Rangpuri", - "speakers": 16274502, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mag", - "language_name": "Magahi", - "autonym": "Magahi", - "speakers": 15913080, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bgc", - "language_name": "Haryanvi", - "autonym": "हरियाणवी", - "speakers": 15913080, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mwr", - "language_name": "Marwari", - "autonym": "Marwari", - "speakers": 15913080, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sr", - "language_name": "Serbian", - "autonym": "Српски", - "speakers": 15602410, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "si", - "language_name": "Sinhala", - "autonym": "සිංහල", - "speakers": 15564656, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "km", - "language_name": "Khmer", - "autonym": "ខ្មែរ", - "speakers": 15065030, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hne", - "language_name": "Chhattisgarhi", - "autonym": "Chhattisgarhi", - "speakers": 14586990, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fuv", - "language_name": "Nigerian Fulfulde", - "autonym": "Nigerian Fulfulde", - "speakers": 14339876, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "zu", - "language_name": "Zulu", - "autonym": "Isizulu", - "speakers": 13973830, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kk", - "language_name": "Kazakh", - "autonym": "Қазақ Тілі", - "speakers": 13637392, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dcc", - "language_name": "Deccan", - "autonym": "Deccan", - "speakers": 13128291, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cs", - "language_name": "Czech", - "autonym": "Čeština", - "speakers": 13045532, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sv", - "language_name": "Swedish", - "autonym": "Svenska", - "speakers": 12932871, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hu", - "language_name": "Hungarian", - "autonym": "Magyar", - "speakers": 12443430, - "family": "Uralic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "el", - "language_name": "Greek", - "autonym": "Ελληνικά", - "speakers": 12292242, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sn", - "language_name": "Shona", - "autonym": "Chishona", - "speakers": 11782503, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nds", - "language_name": "Low German", - "autonym": "Neddersass’Sch", - "speakers": 11520008, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ak", - "language_name": "Akan", - "autonym": "Akan", - "speakers": 11442678, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "qu", - "language_name": "Quechua", - "autonym": "Runasimi", - "speakers": 11385851, - "family": "Quechuan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ckb", - "language_name": "Central Kurdish", - "autonym": "کوردیی ناوەندی", - "speakers": 11086549, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rw", - "language_name": "Kinyarwanda", - "autonym": "Kinyarwanda", - "speakers": 11083625, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wo", - "language_name": "Wolof", - "autonym": "Wolof", - "speakers": 11025494, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "aeb", - "language_name": "Tunisian Arabic", - "autonym": "Tunisian Arabic", - "speakers": 10549080, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ilo", - "language_name": "Iloko", - "autonym": "Ilokano", - "speakers": 10481376, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "xh", - "language_name": "Xhosa", - "autonym": "Isixhosa", - "speakers": 10182944, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ti", - "language_name": "Tigrinya", - "autonym": "ትግርኛ", - "speakers": 10145911, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "be", - "language_name": "Belarusian", - "autonym": "Беларуская", - "speakers": 10064517, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lua", - "language_name": "Luba-Lulua", - "autonym": "Luba-Lulua", - "speakers": 9770880, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tg", - "language_name": "Tajik", - "autonym": "Тоҷикӣ", - "speakers": 9644223, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "umb", - "language_name": "Umbundu", - "autonym": "Umbundu", - "speakers": 9431467, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bm", - "language_name": "Bambara", - "autonym": "Bamanakan", - "speakers": 9385632, - "family": "Mande", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "af", - "language_name": "Afrikaans", - "autonym": "Afrikaans", - "speakers": 9318845, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hil", - "language_name": "Hiligaynon", - "autonym": "Ilonggo", - "speakers": 9171204, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ki", - "language_name": "Kikuyu", - "autonym": "Gikuyu", - "speakers": 9099743, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ht", - "language_name": "Haitian Creole", - "autonym": "Haitian Creole", - "speakers": 8964918, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ca", - "language_name": "Catalan", - "autonym": "Català", - "speakers": 8679139, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "he", - "language_name": "Hebrew", - "autonym": "עברית", - "speakers": 8675480, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ii", - "language_name": "Sichuan Yi", - "autonym": "ꆈꌠꉙ", - "speakers": 8364120, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mos", - "language_name": "Mossi", - "autonym": "Mossi", - "speakers": 8334160, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bal", - "language_name": "Baluchi", - "autonym": "بلۆچی", - "speakers": 8227887, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "syl", - "language_name": "Sylheti", - "autonym": "Sylheti", - "speakers": 8132550, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kmb", - "language_name": "Kimbundu", - "autonym": "Kimbundu", - "speakers": 8130575, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ug", - "language_name": "Uyghur", - "autonym": "ئۇيغۇرچە", - "speakers": 8052967, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "min", - "language_name": "Minangkabau", - "autonym": "Minangkabau", - "speakers": 8010780, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gsw", - "language_name": "Swiss German", - "autonym": "Schwiizertüütsch", - "speakers": 7956952, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bg", - "language_name": "Bulgarian", - "autonym": "Български", - "speakers": 7878315, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "zgh", - "language_name": "Standard Moroccan Tamazight", - "autonym": "ⵜⴰⵎⴰⵣⵉⵖⵜ", - "speakers": 7823574, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ff", - "language_name": "Fula", - "autonym": "Pulaar", - "speakers": 7788904, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bs", - "language_name": "Bosnian", - "autonym": "Bosanski", - "speakers": 7594468, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rn", - "language_name": "Rundi", - "autonym": "Ikirundi", - "speakers": 7475454, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bjj", - "language_name": "Kanauji", - "autonym": "Kanauji", - "speakers": 7426104, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sat", - "language_name": "Santali", - "autonym": "ᱥᱟᱱᱛᱟᱲᱤ", - "speakers": 7293495, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "da", - "language_name": "Danish", - "autonym": "Dansk", - "speakers": 7072056, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tk", - "language_name": "Turkmen", - "autonym": "Türkmen Dili", - "speakers": 6870838, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ku", - "language_name": "Kurdish", - "autonym": "Kurdî (Kurmancî)", - "speakers": 6866757, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hr", - "language_name": "Croatian", - "autonym": "Hrvatski", - "speakers": 6813164, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sq", - "language_name": "Albanian", - "autonym": "Shqip", - "speakers": 6791906, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sk", - "language_name": "Slovak", - "autonym": "Slovenčina", - "speakers": 6680269, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dyu", - "language_name": "Dyula", - "autonym": "Dyula", - "speakers": 6667328, - "family": "Mande", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nod", - "language_name": "Northern Thai", - "autonym": "Northern Thai", - "speakers": 6621830, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mn", - "language_name": "Mongolian", - "autonym": "Монгол", - "speakers": 6572846, - "family": "Mongolic-Khitan", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "st", - "language_name": "Southern Sotho", - "autonym": "Sesotho", - "speakers": 6390567, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kri", - "language_name": "Krio", - "autonym": "Krio", - "speakers": 6293684, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "shi", - "language_name": "Tachelhit", - "autonym": "ⵜⴰⵛⵍⵃⵉⵜ", - "speakers": 6187736, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tn", - "language_name": "Tswana", - "autonym": "Tswana", - "speakers": 6113428, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wtm", - "language_name": "Mewati", - "autonym": "Mewati", - "speakers": 6100014, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "luy", - "language_name": "Luyia", - "autonym": "Luluhia", - "speakers": 5888069, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gn", - "language_name": "Guarani", - "autonym": "Avañe’Ẽ", - "speakers": 5827107, - "family": "Tupian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fi", - "language_name": "Finnish", - "autonym": "Suomi", - "speakers": 5736842, - "family": "Uralic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lg", - "language_name": "Ganda", - "autonym": "Luganda", - "speakers": 5622890, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bew", - "language_name": "Betawi", - "autonym": "Betawi", - "speakers": 5607546, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ks", - "language_name": "Kashmiri", - "autonym": "کٲشُر", - "speakers": 5598085, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sou", - "language_name": "Southern Thai", - "autonym": "Southern Thai", - "speakers": 5518192, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nb", - "language_name": "Norwegian Bokmål", - "autonym": "Norsk Bokmål", - "speakers": 5468932, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "no", - "language_name": "Norwegian", - "autonym": "Norsk", - "speakers": 5467440, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bem", - "language_name": "Bemba", - "autonym": "Ichibemba", - "speakers": 5402246, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hy", - "language_name": "Armenian", - "autonym": "Հայերեն", - "speakers": 5317273, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nso", - "language_name": "Northern Sotho", - "autonym": "Northern Sotho", - "speakers": 5307578, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "luo", - "language_name": "Luo (Kenya and Tanzania)", - "autonym": "Dholuo", - "speakers": 5245734, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tpi", - "language_name": "Tok Pisin", - "autonym": "Tok Pisin", - "speakers": 5154217, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lo", - "language_name": "Lao", - "autonym": "ລາວ", - "speakers": 5138706, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "suk", - "language_name": "Sukuma", - "autonym": "Sukuma", - "speakers": 5094094, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kok", - "language_name": "Konkani", - "autonym": "कोंकणी", - "speakers": 4906533, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ts", - "language_name": "Tsonga", - "autonym": "Tsonga", - "speakers": 4880932, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vmf", - "language_name": "Main-Franconian", - "autonym": "Main-Franconian", - "speakers": 4809582, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ban", - "language_name": "Balinese", - "autonym": "Balinese", - "speakers": 4806468, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ee", - "language_name": "Ewe", - "autonym": "Eʋegbe", - "speakers": 4690857, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "za", - "language_name": "Zhuang", - "autonym": "Vahcuengh", - "speakers": 4321462, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bug", - "language_name": "Buginese", - "autonym": "Buginese", - "speakers": 4298211, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mzn", - "language_name": "Mazanderani", - "autonym": "مازرونی", - "speakers": 4246165, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gom", - "language_name": "Goan Konkani", - "autonym": "Goan Konkani", - "speakers": 4243488, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kam", - "language_name": "Kamba", - "autonym": "Kikamba", - "speakers": 4068120, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kln", - "language_name": "Kalenjin", - "autonym": "Kalenjin", - "speakers": 4068120, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bjn", - "language_name": "Banjar", - "autonym": "Banjar", - "speakers": 4010288, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hno", - "language_name": "Northern Hindko", - "autonym": "Northern Hindko", - "speakers": 3969517, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vmw", - "language_name": "Makhuwa", - "autonym": "Emakhuwa", - "speakers": 3912766, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "glk", - "language_name": "Gilaki", - "autonym": "Gilaki", - "speakers": 3906472, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lmo", - "language_name": "Lombard", - "autonym": "Lombard", - "speakers": 3901518, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dje", - "language_name": "Zarma", - "autonym": "Zarmaciine", - "speakers": 3871308, - "family": "Songhay", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ndc", - "language_name": "Ndau", - "autonym": "Ndau", - "speakers": 3867046, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sid", - "language_name": "Sidamo", - "autonym": "Sidamo", - "speakers": 3783955, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ace", - "language_name": "Achinese", - "autonym": "Achinese", - "speakers": 3738364, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "swv", - "language_name": "Shekhawati", - "autonym": "Shekhawati", - "speakers": 3713052, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rif", - "language_name": "Riffian", - "autonym": "Tarifit", - "speakers": 3692411, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "shn", - "language_name": "Shan", - "autonym": "တႆး", - "speakers": 3687984, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lmn", - "language_name": "Lambadi", - "autonym": "Lambadi", - "speakers": 3580443, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gbm", - "language_name": "Garhwali", - "autonym": "Garhwali", - "speakers": 3580443, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ka", - "language_name": "Georgian", - "autonym": "ქართული", - "speakers": 3543646, - "family": "Kartvelian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gl", - "language_name": "Galician", - "autonym": "Galego", - "speakers": 3515530, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ln", - "language_name": "Lingala", - "autonym": "Lingála", - "speakers": 3514491, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "man", - "language_name": "Mandingo", - "autonym": "Mandingo", - "speakers": 3511762, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tzm", - "language_name": "Central Atlas Tamazight", - "autonym": "Tamaziɣt N Laṭlaṣ", - "speakers": 3485047, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mfa", - "language_name": "Pattani Malay", - "autonym": "Pattani Malay", - "speakers": 3448870, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tiv", - "language_name": "Tiv", - "autonym": "Tiv", - "speakers": 3424448, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kab", - "language_name": "Kabyle", - "autonym": "Taqbaylit", - "speakers": 3351886, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ky", - "language_name": "Kyrgyz", - "autonym": "Кыргызча", - "speakers": 3338267, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bik", - "language_name": "Bikol", - "autonym": "Bikol", - "speakers": 3275430, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fon", - "language_name": "Fon", - "autonym": "Fon", - "speakers": 3216150, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gon", - "language_name": "Gondi", - "autonym": "Gondi", - "speakers": 3182616, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "war", - "language_name": "Waray", - "autonym": "Waray", - "speakers": 3166927, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sdh", - "language_name": "Southern Kurdish", - "autonym": "کوردی خوارگ", - "speakers": 3142162, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "brh", - "language_name": "Brahui", - "autonym": "Brahui", - "speakers": 3035513, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bci", - "language_name": "Baoulé", - "autonym": "Baoulé", - "speakers": 3022921, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bo", - "language_name": "Tibetan", - "autonym": "བོད་སྐད་", - "speakers": 3006697, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ibb", - "language_name": "Ibibio", - "autonym": "Ibibio", - "speakers": 2996392, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "efi", - "language_name": "Efik", - "autonym": "Efik", - "speakers": 2996392, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sg", - "language_name": "Sango", - "autonym": "Sängö", - "speakers": 2935521, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kfy", - "language_name": "Kumaoni", - "autonym": "Kumaoni", - "speakers": 2917398, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ay", - "language_name": "Aymara", - "autonym": "Aymara", - "speakers": 2838620, - "family": "Aymaran", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nyn", - "language_name": "Nyankole", - "autonym": "Runyankore", - "speakers": 2724939, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "jam", - "language_name": "Jamaican Creole English", - "autonym": "Jamaican Creole English", - "speakers": 2668142, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "doi", - "language_name": "Dogri", - "autonym": "डोगरी", - "speakers": 2652180, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "guz", - "language_name": "Gusii", - "autonym": "Ekegusii", - "speakers": 2622867, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sas", - "language_name": "Sasak", - "autonym": "Sasak", - "speakers": 2590152, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kru", - "language_name": "Kurukh", - "autonym": "Kurukh", - "speakers": 2519571, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pam", - "language_name": "Pampanga", - "autonym": "Pampanga", - "speakers": 2511163, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fbl", - "language_name": "West Albay Bikol", - "autonym": "West Albay Bikol", - "speakers": 2511163, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lt", - "language_name": "Lithuanian", - "autonym": "Lietuvių", - "speakers": 2488617, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bej", - "language_name": "Beja", - "autonym": "Beja", - "speakers": 2460326, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bbc", - "language_name": "Batak Toba", - "autonym": "Batak Toba", - "speakers": 2456639, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sck", - "language_name": "Sadri", - "autonym": "Sadri", - "speakers": 2386962, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wbq", - "language_name": "Waddar", - "autonym": "Waddar", - "speakers": 2386962, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lu", - "language_name": "Luba-Katanga", - "autonym": "Tshiluba", - "speakers": 2340940, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cgg", - "language_name": "Chiga", - "autonym": "Rukiga", - "speakers": 2335662, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "xog", - "language_name": "Soga", - "autonym": "Olusoga", - "speakers": 2292409, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ss", - "language_name": "Swati", - "autonym": "Siswati", - "speakers": 2212379, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "haz", - "language_name": "Hazaragi", - "autonym": "Hazaragi", - "speakers": 2161984, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mer", - "language_name": "Meru", - "autonym": "Kĩmĩrũ", - "speakers": 2141116, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "xnr", - "language_name": "Kangri", - "autonym": "कांगड़ी", - "speakers": 2121744, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "aa", - "language_name": "Afar", - "autonym": "Afar", - "speakers": 2119663, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "teo", - "language_name": "Teso", - "autonym": "Kiteso", - "speakers": 2082973, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ngl", - "language_name": "Lomwe", - "autonym": "Lomwe", - "speakers": 2046678, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "oc", - "language_name": "Occitan", - "autonym": "Occitan", - "speakers": 2040398, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bgn", - "language_name": "Western Balochi", - "autonym": "بلوچی (رخشانی)", - "speakers": 2037382, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lrc", - "language_name": "Northern Luri", - "autonym": "لۊری شومالی", - "speakers": 2020512, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wbr", - "language_name": "Wagdi", - "autonym": "Wagdi", - "speakers": 1989135, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tcy", - "language_name": "Tulu", - "autonym": "Tulu", - "speakers": 1989135, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "khn", - "language_name": "Khandesi", - "autonym": "Khandesi", - "speakers": 1989135, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tt", - "language_name": "Tatar", - "autonym": "Татар", - "speakers": 1984108, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sl", - "language_name": "Slovenian", - "autonym": "Slovenščina", - "speakers": 1973181, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mak", - "language_name": "Makasar", - "autonym": "Makasar", - "speakers": 1949290, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wal", - "language_name": "Wolaytta", - "autonym": "Wolaytta", - "speakers": 1946034, - "family": "Ta-Ne-Omotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nym", - "language_name": "Nyamwezi", - "autonym": "Nyamwezi", - "speakers": 1932242, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "brx", - "language_name": "Bodo", - "autonym": "बर’", - "speakers": 1856526, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ljp", - "language_name": "Lampung Api", - "autonym": "Lampung Api", - "speakers": 1842479, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cv", - "language_name": "Chuvash", - "autonym": "Чӑваш", - "speakers": 1842386, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ba", - "language_name": "Bashkir", - "autonym": "Башҡорт Теле", - "speakers": 1842386, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rhg", - "language_name": "Rohingya", - "autonym": "𐴌𐴗𐴥𐴝𐴙𐴚𐴒𐴙𐴝", - "speakers": 1824082, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "men", - "language_name": "Mende", - "autonym": "Mende", - "speakers": 1813083, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tum", - "language_name": "Tumbuka", - "autonym": "Tumbuka", - "speakers": 1780514, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tmh", - "language_name": "Tamashek", - "autonym": "Tamashek", - "speakers": 1776965, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nd", - "language_name": "North Ndebele", - "autonym": "Isindebele", - "speakers": 1745556, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mas", - "language_name": "Masai", - "autonym": "Maa", - "speakers": 1734738, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "srr", - "language_name": "Serer", - "autonym": "Serer", - "speakers": 1731004, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "noe", - "language_name": "Nimadi", - "autonym": "Nimadi", - "speakers": 1723917, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tem", - "language_name": "Timne", - "autonym": "Timne", - "speakers": 1722482, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sco", - "language_name": "Scots", - "autonym": "Scots", - "speakers": 1644028, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "laj", - "language_name": "Lango (Uganda)", - "autonym": "Lango (Uganda)", - "speakers": 1643614, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rmt", - "language_name": "Domari", - "autonym": "Domari", - "speakers": 1613543, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mk", - "language_name": "Macedonian", - "autonym": "Македонски", - "speakers": 1608565, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ach", - "language_name": "Acoli", - "autonym": "Acoli", - "speakers": 1600361, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fuq", - "language_name": "Central-Eastern Niger Fulfulde", - "autonym": "Central-Eastern Niger Fulfulde", - "speakers": 1594068, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bhb", - "language_name": "Bhili", - "autonym": "Bhili", - "speakers": 1591308, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pag", - "language_name": "Pangasinan", - "autonym": "Pangasinan", - "speakers": 1528534, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kg", - "language_name": "Kongo", - "autonym": "Kongo", - "speakers": 1526700, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bin", - "language_name": "Bini", - "autonym": "Bini", - "speakers": 1519599, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ffm", - "language_name": "Maasina Fulfulde", - "autonym": "Maasina Fulfulde", - "speakers": 1505612, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mni", - "language_name": "Manipuri", - "autonym": "মৈতৈলোন্", - "speakers": 1476591, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "abr", - "language_name": "Abron", - "autonym": "Abron", - "speakers": 1467010, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kde", - "language_name": "Makonde", - "autonym": "Chimakonde", - "speakers": 1463820, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "aln", - "language_name": "Gheg Albanian", - "autonym": "Gheg Albanian", - "speakers": 1430250, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ve", - "language_name": "Venda", - "autonym": "Tshivenḓa", - "speakers": 1391759, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "seh", - "language_name": "Sena", - "autonym": "Sena", - "speakers": 1384517, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vec", - "language_name": "Venetian", - "autonym": "Veneto", - "speakers": 1380829, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sus", - "language_name": "Susu", - "autonym": "Susu", - "speakers": 1378014, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nn", - "language_name": "Norwegian Nynorsk", - "autonym": "Norsk Nynorsk", - "speakers": 1366860, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mgh", - "language_name": "Makhuwa-Meetto", - "autonym": "Makua", - "speakers": 1354419, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "raj", - "language_name": "Rajasthani", - "autonym": "राजस्थानी", - "speakers": 1326090, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hoc", - "language_name": "Ho", - "autonym": "Ho", - "speakers": 1312829, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mdh", - "language_name": "Maguindanaon", - "autonym": "Maguindanaon", - "speakers": 1310172, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mtr", - "language_name": "Mewari", - "autonym": "Mewari", - "speakers": 1286307, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bum", - "language_name": "Bulu", - "autonym": "Bulu", - "speakers": 1276270, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "myx", - "language_name": "Masaaba", - "autonym": "Masaaba", - "speakers": 1254337, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "unr", - "language_name": "Mundari", - "autonym": "Mundari", - "speakers": 1252287, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mfe", - "language_name": "Morisyen", - "autonym": "Kreol Morisien", - "speakers": 1241433, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ga", - "language_name": "Irish", - "autonym": "Gaeilge", - "speakers": 1237487, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fvr", - "language_name": "Fur", - "autonym": "Fur", - "speakers": 1230163, - "family": "Furan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rej", - "language_name": "Rejang", - "autonym": "Rejang", - "speakers": 1228320, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bhi", - "language_name": "Bhilali", - "autonym": "Bhilali", - "speakers": 1220003, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tsg", - "language_name": "Tausug", - "autonym": "Tausug", - "speakers": 1200991, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "quc", - "language_name": "Kʼicheʼ", - "autonym": "KʼIcheʼ", - "speakers": 1200731, - "family": "Mayan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bqi", - "language_name": "Bakhtiari", - "autonym": "Bakhtiari", - "speakers": 1188926, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kpe", - "language_name": "Kpelle", - "autonym": "Kpɛlɛɛ", - "speakers": 1186303, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sef", - "language_name": "Cebaara Senoufo", - "autonym": "Cebaara Senoufo", - "speakers": 1181687, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kxm", - "language_name": "Northern Khmer", - "autonym": "Northern Khmer", - "speakers": 1172616, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vls", - "language_name": "West Flemish", - "autonym": "West Flemish", - "speakers": 1172070, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "snk", - "language_name": "Soninke", - "autonym": "Soninke", - "speakers": 1153651, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "zza", - "language_name": "Zaza", - "autonym": "Zaza", - "speakers": 1148245, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lv", - "language_name": "Latvian", - "autonym": "Latviešu", - "speakers": 1147550, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dnj", - "language_name": "Dan", - "autonym": "Dan", - "speakers": 1099244, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gor", - "language_name": "Gorontalo", - "autonym": "Gorontalo", - "speakers": 1094807, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tig", - "language_name": "Tigre", - "autonym": "Tigre", - "speakers": 1094616, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "eu", - "language_name": "Basque", - "autonym": "Euskara", - "speakers": 1088519, - "family": null, - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hoj", - "language_name": "Hadothi", - "autonym": "Hadothi", - "speakers": 1087394, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kbd", - "language_name": "Kabardian", - "autonym": "Kabardian", - "speakers": 1070873, - "family": "Abkhaz-Adyge", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kha", - "language_name": "Khasi", - "autonym": "Khasi", - "speakers": 1060872, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sc", - "language_name": "Sardinian", - "autonym": "Sardu", - "speakers": 1060846, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "loz", - "language_name": "Lozi", - "autonym": "Lozi", - "speakers": 1045596, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gur", - "language_name": "Frafra", - "autonym": "Frafra", - "speakers": 1026907, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ars", - "language_name": "Najdi Arabic", - "autonym": "Najdi Arabic", - "speakers": 1025205, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rng", - "language_name": "Ronga", - "autonym": "Ronga", - "speakers": 1023339, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "luz", - "language_name": "Southern Luri", - "autonym": "Southern Luri", - "speakers": 1019080, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "new", - "language_name": "Newari", - "autonym": "Newari", - "speakers": 1000821, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tly", - "language_name": "Talysh", - "autonym": "Talysh", - "speakers": 1000168, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "yi", - "language_name": "Yiddish", - "autonym": "ייִדיש", - "speakers": 997214, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bez", - "language_name": "Bena", - "autonym": "Hibena", - "speakers": 995398, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ksb", - "language_name": "Shambala", - "autonym": "Kishambaa", - "speakers": 995398, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kfr", - "language_name": "Kachhi", - "autonym": "Kachhi", - "speakers": 994568, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nij", - "language_name": "Ngaju", - "autonym": "Ngaju", - "speakers": 987996, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mwk", - "language_name": "Kita Maninkakan", - "autonym": "Kita Maninkakan", - "speakers": 977670, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "jml", - "language_name": "Jumli", - "autonym": "Jumli", - "speakers": 970493, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ryu", - "language_name": "Central Okinawan", - "autonym": "Central Okinawan", - "speakers": 966404, - "family": "Japonic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mnw", - "language_name": "Mon", - "autonym": "Mon", - "speakers": 966114, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "qug", - "language_name": "Chimborazo Highland Quichua", - "autonym": "Chimborazo Highland Quichua", - "speakers": 963579, - "family": "Quechuan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kac", - "language_name": "Kachin", - "autonym": "Kachin", - "speakers": 962032, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hnd", - "language_name": "Southern Hindko", - "autonym": "Southern Hindko", - "speakers": 957354, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "li", - "language_name": "Limburgish", - "autonym": "Limburgish", - "speakers": 950422, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mxc", - "language_name": "Manyika", - "autonym": "Manyika", - "speakers": 945510, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ce", - "language_name": "Chechen", - "autonym": "Нохчийн", - "speakers": 935365, - "family": "Nakh-Daghestanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kj", - "language_name": "Kuanyama", - "autonym": "Kuanyama", - "speakers": 920524, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nr", - "language_name": "South Ndebele", - "autonym": "South Ndebele", - "speakers": 903418, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cy", - "language_name": "Welsh", - "autonym": "Cymraeg", - "speakers": 884910, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ada", - "language_name": "Adangme", - "autonym": "Adangme", - "speakers": 880206, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "et", - "language_name": "Estonian", - "autonym": "Eesti", - "speakers": 878449, - "family": "Uralic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "prd", - "language_name": "Parsi-Dari", - "autonym": "Parsi-Dari", - "speakers": 864342, - "family": "Bookkeeping", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "yua", - "language_name": "Yucateco", - "autonym": "Yucateco", - "speakers": 861955, - "family": "Mayan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ewo", - "language_name": "Ewondo", - "autonym": "Ewondo", - "speakers": 860095, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kge", - "language_name": "Komering", - "autonym": "Komering", - "speakers": 854483, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ttj", - "language_name": "Tooro", - "autonym": "Tooro", - "speakers": 821807, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "grt", - "language_name": "Garo", - "autonym": "Garo", - "speakers": 821563, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gaa", - "language_name": "Ga", - "autonym": "Gã", - "speakers": 821526, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mgy", - "language_name": "Mbunga", - "autonym": "Mbunga", - "speakers": 819739, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tet", - "language_name": "Tetum", - "autonym": "Tetum", - "speakers": 816395, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "iba", - "language_name": "Iban", - "autonym": "Iban", - "speakers": 816302, - "family": "Bookkeeping", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ebu", - "language_name": "Embu", - "autonym": "Kĩembu", - "speakers": 802918, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "swg", - "language_name": "Swabian", - "autonym": "Swabian", - "speakers": 801597, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hnj", - "language_name": "Hmong Njua", - "autonym": "𞄀𞄄𞄰𞄩𞄍𞄜𞄰", - "speakers": 781687, - "family": "Hmong-Mien", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kck", - "language_name": "Kalanga", - "autonym": "Kalanga", - "speakers": 770954, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dty", - "language_name": "Dotyali", - "autonym": "Dotyali", - "speakers": 758198, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pcd", - "language_name": "Picard", - "autonym": "Picard", - "speakers": 746330, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fy", - "language_name": "Western Frisian", - "autonym": "Frysk", - "speakers": 743057, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ccp", - "language_name": "Chakma", - "autonym": "𑄌𑄋𑄴𑄟𑄳𑄦", - "speakers": 729137, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "yao", - "language_name": "Yao", - "autonym": "Yao", - "speakers": 722357, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "aoz", - "language_name": "Uab Meto", - "autonym": "Uab Meto", - "speakers": 720970, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cps", - "language_name": "Capiznon", - "autonym": "Capiznon", - "speakers": 720595, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "asa", - "language_name": "Asu", - "autonym": "Kipare", - "speakers": 702634, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "blt", - "language_name": "Tai Dam", - "autonym": "ꪼꪕꪒꪾ", - "speakers": 681177, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wa", - "language_name": "Walloon", - "autonym": "Walon", - "speakers": 679801, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ses", - "language_name": "Koyraboro Senni", - "autonym": "Koyraboro Senni", - "speakers": 664816, - "family": "Songhay", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bfy", - "language_name": "Bagheli", - "autonym": "Bagheli", - "speakers": 654424, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ast", - "language_name": "Asturian", - "autonym": "Asturianu", - "speakers": 650205, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lki", - "language_name": "Laki", - "autonym": "Laki", - "speakers": 645417, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "unx", - "language_name": "Munda", - "autonym": "Munda", - "speakers": 636523, - "family": "Bookkeeping", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lis", - "language_name": "Lisu", - "autonym": "Lisu", - "speakers": 627309, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nqo", - "language_name": "N’Ko", - "autonym": "ߒߞߏ", - "speakers": 626370, - "family": "Artificial Language", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gos", - "language_name": "Gronings", - "autonym": "Gronings", - "speakers": 622094, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lol", - "language_name": "Mongo", - "autonym": "Mongo", - "speakers": 620858, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "thl", - "language_name": "Dangaura Tharu", - "autonym": "Dangaura Tharu", - "speakers": 606558, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nap", - "language_name": "Neapolitan", - "autonym": "Neapolitan", - "speakers": 605306, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nus", - "language_name": "Nuer", - "autonym": "Thok Nath", - "speakers": 591427, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "br", - "language_name": "Breton", - "autonym": "Brezhoneg", - "speakers": 563140, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pis", - "language_name": "Pijin", - "autonym": "Pijin", - "speakers": 561780, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rcf", - "language_name": "Réunion Creole French", - "autonym": "Réunion Creole French", - "speakers": 559185, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "av", - "language_name": "Avaric", - "autonym": "Avaric", - "speakers": 552716, - "family": "Nakh-Daghestanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ng", - "language_name": "Ndonga", - "autonym": "Ndonga", - "speakers": 552315, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "os", - "language_name": "Ossetic", - "autonym": "Ирон", - "speakers": 541444, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "udm", - "language_name": "Udmurt", - "autonym": "Udmurt", - "speakers": 538544, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lij", - "language_name": "Ligurian", - "autonym": "Ligure", - "speakers": 536663, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kea", - "language_name": "Kabuverdianu", - "autonym": "Kabuverdianu", - "speakers": 530762, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rue", - "language_name": "Rusyn", - "autonym": "Rusyn", - "speakers": 527075, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "chm", - "language_name": "Mari", - "autonym": "Mari", - "speakers": 524371, - "family": "Uralic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "scn", - "language_name": "Sicilian", - "autonym": "Sicilianu", - "speakers": 511702, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lag", - "language_name": "Langi", - "autonym": "Kɨlaangi", - "speakers": 509409, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bft", - "language_name": "Balti", - "autonym": "Balti", - "speakers": 502520, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nhe", - "language_name": "Eastern Huasteca Nahuatl", - "autonym": "Eastern Huasteca Nahuatl", - "speakers": 501735, - "family": "Uto-Aztecan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nhw", - "language_name": "Western Huasteca Nahuatl", - "autonym": "Western Huasteca Nahuatl", - "speakers": 501735, - "family": "Uto-Aztecan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "szl", - "language_name": "Silesian", - "autonym": "Ślōnski", - "speakers": 497670, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kaa", - "language_name": "Kara-Kalpak", - "autonym": "Kara-Kalpak", - "speakers": 489046, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gju", - "language_name": "Gujari", - "autonym": "Gujari", - "speakers": 467002, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "srx", - "language_name": "Sirmauri", - "autonym": "Sirmauri", - "speakers": 464132, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mt", - "language_name": "Maltese", - "autonym": "Malti", - "speakers": 457267, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bap", - "language_name": "Bantawa", - "autonym": "Bantawa", - "speakers": 454918, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sah", - "language_name": "Yakut", - "autonym": "Саха Тыла", - "speakers": 453510, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mls", - "language_name": "Masalit", - "autonym": "Masalit", - "speakers": 451060, - "family": "Maban", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kaj", - "language_name": "Jju", - "autonym": "Kaje", - "speakers": 449459, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ady", - "language_name": "Adyghe", - "autonym": "Adyghe", - "speakers": 444583, - "family": "Abkhaz-Adyge", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ybb", - "language_name": "Yemba", - "autonym": "Yemba", - "speakers": 443920, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "xmf", - "language_name": "Mingrelian", - "autonym": "Mingrelian", - "speakers": 439670, - "family": "Kartvelian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "myv", - "language_name": "Erzya", - "autonym": "Эрзянь Кель", - "speakers": 439338, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dav", - "language_name": "Taita", - "autonym": "Kitaita", - "speakers": 438929, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "maz", - "language_name": "Central Mazahua", - "autonym": "Central Mazahua", - "speakers": 437410, - "family": "Otomanguean", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vun", - "language_name": "Vunjo", - "autonym": "Kyivunjo", - "speakers": 433291, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rof", - "language_name": "Rombo", - "autonym": "Kihorombo", - "speakers": 433291, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "jmc", - "language_name": "Machame", - "autonym": "Kimachame", - "speakers": 433291, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kjg", - "language_name": "Khmu", - "autonym": "Khmu", - "speakers": 431949, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fan", - "language_name": "Fang", - "autonym": "Fang", - "speakers": 426451, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "krj", - "language_name": "Kinaray-a", - "autonym": "Kinaray-A", - "speakers": 425806, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kdt", - "language_name": "Kuy", - "autonym": "Kuy", - "speakers": 421207, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lb", - "language_name": "Luxembourgish", - "autonym": "Lëtzebuergesch", - "speakers": 421015, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "srn", - "language_name": "Sranan Tongo", - "autonym": "Sranan Tongo", - "speakers": 414507, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dyo", - "language_name": "Jola-Fonyi", - "autonym": "Joola", - "speakers": 409146, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tdg", - "language_name": "Western Tamang", - "autonym": "Western Tamang", - "speakers": 394263, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pnt", - "language_name": "Pontic", - "autonym": "Pontic", - "speakers": 392463, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "zmi", - "language_name": "Negeri Sembilan Malay", - "autonym": "Negeri Sembilan Malay", - "speakers": 391825, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nnh", - "language_name": "Ngiemboon", - "autonym": "Shwóŋò Ngiembɔɔn", - "speakers": 388430, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bbj", - "language_name": "Ghomala", - "autonym": "Ghomala", - "speakers": 388430, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dv", - "language_name": "Divehi", - "autonym": "Divehi", - "speakers": 388044, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "saz", - "language_name": "Saurashtra", - "autonym": "Saurashtra", - "speakers": 384566, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hif", - "language_name": "Fiji Hindi", - "autonym": "Fiji Hindi", - "speakers": 383749, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fia", - "language_name": "Nobiin", - "autonym": "Nobiin", - "speakers": 378161, - "family": "Nubian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bgx", - "language_name": "Balkan Gagauz Turkish", - "autonym": "Balkan Gagauz Turkish", - "speakers": 377280, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kvr", - "language_name": "Kerinci", - "autonym": "Kerinci", - "speakers": 373836, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kvx", - "language_name": "Parkari Koli", - "autonym": "Parkari Koli", - "speakers": 373602, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dz", - "language_name": "Dzongkha", - "autonym": "རྫོང་ཁ", - "speakers": 370341, - "family": "Bookkeeping", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pko", - "language_name": "Pökoot", - "autonym": "Pökoot", - "speakers": 369343, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dar", - "language_name": "Dargwa", - "autonym": "Dargwa", - "speakers": 368477, - "family": "Nakh-Daghestanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lif", - "language_name": "Limbu", - "autonym": "Limbu", - "speakers": 368085, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fj", - "language_name": "Fijian", - "autonym": "Fijian", - "speakers": 365030, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "thr", - "language_name": "Rana Tharu", - "autonym": "Rana Tharu", - "speakers": 363935, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bkm", - "language_name": "Kom", - "autonym": "Kom", - "speakers": 360685, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "is", - "language_name": "Icelandic", - "autonym": "Íslenska", - "speakers": 350734, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "khw", - "language_name": "Khowar", - "autonym": "Khowar", - "speakers": 350252, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lbw", - "language_name": "Tolaki", - "autonym": "Tolaki", - "speakers": 347134, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nxq", - "language_name": "Naxi", - "autonym": "Naxi", - "speakers": 334565, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mgp", - "language_name": "Eastern Magar", - "autonym": "Eastern Magar", - "speakers": 333607, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bax", - "language_name": "Bamun", - "autonym": "Bamun", - "speakers": 332940, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bas", - "language_name": "Basaa", - "autonym": "Ɓàsàa", - "speakers": 332940, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "khq", - "language_name": "Koyra Chiini", - "autonym": "Koyra Ciini", - "speakers": 332408, - "family": "Songhay", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mvy", - "language_name": "Indus Kohistani", - "autonym": "Indus Kohistani", - "speakers": 326901, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gay", - "language_name": "Gayo", - "autonym": "Gayo", - "speakers": 320431, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "zdj", - "language_name": "Ngazidja Comorian", - "autonym": "Ngazidja Comorian", - "speakers": 313124, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bua", - "language_name": "Buriat", - "autonym": "Buriat", - "speakers": 311788, - "family": "Mongolic-Khitan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bto", - "language_name": "Rinconada Bikol", - "autonym": "Rinconada Bikol", - "speakers": 305707, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "byv", - "language_name": "Medumba", - "autonym": "Medumba", - "speakers": 305195, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "njo", - "language_name": "Ao Naga", - "autonym": "Ao Naga", - "speakers": 305001, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bfq", - "language_name": "Badaga", - "autonym": "Badaga", - "speakers": 305001, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "thq", - "language_name": "Kochila Tharu", - "autonym": "Kochila Tharu", - "speakers": 303279, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mdf", - "language_name": "Moksha", - "autonym": "Мокшень Кяль", - "speakers": 297616, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rob", - "language_name": "Tae'", - "autonym": "Tae'", - "speakers": 293729, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nzi", - "language_name": "Nzima", - "autonym": "Nzima", - "speakers": 293402, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "naq", - "language_name": "Nama", - "autonym": "Khoekhoegowab", - "speakers": 289308, - "family": "Khoe-Kwadi", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wni", - "language_name": "Ndzwani Comorian", - "autonym": "Ndzwani Comorian", - "speakers": 287736, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kum", - "language_name": "Kumyk", - "autonym": "Kumyk", - "speakers": 283444, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mua", - "language_name": "Mundang", - "autonym": "Mundaŋ", - "speakers": 277450, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "arn", - "language_name": "Mapuche", - "autonym": "Mapudungun", - "speakers": 272802, - "family": "Araucanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cja", - "language_name": "Western Cham", - "autonym": "Western Cham", - "speakers": 270832, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bi", - "language_name": "Bislama", - "autonym": "Bislama", - "speakers": 268500, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "khb", - "language_name": "Lü", - "autonym": "Lü", - "speakers": 264864, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tdd", - "language_name": "Tai Nüa", - "autonym": "Tai Nüa", - "speakers": 264864, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kxp", - "language_name": "Wadiyara Koli", - "autonym": "Wadiyara Koli", - "speakers": 256851, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gjk", - "language_name": "Kachi Koli", - "autonym": "Kachi Koli", - "speakers": 256851, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lez", - "language_name": "Lezghian", - "autonym": "Lezghian", - "speakers": 255100, - "family": "Nakh-Daghestanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kv", - "language_name": "Komi", - "autonym": "Komi", - "speakers": 255100, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sm", - "language_name": "Samoan", - "autonym": "Samoan", - "speakers": 252717, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mrd", - "language_name": "Western Magar", - "autonym": "Western Magar", - "speakers": 251722, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "saq", - "language_name": "Samburu", - "autonym": "Kisampur", - "speakers": 246228, - "family": "Nilotic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "crh", - "language_name": "Crimean Tatar", - "autonym": "Crimean Tatar", - "speakers": 245968, - "family": "Turkic", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mdr", - "language_name": "Mandar", - "autonym": "Mandar", - "speakers": 245664, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sxn", - "language_name": "Sangir", - "autonym": "Sangir", - "speakers": 245664, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ext", - "language_name": "Extremaduran", - "autonym": "Extremaduran", - "speakers": 245077, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nch", - "language_name": "Central Huasteca Nahuatl", - "autonym": "Central Huasteca Nahuatl", - "speakers": 244435, - "family": "Uto-Aztecan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "zea", - "language_name": "Zeelandic", - "autonym": "Zeelandic", - "speakers": 241926, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "krc", - "language_name": "Karachay-Balkar", - "autonym": "Karachay-Balkar", - "speakers": 240927, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ksh", - "language_name": "Colognian", - "autonym": "Kölsch", - "speakers": 240479, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hz", - "language_name": "Herero", - "autonym": "Herero", - "speakers": 239336, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sav", - "language_name": "Saafi-Saafi", - "autonym": "Saafi-Saafi", - "speakers": 236046, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "zag", - "language_name": "Zaghawa", - "autonym": "Zaghawa", - "speakers": 232364, - "family": "Saharan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "inh", - "language_name": "Ingush", - "autonym": "Ingush", - "speakers": 226755, - "family": "Nakh-Daghestanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ssy", - "language_name": "Saho", - "autonym": "Saho", - "speakers": 218923, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dtm", - "language_name": "Tomo Kan Dogon", - "autonym": "Tomo Kan Dogon", - "speakers": 215087, - "family": "Dogon", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pap", - "language_name": "Papiamento", - "autonym": "Papiamentu", - "speakers": 211640, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "syr", - "language_name": "Syriac", - "autonym": "ܣܘܪܝܝܐ", - "speakers": 210659, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tog", - "language_name": "Nyasa Tonga", - "autonym": "Nyasa Tonga", - "speakers": 207727, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "maf", - "language_name": "Mafa", - "autonym": "Mafa", - "speakers": 205313, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "puu", - "language_name": "Punu", - "autonym": "Punu", - "speakers": 200782, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kcg", - "language_name": "Tyap", - "autonym": "Katab", - "speakers": 199046, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kao", - "language_name": "Xaasongaxango", - "autonym": "Xaasongaxango", - "speakers": 195534, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tyv", - "language_name": "Tuvinian", - "autonym": "Tuvinian", - "speakers": 184239, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dtp", - "language_name": "Central Dusun", - "autonym": "Central Dusun", - "speakers": 182852, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ria", - "language_name": "Riang (India)", - "autonym": "Riang (India)", - "speakers": 172392, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "swb", - "language_name": "Comorian", - "autonym": "Comorian", - "speakers": 170720, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bmq", - "language_name": "Bomu", - "autonym": "Bomu", - "speakers": 168159, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ltg", - "language_name": "Latgalian", - "autonym": "Latgalian", - "speakers": 167429, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nv", - "language_name": "Navajo", - "autonym": "Diné Bizaad", - "speakers": 166320, - "family": "Athabaskan-Eyak-Tlingit", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bze", - "language_name": "Jenaama Bozo", - "autonym": "Jenaama Bozo", - "speakers": 166204, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "co", - "language_name": "Corsican", - "autonym": "Corsu", - "speakers": 162836, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bfd", - "language_name": "Bafut", - "autonym": "Bafut", - "speakers": 158146, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "xsr", - "language_name": "Sherpa", - "autonym": "Sherpa", - "speakers": 157705, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kiu", - "language_name": "Kirmanjki", - "autonym": "Kirmanjki", - "speakers": 155833, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ho", - "language_name": "Hiri Motu", - "autonym": "Hiri Motu", - "speakers": 152449, - "family": "Pidgin", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kkj", - "language_name": "Kako", - "autonym": "Kakɔ", - "speakers": 149823, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bss", - "language_name": "Akoose", - "autonym": "Akoose", - "speakers": 149823, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sly", - "language_name": "Selayar", - "autonym": "Selayar", - "speakers": 144194, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mi", - "language_name": "Māori", - "autonym": "Māori", - "speakers": 137913, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rjs", - "language_name": "Rajbanshi", - "autonym": "Rajbanshi", - "speakers": 133443, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dua", - "language_name": "Duala", - "autonym": "Duálá", - "speakers": 133176, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "guc", - "language_name": "Wayuu", - "autonym": "Wayuu", - "speakers": 132529, - "family": "Arawakan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vai", - "language_name": "Vai", - "autonym": "ꕙꔤ", - "speakers": 131906, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "taj", - "language_name": "Eastern Tamang", - "autonym": "Eastern Tamang", - "speakers": 130410, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mgo", - "language_name": "Metaʼ", - "autonym": "Metaʼ", - "speakers": 130401, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pdc", - "language_name": "Pennsylvania German", - "autonym": "Pennsylvania German", - "speakers": 129729, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rwk", - "language_name": "Rwa", - "autonym": "Kiruwa", - "speakers": 128816, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "trw", - "language_name": "Torwali", - "autonym": "توروالی", - "speakers": 123756, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mfv", - "language_name": "Mandjak", - "autonym": "Mandjak", - "speakers": 121170, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tsj", - "language_name": "Tshangla", - "autonym": "Tshangla", - "speakers": 117348, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sbp", - "language_name": "Sangu", - "autonym": "Ishisangu", - "speakers": 117106, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "krl", - "language_name": "Karelian", - "autonym": "Karelian", - "speakers": 116212, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lad", - "language_name": "Ladino", - "autonym": "Ladino", - "speakers": 112781, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ife", - "language_name": "Ifè", - "autonym": "Ifè", - "speakers": 111910, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gag", - "language_name": "Gagauz", - "autonym": "Gagauz", - "speakers": 111028, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lbe", - "language_name": "Lak", - "autonym": "Lak", - "speakers": 110543, - "family": "Nakh-Daghestanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sdc", - "language_name": "Sassarese Sardinian", - "autonym": "Sassarese Sardinian", - "speakers": 106085, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "to", - "language_name": "Tongan", - "autonym": "Lea Fakatonga", - "speakers": 100790, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bjt", - "language_name": "Balanta-Ganja", - "autonym": "Balanta-Ganja", - "speakers": 95992, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "jgo", - "language_name": "Ngomba", - "autonym": "Ndaꞌa", - "speakers": 94333, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "crs", - "language_name": "Seselwa Creole French", - "autonym": "Seselwa Creole French", - "speakers": 94061, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ab", - "language_name": "Abkhazian", - "autonym": "Аԥсшәа", - "speakers": 91953, - "family": "Abkhaz-Adyge", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ty", - "language_name": "Tahitian", - "autonym": "Tahitian", - "speakers": 91488, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "iu", - "language_name": "Inuktitut", - "autonym": "Inuktitut", - "speakers": 90466, - "family": "Eskimo-Aleut", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pdt", - "language_name": "Plautdietsch", - "autonym": "Plautdietsch", - "speakers": 90466, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bpy", - "language_name": "Bishnupriya", - "autonym": "Bishnupriya", - "speakers": 90174, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ksf", - "language_name": "Bafia", - "autonym": "Rikpa", - "speakers": 88784, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gvr", - "language_name": "Gurung", - "autonym": "Gurung", - "speakers": 87951, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cjm", - "language_name": "Eastern Cham", - "autonym": "Eastern Cham", - "speakers": 87862, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lcp", - "language_name": "Western Lawa", - "autonym": "Western Lawa", - "speakers": 87751, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "knf", - "language_name": "Mankanya", - "autonym": "Mankanya", - "speakers": 83151, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lep", - "language_name": "Lepcha", - "autonym": "Lepcha", - "speakers": 79743, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "byn", - "language_name": "Blin", - "autonym": "Blin", - "speakers": 79056, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "btv", - "language_name": "Bateri", - "autonym": "Bateri", - "speakers": 78843, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tkt", - "language_name": "Kathoriya Tharu", - "autonym": "Kathoriya Tharu", - "speakers": 72787, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gd", - "language_name": "Scottish Gaelic", - "autonym": "Gàidhlig", - "speakers": 72337, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fo", - "language_name": "Faroese", - "autonym": "Føroyskt", - "speakers": 71351, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vro", - "language_name": "Võro", - "autonym": "Võro", - "speakers": 70031, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ken", - "language_name": "Kenyang", - "autonym": "Kɛnyaŋ", - "speakers": 69362, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gil", - "language_name": "Gilbertese", - "autonym": "Gilbertese", - "speakers": 67078, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bvb", - "language_name": "Bube", - "autonym": "Bube", - "speakers": 66058, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mwv", - "language_name": "Mentawai", - "autonym": "Mentawai", - "speakers": 64086, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "frp", - "language_name": "Arpitan", - "autonym": "Arpitan", - "speakers": 63777, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "koi", - "language_name": "Komi-Permyak", - "autonym": "Komi-Permyak", - "speakers": 63775, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kfo", - "language_name": "Koro", - "autonym": "Koro", - "speakers": 63207, - "family": "Mande", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mh", - "language_name": "Marshallese", - "autonym": "Marshallese", - "speakers": 56879, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fit", - "language_name": "Tornedalen Finnish", - "autonym": "Tornedalen Finnish", - "speakers": 56114, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kl", - "language_name": "Kalaallisut", - "autonym": "Kalaallisut", - "speakers": 55440, - "family": "Eskimo-Aleut", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bra", - "language_name": "Braj", - "autonym": "Braj", - "speakers": 54370, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gcr", - "language_name": "Guianese Creole French", - "autonym": "Guianese Creole French", - "speakers": 51872, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "se", - "language_name": "Northern Sami", - "autonym": "Davvisámegiella", - "speakers": 51530, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "blo", - "language_name": "Anii", - "autonym": "Anii Kagɩja", - "speakers": 51507, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kgp", - "language_name": "Kaingang", - "autonym": "Kanhgág", - "speakers": 50812, - "family": "Nuclear-Macro-Je", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "csb", - "language_name": "Kashubian", - "autonym": "Kashubian", - "speakers": 49767, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bqv", - "language_name": "Koro Wachi", - "autonym": "Koro Wachi", - "speakers": 46718, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ch", - "language_name": "Chamorro", - "autonym": "Chamorro", - "speakers": 46325, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cch", - "language_name": "Atsam", - "autonym": "Atsam", - "speakers": 44946, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "buc", - "language_name": "Bushi", - "autonym": "Bushi", - "speakers": 44620, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rm", - "language_name": "Romansh", - "autonym": "Rumantsch", - "speakers": 42020, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "agq", - "language_name": "Aghem", - "autonym": "Aghem", - "speakers": 38843, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kxv", - "language_name": "Kuvi", - "autonym": "Kuvi", - "speakers": 38457, - "family": "Dravidian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "snf", - "language_name": "Noon", - "autonym": "Noon", - "speakers": 37767, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fur", - "language_name": "Friulian", - "autonym": "Furlan", - "speakers": 37442, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tdh", - "language_name": "Thulung", - "autonym": "Thulung", - "speakers": 36393, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "egl", - "language_name": "Emilian", - "autonym": "Emilian", - "speakers": 31201, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "chk", - "language_name": "Chuukese", - "autonym": "Chuukese", - "speakers": 30731, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mrj", - "language_name": "Western Mari", - "autonym": "Western Mari", - "speakers": 29762, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "haw", - "language_name": "Hawaiian", - "autonym": "ʻŌlelo HawaiʻI", - "speakers": 29605, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mro", - "language_name": "Mru", - "autonym": "Mru", - "speakers": 29277, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "frc", - "language_name": "Cajun French", - "autonym": "Cajun French", - "speakers": 27942, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "yrl", - "language_name": "Nheengatu", - "autonym": "Nheẽgatu", - "speakers": 26171, - "family": "Tupian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "an", - "language_name": "Aragonese", - "autonym": "Aragonés", - "speakers": 26008, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "chr", - "language_name": "Cherokee", - "autonym": "Ꮳꮃꭹ", - "speakers": 25613, - "family": "Iroquoian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rmo", - "language_name": "Sinte Romani", - "autonym": "Sinte Romani", - "speakers": 24372, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "oj", - "language_name": "Ojibwa", - "autonym": "Ojibwa", - "speakers": 23747, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pon", - "language_name": "Pohnpeian", - "autonym": "Pohnpeian", - "speakers": 23560, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lzz", - "language_name": "Laz", - "autonym": "Laz", - "speakers": 22965, - "family": "Kartvelian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ttt", - "language_name": "Muslim Tat", - "autonym": "Muslim Tat", - "speakers": 22453, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "esu", - "language_name": "Central Yupik", - "autonym": "Central Yupik", - "speakers": 20956, - "family": "Eskimo-Aleut", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dak", - "language_name": "Dakota", - "autonym": "Dakota", - "speakers": 20832, - "family": "Siouan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "alt", - "language_name": "Southern Altai", - "autonym": "Southern Altai", - "speakers": 19841, - "family": "Turkic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "amo", - "language_name": "Amo", - "autonym": "Amo", - "speakers": 18620, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gub", - "language_name": "Guajajára", - "autonym": "Guajajára", - "speakers": 17784, - "family": "Tupian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hnn", - "language_name": "Hanunoo", - "autonym": "Hanunoo", - "speakers": 17469, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tkr", - "language_name": "Tsakhur", - "autonym": "Tsakhur", - "speakers": 16329, - "family": "Nakh-Daghestanian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pau", - "language_name": "Palauan", - "autonym": "Palauan", - "speakers": 16047, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sa", - "language_name": "Sanskrit", - "autonym": "संस्कृत भाषा", - "speakers": 15913, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bsc", - "language_name": "Bassari", - "autonym": "Bassari", - "speakers": 15264, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ojs", - "language_name": "Oji-Cree", - "autonym": "Oji-Cree", - "speakers": 15078, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kht", - "language_name": "Khamti", - "autonym": "Khamti", - "speakers": 13527, - "family": "Tai-Kadai", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hsb", - "language_name": "Upper Sorbian", - "autonym": "Hornjoserbšćina", - "speakers": 12826, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "chp", - "language_name": "Chipewyan", - "autonym": "Chipewyan", - "speakers": 12816, - "family": "Athabaskan-Eyak-Tlingit", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "moe", - "language_name": "Innu-aimun", - "autonym": "Innu-Aimun", - "speakers": 12062, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sli", - "language_name": "Lower Silesian", - "autonym": "Lower Silesian", - "speakers": 11868, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wae", - "language_name": "Walser", - "autonym": "Walser", - "speakers": 11377, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cho", - "language_name": "Choctaw", - "autonym": "Chahta", - "speakers": 10977, - "family": "Muskogean", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tbw", - "language_name": "Tagbanwa", - "autonym": "Tagbanwa", - "speakers": 10045, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "xav", - "language_name": "Xavánte", - "autonym": "Xavánte", - "speakers": 9951, - "family": "Nuclear-Macro-Je", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tvl", - "language_name": "Tuvalu", - "autonym": "Tuvalu", - "speakers": 9868, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "frr", - "language_name": "Northern Frisian", - "autonym": "Nordfriisk", - "speakers": 9619, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rug", - "language_name": "Roviana", - "autonym": "Roviana", - "speakers": 9591, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wls", - "language_name": "Wallisian", - "autonym": "Wallisian", - "speakers": 9512, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rmu", - "language_name": "Tavringer Romani", - "autonym": "Tavringer Romani", - "speakers": 9488, - "family": "Speech Register", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cr", - "language_name": "Cree", - "autonym": "Cree", - "speakers": 9047, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nmg", - "language_name": "Kwasio", - "autonym": "Kwasio", - "speakers": 8878, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lkt", - "language_name": "Lakota", - "autonym": "LakȟólʼIyapi", - "speakers": 8316, - "family": "Siouan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kos", - "language_name": "Kosraean", - "autonym": "Kosraean", - "speakers": 7990, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ik", - "language_name": "Inupiaq", - "autonym": "Inupiaq", - "speakers": 7983, - "family": "Eskimo-Aleut", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gbz", - "language_name": "Zoroastrian Dari", - "autonym": "Zoroastrian Dari", - "speakers": 7983, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "twq", - "language_name": "Tasawaq", - "autonym": "Tasawaq Senni", - "speakers": 7970, - "family": "Songhay", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bku", - "language_name": "Buhid", - "autonym": "Buhid", - "speakers": 7970, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mic", - "language_name": "Mi'kmaw", - "autonym": "LʼNuiʼSuti", - "speakers": 7916, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mey", - "language_name": "Hassaniyya", - "autonym": "Hassaniyya", - "speakers": 7239, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dsb", - "language_name": "Lower Sorbian", - "autonym": "Dolnoserbšćina", - "speakers": 6974, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "na", - "language_name": "Nauru", - "autonym": "Nauru", - "speakers": 6930, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lwl", - "language_name": "Eastern Lawa", - "autonym": "Eastern Lawa", - "speakers": 6898, - "family": "Austroasiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "yap", - "language_name": "Yapese", - "autonym": "Yapese", - "speakers": 6556, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "atj", - "language_name": "Atikamekw", - "autonym": "Atikamekw", - "speakers": 6408, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pms", - "language_name": "Piedmontese", - "autonym": "Piedmontese", - "speakers": 6178, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rmf", - "language_name": "Kalo Finnish Romani", - "autonym": "Kalo Finnish Romani", - "speakers": 5015, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "bla", - "language_name": "Siksiká", - "autonym": "Siksiká", - "speakers": 4900, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "fud", - "language_name": "East Futuna", - "autonym": "East Futuna", - "speakers": 4756, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "trv", - "language_name": "Taroko", - "autonym": "Patas Taroko", - "speakers": 4721, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "crk", - "language_name": "Plains Cree", - "autonym": "Plains Cree", - "speakers": 4146, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "saf", - "language_name": "Safaliba", - "autonym": "Safaliba", - "speakers": 4108, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "mus", - "language_name": "Muscogee", - "autonym": "Mvskoke", - "speakers": 3992, - "family": "Muskogean", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vep", - "language_name": "Veps", - "autonym": "Veps", - "speakers": 3543, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tnr", - "language_name": "Ménik", - "autonym": "Ménik", - "speakers": 3305, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vic", - "language_name": "Virgin Islands Creole English", - "autonym": "Virgin Islands Creole English", - "speakers": 3113, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tru", - "language_name": "Turoyo", - "autonym": "Turoyo", - "speakers": 3035, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "uli", - "language_name": "Ulithian", - "autonym": "Ulithian", - "speakers": 2971, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rtm", - "language_name": "Rotuman", - "autonym": "Rotuman", - "speakers": 2527, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "wbp", - "language_name": "Warlpiri", - "autonym": "Warlpiri", - "speakers": 2496, - "family": "Pama-Nyungan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "yav", - "language_name": "Yangben", - "autonym": "Nuasue", - "speakers": 2303, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "den", - "language_name": "Slave", - "autonym": "Slave", - "speakers": 2299, - "family": "Athabaskan-Eyak-Tlingit", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "dgr", - "language_name": "Dogrib", - "autonym": "Dogrib", - "speakers": 2111, - "family": "Athabaskan-Eyak-Tlingit", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "frs", - "language_name": "Eastern Frisian", - "autonym": "Eastern Frisian", - "speakers": 2004, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kw", - "language_name": "Cornish", - "autonym": "Kernewek", - "speakers": 1973, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "csw", - "language_name": "Swampy Cree", - "autonym": "ᓀᐦᐃᓇᐍᐏᐣ", - "speakers": 1809, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "moh", - "language_name": "Mohawk", - "autonym": "KanienʼKéha", - "speakers": 1772, - "family": "Iroquoian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gv", - "language_name": "Manx", - "autonym": "Gaelg", - "speakers": 1719, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "smj", - "language_name": "Lule Sami", - "autonym": "Julevsámegiella", - "speakers": 1530, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "nsk", - "language_name": "Naskapi", - "autonym": "Naskapi", - "speakers": 1395, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tkl", - "language_name": "Tokelau", - "autonym": "Tokelau", - "speakers": 1285, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "niu", - "language_name": "Niuean", - "autonym": "Niuean", - "speakers": 1120, - "family": "Austronesian", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "stq", - "language_name": "Saterland Frisian", - "autonym": "Saterland Frisian", - "speakers": 962, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sei", - "language_name": "Seri", - "autonym": "Seri", - "speakers": 901, - "family": null, - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "clc", - "language_name": "Chilcotin", - "autonym": "Chilcotin", - "speakers": 867, - "family": "Athabaskan-Eyak-Tlingit", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "la", - "language_name": "Latin", - "autonym": "Lingua Latina", - "speakers": 820, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "hur", - "language_name": "Halkomelem", - "autonym": "Halkomelem", - "speakers": 716, - "family": "Salishan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "crg", - "language_name": "Michif", - "autonym": "Michif", - "speakers": 678, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sms", - "language_name": "Skolt Sami", - "autonym": "SääʹMǩiõll", - "speakers": 613, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "smn", - "language_name": "Inari Sami", - "autonym": "Anarâškielâ", - "speakers": 613, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lil", - "language_name": "Lillooet", - "autonym": "Lillooet", - "speakers": 528, - "family": "Salishan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "oka", - "language_name": "Okanagan", - "autonym": "Okanagan", - "speakers": 490, - "family": "Salishan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pqm", - "language_name": "Maliseet-Passamaquoddy", - "autonym": "Maliseet-Passamaquoddy", - "speakers": 490, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "kwk", - "language_name": "Kwakʼwala", - "autonym": "KwakʼWala", - "speakers": 377, - "family": "Wakashan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "crl", - "language_name": "Northern East Cree", - "autonym": "Northern East Cree", - "speakers": 377, - "family": "Algic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gwi", - "language_name": "Gwichʼin", - "autonym": "GwichʼIn", - "speakers": 302, - "family": "Athabaskan-Eyak-Tlingit", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "eo", - "language_name": "Esperanto", - "autonym": "Esperanto", - "speakers": 301, - "family": "Artificial Language", - "average": 0.0, - "in_benchmark": true, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sma", - "language_name": "Southern Sami", - "autonym": "Åarjelsaemien Gïele", - "speakers": 296, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "tsd", - "language_name": "Tsakonian", - "autonym": "Tsakonian", - "speakers": 202, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "izh", - "language_name": "Ingrian", - "autonym": "Ingrian", - "speakers": 142, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ia", - "language_name": "Interlingua", - "autonym": "Interlingua", - "speakers": 136, - "family": "Artificial Language", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "aro", - "language_name": "Araona", - "autonym": "Araona", - "speakers": 105, - "family": "Pano-Tacanan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "prg", - "language_name": "Prussian", - "autonym": "Prūsiskan", - "speakers": 38, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ie", - "language_name": "Interlingue", - "autonym": "Interlingue", - "speakers": 1, - "family": "Artificial Language", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "lzh", - "language_name": "Literary Chinese", - "autonym": "Literary Chinese", - "speakers": 0, - "family": "Sino-Tibetan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "io", - "language_name": "Ido", - "autonym": "Ido", - "speakers": 0, - "family": "Artificial Language", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "jbo", - "language_name": "Lojban", - "autonym": "La .Lojban.", - "speakers": 0, - "family": "Artificial Language", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "jut", - "language_name": "Jutish", - "autonym": "Jutish", - "speakers": 0, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "vot", - "language_name": "Votic", - "autonym": "Votic", - "speakers": 0, - "family": "Uralic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "gez", - "language_name": "Geez", - "autonym": "Geez", - "speakers": 0, - "family": "Afro-Asiatic", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "osa", - "language_name": "Osage", - "autonym": "𐓏𐓘𐓻𐓘𐓻𐓟", - "speakers": 0, - "family": "Siouan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "rgn", - "language_name": "Romagnol", - "autonym": "Romagnol", - "speakers": 0, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cu", - "language_name": "Church Slavic", - "autonym": "Church Slavic", - "speakers": 0, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "sgs", - "language_name": "Samogitian", - "autonym": "Samogitian", - "speakers": 0, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "ann", - "language_name": "Obolo", - "autonym": "Obolo", - "speakers": 0, - "family": "Atlantic-Congo", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cic", - "language_name": "Chickasaw", - "autonym": "Chikashshanompaʼ", - "speakers": 0, - "family": "Muskogean", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "cad", - "language_name": "Caddo", - "autonym": "Caddo", - "speakers": 0, - "family": "Caddoan", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - }, - { - "bcp_47": "pfl", - "language_name": "Palatine German", - "autonym": "Palatine German", - "speakers": 0, - "family": "Indo-European", - "average": 0.0, - "in_benchmark": false, - "NaN": 0.0, - "classification_accuracy": 0.0, - "language_modeling_chrf": 0.0, - "translation_bleu": 0.0, - "translation_chrf": 0.0 - } - ], - "dataset_table": [ - { - "name": "FLORES+", - "author": "Meta", - "author_url": "https://ai.meta.com", - "url": "https://huggingface.co/datasets/openlanguagedata/flores_plus", - "n_languages": 200, - "tasks": [ - "translation", - "classification", - "language_modeling" - ], - "parallel": 1.0, - "base": "FLORES", - "implemented": 1.0 - }, - { - "name": "FLEURS", - "author": "Meta", - "author_url": "https://ai.meta.com", - "url": "https://huggingface.co/datasets/google/fleurs", - "n_languages": 102, - "tasks": [ - "speech_recognition" - ], - "parallel": 1.0, - "base": "FLORES", - "implemented": 1.0 - }, - { - "name": "CommonVoice", - "author": "Mozilla", - "author_url": "https://mozilla.ai", - "url": "https://huggingface.co/datasets/mozilla-foundation/common_voice_17_0", - "n_languages": 124, - "tasks": [ - "speech_recognition" - ], - "parallel": null, - "base": null, - "implemented": null - }, - { - "name": "MMMLU", - "author": "OpenAI", - "author_url": "https://openai.com", - "url": "https://huggingface.co/datasets/openai/MMMLU", - "n_languages": 14, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "MMLU", - "implemented": null - }, - { - "name": "AfriMMLU", - "author": "Masakhane", - "author_url": "https://www.masakhane.io", - "url": "https://huggingface.co/datasets/masakhane/afrimmlu", - "n_languages": 17, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "MMLU", - "implemented": null - }, - { - "name": "Okapi MMLU", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/jon-tow/okapi_mmlu", - "n_languages": 16, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "MMLU", - "implemented": null - }, - { - "name": "MMLU-X", - "author": "OpenGPT-X", - "author_url": null, - "url": "https://huggingface.co/datasets/openGPT-X/mmlux", - "n_languages": 20, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "MMLU", - "implemented": null - }, - { - "name": "Global MMLU", - "author": "Cohere", - "author_url": "https://cohere.com", - "url": "https://huggingface.co/datasets/CohereForAI/Global-MMLU", - "n_languages": 42, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "MMLU", - "implemented": null - }, - { - "name": "MGSM", - "author": "Google", - "author_url": "https://google.com", - "url": "https://huggingface.co/datasets/juletxara/mgsm", - "n_languages": 10, - "tasks": [ - "math" - ], - "parallel": 1.0, - "base": "MGSM", - "implemented": null - }, - { - "name": "AfriMGSM", - "author": "Masakhane", - "author_url": "https://www.masakhane.io", - "url": "https://huggingface.co/datasets/masakhane/afrimgsm", - "n_languages": 18, - "tasks": [ - "math" - ], - "parallel": 1.0, - "base": "MGSM", - "implemented": null - }, - { - "name": "GSM8K-X", - "author": "OpenGPT-X", - "author_url": null, - "url": "https://huggingface.co/datasets/openGPT-X/gsm8kx", - "n_languages": 20, - "tasks": [ - "math" - ], - "parallel": 1.0, - "base": "MGSM", - "implemented": null - }, - { - "name": "Okapi ARC Challenge", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/jon-tow/okapi_arc_challenge", - "n_languages": 31, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "AI2 ARC", - "implemented": null - }, - { - "name": "Uhuru ARC Easy", - "author": "Masakhane", - "author_url": "https://www.masakhane.io", - "url": "https://huggingface.co/datasets/masakhane/uhura-arc-easy", - "n_languages": 6, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "AI2 ARC", - "implemented": null - }, - { - "name": "Arc-X", - "author": "OpenGPT-X", - "author_url": null, - "url": "https://huggingface.co/datasets/openGPT-X/arcx", - "n_languages": 20, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "AI2 ARC", - "implemented": null - }, - { - "name": "Okapi TruthfulQA", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/jon-tow/okapi_truthfulqa/tree/main/data", - "n_languages": 31, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "TruthfulQA", - "implemented": null - }, - { - "name": "Uhura TruthfulQA", - "author": "Masakhane", - "author_url": "https://www.masakhane.io", - "url": "https://huggingface.co/datasets/masakhane/uhura-truthfulqa", - "n_languages": 6, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "TruthfulQA", - "implemented": null - }, - { - "name": "TruthfulQA-X", - "author": "OpenGPT-X", - "author_url": null, - "url": "https://huggingface.co/datasets/openGPT-X/truthfulqax", - "n_languages": 20, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "TruthfulQA", - "implemented": null - }, - { - "name": "XNLI", - "author": "Meta", - "author_url": "https://ai.meta.com", - "url": "https://huggingface.co/datasets/facebook/xnli", - "n_languages": 14, - "tasks": [ - "classification" - ], - "parallel": 1.0, - "base": "XNLI", - "implemented": null - }, - { - "name": "AfriXNLI", - "author": "Masakhane", - "author_url": "https://www.masakhane.io", - "url": "https://huggingface.co/datasets/masakhane/afrixnli", - "n_languages": 18, - "tasks": [ - "classification" - ], - "parallel": 1.0, - "base": "XNLI", - "implemented": null - }, - { - "name": "Okapi HellaSwag", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/jon-tow/okapi_hellaswag", - "n_languages": 31, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "HellaSwag", - "implemented": null - }, - { - "name": "HellaSwag-X", - "author": "OpenGPT-X", - "author_url": null, - "url": "https://huggingface.co/datasets/openGPT-X/hellaswagx", - "n_languages": 20, - "tasks": [ - "question_answering" - ], - "parallel": 1.0, - "base": "HellaSwag", - "implemented": null - }, - { - "name": "WikiANN / PAN-X", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/unimelb-nlp/wikiann", - "n_languages": 176, - "tasks": [ - "ner" - ], - "parallel": 0.0, - "base": null, - "implemented": null - }, - { - "name": "MSVAMP", - "author": "Microsoft", - "author_url": "https://microsoft.ai", - "url": "https://huggingface.co/datasets/Mathoctopus/MSVAMP", - "n_languages": 10, - "tasks": [ - "math" - ], - "parallel": 1.0, - "base": null, - "implemented": null - }, - { - "name": "XLSUM", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/csebuetnlp/xlsum", - "n_languages": 45, - "tasks": [ - "summarization" - ], - "parallel": 1.0, - "base": null, - "implemented": null - }, - { - "name": "SEA-IFEVAL", - "author": "AI Singapore", - "author_url": "https://aisingapore.org", - "url": "https://huggingface.co/datasets/aisingapore/instruction_following-ifeval", - "n_languages": 7, - "tasks": [ - "instruction_following" - ], - "parallel": 1.0, - "base": "IFEVAL", - "implemented": null - }, - { - "name": "XTREME", - "author": "Google", - "author_url": "https://google.com", - "url": "https://huggingface.co/datasets/google/xtreme", - "n_languages": 40, - "tasks": [ - "translation", - "classification", - "question_answering", - "ner" - ], - "parallel": null, - "base": null, - "implemented": null - }, - { - "name": "XGLUE", - "author": "Microsoft", - "author_url": "https://microsoft.ai", - "url": "https://huggingface.co/datasets/microsoft/xglue", - "n_languages": 18, - "tasks": [ - "pos" - ], - "parallel": null, - "base": "GLUE", - "implemented": null - }, - { - "name": "IndicGLUE", - "author": "AI4Bharat", - "author_url": "https://models.ai4bharat.org", - "url": "https://huggingface.co/datasets/ai4bharat/indic_glue", - "n_languages": 11, - "tasks": [ - "question_answering" - ], - "parallel": null, - "base": "GLUE", - "implemented": null - }, - { - "name": "Opus Gnome", - "author": "Helsinki NLP", - "author_url": null, - "url": "https://huggingface.co/datasets/Helsinki-NLP/opus_gnome", - "n_languages": 187, - "tasks": [ - "translation" - ], - "parallel": 1.0, - "base": null, - "implemented": null - }, - { - "name": "Opus Paracrawl", - "author": "Helsinki NLP", - "author_url": null, - "url": "https://huggingface.co/datasets/Helsinki-NLP/opus_paracrawl", - "n_languages": 43, - "tasks": [ - "translation" - ], - "parallel": 0.0, - "base": null, - "implemented": null - }, - { - "name": "CCAligned", - "author": "Meta", - "author_url": "https://ai.meta.com", - "url": "https://huggingface.co/datasets/ahelk/ccaligned_multilingual", - "n_languages": 137, - "tasks": [ - "translation" - ], - "parallel": 0.0, - "base": null, - "implemented": null - }, - { - "name": "OPUS Collection", - "author": "Helsinki NLP", - "author_url": null, - "url": "https://opus.nlpl.eu", - "n_languages": 747, - "tasks": [ - "translation" - ], - "parallel": 0.0, - "base": null, - "implemented": null - }, - { - "name": "MasakhaNER", - "author": "Masakhane", - "author_url": "https://www.masakhane.io", - "url": "https://huggingface.co/datasets/masakhane/masakhaner", - "n_languages": 10, - "tasks": [ - "ner" - ], - "parallel": null, - "base": null, - "implemented": null - }, - { - "name": "Multilingual Sentiments", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/tyqiangz/multilingual-sentiments", - "n_languages": 12, - "tasks": [ - "sentiment_analysis" - ], - "parallel": null, - "base": null, - "implemented": null - }, - { - "name": "CulturaX", - "author": "Academic", - "author_url": null, - "url": "https://huggingface.co/datasets/uonlp/CulturaX", - "n_languages": 167, - "tasks": [ - "language_modeling" - ], - "parallel": 0.0, - "base": null, - "implemented": null - }, - { - "name": "Tülu 3 SFT Mixture", - "author": "AllenAI", - "author_url": "https://allenai.org", - "url": "https://huggingface.co/datasets/allenai/tulu-3-sft-mixture", - "n_languages": 70, - "tasks": [ - "instruction_following" - ], - "parallel": 0.0, - "base": null, - "implemented": null - }, - { - "name": "xP3", - "author": "BigScience", - "author_url": "https://bigscience.huggingface.co", - "url": "https://huggingface.co/datasets/bigscience/xP3", - "n_languages": 46, - "tasks": [ - "instruction_following" - ], - "parallel": 0.0, - "base": null, - "implemented": null - }, - { - "name": "Aya", - "author": "Cohere", - "author_url": "https://cohere.com", - "url": "https://huggingface.co/datasets/CohereForAI/aya_dataset", - "n_languages": 65, - "tasks": [ - "instruction_following" - ], - "parallel": null, - "base": null, - "implemented": null - }, - { - "name": "Lanfrica", - "author": "Lanfrica", - "author_url": "https://lanfrica.com", - "url": "https://lanfrica.com/records?language=yor&task=machine%20translation", - "n_languages": 2200, - "tasks": [ - "datasets" - ], - "parallel": null, - "base": null, - "implemented": null - }, - { - "name": "HuggingFace Languages", - "author": "HuggingFace", - "author_url": "https://huggingface.co", - "url": "https://huggingface.co/languages", - "n_languages": 4680, - "tasks": [ - "datasets", - "models" - ], - "parallel": null, - "base": null, - "implemented": null - }, - { - "name": "HuggingFace Multilingual Datasets", - "author": "HuggingFace", - "author_url": "https://huggingface.co", - "url": "https://huggingface.co/datasets?other=multilinguality:multilingual", - "n_languages": 2012, - "tasks": [ - "datasets" - ], - "parallel": 0.0, - "base": null, - "implemented": null - } - ], - "countries": { - "AC": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 931, - "score": 0.47 - } - ] - }, - "AE": { - "score": 0.40140041521976655, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 4996040, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 7793822, - "score": 0.42 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 189850, - "score": 0.41 - }, - { - "name": "Pashto", - "bcp_47": "ps", - "population": 289770, - "score": 0.0 - }, - { - "name": "Malayalam", - "bcp_47": "ml", - "population": 699446, - "score": 0.0 - }, - { - "name": "Baluchi", - "bcp_47": "bal", - "population": 229818, - "score": 0.0 - } - ] - }, - "AG": { - "score": 0.4696346724027672, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 84434, - "score": 0.47 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 1571, - "score": 0.45 - } - ] - }, - "AI": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 17186, - "score": 0.47 - } - ] - }, - "AQ": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 300, - "score": 0.47 - } - ] - }, - "AR": { - "score": 0.45083230214508235, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3183537, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 45479100, - "score": 0.45 - }, - { - "name": "Guarani", - "bcp_47": "gn", - "population": 21375, - "score": 0.0 - }, - { - "name": "Welsh", - "bcp_47": "cy", - "population": 30016, - "score": 0.0 - } - ] - }, - "AS": { - "score": 0.23260142212865204, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 47954, - "score": 0.47 - }, - { - "name": "Samoan", - "bcp_47": "sm", - "population": 48943, - "score": 0.0 - } - ] - }, - "AT": { - "score": 0.31771431191158667, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 6467398, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 974540, - "score": 0.46 - }, - { - "name": "German", - "bcp_47": "de", - "population": 8593666, - "score": 0.49 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 797350, - "score": 0.47 - }, - { - "name": "Bavarian", - "bcp_47": "bar", - "population": 8416478, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 23035, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 106313, - "score": 0.0 - }, - { - "name": "Slovenian", - "bcp_47": "sl", - "population": 32780, - "score": 0.0 - } - ] - }, - "AU": { - "score": 0.46970357171432847, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 24447840, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 534796, - "score": 0.46 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 483864, - "score": 0.47 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 2190, - "score": 0.0 - }, - { - "name": "Warlpiri", - "bcp_47": "wbp", - "population": 2496, - "score": 0.0 - } - ] - }, - "AW": { - "score": 0.0073216055759017535, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2986, - "score": 0.47 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 115845, - "score": 0.0 - }, - { - "name": "Papiamento", - "bcp_47": "pap", - "population": 72851, - "score": 0.0 - } - ] - }, - "BA": { - "score": 0.07690910954274856, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1726016, - "score": 0.47 - }, - { - "name": "Serbian", - "bcp_47": "sr", - "population": 767118, - "score": 0.0 - }, - { - "name": "Bosnian", - "bcp_47": "bs", - "population": 7594468, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 460271, - "score": 0.0 - } - ] - }, - "BB": { - "score": 0.4699999999999999, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 294560, - "score": 0.47 - } - ] - }, - "BD": { - "score": 0.3554705133359761, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 29277180, - "score": 0.47 - }, - { - "name": "Bangla", - "bcp_47": "bn", - "population": 159397980, - "score": 0.38 - }, - { - "name": "Burmese", - "bcp_47": "my", - "population": 341567, - "score": 0.0 - }, - { - "name": "Rangpuri", - "bcp_47": "rkt", - "population": 10572315, - "score": 0.0 - }, - { - "name": "Sylheti", - "bcp_47": "syl", - "population": 8132550, - "score": 0.0 - }, - { - "name": "Rohingya", - "bcp_47": "rhg", - "population": 862050, - "score": 0.0 - }, - { - "name": "Manipuri", - "bcp_47": "mni", - "population": 17892, - "score": 0.0 - }, - { - "name": "Garo", - "bcp_47": "grt", - "population": 118735, - "score": 0.0 - }, - { - "name": "Chakma", - "bcp_47": "ccp", - "population": 357832, - "score": 0.0 - }, - { - "name": "Mru", - "bcp_47": "mro", - "population": 29277, - "score": 0.0 - } - ] - }, - "BE": { - "score": 0.29499472599184506, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 6915213, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 4453866, - "score": 0.46 - }, - { - "name": "German", - "bcp_47": "de", - "population": 2578554, - "score": 0.49 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 6446385, - "score": 0.0 - }, - { - "name": "West Flemish", - "bcp_47": "vls", - "population": 1172070, - "score": 0.0 - }, - { - "name": "Walloon", - "bcp_47": "wa", - "population": 679801, - "score": 0.0 - } - ] - }, - "BG": { - "score": 0.18479041916167663, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1741725, - "score": 0.47 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 1602387, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 557352, - "score": 0.49 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 766359, - "score": 0.44 - }, - { - "name": "Bulgarian", - "bcp_47": "bg", - "population": 6966900, - "score": 0.0 - } - ] - }, - "BI": { - "score": 0.2226670965568091, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 6289, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 7000822, - "score": 0.46 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 6408, - "score": 0.45 - }, - { - "name": "Rundi", - "bcp_47": "rn", - "population": 7475454, - "score": 0.0 - } - ] - }, - "BM": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 66010, - "score": 0.47 - } - ] - }, - "BN": { - "score": 0.05292700193318268, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 7896, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 51093, - "score": 0.46 - }, - { - "name": "Malay", - "bcp_47": "ms", - "population": 455189, - "score": 0.0 - } - ] - }, - "BR": { - "score": 0.45070787745315494, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 16937280, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 76218, - "score": 0.45 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 192661560, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 1778414, - "score": 0.49 - }, - { - "name": "Japanese", - "bcp_47": "ja", - "population": 444604, - "score": 0.46 - }, - { - "name": "Korean", - "bcp_47": "ko", - "population": 44460, - "score": 0.41 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 592805, - "score": 0.47 - }, - { - "name": "Venetian", - "bcp_47": "vec", - "population": 508118, - "score": 0.0 - }, - { - "name": "Kaingang", - "bcp_47": "kgp", - "population": 50812, - "score": 0.0 - }, - { - "name": "Nheengatu", - "bcp_47": "yrl", - "population": 21172, - "score": 0.0 - }, - { - "name": "Guajajára", - "bcp_47": "gub", - "population": 17784, - "score": 0.0 - }, - { - "name": "Xavánte", - "bcp_47": "xav", - "population": 9951, - "score": 0.0 - } - ] - }, - "BS": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 337721, - "score": 0.47 - } - ] - }, - "BT": { - "score": 0.05505863086648988, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 86055, - "score": 0.47 - }, - { - "name": "Nepali", - "bcp_47": "ne", - "population": 132994, - "score": 0.0 - }, - { - "name": "Dzongkha", - "bcp_47": "dz", - "population": 367689, - "score": 0.0 - }, - { - "name": "Tshangla", - "bcp_47": "tsj", - "population": 117348, - "score": 0.0 - }, - { - "name": "Lepcha", - "bcp_47": "lep", - "population": 30510, - "score": 0.0 - } - ] - }, - "BV": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1, - "score": 0.47 - } - ] - }, - "BW": { - "score": 0.26574054482622333, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1876956, - "score": 0.47 - }, - { - "name": "Afrikaans", - "bcp_47": "af", - "population": 6025, - "score": 0.0 - }, - { - "name": "Tswana", - "bcp_47": "tn", - "population": 1436683, - "score": 0.0 - } - ] - }, - "BZ": { - "score": 0.4656250134412544, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 399598, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 111887, - "score": 0.45 - } - ] - }, - "CA": { - "score": 0.4538591979207903, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 32416926, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 678494, - "score": 0.46 - }, - { - "name": "Hindi", - "bcp_47": "hi", - "population": 188470, - "score": 0.46 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 603106, - "score": 0.45 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 565412, - "score": 0.42 - }, - { - "name": "Urdu", - "bcp_47": "ur", - "population": 286475, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 11308230, - "score": 0.46 - }, - { - "name": "Bangla", - "bcp_47": "bn", - "population": 90466, - "score": 0.38 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 229934, - "score": 0.45 - }, - { - "name": "Punjabi", - "bcp_47": "pa", - "population": 603106, - "score": 0.43 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 211087, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 294014, - "score": 0.49 - }, - { - "name": "Japanese", - "bcp_47": "ja", - "population": 52772, - "score": 0.46 - }, - { - "name": "Vietnamese", - "bcp_47": "vi", - "population": 184701, - "score": 0.45 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 184701, - "score": 0.41 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 245012, - "score": 0.41 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 37694, - "score": 0.44 - }, - { - "name": "Cantonese", - "bcp_47": "yue", - "population": 640800, - "score": 0.39 - }, - { - "name": "Korean", - "bcp_47": "ko", - "population": 169623, - "score": 0.41 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 343016, - "score": 0.47 - }, - { - "name": "Filipino", - "bcp_47": "fil", - "population": 565412, - "score": 0.42 - }, - { - "name": "Gujarati", - "bcp_47": "gu", - "population": 135699, - "score": 0.42 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 173393, - "score": 0.0 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 56541, - "score": 0.0 - }, - { - "name": "Ukrainian", - "bcp_47": "uk", - "population": 75388, - "score": 0.0 - }, - { - "name": "Romanian", - "bcp_47": "ro", - "population": 101774, - "score": 0.0 - }, - { - "name": "Somali", - "bcp_47": "so", - "population": 49002, - "score": 0.0 - }, - { - "name": "Serbian", - "bcp_47": "sr", - "population": 64080, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 49002, - "score": 0.0 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 124391, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 45233, - "score": 0.0 - }, - { - "name": "Waray", - "bcp_47": "war", - "population": 678, - "score": 0.0 - }, - { - "name": "Inuktitut", - "bcp_47": "iu", - "population": 90466, - "score": 0.0 - }, - { - "name": "Plautdietsch", - "bcp_47": "pdt", - "population": 90466, - "score": 0.0 - }, - { - "name": "Ojibwa", - "bcp_47": "oj", - "population": 23747, - "score": 0.0 - }, - { - "name": "Dakota", - "bcp_47": "dak", - "population": 1206, - "score": 0.0 - }, - { - "name": "Oji-Cree", - "bcp_47": "ojs", - "population": 15078, - "score": 0.0 - }, - { - "name": "Chipewyan", - "bcp_47": "chp", - "population": 12816, - "score": 0.0 - }, - { - "name": "Innu-aimun", - "bcp_47": "moe", - "population": 12062, - "score": 0.0 - }, - { - "name": "Cree", - "bcp_47": "cr", - "population": 9047, - "score": 0.0 - }, - { - "name": "Mi'kmaw", - "bcp_47": "mic", - "population": 7916, - "score": 0.0 - }, - { - "name": "Atikamekw", - "bcp_47": "atj", - "population": 6408, - "score": 0.0 - }, - { - "name": "Siksiká", - "bcp_47": "bla", - "population": 4900, - "score": 0.0 - }, - { - "name": "Plains Cree", - "bcp_47": "crk", - "population": 4146, - "score": 0.0 - }, - { - "name": "Slave", - "bcp_47": "den", - "population": 2299, - "score": 0.0 - }, - { - "name": "Dogrib", - "bcp_47": "dgr", - "population": 2111, - "score": 0.0 - }, - { - "name": "Swampy Cree", - "bcp_47": "csw", - "population": 1809, - "score": 0.0 - }, - { - "name": "Mohawk", - "bcp_47": "moh", - "population": 1772, - "score": 0.0 - }, - { - "name": "Naskapi", - "bcp_47": "nsk", - "population": 1395, - "score": 0.0 - }, - { - "name": "Chilcotin", - "bcp_47": "clc", - "population": 867, - "score": 0.0 - }, - { - "name": "Halkomelem", - "bcp_47": "hur", - "population": 716, - "score": 0.0 - }, - { - "name": "Michif", - "bcp_47": "crg", - "population": 678, - "score": 0.0 - }, - { - "name": "Lillooet", - "bcp_47": "lil", - "population": 528, - "score": 0.0 - }, - { - "name": "Okanagan", - "bcp_47": "oka", - "population": 490, - "score": 0.0 - }, - { - "name": "Maliseet-Passamaquoddy", - "bcp_47": "pqm", - "population": 490, - "score": 0.0 - }, - { - "name": "Kwakʼwala", - "bcp_47": "kwk", - "population": 377, - "score": 0.0 - }, - { - "name": "Northern East Cree", - "bcp_47": "crl", - "population": 377, - "score": 0.0 - }, - { - "name": "Gwichʼin", - "bcp_47": "gwi", - "population": 302, - "score": 0.0 - } - ] - }, - "CC": { - "score": 0.07964765100671141, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 101, - "score": 0.47 - }, - { - "name": "Malay", - "bcp_47": "ms", - "population": 495, - "score": 0.0 - } - ] - }, - "CH": { - "score": 0.33368138748580556, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 5126434, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 1764838, - "score": 0.46 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 285736, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 6134913, - "score": 0.49 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 361372, - "score": 0.47 - }, - { - "name": "Swiss German", - "bcp_47": "gsw", - "population": 5462594, - "score": 0.0 - }, - { - "name": "Lombard", - "bcp_47": "lmo", - "population": 344564, - "score": 0.0 - }, - { - "name": "Romansh", - "bcp_47": "rm", - "population": 42020, - "score": 0.0 - }, - { - "name": "Sinte Romani", - "bcp_47": "rmo", - "population": 24372, - "score": 0.0 - }, - { - "name": "Walser", - "bcp_47": "wae", - "population": 10085, - "score": 0.0 - } - ] - }, - "CK": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 8574, - "score": 0.47 - } - ] - }, - "CL": { - "score": 0.44555045871559634, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1727746, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 17823064, - "score": 0.45 - }, - { - "name": "Mapuche", - "bcp_47": "arn", - "population": 272802, - "score": 0.0 - } - ] - }, - "CM": { - "score": 0.3722156934094152, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 10543100, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 108206, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 18866600, - "score": 0.46 - }, - { - "name": "Hausa", - "bcp_47": "ha", - "population": 38843, - "score": 0.0 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 998820, - "score": 0.0 - }, - { - "name": "Bulu", - "bcp_47": "bum", - "population": 1276270, - "score": 0.0 - }, - { - "name": "Ewondo", - "bcp_47": "ewo", - "population": 860095, - "score": 0.0 - }, - { - "name": "Yemba", - "bcp_47": "ybb", - "population": 443920, - "score": 0.0 - }, - { - "name": "Ngiemboon", - "bcp_47": "nnh", - "population": 388430, - "score": 0.0 - }, - { - "name": "Ghomala", - "bcp_47": "bbj", - "population": 388430, - "score": 0.0 - }, - { - "name": "Kom", - "bcp_47": "bkm", - "population": 360685, - "score": 0.0 - }, - { - "name": "Bamun", - "bcp_47": "bax", - "population": 332940, - "score": 0.0 - }, - { - "name": "Basaa", - "bcp_47": "bas", - "population": 332940, - "score": 0.0 - }, - { - "name": "Medumba", - "bcp_47": "byv", - "population": 305195, - "score": 0.0 - }, - { - "name": "Mundang", - "bcp_47": "mua", - "population": 277450, - "score": 0.0 - }, - { - "name": "Mafa", - "bcp_47": "maf", - "population": 205313, - "score": 0.0 - }, - { - "name": "Bafut", - "bcp_47": "bfd", - "population": 158146, - "score": 0.0 - }, - { - "name": "Kako", - "bcp_47": "kkj", - "population": 149823, - "score": 0.0 - }, - { - "name": "Akoose", - "bcp_47": "bss", - "population": 149823, - "score": 0.0 - }, - { - "name": "Duala", - "bcp_47": "dua", - "population": 133176, - "score": 0.0 - }, - { - "name": "Metaʼ", - "bcp_47": "mgo", - "population": 130401, - "score": 0.0 - }, - { - "name": "Ngomba", - "bcp_47": "jgo", - "population": 94333, - "score": 0.0 - }, - { - "name": "Bafia", - "bcp_47": "ksf", - "population": 88784, - "score": 0.0 - }, - { - "name": "Kenyang", - "bcp_47": "ken", - "population": 69362, - "score": 0.0 - }, - { - "name": "Aghem", - "bcp_47": "agq", - "population": 38843, - "score": 0.0 - }, - { - "name": "Kwasio", - "bcp_47": "nmg", - "population": 8878, - "score": 0.0 - }, - { - "name": "Yangben", - "bcp_47": "yav", - "population": 2303, - "score": 0.0 - } - ] - }, - "CN": { - "score": 0.38724457341349466, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 62731, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 1254618000, - "score": 0.46 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 13940, - "score": 0.45 - }, - { - "name": "Vietnamese", - "bcp_47": "vi", - "population": 6970, - "score": 0.45 - }, - { - "name": "Wu Chinese", - "bcp_47": "wuu", - "population": 83641200, - "score": 0.0 - }, - { - "name": "Cantonese", - "bcp_47": "yue", - "population": 72489040, - "score": 0.39 - }, - { - "name": "Korean", - "bcp_47": "ko", - "population": 2091030, - "score": 0.41 - }, - { - "name": "Xiang Chinese", - "bcp_47": "hsn", - "population": 40426580, - "score": 0.0 - }, - { - "name": "Uzbek", - "bcp_47": "uz", - "population": 5576, - "score": 0.0 - }, - { - "name": "Hakka Chinese", - "bcp_47": "hak", - "population": 32062460, - "score": 0.0 - }, - { - "name": "Min Nan Chinese", - "bcp_47": "nan", - "population": 26486380, - "score": 0.0 - }, - { - "name": "Gan Chinese", - "bcp_47": "gan", - "population": 23698340, - "score": 0.0 - }, - { - "name": "Kazakh", - "bcp_47": "kk", - "population": 1184917, - "score": 0.0 - }, - { - "name": "Sichuan Yi", - "bcp_47": "ii", - "population": 8364120, - "score": 0.0 - }, - { - "name": "Uyghur", - "bcp_47": "ug", - "population": 7667110, - "score": 0.0 - }, - { - "name": "Mongolian", - "bcp_47": "mn", - "population": 3624452, - "score": 0.0 - }, - { - "name": "Zhuang", - "bcp_47": "za", - "population": 4321462, - "score": 0.0 - }, - { - "name": "Kyrgyz", - "bcp_47": "ky", - "population": 473967, - "score": 0.0 - }, - { - "name": "Tibetan", - "bcp_47": "bo", - "population": 2788040, - "score": 0.0 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 55761, - "score": 0.0 - }, - { - "name": "Lisu", - "bcp_47": "lis", - "population": 627309, - "score": 0.0 - }, - { - "name": "Naxi", - "bcp_47": "nxq", - "population": 334565, - "score": 0.0 - }, - { - "name": "Lü", - "bcp_47": "khb", - "population": 264864, - "score": 0.0 - }, - { - "name": "Tai Nüa", - "bcp_47": "tdd", - "population": 264864, - "score": 0.0 - }, - { - "name": "Western Lawa", - "bcp_47": "lcp", - "population": 80853, - "score": 0.0 - }, - { - "name": "Literary Chinese", - "bcp_47": "lzh", - "population": 0, - "score": 0.0 - } - ] - }, - "CP": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1, - "score": 0.47 - } - ] - }, - "CQ": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 482, - "score": 0.47 - } - ] - }, - "CX": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1389, - "score": 0.47 - } - ] - }, - "CY": { - "score": 0.2404799926753925, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 924676, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 1267, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 88668, - "score": 0.46 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 291336, - "score": 0.44 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 1203346, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 2787, - "score": 0.0 - } - ] - }, - "CZ": { - "score": 0.12805930282531847, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2889675, - "score": 0.47 - }, - { - "name": "German", - "bcp_47": "de", - "population": 1605375, - "score": 0.49 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 52442, - "score": 0.0 - }, - { - "name": "Czech", - "bcp_47": "cs", - "population": 10488450, - "score": 0.0 - }, - { - "name": "Slovak", - "bcp_47": "sk", - "population": 1712400, - "score": 0.0 - } - ] - }, - "DE": { - "score": 0.3765932308207555, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 51302208, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 4809582, - "score": 0.45 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 14428746, - "score": 0.46 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 4809582, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 72945327, - "score": 0.49 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 2003992, - "score": 0.44 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 5611179, - "score": 0.47 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 232463, - "score": 0.0 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 7214373, - "score": 0.0 - }, - { - "name": "Bavarian", - "bcp_47": "bar", - "population": 13627149, - "score": 0.0 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 304607, - "score": 0.0 - }, - { - "name": "Low German", - "bcp_47": "nds", - "population": 9619164, - "score": 0.0 - }, - { - "name": "Swiss German", - "bcp_47": "gsw", - "population": 1843673, - "score": 0.0 - }, - { - "name": "Danish", - "bcp_47": "da", - "population": 1603194, - "score": 0.0 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 529054, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 633262, - "score": 0.0 - }, - { - "name": "Main-Franconian", - "bcp_47": "vmf", - "population": 4809582, - "score": 0.0 - }, - { - "name": "Swabian", - "bcp_47": "swg", - "population": 801597, - "score": 0.0 - }, - { - "name": "Colognian", - "bcp_47": "ksh", - "population": 240479, - "score": 0.0 - }, - { - "name": "Upper Sorbian", - "bcp_47": "hsb", - "population": 12826, - "score": 0.0 - }, - { - "name": "Northern Frisian", - "bcp_47": "frr", - "population": 9619, - "score": 0.0 - }, - { - "name": "Lower Sorbian", - "bcp_47": "dsb", - "population": 6974, - "score": 0.0 - }, - { - "name": "Eastern Frisian", - "bcp_47": "frs", - "population": 2004, - "score": 0.0 - }, - { - "name": "Saterland Frisian", - "bcp_47": "stq", - "population": 962, - "score": 0.0 - }, - { - "name": "Palatine German", - "bcp_47": "pfl", - "population": 0, - "score": 0.0 - } - ] - }, - "DG": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 495, - "score": 0.47 - } - ] - }, - "DK": { - "score": 0.2649269539952979, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 5047693, - "score": 0.47 - }, - { - "name": "German", - "bcp_47": "de", - "population": 2758623, - "score": 0.49 - }, - { - "name": "Swedish", - "bcp_47": "sv", - "population": 763023, - "score": 0.0 - }, - { - "name": "Danish", - "bcp_47": "da", - "population": 5458551, - "score": 0.0 - }, - { - "name": "Faroese", - "bcp_47": "fo", - "population": 22304, - "score": 0.0 - }, - { - "name": "Kalaallisut", - "bcp_47": "kl", - "population": 7043, - "score": 0.0 - }, - { - "name": "Jutish", - "bcp_47": "jut", - "population": 0, - "score": 0.0 - } - ] - }, - "DM": { - "score": 0.47000000000000003, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 69788, - "score": 0.47 - } - ] - }, - "DO": { - "score": 0.45001946876617066, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 7980, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 8189766, - "score": 0.45 - } - ] - }, - "DZ": { - "score": 0.2271637127514295, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3008103, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 31799946, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 8594580, - "score": 0.46 - }, - { - "name": "Algerian Arabic", - "bcp_47": "arq", - "population": 35667507, - "score": 0.0 - }, - { - "name": "Kabyle", - "bcp_47": "kab", - "population": 3351886, - "score": 0.0 - } - ] - }, - "EE": { - "score": 0.23907703243578238, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 614310, - "score": 0.47 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 688027, - "score": 0.45 - }, - { - "name": "Finnish", - "bcp_47": "fi", - "population": 258010, - "score": 0.0 - }, - { - "name": "Estonian", - "bcp_47": "et", - "population": 872320, - "score": 0.0 - }, - { - "name": "Võro", - "bcp_47": "vro", - "population": 70031, - "score": 0.0 - }, - { - "name": "Interlingue", - "bcp_47": "ie", - "population": 1, - "score": 0.0 - } - ] - }, - "EG": { - "score": 0.4156717299521135, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 36443400, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 97876560, - "score": 0.42 - }, - { - "name": "Egyptian Arabic", - "bcp_47": "arz", - "population": 66639360, - "score": 0.38 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 63516, - "score": 0.0 - } - ] - }, - "ER": { - "score": 0.1980585154915333, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3587908, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 297979, - "score": 0.42 - }, - { - "name": "Tigrinya", - "bcp_47": "ti", - "population": 3648720, - "score": 0.0 - }, - { - "name": "Afar", - "bcp_47": "aa", - "population": 218923, - "score": 0.0 - }, - { - "name": "Tigre", - "bcp_47": "tig", - "population": 1094616, - "score": 0.0 - }, - { - "name": "Saho", - "bcp_47": "ssy", - "population": 218923, - "score": 0.0 - }, - { - "name": "Blin", - "bcp_47": "byn", - "population": 79056, - "score": 0.0 - } - ] - }, - "ES": { - "score": 0.37009809252734244, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 12003792, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 49515642, - "score": 0.45 - }, - { - "name": "Catalan", - "bcp_47": "ca", - "population": 8502686, - "score": 0.0 - }, - { - "name": "Galician", - "bcp_47": "gl", - "population": 3501106, - "score": 0.0 - }, - { - "name": "Occitan", - "bcp_47": "oc", - "population": 4952, - "score": 0.0 - }, - { - "name": "Basque", - "bcp_47": "eu", - "population": 1000316, - "score": 0.0 - }, - { - "name": "Asturian", - "bcp_47": "ast", - "population": 650205, - "score": 0.0 - }, - { - "name": "Extremaduran", - "bcp_47": "ext", - "population": 245077, - "score": 0.0 - }, - { - "name": "Aragonese", - "bcp_47": "an", - "population": 26008, - "score": 0.0 - } - ] - }, - "ET": { - "score": 0.15951065509076556, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 46488590, - "score": 0.47 - }, - { - "name": "Amharic", - "bcp_47": "am", - "population": 35677290, - "score": 0.0 - }, - { - "name": "Oromo", - "bcp_47": "om", - "population": 34596160, - "score": 0.0 - }, - { - "name": "Somali", - "bcp_47": "so", - "population": 6486780, - "score": 0.0 - }, - { - "name": "Tigrinya", - "bcp_47": "ti", - "population": 6486780, - "score": 0.0 - }, - { - "name": "Sidamo", - "bcp_47": "sid", - "population": 3783955, - "score": 0.0 - }, - { - "name": "Afar", - "bcp_47": "aa", - "population": 1513582, - "score": 0.0 - }, - { - "name": "Wolaytta", - "bcp_47": "wal", - "population": 1946034, - "score": 0.0 - }, - { - "name": "Geez", - "bcp_47": "gez", - "population": 0, - "score": 0.0 - } - ] - }, - "FI": { - "score": 0.18533875082776866, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3900169, - "score": 0.47 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 45131, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 1002901, - "score": 0.49 - }, - { - "name": "Swedish", - "bcp_47": "sv", - "population": 2451535, - "score": 0.0 - }, - { - "name": "Finnish", - "bcp_47": "fi", - "population": 5237370, - "score": 0.0 - }, - { - "name": "Estonian", - "bcp_47": "et", - "population": 6129, - "score": 0.0 - }, - { - "name": "Northern Sami", - "bcp_47": "se", - "population": 2006, - "score": 0.0 - }, - { - "name": "Kalo Finnish Romani", - "bcp_47": "rmf", - "population": 5015, - "score": 0.0 - }, - { - "name": "Skolt Sami", - "bcp_47": "sms", - "population": 613, - "score": 0.0 - }, - { - "name": "Inari Sami", - "bcp_47": "smn", - "population": 613, - "score": 0.0 - } - ] - }, - "FJ": { - "score": 0.2951391687808469, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 879816, - "score": 0.47 - }, - { - "name": "Hindi", - "bcp_47": "hi", - "population": 411829, - "score": 0.46 - }, - { - "name": "Fiji Hindi", - "bcp_47": "hif", - "population": 383749, - "score": 0.0 - }, - { - "name": "Fijian", - "bcp_47": "fj", - "population": 365030, - "score": 0.0 - }, - { - "name": "Rotuman", - "bcp_47": "rtm", - "population": 2527, - "score": 0.0 - } - ] - }, - "FK": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2814, - "score": 0.47 - } - ] - }, - "FM": { - "score": 0.2107792806285859, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 58389, - "score": 0.47 - }, - { - "name": "Chuukese", - "bcp_47": "chk", - "population": 30731, - "score": 0.0 - }, - { - "name": "Pohnpeian", - "bcp_47": "pon", - "population": 23560, - "score": 0.0 - }, - { - "name": "Kosraean", - "bcp_47": "kos", - "population": 7990, - "score": 0.0 - }, - { - "name": "Yapese", - "bcp_47": "yap", - "population": 6556, - "score": 0.0 - }, - { - "name": "Ulithian", - "bcp_47": "uli", - "population": 2971, - "score": 0.0 - } - ] - }, - "FR": { - "score": 0.4436463938115849, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 26460798, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 8820266, - "score": 0.45 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 67169718, - "score": 0.46 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 882027, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 3392410, - "score": 0.49 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 1153419, - "score": 0.47 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 88203, - "score": 0.0 - }, - { - "name": "Catalan", - "bcp_47": "ca", - "population": 115342, - "score": 0.0 - }, - { - "name": "Swiss German", - "bcp_47": "gsw", - "population": 617419, - "score": 0.0 - }, - { - "name": "Occitan", - "bcp_47": "oc", - "population": 2035446, - "score": 0.0 - }, - { - "name": "Basque", - "bcp_47": "eu", - "population": 88203, - "score": 0.0 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 128912, - "score": 0.0 - }, - { - "name": "Picard", - "bcp_47": "pcd", - "population": 746330, - "score": 0.0 - }, - { - "name": "Breton", - "bcp_47": "br", - "population": 563140, - "score": 0.0 - }, - { - "name": "Corsican", - "bcp_47": "co", - "population": 162836, - "score": 0.0 - }, - { - "name": "Arpitan", - "bcp_47": "frp", - "population": 63777, - "score": 0.0 - }, - { - "name": "Interlingua", - "bcp_47": "ia", - "population": 136, - "score": 0.0 - } - ] - }, - "GB": { - "score": 0.43956766255639257, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 64445878, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 197283, - "score": 0.46 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 5260888, - "score": 0.45 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 197283, - "score": 0.42 - }, - { - "name": "Urdu", - "bcp_47": "ur", - "population": 2301638, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 15125053, - "score": 0.46 - }, - { - "name": "Bangla", - "bcp_47": "bn", - "population": 263044, - "score": 0.38 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 131522, - "score": 0.45 - }, - { - "name": "Punjabi", - "bcp_47": "pa", - "population": 2367400, - "score": 0.43 - }, - { - "name": "German", - "bcp_47": "de", - "population": 5918499, - "score": 0.49 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 2104355, - "score": 0.41 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 131522, - "score": 0.44 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 131522, - "score": 0.47 - }, - { - "name": "Gujarati", - "bcp_47": "gu", - "population": 1907072, - "score": 0.42 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 2630444, - "score": 0.0 - }, - { - "name": "Somali", - "bcp_47": "so", - "population": 131522, - "score": 0.0 - }, - { - "name": "Lithuanian", - "bcp_47": "lt", - "population": 131522, - "score": 0.0 - }, - { - "name": "Scots", - "bcp_47": "sco", - "population": 1644028, - "score": 0.0 - }, - { - "name": "Irish", - "bcp_47": "ga", - "population": 98642, - "score": 0.0 - }, - { - "name": "Welsh", - "bcp_47": "cy", - "population": 854894, - "score": 0.0 - }, - { - "name": "Scottish Gaelic", - "bcp_47": "gd", - "population": 72337, - "score": 0.0 - }, - { - "name": "Cornish", - "bcp_47": "kw", - "population": 1973, - "score": 0.0 - } - ] - }, - "GD": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 108570, - "score": 0.47 - } - ] - }, - "GG": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 67052, - "score": 0.47 - } - ] - }, - "GH": { - "score": 0.11322182754078493, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 6161442, - "score": 0.47 - }, - { - "name": "Hausa", - "bcp_47": "ha", - "population": 252326, - "score": 0.0 - }, - { - "name": "Akan", - "bcp_47": "ak", - "population": 11442678, - "score": 0.0 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 0, - "score": 0.0 - }, - { - "name": "Ewe", - "bcp_47": "ee", - "population": 3227422, - "score": 0.0 - }, - { - "name": "Abron", - "bcp_47": "abr", - "population": 1467010, - "score": 0.0 - }, - { - "name": "Frafra", - "bcp_47": "gur", - "population": 1026907, - "score": 0.0 - }, - { - "name": "Adangme", - "bcp_47": "ada", - "population": 880206, - "score": 0.0 - }, - { - "name": "Ga", - "bcp_47": "gaa", - "population": 821526, - "score": 0.0 - }, - { - "name": "Nzima", - "bcp_47": "nzi", - "population": 293402, - "score": 0.0 - }, - { - "name": "Safaliba", - "bcp_47": "saf", - "population": 4108, - "score": 0.0 - } - ] - }, - "GI": { - "score": 0.46230789234169806, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 23665, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 14790, - "score": 0.45 - } - ] - }, - "GM": { - "score": 0.27246376811594203, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 869600, - "score": 0.47 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 0, - "score": 0.0 - }, - { - "name": "Mandingo", - "bcp_47": "man", - "population": 630460, - "score": 0.0 - } - ] - }, - "GR": { - "score": 0.18194383576443016, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 5409621, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 954639, - "score": 0.46 - }, - { - "name": "German", - "bcp_47": "de", - "population": 530355, - "score": 0.49 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 127285, - "score": 0.44 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 10501029, - "score": 0.0 - }, - { - "name": "Bulgarian", - "bcp_47": "bg", - "population": 28639, - "score": 0.0 - }, - { - "name": "Albanian", - "bcp_47": "sq", - "population": 9971, - "score": 0.0 - }, - { - "name": "Macedonian", - "bcp_47": "mk", - "population": 169714, - "score": 0.0 - }, - { - "name": "Pontic", - "bcp_47": "pnt", - "population": 392463, - "score": 0.0 - }, - { - "name": "Tsakonian", - "bcp_47": "tsd", - "population": 202, - "score": 0.0 - } - ] - }, - "GS": { - "score": 0.4699999999999999, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 20, - "score": 0.47 - } - ] - }, - "GU": { - "score": 0.37849481059730655, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 153321, - "score": 0.47 - }, - { - "name": "Chamorro", - "bcp_47": "ch", - "population": 37067, - "score": 0.0 - } - ] - }, - "GY": { - "score": 0.47000000000000003, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 750204, - "score": 0.47 - } - ] - }, - "HK": { - "score": 0.4359751035397035, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3697454, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 7249910, - "score": 0.46 - }, - { - "name": "Cantonese", - "bcp_47": "yue", - "population": 6524919, - "score": 0.39 - } - ] - }, - "HM": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1, - "score": 0.47 - } - ] - }, - "HN": { - "score": 0.45011218630076477, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 40635, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 7203565, - "score": 0.45 - } - ] - }, - "HR": { - "score": 0.15823024946225459, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2071598, - "score": 0.47 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 67644, - "score": 0.47 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 4185472, - "score": 0.0 - }, - { - "name": "Venetian", - "bcp_47": "vec", - "population": 29594, - "score": 0.0 - } - ] - }, - "HU": { - "score": 0.13756219151316587, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1954366, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 293155, - "score": 0.46 - }, - { - "name": "German", - "bcp_47": "de", - "population": 1758929, - "score": 0.49 - }, - { - "name": "Romanian", - "bcp_47": "ro", - "population": 96741, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 9771830, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 31270, - "score": 0.0 - }, - { - "name": "Slovak", - "bcp_47": "sk", - "population": 11726, - "score": 0.0 - }, - { - "name": "Slovenian", - "bcp_47": "sl", - "population": 4984, - "score": 0.0 - } - ] - }, - "IE": { - "score": 0.3932846989826846, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 5073039, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 880017, - "score": 0.46 - }, - { - "name": "Irish", - "bcp_47": "ga", - "population": 1138845, - "score": 0.0 - } - ] - }, - "IL": { - "score": 0.21817259544999, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 7374158, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 1735096, - "score": 0.42 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 954303, - "score": 0.45 - }, - { - "name": "Malayalam", - "bcp_47": "ml", - "population": 7981, - "score": 0.0 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 130132, - "score": 0.0 - }, - { - "name": "North Levantine Arabic", - "bcp_47": "apc", - "population": 1474832, - "score": 0.0 - }, - { - "name": "Amharic", - "bcp_47": "am", - "population": 51185, - "score": 0.0 - }, - { - "name": "Romanian", - "bcp_47": "ro", - "population": 320993, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 86755, - "score": 0.0 - }, - { - "name": "Tigrinya", - "bcp_47": "ti", - "population": 10411, - "score": 0.0 - }, - { - "name": "Hebrew", - "bcp_47": "he", - "population": 8675480, - "score": 0.0 - }, - { - "name": "Yiddish", - "bcp_47": "yi", - "population": 260264, - "score": 0.0 - }, - { - "name": "Ladino", - "bcp_47": "lad", - "population": 112781, - "score": 0.0 - } - ] - }, - "IM": { - "score": 0.4612389121429656, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 90499, - "score": 0.47 - }, - { - "name": "Manx", - "bcp_47": "gv", - "population": 1719, - "score": 0.0 - } - ] - }, - "IN": { - "score": 0.3397907454052606, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 251957100, - "score": 0.47 - }, - { - "name": "Hindi", - "bcp_47": "hi", - "population": 545022990, - "score": 0.46 - }, - { - "name": "Urdu", - "bcp_47": "ur", - "population": 66304500, - "score": 0.42 - }, - { - "name": "Bangla", - "bcp_47": "bn", - "population": 107413290, - "score": 0.38 - }, - { - "name": "Punjabi", - "bcp_47": "pa", - "population": 37130520, - "score": 0.43 - }, - { - "name": "Telugu", - "bcp_47": "te", - "population": 95478480, - "score": 0.41 - }, - { - "name": "Western Panjabi", - "bcp_47": "lah", - "population": 33152, - "score": 0.0 - }, - { - "name": "Marathi", - "bcp_47": "mr", - "population": 92826300, - "score": 0.45 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 78239310, - "score": 0.41 - }, - { - "name": "Gujarati", - "bcp_47": "gu", - "population": 59674050, - "score": 0.42 - }, - { - "name": "Kannada", - "bcp_47": "kn", - "population": 49065330, - "score": 0.0 - }, - { - "name": "Malayalam", - "bcp_47": "ml", - "population": 42434880, - "score": 0.0 - }, - { - "name": "Odia", - "bcp_47": "or", - "population": 42434880, - "score": 0.0 - }, - { - "name": "Sindhi", - "bcp_47": "sd", - "population": 5304360, - "score": 0.0 - }, - { - "name": "Bhojpuri", - "bcp_47": "bho", - "population": 30500070, - "score": 0.0 - }, - { - "name": "Awadhi", - "bcp_47": "awa", - "population": 25195710, - "score": 0.0 - }, - { - "name": "Nepali", - "bcp_47": "ne", - "population": 7426104, - "score": 0.0 - }, - { - "name": "Maithili", - "bcp_47": "mai", - "population": 15913080, - "score": 0.0 - }, - { - "name": "Assamese", - "bcp_47": "as", - "population": 17239170, - "score": 0.0 - }, - { - "name": "Rangpuri", - "bcp_47": "rkt", - "population": 5702187, - "score": 0.0 - }, - { - "name": "Magahi", - "bcp_47": "mag", - "population": 15913080, - "score": 0.0 - }, - { - "name": "Haryanvi", - "bcp_47": "bgc", - "population": 15913080, - "score": 0.0 - }, - { - "name": "Marwari", - "bcp_47": "mwr", - "population": 15913080, - "score": 0.0 - }, - { - "name": "Chhattisgarhi", - "bcp_47": "hne", - "population": 14586990, - "score": 0.0 - }, - { - "name": "Deccan", - "bcp_47": "dcc", - "population": 13128291, - "score": 0.0 - }, - { - "name": "Kanauji", - "bcp_47": "bjj", - "population": 7426104, - "score": 0.0 - }, - { - "name": "Santali", - "bcp_47": "sat", - "population": 7293495, - "score": 0.0 - }, - { - "name": "Mewati", - "bcp_47": "wtm", - "population": 6100014, - "score": 0.0 - }, - { - "name": "Kashmiri", - "bcp_47": "ks", - "population": 5436969, - "score": 0.0 - }, - { - "name": "Konkani", - "bcp_47": "kok", - "population": 4906533, - "score": 0.0 - }, - { - "name": "Goan Konkani", - "bcp_47": "gom", - "population": 4243488, - "score": 0.0 - }, - { - "name": "Shekhawati", - "bcp_47": "swv", - "population": 3713052, - "score": 0.0 - }, - { - "name": "Lambadi", - "bcp_47": "lmn", - "population": 3580443, - "score": 0.0 - }, - { - "name": "Garhwali", - "bcp_47": "gbm", - "population": 3580443, - "score": 0.0 - }, - { - "name": "Gondi", - "bcp_47": "gon", - "population": 3182616, - "score": 0.0 - }, - { - "name": "Tibetan", - "bcp_47": "bo", - "population": 145870, - "score": 0.0 - }, - { - "name": "Kumaoni", - "bcp_47": "kfy", - "population": 2917398, - "score": 0.0 - }, - { - "name": "Dogri", - "bcp_47": "doi", - "population": 2652180, - "score": 0.0 - }, - { - "name": "Kurukh", - "bcp_47": "kru", - "population": 2519571, - "score": 0.0 - }, - { - "name": "Sadri", - "bcp_47": "sck", - "population": 2386962, - "score": 0.0 - }, - { - "name": "Waddar", - "bcp_47": "wbq", - "population": 2386962, - "score": 0.0 - }, - { - "name": "Kangri", - "bcp_47": "xnr", - "population": 2121744, - "score": 0.0 - }, - { - "name": "Wagdi", - "bcp_47": "wbr", - "population": 1989135, - "score": 0.0 - }, - { - "name": "Tulu", - "bcp_47": "tcy", - "population": 1989135, - "score": 0.0 - }, - { - "name": "Khandesi", - "bcp_47": "khn", - "population": 1989135, - "score": 0.0 - }, - { - "name": "Bodo", - "bcp_47": "brx", - "population": 1856526, - "score": 0.0 - }, - { - "name": "Nimadi", - "bcp_47": "noe", - "population": 1723917, - "score": 0.0 - }, - { - "name": "Bhili", - "bcp_47": "bhb", - "population": 1591308, - "score": 0.0 - }, - { - "name": "Manipuri", - "bcp_47": "mni", - "population": 1458699, - "score": 0.0 - }, - { - "name": "Rajasthani", - "bcp_47": "raj", - "population": 1326090, - "score": 0.0 - }, - { - "name": "Ho", - "bcp_47": "hoc", - "population": 1312829, - "score": 0.0 - }, - { - "name": "Mewari", - "bcp_47": "mtr", - "population": 1286307, - "score": 0.0 - }, - { - "name": "Mundari", - "bcp_47": "unr", - "population": 1246525, - "score": 0.0 - }, - { - "name": "Bhilali", - "bcp_47": "bhi", - "population": 1220003, - "score": 0.0 - }, - { - "name": "Hadothi", - "bcp_47": "hoj", - "population": 1087394, - "score": 0.0 - }, - { - "name": "Khasi", - "bcp_47": "kha", - "population": 1060872, - "score": 0.0 - }, - { - "name": "Kachhi", - "bcp_47": "kfr", - "population": 994568, - "score": 0.0 - }, - { - "name": "Garo", - "bcp_47": "grt", - "population": 702828, - "score": 0.0 - }, - { - "name": "Chakma", - "bcp_47": "ccp", - "population": 371305, - "score": 0.0 - }, - { - "name": "Bagheli", - "bcp_47": "bfy", - "population": 490653, - "score": 0.0 - }, - { - "name": "Munda", - "bcp_47": "unx", - "population": 636523, - "score": 0.0 - }, - { - "name": "Balti", - "bcp_47": "bft", - "population": 82218, - "score": 0.0 - }, - { - "name": "Sirmauri", - "bcp_47": "srx", - "population": 464132, - "score": 0.0 - }, - { - "name": "Divehi", - "bcp_47": "dv", - "population": 3978, - "score": 0.0 - }, - { - "name": "Saurashtra", - "bcp_47": "saz", - "population": 384566, - "score": 0.0 - }, - { - "name": "Dzongkha", - "bcp_47": "dz", - "population": 2652, - "score": 0.0 - }, - { - "name": "Limbu", - "bcp_47": "lif", - "population": 34478, - "score": 0.0 - }, - { - "name": "Ao Naga", - "bcp_47": "njo", - "population": 305001, - "score": 0.0 - }, - { - "name": "Badaga", - "bcp_47": "bfq", - "population": 305001, - "score": 0.0 - }, - { - "name": "Riang (India)", - "bcp_47": "ria", - "population": 172392, - "score": 0.0 - }, - { - "name": "Bishnupriya", - "bcp_47": "bpy", - "population": 90174, - "score": 0.0 - }, - { - "name": "Lepcha", - "bcp_47": "lep", - "population": 46413, - "score": 0.0 - }, - { - "name": "Bateri", - "bcp_47": "btv", - "population": 34478, - "score": 0.0 - }, - { - "name": "Braj", - "bcp_47": "bra", - "population": 54370, - "score": 0.0 - }, - { - "name": "Kuvi", - "bcp_47": "kxv", - "population": 38457, - "score": 0.0 - }, - { - "name": "Sanskrit", - "bcp_47": "sa", - "population": 15913, - "score": 0.0 - }, - { - "name": "Khamti", - "bcp_47": "kht", - "population": 9283, - "score": 0.0 - } - ] - }, - "IO": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3500, - "score": 0.47 - } - ] - }, - "IQ": { - "score": 0.357837983423388, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 13605445, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 26433436, - "score": 0.42 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 338192, - "score": 0.41 - }, - { - "name": "Azerbaijani", - "bcp_47": "az", - "population": 699709, - "score": 0.0 - }, - { - "name": "Central Kurdish", - "bcp_47": "ckb", - "population": 7774540, - "score": 0.0 - }, - { - "name": "Northern Luri", - "bcp_47": "lrc", - "population": 237123, - "score": 0.0 - }, - { - "name": "Syriac", - "bcp_47": "syr", - "population": 194364, - "score": 0.0 - } - ] - }, - "IT": { - "score": 0.43224641662655555, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 21216918, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 3931370, - "score": 0.46 - }, - { - "name": "German", - "bcp_47": "de", - "population": 998443, - "score": 0.49 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 59282565, - "score": 0.47 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 21841, - "score": 0.0 - }, - { - "name": "Catalan", - "bcp_47": "ca", - "population": 21841, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 3495, - "score": 0.0 - }, - { - "name": "Lombard", - "bcp_47": "lmo", - "population": 3556954, - "score": 0.0 - }, - { - "name": "Slovenian", - "bcp_47": "sl", - "population": 106085, - "score": 0.0 - }, - { - "name": "Venetian", - "bcp_47": "vec", - "population": 811235, - "score": 0.0 - }, - { - "name": "Sardinian", - "bcp_47": "sc", - "population": 1060846, - "score": 0.0 - }, - { - "name": "Neapolitan", - "bcp_47": "nap", - "population": 605306, - "score": 0.0 - }, - { - "name": "Ligurian", - "bcp_47": "lij", - "population": 536663, - "score": 0.0 - }, - { - "name": "Sicilian", - "bcp_47": "scn", - "population": 511702, - "score": 0.0 - }, - { - "name": "Sassarese Sardinian", - "bcp_47": "sdc", - "population": 106085, - "score": 0.0 - }, - { - "name": "Friulian", - "bcp_47": "fur", - "population": 37442, - "score": 0.0 - }, - { - "name": "Emilian", - "bcp_47": "egl", - "population": 31201, - "score": 0.0 - }, - { - "name": "Piedmontese", - "bcp_47": "pms", - "population": 6178, - "score": 0.0 - }, - { - "name": "Romagnol", - "bcp_47": "rgn", - "population": 0, - "score": 0.0 - } - ] - }, - "JE": { - "score": 0.47000000000000003, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 96019, - "score": 0.47 - } - ] - }, - "JM": { - "score": 0.2386528447990708, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2752399, - "score": 0.47 - }, - { - "name": "Jamaican Creole English", - "bcp_47": "jam", - "population": 2668142, - "score": 0.0 - } - ] - }, - "JO": { - "score": 0.29928909952606636, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 4869270, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 10820600, - "score": 0.42 - }, - { - "name": "North Levantine Arabic", - "bcp_47": "apc", - "population": 7141596, - "score": 0.0 - } - ] - }, - "KE": { - "score": 0.2501476621404106, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 10170301, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 24623, - "score": 0.42 - }, - { - "name": "Punjabi", - "bcp_47": "pa", - "population": 10170, - "score": 0.43 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 35328414, - "score": 0.45 - }, - { - "name": "Gujarati", - "bcp_47": "gu", - "population": 4978, - "score": 0.42 - }, - { - "name": "Oromo", - "bcp_47": "om", - "population": 251581, - "score": 0.0 - }, - { - "name": "Somali", - "bcp_47": "so", - "population": 695863, - "score": 0.0 - }, - { - "name": "Kikuyu", - "bcp_47": "ki", - "population": 9099743, - "score": 0.0 - }, - { - "name": "Luyia", - "bcp_47": "luy", - "population": 5888069, - "score": 0.0 - }, - { - "name": "Luo (Kenya and Tanzania)", - "bcp_47": "luo", - "population": 5245734, - "score": 0.0 - }, - { - "name": "Kamba", - "bcp_47": "kam", - "population": 4068120, - "score": 0.0 - }, - { - "name": "Kalenjin", - "bcp_47": "kln", - "population": 4068120, - "score": 0.0 - }, - { - "name": "Gusii", - "bcp_47": "guz", - "population": 2622867, - "score": 0.0 - }, - { - "name": "Meru", - "bcp_47": "mer", - "population": 2141116, - "score": 0.0 - }, - { - "name": "Teso", - "bcp_47": "teo", - "population": 396106, - "score": 0.0 - }, - { - "name": "Masai", - "bcp_47": "mas", - "population": 856446, - "score": 0.0 - }, - { - "name": "Embu", - "bcp_47": "ebu", - "population": 802918, - "score": 0.0 - }, - { - "name": "Taita", - "bcp_47": "dav", - "population": 438929, - "score": 0.0 - }, - { - "name": "Pökoot", - "bcp_47": "pko", - "population": 369343, - "score": 0.0 - }, - { - "name": "Samburu", - "bcp_47": "saq", - "population": 246228, - "score": 0.0 - } - ] - }, - "KI": { - "score": 0.29374934311302925, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 111796, - "score": 0.47 - }, - { - "name": "Gilbertese", - "bcp_47": "gil", - "population": 67078, - "score": 0.0 - } - ] - }, - "KN": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 52745, - "score": 0.47 - } - ] - }, - "KY": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 60705, - "score": 0.47 - } - ] - }, - "KZ": { - "score": 0.2671643693028198, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2863785, - "score": 0.47 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 13746168, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 1221882, - "score": 0.49 - }, - { - "name": "Kazakh", - "bcp_47": "kk", - "population": 12218816, - "score": 0.0 - }, - { - "name": "Uyghur", - "bcp_47": "ug", - "population": 381838, - "score": 0.0 - } - ] - }, - "LB": { - "score": 0.236164974261225, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2187844, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 4703865, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 20238, - "score": 0.46 - }, - { - "name": "North Levantine Arabic", - "bcp_47": "apc", - "population": 5469610, - "score": 0.0 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 92983, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 284420, - "score": 0.0 - } - ] - }, - "LC": { - "score": 0.47000000000000003, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 149838, - "score": 0.47 - } - ] - }, - "LK": { - "score": 0.11666666666666665, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2288920, - "score": 0.47 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 3433380, - "score": 0.41 - }, - { - "name": "Sinhala", - "bcp_47": "si", - "population": 15564656, - "score": 0.0 - } - ] - }, - "LR": { - "score": 0.3897881418272767, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 4210839, - "score": 0.47 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 0, - "score": 0.0 - }, - { - "name": "Mende", - "bcp_47": "men", - "population": 24352, - "score": 0.0 - }, - { - "name": "Kpelle", - "bcp_47": "kpe", - "population": 710262, - "score": 0.0 - }, - { - "name": "Vai", - "bcp_47": "vai", - "population": 131906, - "score": 0.0 - } - ] - }, - "LS": { - "score": 0.08912144167455979, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 531719, - "score": 0.47 - }, - { - "name": "Zulu", - "bcp_47": "zu", - "population": 275706, - "score": 0.0 - }, - { - "name": "Xhosa", - "bcp_47": "xh", - "population": 19496, - "score": 0.0 - }, - { - "name": "Southern Sotho", - "bcp_47": "st", - "population": 1929943, - "score": 0.0 - }, - { - "name": "Swati", - "bcp_47": "ss", - "population": 47264, - "score": 0.0 - } - ] - }, - "LT": { - "score": 0.2785320836068621, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1037955, - "score": 0.47 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 2185168, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 382404, - "score": 0.49 - }, - { - "name": "Lithuanian", - "bcp_47": "lt", - "population": 2349056, - "score": 0.0 - }, - { - "name": "Samogitian", - "bcp_47": "sgs", - "population": 0, - "score": 0.0 - } - ] - }, - "LU": { - "score": 0.3612802832567923, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 351893, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 546691, - "score": 0.46 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 100541, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 395880, - "score": 0.49 - }, - { - "name": "Luxembourgish", - "bcp_47": "lb", - "population": 421015, - "score": 0.0 - } - ] - }, - "LV": { - "score": 0.2515919974081345, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 865366, - "score": 0.47 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 714867, - "score": 0.45 - }, - { - "name": "Latvian", - "bcp_47": "lv", - "population": 1147550, - "score": 0.0 - }, - { - "name": "Latgalian", - "bcp_47": "ltg", - "population": 167429, - "score": 0.0 - } - ] - }, - "MA": { - "score": 0.1728843489070226, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 4978638, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 23115, - "score": 0.45 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 22048254, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 7112340, - "score": 0.46 - }, - { - "name": "Moroccan Arabic", - "bcp_47": "ary", - "population": 30938679, - "score": 0.0 - }, - { - "name": "Standard Moroccan Tamazight", - "bcp_47": "zgh", - "population": 7823574, - "score": 0.0 - }, - { - "name": "Tachelhit", - "bcp_47": "shi", - "population": 6187736, - "score": 0.0 - }, - { - "name": "Riffian", - "bcp_47": "rif", - "population": 3485046, - "score": 0.0 - }, - { - "name": "Central Atlas Tamazight", - "bcp_47": "tzm", - "population": 3485047, - "score": 0.0 - } - ] - }, - "MG": { - "score": 0.22711864406779658, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 4852026, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 18599433, - "score": 0.46 - }, - { - "name": "Malagasy", - "bcp_47": "mg", - "population": 24260130, - "score": 0.0 - } - ] - }, - "MH": { - "score": 0.2633143913036755, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 72463, - "score": 0.47 - }, - { - "name": "Marshallese", - "bcp_47": "mh", - "population": 56879, - "score": 0.0 - } - ] - }, - "MO": { - "score": 0.4597552187538731, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 14133, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 632892, - "score": 0.46 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 30723, - "score": 0.45 - } - ] - }, - "MP": { - "score": 0.39643436802596876, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 49890, - "score": 0.47 - }, - { - "name": "Chamorro", - "bcp_47": "ch", - "population": 9258, - "score": 0.0 - } - ] - }, - "MS": { - "score": 0.47000000000000003, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3492, - "score": 0.47 - } - ] - }, - "MT": { - "score": 0.28525492889983195, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 402395, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 50299, - "score": 0.46 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 256070, - "score": 0.47 - }, - { - "name": "Maltese", - "bcp_47": "mt", - "population": 457267, - "score": 0.0 - } - ] - }, - "MU": { - "score": 0.19243355389764255, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 993146, - "score": 0.47 - }, - { - "name": "Urdu", - "bcp_47": "ur", - "population": 71727, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 41381, - "score": 0.46 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 34484, - "score": 0.41 - }, - { - "name": "Bhojpuri", - "bcp_47": "bho", - "population": 372430, - "score": 0.0 - }, - { - "name": "Morisyen", - "bcp_47": "mfe", - "population": 1241433, - "score": 0.0 - } - ] - }, - "MV": { - "score": 0.20375720139116277, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 293928, - "score": 0.47 - }, - { - "name": "Divehi", - "bcp_47": "dv", - "population": 384066, - "score": 0.0 - } - ] - }, - "MW": { - "score": 0.21818583638561564, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 13353858, - "score": 0.47 - }, - { - "name": "Nyanja", - "bcp_47": "ny", - "population": 13353858, - "score": 0.0 - }, - { - "name": "Zulu", - "bcp_47": "zu", - "population": 69949, - "score": 0.0 - }, - { - "name": "Tumbuka", - "bcp_47": "tum", - "population": 1780514, - "score": 0.0 - }, - { - "name": "Nyasa Tonga", - "bcp_47": "tog", - "population": 207727, - "score": 0.0 - } - ] - }, - "MX": { - "score": 0.4435481398281213, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 16724500, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 106779500, - "score": 0.45 - }, - { - "name": "Venetian", - "bcp_47": "vec", - "population": 2444, - "score": 0.0 - }, - { - "name": "Yucateco", - "bcp_47": "yua", - "population": 861955, - "score": 0.0 - }, - { - "name": "Eastern Huasteca Nahuatl", - "bcp_47": "nhe", - "population": 501735, - "score": 0.0 - }, - { - "name": "Western Huasteca Nahuatl", - "bcp_47": "nhw", - "population": 501735, - "score": 0.0 - }, - { - "name": "Central Mazahua", - "bcp_47": "maz", - "population": 437410, - "score": 0.0 - }, - { - "name": "Central Huasteca Nahuatl", - "bcp_47": "nch", - "population": 244435, - "score": 0.0 - }, - { - "name": "Seri", - "bcp_47": "sei", - "population": 901, - "score": 0.0 - } - ] - }, - "MY": { - "score": 0.1619475361727729, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 6856941, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 5550857, - "score": 0.46 - }, - { - "name": "Javanese", - "bcp_47": "jv", - "population": 391825, - "score": 0.41 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 1371388, - "score": 0.41 - }, - { - "name": "Malayalam", - "bcp_47": "ml", - "population": 48978, - "score": 0.0 - }, - { - "name": "Malay", - "bcp_47": "ms", - "population": 24489075, - "score": 0.0 - }, - { - "name": "Buginese", - "bcp_47": "bug", - "population": 25795, - "score": 0.0 - }, - { - "name": "Banjar", - "bcp_47": "bjn", - "population": 4898, - "score": 0.0 - }, - { - "name": "Iban", - "bcp_47": "iba", - "population": 816302, - "score": 0.0 - }, - { - "name": "Negeri Sembilan Malay", - "bcp_47": "zmi", - "population": 391825, - "score": 0.0 - }, - { - "name": "Central Dusun", - "bcp_47": "dtp", - "population": 182852, - "score": 0.0 - } - ] - }, - "NA": { - "score": 0.023383111654627774, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 184105, - "score": 0.47 - }, - { - "name": "German", - "bcp_47": "de", - "population": 23671, - "score": 0.49 - }, - { - "name": "Afrikaans", - "bcp_47": "af", - "population": 1972552, - "score": 0.0 - }, - { - "name": "Tswana", - "bcp_47": "tn", - "population": 14728, - "score": 0.0 - }, - { - "name": "Kuanyama", - "bcp_47": "kj", - "population": 920524, - "score": 0.0 - }, - { - "name": "Ndonga", - "bcp_47": "ng", - "population": 552315, - "score": 0.0 - }, - { - "name": "Nama", - "bcp_47": "naq", - "population": 289308, - "score": 0.0 - }, - { - "name": "Herero", - "bcp_47": "hz", - "population": 239336, - "score": 0.0 - } - ] - }, - "NF": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1678, - "score": 0.47 - } - ] - }, - "NG": { - "score": 0.19759994365435074, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 113434840, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 151960, - "score": 0.42 - }, - { - "name": "Nigerian Pidgin", - "bcp_47": "pcm", - "population": 44945880, - "score": 0.0 - }, - { - "name": "Hausa", - "bcp_47": "ha", - "population": 29963920, - "score": 0.0 - }, - { - "name": "Yoruba", - "bcp_47": "yo", - "population": 27823640, - "score": 0.0 - }, - { - "name": "Igbo", - "bcp_47": "ig", - "population": 27823640, - "score": 0.0 - }, - { - "name": "Nigerian Fulfulde", - "bcp_47": "fuv", - "population": 14339876, - "score": 0.0 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 0, - "score": 0.0 - }, - { - "name": "Tiv", - "bcp_47": "tiv", - "population": 3424448, - "score": 0.0 - }, - { - "name": "Ibibio", - "bcp_47": "ibb", - "population": 2996392, - "score": 0.0 - }, - { - "name": "Efik", - "bcp_47": "efi", - "population": 2996392, - "score": 0.0 - }, - { - "name": "Bini", - "bcp_47": "bin", - "population": 1519599, - "score": 0.0 - }, - { - "name": "Jju", - "bcp_47": "kaj", - "population": 449459, - "score": 0.0 - }, - { - "name": "Tyap", - "bcp_47": "kcg", - "population": 199046, - "score": 0.0 - }, - { - "name": "Atsam", - "bcp_47": "cch", - "population": 44946, - "score": 0.0 - }, - { - "name": "Amo", - "bcp_47": "amo", - "population": 18620, - "score": 0.0 - }, - { - "name": "Obolo", - "bcp_47": "ann", - "population": 0, - "score": 0.0 - } - ] - }, - "NL": { - "score": 0.28688749989149553, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 15552360, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 5011316, - "score": 0.46 - }, - { - "name": "Indonesian", - "bcp_47": "id", - "population": 311047, - "score": 0.47 - }, - { - "name": "German", - "bcp_47": "de", - "population": 12269084, - "score": 0.49 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 207365, - "score": 0.44 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 17280400, - "score": 0.0 - }, - { - "name": "Low German", - "bcp_47": "nds", - "population": 1900844, - "score": 0.0 - }, - { - "name": "Riffian", - "bcp_47": "rif", - "population": 207365, - "score": 0.0 - }, - { - "name": "Limburgish", - "bcp_47": "li", - "population": 950422, - "score": 0.0 - }, - { - "name": "Western Frisian", - "bcp_47": "fy", - "population": 743057, - "score": 0.0 - }, - { - "name": "Gronings", - "bcp_47": "gos", - "population": 622094, - "score": 0.0 - }, - { - "name": "Zeelandic", - "bcp_47": "zea", - "population": 241926, - "score": 0.0 - } - ] - }, - "NP": { - "score": 0.018334010922876218, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 909837, - "score": 0.47 - }, - { - "name": "Hindi", - "bcp_47": "hi", - "population": 127377, - "score": 0.46 - }, - { - "name": "Bangla", - "bcp_47": "bn", - "population": 28508, - "score": 0.38 - }, - { - "name": "Bhojpuri", - "bcp_47": "bho", - "population": 2062297, - "score": 0.0 - }, - { - "name": "Awadhi", - "bcp_47": "awa", - "population": 667214, - "score": 0.0 - }, - { - "name": "Nepali", - "bcp_47": "ne", - "population": 13344276, - "score": 0.0 - }, - { - "name": "Maithili", - "bcp_47": "mai", - "population": 3336069, - "score": 0.0 - }, - { - "name": "Tibetan", - "bcp_47": "bo", - "population": 72787, - "score": 0.0 - }, - { - "name": "Mundari", - "bcp_47": "unr", - "population": 5762, - "score": 0.0 - }, - { - "name": "Newari", - "bcp_47": "new", - "population": 1000821, - "score": 0.0 - }, - { - "name": "Jumli", - "bcp_47": "jml", - "population": 970493, - "score": 0.0 - }, - { - "name": "Dotyali", - "bcp_47": "dty", - "population": 758198, - "score": 0.0 - }, - { - "name": "Bagheli", - "bcp_47": "bfy", - "population": 163771, - "score": 0.0 - }, - { - "name": "Dangaura Tharu", - "bcp_47": "thl", - "population": 606558, - "score": 0.0 - }, - { - "name": "Bantawa", - "bcp_47": "bap", - "population": 454918, - "score": 0.0 - }, - { - "name": "Western Tamang", - "bcp_47": "tdg", - "population": 394263, - "score": 0.0 - }, - { - "name": "Limbu", - "bcp_47": "lif", - "population": 333607, - "score": 0.0 - }, - { - "name": "Rana Tharu", - "bcp_47": "thr", - "population": 363935, - "score": 0.0 - }, - { - "name": "Eastern Magar", - "bcp_47": "mgp", - "population": 333607, - "score": 0.0 - }, - { - "name": "Kochila Tharu", - "bcp_47": "thq", - "population": 303279, - "score": 0.0 - }, - { - "name": "Western Magar", - "bcp_47": "mrd", - "population": 251722, - "score": 0.0 - }, - { - "name": "Sherpa", - "bcp_47": "xsr", - "population": 157705, - "score": 0.0 - }, - { - "name": "Rajbanshi", - "bcp_47": "rjs", - "population": 133443, - "score": 0.0 - }, - { - "name": "Eastern Tamang", - "bcp_47": "taj", - "population": 130410, - "score": 0.0 - }, - { - "name": "Gurung", - "bcp_47": "gvr", - "population": 87951, - "score": 0.0 - }, - { - "name": "Lepcha", - "bcp_47": "lep", - "population": 2820, - "score": 0.0 - }, - { - "name": "Kathoriya Tharu", - "bcp_47": "tkt", - "population": 72787, - "score": 0.0 - }, - { - "name": "Thulung", - "bcp_47": "tdh", - "population": 36393, - "score": 0.0 - } - ] - }, - "NR": { - "score": 0.2699324324324324, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 9350, - "score": 0.47 - }, - { - "name": "Nauru", - "bcp_47": "na", - "population": 6930, - "score": 0.0 - } - ] - }, - "NU": { - "score": 0.235, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1120, - "score": 0.47 - }, - { - "name": "Niuean", - "bcp_47": "niu", - "population": 1120, - "score": 0.0 - } - ] - }, - "NZ": { - "score": 0.45694448388813996, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 4826970, - "score": 0.47 - }, - { - "name": "Māori", - "bcp_47": "mi", - "population": 137913, - "score": 0.0 - } - ] - }, - "PA": { - "score": 0.4533854469232938, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 545171, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 5841, - "score": 0.46 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 2686915, - "score": 0.45 - } - ] - }, - "PG": { - "score": 0.19090169012205813, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 3629730, - "score": 0.47 - }, - { - "name": "Tok Pisin", - "bcp_47": "tpi", - "population": 5154217, - "score": 0.0 - }, - { - "name": "Hiri Motu", - "bcp_47": "ho", - "population": 152449, - "score": 0.0 - } - ] - }, - "PH": { - "score": 0.32615211365536473, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 69875840, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 797021, - "score": 0.46 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 33846110, - "score": 0.45 - }, - { - "name": "Filipino", - "bcp_47": "fil", - "population": 65508600, - "score": 0.42 - }, - { - "name": "Cebuano", - "bcp_47": "ceb", - "population": 26203440, - "score": 0.0 - }, - { - "name": "Iloko", - "bcp_47": "ilo", - "population": 10481376, - "score": 0.0 - }, - { - "name": "Hiligaynon", - "bcp_47": "hil", - "population": 9171204, - "score": 0.0 - }, - { - "name": "Bikol", - "bcp_47": "bik", - "population": 3275430, - "score": 0.0 - }, - { - "name": "Waray", - "bcp_47": "war", - "population": 3166249, - "score": 0.0 - }, - { - "name": "Pampanga", - "bcp_47": "pam", - "population": 2511163, - "score": 0.0 - }, - { - "name": "West Albay Bikol", - "bcp_47": "fbl", - "population": 2511163, - "score": 0.0 - }, - { - "name": "Pangasinan", - "bcp_47": "pag", - "population": 1528534, - "score": 0.0 - }, - { - "name": "Maguindanaon", - "bcp_47": "mdh", - "population": 1310172, - "score": 0.0 - }, - { - "name": "Tausug", - "bcp_47": "tsg", - "population": 1200991, - "score": 0.0 - }, - { - "name": "Capiznon", - "bcp_47": "cps", - "population": 720595, - "score": 0.0 - }, - { - "name": "Kinaray-a", - "bcp_47": "krj", - "population": 425806, - "score": 0.0 - }, - { - "name": "Rinconada Bikol", - "bcp_47": "bto", - "population": 305707, - "score": 0.0 - }, - { - "name": "Hanunoo", - "bcp_47": "hnn", - "population": 17469, - "score": 0.0 - }, - { - "name": "Tagbanwa", - "bcp_47": "tbw", - "population": 10045, - "score": 0.0 - }, - { - "name": "Buhid", - "bcp_47": "bku", - "population": 7970, - "score": 0.0 - } - ] - }, - "PK": { - "score": 0.30567966556461956, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 116750500, - "score": 0.47 - }, - { - "name": "Urdu", - "bcp_47": "ur", - "population": 221825950, - "score": 0.42 - }, - { - "name": "Punjabi", - "bcp_47": "pa", - "population": 163450700, - "score": 0.43 - }, - { - "name": "Western Panjabi", - "bcp_47": "lah", - "population": 93400400, - "score": 0.0 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 1541107, - "score": 0.41 - }, - { - "name": "Pashto", - "bcp_47": "ps", - "population": 37360160, - "score": 0.0 - }, - { - "name": "Sindhi", - "bcp_47": "sd", - "population": 35025150, - "score": 0.0 - }, - { - "name": "Saraiki", - "bcp_47": "skr", - "population": 28020120, - "score": 0.0 - }, - { - "name": "Tajik", - "bcp_47": "tg", - "population": 770553, - "score": 0.0 - }, - { - "name": "Baluchi", - "bcp_47": "bal", - "population": 6071026, - "score": 0.0 - }, - { - "name": "Kashmiri", - "bcp_47": "ks", - "population": 161116, - "score": 0.0 - }, - { - "name": "Northern Hindko", - "bcp_47": "hno", - "population": 3969517, - "score": 0.0 - }, - { - "name": "Brahui", - "bcp_47": "brh", - "population": 3035513, - "score": 0.0 - }, - { - "name": "Western Balochi", - "bcp_47": "bgn", - "population": 1330956, - "score": 0.0 - }, - { - "name": "Southern Hindko", - "bcp_47": "hnd", - "population": 957354, - "score": 0.0 - }, - { - "name": "Balti", - "bcp_47": "bft", - "population": 420302, - "score": 0.0 - }, - { - "name": "Gujari", - "bcp_47": "gju", - "population": 467002, - "score": 0.0 - }, - { - "name": "Parkari Koli", - "bcp_47": "kvx", - "population": 373602, - "score": 0.0 - }, - { - "name": "Khowar", - "bcp_47": "khw", - "population": 350252, - "score": 0.0 - }, - { - "name": "Indus Kohistani", - "bcp_47": "mvy", - "population": 326901, - "score": 0.0 - }, - { - "name": "Wadiyara Koli", - "bcp_47": "kxp", - "population": 256851, - "score": 0.0 - }, - { - "name": "Kachi Koli", - "bcp_47": "gjk", - "population": 256851, - "score": 0.0 - }, - { - "name": "Torwali", - "bcp_47": "trw", - "population": 123756, - "score": 0.0 - }, - { - "name": "Bateri", - "bcp_47": "btv", - "population": 44365, - "score": 0.0 - } - ] - }, - "PL": { - "score": 0.19542647519424666, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 12633159, - "score": 0.47 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 6890814, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 7273637, - "score": 0.49 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 36751008, - "score": 0.0 - }, - { - "name": "Ukrainian", - "bcp_47": "uk", - "population": 149301, - "score": 0.0 - }, - { - "name": "Belarusian", - "bcp_47": "be", - "population": 222037, - "score": 0.0 - }, - { - "name": "Lithuanian", - "bcp_47": "lt", - "population": 8039, - "score": 0.0 - }, - { - "name": "Silesian", - "bcp_47": "szl", - "population": 497670, - "score": 0.0 - }, - { - "name": "Kashubian", - "bcp_47": "csb", - "population": 49767, - "score": 0.0 - }, - { - "name": "Lower Silesian", - "bcp_47": "sli", - "population": 11868, - "score": 0.0 - }, - { - "name": "Prussian", - "bcp_47": "prg", - "population": 38, - "score": 0.0 - } - ] - }, - "PM": { - "score": 0.46035150375939854, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 187, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 5133, - "score": 0.46 - } - ] - }, - "PN": { - "score": 0.4699999999999999, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 46, - "score": 0.47 - } - ] - }, - "PR": { - "score": 0.4572058813018271, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1562644, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 2774491, - "score": 0.45 - } - ] - }, - "PT": { - "score": 0.4542324762390237, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2781729, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 1030270, - "score": 0.45 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 1545405, - "score": 0.46 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 9890592, - "score": 0.45 - }, - { - "name": "Galician", - "bcp_47": "gl", - "population": 14424, - "score": 0.0 - } - ] - }, - "PW": { - "score": 0.04945299431247909, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1887, - "score": 0.47 - }, - { - "name": "Palauan", - "bcp_47": "pau", - "population": 16047, - "score": 0.0 - } - ] - }, - "RO": { - "score": 0.1743772772485309, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 6603899, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 2130290, - "score": 0.45 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 3621493, - "score": 0.46 - }, - { - "name": "German", - "bcp_47": "de", - "population": 44736, - "score": 0.49 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 27694, - "score": 0.44 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 2769, - "score": 0.0 - }, - { - "name": "Romanian", - "bcp_47": "ro", - "population": 19172610, - "score": 0.0 - }, - { - "name": "Serbian", - "bcp_47": "sr", - "population": 25563, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 1405991, - "score": 0.0 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 4048, - "score": 0.0 - }, - { - "name": "Bulgarian", - "bcp_47": "bg", - "population": 6817, - "score": 0.0 - } - ] - }, - "RW": { - "score": 0.07670541959715828, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1906860, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 2288, - "score": 0.46 - }, - { - "name": "Kinyarwanda", - "bcp_47": "rw", - "population": 9788548, - "score": 0.0 - } - ] - }, - "SB": { - "score": 0.25627042630612157, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 685097, - "score": 0.47 - }, - { - "name": "Pijin", - "bcp_47": "pis", - "population": 561780, - "score": 0.0 - }, - { - "name": "Roviana", - "bcp_47": "rug", - "population": 9591, - "score": 0.0 - } - ] - }, - "SC": { - "score": 0.23194000733562617, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 36473, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 57589, - "score": 0.46 - }, - { - "name": "Seselwa Creole French", - "bcp_47": "crs", - "population": 94061, - "score": 0.0 - } - ] - }, - "SD": { - "score": 0.40445504435404195, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 27792576, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 27792576, - "score": 0.42 - }, - { - "name": "Hausa", - "bcp_47": "ha", - "population": 820109, - "score": 0.0 - }, - { - "name": "Beja", - "bcp_47": "bej", - "population": 2460326, - "score": 0.0 - }, - { - "name": "Fur", - "bcp_47": "fvr", - "population": 1230163, - "score": 0.0 - }, - { - "name": "Masalit", - "bcp_47": "mls", - "population": 451060, - "score": 0.0 - }, - { - "name": "Nobiin", - "bcp_47": "fia", - "population": 378161, - "score": 0.0 - }, - { - "name": "Zaghawa", - "bcp_47": "zag", - "population": 232364, - "score": 0.0 - } - ] - }, - "SE": { - "score": 0.21941169569516628, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 8774150, - "score": 0.47 - }, - { - "name": "Swedish", - "bcp_47": "sv", - "population": 9692375, - "score": 0.0 - }, - { - "name": "Finnish", - "bcp_47": "fi", - "population": 224455, - "score": 0.0 - }, - { - "name": "Yiddish", - "bcp_47": "yi", - "population": 2959, - "score": 0.0 - }, - { - "name": "Tornedalen Finnish", - "bcp_47": "fit", - "population": 56114, - "score": 0.0 - }, - { - "name": "Northern Sami", - "bcp_47": "se", - "population": 33668, - "score": 0.0 - }, - { - "name": "Tavringer Romani", - "bcp_47": "rmu", - "population": 9488, - "score": 0.0 - }, - { - "name": "Lule Sami", - "bcp_47": "smj", - "population": 1530, - "score": 0.0 - }, - { - "name": "Southern Sami", - "bcp_47": "sma", - "population": 296, - "score": 0.0 - }, - { - "name": "Interlingua", - "bcp_47": "ia", - "population": 0, - "score": 0.0 - } - ] - }, - "SG": { - "score": 0.4294592881506046, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 5774984, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 4781438, - "score": 0.46 - }, - { - "name": "Punjabi", - "bcp_47": "pa", - "population": 9314, - "score": 0.43 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 130403, - "score": 0.41 - }, - { - "name": "Malayalam", - "bcp_47": "ml", - "population": 9935, - "score": 0.0 - }, - { - "name": "Malay", - "bcp_47": "ms", - "population": 869352, - "score": 0.0 - } - ] - }, - "SH": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 5425, - "score": 0.47 - } - ] - }, - "SI": { - "score": 0.1928028123892293, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1240581, - "score": 0.47 - }, - { - "name": "German", - "bcp_47": "de", - "population": 883126, - "score": 0.49 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 3995, - "score": 0.47 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 9252, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 1282635, - "score": 0.0 - }, - { - "name": "Slovenian", - "bcp_47": "sl", - "population": 1829332, - "score": 0.0 - }, - { - "name": "Venetian", - "bcp_47": "vec", - "population": 29438, - "score": 0.0 - } - ] - }, - "SK": { - "score": 0.11567670853229638, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1414556, - "score": 0.47 - }, - { - "name": "German", - "bcp_47": "de", - "population": 1196932, - "score": 0.49 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 50598, - "score": 0.0 - }, - { - "name": "Ukrainian", - "bcp_47": "uk", - "population": 103371, - "score": 0.0 - }, - { - "name": "Czech", - "bcp_47": "cs", - "population": 2557082, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 598466, - "score": 0.0 - }, - { - "name": "Slovak", - "bcp_47": "sk", - "population": 4896540, - "score": 0.0 - } - ] - }, - "SL": { - "score": 0.08989072161019854, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2318726, - "score": 0.47 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 0, - "score": 0.0 - }, - { - "name": "Krio", - "bcp_47": "kri", - "population": 6293684, - "score": 0.0 - }, - { - "name": "Mende", - "bcp_47": "men", - "population": 1788731, - "score": 0.0 - }, - { - "name": "Timne", - "bcp_47": "tem", - "population": 1722482, - "score": 0.0 - } - ] - }, - "SS": { - "score": 0.4031879322739386, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2851524, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 2851524, - "score": 0.42 - }, - { - "name": "Nuer", - "bcp_47": "nus", - "population": 591427, - "score": 0.0 - } - ] - }, - "SX": { - "score": 0.41148919399949146, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 29816, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 4823, - "score": 0.45 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 1578, - "score": 0.0 - }, - { - "name": "Virgin Islands Creole English", - "bcp_47": "vic", - "population": 3113, - "score": 0.0 - } - ] - }, - "SZ": { - "score": 0.2566553218261588, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 883584, - "score": 0.47 - }, - { - "name": "Zulu", - "bcp_47": "zu", - "population": 75105, - "score": 0.0 - }, - { - "name": "Tsonga", - "bcp_47": "ts", - "population": 18776, - "score": 0.0 - }, - { - "name": "Swati", - "bcp_47": "ss", - "population": 640598, - "score": 0.0 - } - ] - }, - "TA": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 272, - "score": 0.47 - } - ] - }, - "TC": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 54807, - "score": 0.47 - } - ] - }, - "TH": { - "score": 0.0855764589364112, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 18623898, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 1241593, - "score": 0.46 - }, - { - "name": "Thai", - "bcp_47": "th", - "population": 55181920, - "score": 0.0 - }, - { - "name": "Northeastern Thai", - "bcp_47": "tts", - "population": 16554576, - "score": 0.0 - }, - { - "name": "Northern Thai", - "bcp_47": "nod", - "population": 6621830, - "score": 0.0 - }, - { - "name": "Southern Thai", - "bcp_47": "sou", - "population": 5518192, - "score": 0.0 - }, - { - "name": "Shan", - "bcp_47": "shn", - "population": 66218, - "score": 0.0 - }, - { - "name": "Pattani Malay", - "bcp_47": "mfa", - "population": 3448870, - "score": 0.0 - }, - { - "name": "Northern Khmer", - "bcp_47": "kxm", - "population": 1172616, - "score": 0.0 - }, - { - "name": "Mon", - "bcp_47": "mnw", - "population": 117262, - "score": 0.0 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 67598, - "score": 0.0 - }, - { - "name": "Kuy", - "bcp_47": "kdt", - "population": 331092, - "score": 0.0 - }, - { - "name": "Western Lawa", - "bcp_47": "lcp", - "population": 6898, - "score": 0.0 - }, - { - "name": "Eastern Lawa", - "bcp_47": "lwl", - "population": 6898, - "score": 0.0 - } - ] - }, - "TK": { - "score": 0.235, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1285, - "score": 0.47 - }, - { - "name": "Tokelau", - "bcp_47": "tkl", - "population": 1285, - "score": 0.0 - } - ] - }, - "TO": { - "score": 0.10699318758285631, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 29707, - "score": 0.47 - }, - { - "name": "Tongan", - "bcp_47": "to", - "population": 100790, - "score": 0.0 - } - ] - }, - "TR": { - "score": 0.38853953080443926, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 13942975, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 459298, - "score": 0.42 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 76276275, - "score": 0.44 - }, - { - "name": "North Levantine Arabic", - "bcp_47": "apc", - "population": 4264910, - "score": 0.0 - }, - { - "name": "Uzbek", - "bcp_47": "uz", - "population": 1968, - "score": 0.0 - }, - { - "name": "Azerbaijani", - "bcp_47": "az", - "population": 1140044, - "score": 0.0 - }, - { - "name": "Serbian", - "bcp_47": "sr", - "population": 22965, - "score": 0.0 - }, - { - "name": "Kazakh", - "bcp_47": "kk", - "population": 574, - "score": 0.0 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 4019, - "score": 0.0 - }, - { - "name": "Bulgarian", - "bcp_47": "bg", - "population": 344474, - "score": 0.0 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 4510962, - "score": 0.0 - }, - { - "name": "Albanian", - "bcp_47": "sq", - "population": 17224, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 45930, - "score": 0.0 - }, - { - "name": "Georgian", - "bcp_47": "ka", - "population": 45930, - "score": 0.0 - }, - { - "name": "Kyrgyz", - "bcp_47": "ky", - "population": 1148, - "score": 0.0 - }, - { - "name": "Zaza", - "bcp_47": "zza", - "population": 1148245, - "score": 0.0 - }, - { - "name": "Kabardian", - "bcp_47": "kbd", - "population": 631535, - "score": 0.0 - }, - { - "name": "Adyghe", - "bcp_47": "ady", - "population": 319868, - "score": 0.0 - }, - { - "name": "Balkan Gagauz Turkish", - "bcp_47": "bgx", - "population": 377280, - "score": 0.0 - }, - { - "name": "Kirmanjki", - "bcp_47": "kiu", - "population": 155833, - "score": 0.0 - }, - { - "name": "Abkhazian", - "bcp_47": "ab", - "population": 4019, - "score": 0.0 - }, - { - "name": "Laz", - "bcp_47": "lzz", - "population": 22965, - "score": 0.0 - }, - { - "name": "Turoyo", - "bcp_47": "tru", - "population": 3035, - "score": 0.0 - } - ] - }, - "TT": { - "score": 0.4699230225360422, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1063735, - "score": 0.47 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 4110, - "score": 0.45 - } - ] - }, - "TV": { - "score": 0.04582220596305103, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1066, - "score": 0.47 - }, - { - "name": "Tuvalu", - "bcp_47": "tvl", - "population": 9868, - "score": 0.0 - } - ] - }, - "TZ": { - "score": 0.3952631230768349, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 40401432, - "score": 0.47 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 52697520, - "score": 0.45 - }, - { - "name": "Sukuma", - "bcp_47": "suk", - "population": 5094094, - "score": 0.0 - }, - { - "name": "Nyamwezi", - "bcp_47": "nym", - "population": 1932242, - "score": 0.0 - }, - { - "name": "Masai", - "bcp_47": "mas", - "population": 878292, - "score": 0.0 - }, - { - "name": "Makonde", - "bcp_47": "kde", - "population": 1463820, - "score": 0.0 - }, - { - "name": "Bena", - "bcp_47": "bez", - "population": 995398, - "score": 0.0 - }, - { - "name": "Shambala", - "bcp_47": "ksb", - "population": 995398, - "score": 0.0 - }, - { - "name": "Mbunga", - "bcp_47": "mgy", - "population": 819739, - "score": 0.0 - }, - { - "name": "Asu", - "bcp_47": "asa", - "population": 702634, - "score": 0.0 - }, - { - "name": "Langi", - "bcp_47": "lag", - "population": 509409, - "score": 0.0 - }, - { - "name": "Vunjo", - "bcp_47": "vun", - "population": 433291, - "score": 0.0 - }, - { - "name": "Rombo", - "bcp_47": "rof", - "population": 433291, - "score": 0.0 - }, - { - "name": "Machame", - "bcp_47": "jmc", - "population": 433291, - "score": 0.0 - }, - { - "name": "Rwa", - "bcp_47": "rwk", - "population": 128816, - "score": 0.0 - }, - { - "name": "Sangu", - "bcp_47": "sbp", - "population": 117106, - "score": 0.0 - } - ] - }, - "UG": { - "score": 0.2797477934487195, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 1686867, - "score": 0.47 - }, - { - "name": "Hindi", - "bcp_47": "hi", - "population": 2206, - "score": 0.46 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 32439750, - "score": 0.45 - }, - { - "name": "Kinyarwanda", - "bcp_47": "rw", - "population": 908313, - "score": 0.0 - }, - { - "name": "Ganda", - "bcp_47": "lg", - "population": 5622890, - "score": 0.0 - }, - { - "name": "Nyankole", - "bcp_47": "nyn", - "population": 2724939, - "score": 0.0 - }, - { - "name": "Chiga", - "bcp_47": "cgg", - "population": 2335662, - "score": 0.0 - }, - { - "name": "Soga", - "bcp_47": "xog", - "population": 2292409, - "score": 0.0 - }, - { - "name": "Teso", - "bcp_47": "teo", - "population": 1686867, - "score": 0.0 - }, - { - "name": "Lango (Uganda)", - "bcp_47": "laj", - "population": 1643614, - "score": 0.0 - }, - { - "name": "Acoli", - "bcp_47": "ach", - "population": 1600361, - "score": 0.0 - }, - { - "name": "Masaaba", - "bcp_47": "myx", - "population": 1254337, - "score": 0.0 - }, - { - "name": "Tooro", - "bcp_47": "ttj", - "population": 821807, - "score": 0.0 - } - ] - }, - "UM": { - "score": 0.4699999999999999, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 316, - "score": 0.47 - } - ] - }, - "US": { - "score": 0.46680423711359387, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 319333440, - "score": 0.47 - }, - { - "name": "Chinese", - "bcp_47": "zh", - "population": 2295209, - "score": 0.46 - }, - { - "name": "Spanish", - "bcp_47": "es", - "population": 31933344, - "score": 0.45 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 1862778, - "score": 0.46 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 798334, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 1563403, - "score": 0.49 - }, - { - "name": "Vietnamese", - "bcp_47": "vi", - "population": 1130973, - "score": 0.45 - }, - { - "name": "Korean", - "bcp_47": "ko", - "population": 997917, - "score": 0.41 - }, - { - "name": "Italian", - "bcp_47": "it", - "population": 1130973, - "score": 0.47 - }, - { - "name": "Filipino", - "bcp_47": "fil", - "population": 1397084, - "score": 0.42 - }, - { - "name": "Yiddish", - "bcp_47": "yi", - "population": 162993, - "score": 0.0 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 116424, - "score": 0.0 - }, - { - "name": "Navajo", - "bcp_47": "nv", - "population": 166320, - "score": 0.0 - }, - { - "name": "Pennsylvania German", - "bcp_47": "pdc", - "population": 129729, - "score": 0.0 - }, - { - "name": "Hawaiian", - "bcp_47": "haw", - "population": 29605, - "score": 0.0 - }, - { - "name": "Cajun French", - "bcp_47": "frc", - "population": 27942, - "score": 0.0 - }, - { - "name": "Cherokee", - "bcp_47": "chr", - "population": 25613, - "score": 0.0 - }, - { - "name": "Central Yupik", - "bcp_47": "esu", - "population": 20956, - "score": 0.0 - }, - { - "name": "Dakota", - "bcp_47": "dak", - "population": 19626, - "score": 0.0 - }, - { - "name": "Choctaw", - "bcp_47": "cho", - "population": 10977, - "score": 0.0 - }, - { - "name": "Lakota", - "bcp_47": "lkt", - "population": 8316, - "score": 0.0 - }, - { - "name": "Inupiaq", - "bcp_47": "ik", - "population": 7983, - "score": 0.0 - }, - { - "name": "Muscogee", - "bcp_47": "mus", - "population": 3992, - "score": 0.0 - }, - { - "name": "Ido", - "bcp_47": "io", - "population": 0, - "score": 0.0 - }, - { - "name": "Lojban", - "bcp_47": "jbo", - "population": 0, - "score": 0.0 - }, - { - "name": "Osage", - "bcp_47": "osa", - "population": 0, - "score": 0.0 - }, - { - "name": "Chickasaw", - "bcp_47": "cic", - "population": 0, - "score": 0.0 - }, - { - "name": "Caddo", - "bcp_47": "cad", - "population": 0, - "score": 0.0 - } - ] - }, - "VC": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 97334, - "score": 0.47 - } - ] - }, - "VG": { - "score": 0.47, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 36633, - "score": 0.47 - } - ] - }, - "VI": { - "score": 0.47000000000000003, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 79676, - "score": 0.47 - } - ] - }, - "VU": { - "score": 0.27807137424430545, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 247616, - "score": 0.47 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 149166, - "score": 0.46 - }, - { - "name": "Bislama", - "bcp_47": "bi", - "population": 268500, - "score": 0.0 - } - ] - }, - "WS": { - "score": 0.00966643114975511, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 4279, - "score": 0.47 - }, - { - "name": "Samoan", - "bcp_47": "sm", - "population": 203774, - "score": 0.0 - } - ] - }, - "YE": { - "score": 0.4254216867469879, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2689596, - "score": 0.47 - }, - { - "name": "Arabic", - "bcp_47": "ar", - "population": 22114456, - "score": 0.42 - } - ] - }, - "ZA": { - "score": 0.12442237800209865, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 17503716, - "score": 0.47 - }, - { - "name": "Hindi", - "bcp_47": "hi", - "population": 1129272, - "score": 0.46 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 1016, - "score": 0.45 - }, - { - "name": "Zulu", - "bcp_47": "zu", - "population": 13551264, - "score": 0.0 - }, - { - "name": "Xhosa", - "bcp_47": "xh", - "population": 10163448, - "score": 0.0 - }, - { - "name": "Afrikaans", - "bcp_47": "af", - "population": 7340268, - "score": 0.0 - }, - { - "name": "Southern Sotho", - "bcp_47": "st", - "population": 4460624, - "score": 0.0 - }, - { - "name": "Tswana", - "bcp_47": "tn", - "population": 4630015, - "score": 0.0 - }, - { - "name": "Northern Sotho", - "bcp_47": "nso", - "population": 5307578, - "score": 0.0 - }, - { - "name": "Tsonga", - "bcp_47": "ts", - "population": 2484398, - "score": 0.0 - }, - { - "name": "Swati", - "bcp_47": "ss", - "population": 1524517, - "score": 0.0 - }, - { - "name": "Venda", - "bcp_47": "ve", - "population": 1298663, - "score": 0.0 - }, - { - "name": "South Ndebele", - "bcp_47": "nr", - "population": 903418, - "score": 0.0 - } - ] - }, - "ZM": { - "score": 0.11058823529411763, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 2788256, - "score": 0.47 - }, - { - "name": "Nyanja", - "bcp_47": "ny", - "population": 2613990, - "score": 0.0 - }, - { - "name": "Bemba", - "bcp_47": "bem", - "population": 5402246, - "score": 0.0 - }, - { - "name": "Lozi", - "bcp_47": "loz", - "population": 1045596, - "score": 0.0 - } - ] - }, - "ZW": { - "score": 0.12681485053220737, - "languages": [ - { - "name": "English", - "bcp_47": "en", - "population": 6109446, - "score": 0.47 - }, - { - "name": "Nyanja", - "bcp_47": "ny", - "population": 276380, - "score": 0.0 - }, - { - "name": "Shona", - "bcp_47": "sn", - "population": 11782503, - "score": 0.0 - }, - { - "name": "Tswana", - "bcp_47": "tn", - "population": 32002, - "score": 0.0 - }, - { - "name": "Ndau", - "bcp_47": "ndc", - "population": 887324, - "score": 0.0 - }, - { - "name": "North Ndebele", - "bcp_47": "nd", - "population": 1745556, - "score": 0.0 - }, - { - "name": "Venda", - "bcp_47": "ve", - "population": 93096, - "score": 0.0 - }, - { - "name": "Manyika", - "bcp_47": "mxc", - "population": 945510, - "score": 0.0 - }, - { - "name": "Kalanga", - "bcp_47": "kck", - "population": 770954, - "score": 0.0 - } - ] - }, - "GF": { - "score": 0.33892599990709343, - "languages": [ - { - "name": "Chinese", - "bcp_47": "zh", - "population": 4988, - "score": 0.46 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 153622, - "score": 0.46 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 4788, - "score": 0.0 - }, - { - "name": "Guianese Creole French", - "bcp_47": "gcr", - "population": 51872, - "score": 0.0 - } - ] - }, - "ID": { - "score": 0.3194548673228042, - "languages": [ - { - "name": "Chinese", - "bcp_47": "zh", - "population": 2456639, - "score": 0.46 - }, - { - "name": "Indonesian", - "bcp_47": "id", - "population": 170896640, - "score": 0.47 - }, - { - "name": "Javanese", - "bcp_47": "jv", - "population": 90788840, - "score": 0.41 - }, - { - "name": "Malay", - "bcp_47": "ms", - "population": 12283196, - "score": 0.0 - }, - { - "name": "Sundanese", - "bcp_47": "su", - "population": 32043120, - "score": 0.0 - }, - { - "name": "Madurese", - "bcp_47": "mad", - "population": 16822638, - "score": 0.0 - }, - { - "name": "Minangkabau", - "bcp_47": "min", - "population": 8010780, - "score": 0.0 - }, - { - "name": "Betawi", - "bcp_47": "bew", - "population": 5607546, - "score": 0.0 - }, - { - "name": "Balinese", - "bcp_47": "ban", - "population": 4806468, - "score": 0.0 - }, - { - "name": "Buginese", - "bcp_47": "bug", - "population": 4272416, - "score": 0.0 - }, - { - "name": "Banjar", - "bcp_47": "bjn", - "population": 4005390, - "score": 0.0 - }, - { - "name": "Achinese", - "bcp_47": "ace", - "population": 3738364, - "score": 0.0 - }, - { - "name": "Sasak", - "bcp_47": "sas", - "population": 2590152, - "score": 0.0 - }, - { - "name": "Batak Toba", - "bcp_47": "bbc", - "population": 2456639, - "score": 0.0 - }, - { - "name": "Makasar", - "bcp_47": "mak", - "population": 1949290, - "score": 0.0 - }, - { - "name": "Lampung Api", - "bcp_47": "ljp", - "population": 1842479, - "score": 0.0 - }, - { - "name": "Rejang", - "bcp_47": "rej", - "population": 1228320, - "score": 0.0 - }, - { - "name": "Gorontalo", - "bcp_47": "gor", - "population": 1094807, - "score": 0.0 - }, - { - "name": "Ngaju", - "bcp_47": "nij", - "population": 987996, - "score": 0.0 - }, - { - "name": "Komering", - "bcp_47": "kge", - "population": 854483, - "score": 0.0 - }, - { - "name": "Uab Meto", - "bcp_47": "aoz", - "population": 720970, - "score": 0.0 - }, - { - "name": "Kerinci", - "bcp_47": "kvr", - "population": 373836, - "score": 0.0 - }, - { - "name": "Tolaki", - "bcp_47": "lbw", - "population": 347134, - "score": 0.0 - }, - { - "name": "Gayo", - "bcp_47": "gay", - "population": 320431, - "score": 0.0 - }, - { - "name": "Tae'", - "bcp_47": "rob", - "population": 293729, - "score": 0.0 - }, - { - "name": "Mandar", - "bcp_47": "mdr", - "population": 245664, - "score": 0.0 - }, - { - "name": "Sangir", - "bcp_47": "sxn", - "population": 245664, - "score": 0.0 - }, - { - "name": "Selayar", - "bcp_47": "sly", - "population": 144194, - "score": 0.0 - }, - { - "name": "Mentawai", - "bcp_47": "mwv", - "population": 64086, - "score": 0.0 - } - ] - }, - "MN": { - "score": 0.006903243016889744, - "languages": [ - { - "name": "Chinese", - "bcp_47": "zh", - "population": 44352, - "score": 0.46 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 4118, - "score": 0.45 - }, - { - "name": "Kazakh", - "bcp_47": "kk", - "population": 228098, - "score": 0.0 - }, - { - "name": "Uyghur", - "bcp_47": "ug", - "population": 1014, - "score": 0.0 - }, - { - "name": "Mongolian", - "bcp_47": "mn", - "population": 2946268, - "score": 0.0 - } - ] - }, - "PF": { - "score": 0.3171135805738615, - "languages": [ - { - "name": "Chinese", - "bcp_47": "zh", - "population": 23019, - "score": 0.46 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 180024, - "score": 0.46 - }, - { - "name": "Tahitian", - "bcp_47": "ty", - "population": 91488, - "score": 0.0 - } - ] - }, - "SR": { - "score": 0.003172691176168042, - "languages": [ - { - "name": "Chinese", - "bcp_47": "zh", - "population": 6705, - "score": 0.46 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 548612, - "score": 0.0 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 2316, - "score": 0.0 - }, - { - "name": "Sranan Tongo", - "bcp_47": "srn", - "population": 414507, - "score": 0.0 - } - ] - }, - "TW": { - "score": 0.45990317007579645, - "languages": [ - { - "name": "Chinese", - "bcp_47": "zh", - "population": 22422850, - "score": 0.46 - }, - { - "name": "Taroko", - "bcp_47": "trv", - "population": 4721, - "score": 0.0 - } - ] - }, - "VN": { - "score": 0.44527479082463184, - "languages": [ - { - "name": "Chinese", - "bcp_47": "zh", - "population": 1085934, - "score": 0.46 - }, - { - "name": "Vietnamese", - "bcp_47": "vi", - "population": 84900318, - "score": 0.45 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 167826, - "score": 0.0 - }, - { - "name": "Tai Dam", - "bcp_47": "blt", - "population": 681177, - "score": 0.0 - }, - { - "name": "Eastern Cham", - "bcp_47": "cjm", - "population": 87862, - "score": 0.0 - } - ] - }, - "AD": { - "score": 0.2246305418719212, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 33110, - "score": 0.45 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 5775, - "score": 0.46 - }, - { - "name": "Catalan", - "bcp_47": "ca", - "population": 39270, - "score": 0.0 - } - ] - }, - "BO": { - "score": 0.24195487707764574, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 7100339, - "score": 0.45 - }, - { - "name": "Quechua", - "bcp_47": "qu", - "population": 3724768, - "score": 0.0 - }, - { - "name": "Guarani", - "bcp_47": "gn", - "population": 52380, - "score": 0.0 - }, - { - "name": "Aymara", - "bcp_47": "ay", - "population": 2327980, - "score": 0.0 - }, - { - "name": "Araona", - "bcp_47": "aro", - "population": 105, - "score": 0.0 - } - ] - }, - "CO": { - "score": 0.4486679880632671, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 45648864, - "score": 0.45 - }, - { - "name": "Wayuu", - "bcp_47": "guc", - "population": 132529, - "score": 0.0 - }, - { - "name": "Nheengatu", - "bcp_47": "yrl", - "population": 2994, - "score": 0.0 - } - ] - }, - "CR": { - "score": 0.45, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 4843090, - "score": 0.45 - } - ] - }, - "CU": { - "score": 0.45, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 11059100, - "score": 0.45 - } - ] - }, - "CW": { - "score": 0.01842639268626111, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 5751, - "score": 0.45 - }, - { - "name": "Dutch", - "bcp_47": "nl", - "population": 12108, - "score": 0.0 - }, - { - "name": "Papiamento", - "bcp_47": "pap", - "population": 122589, - "score": 0.0 - } - ] - }, - "EA": { - "score": 0.45, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 147000, - "score": 0.45 - } - ] - }, - "EC": { - "score": 0.36394271816229906, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 16228704, - "score": 0.45 - }, - { - "name": "Quechua", - "bcp_47": "qu", - "population": 2873833, - "score": 0.0 - }, - { - "name": "Chimborazo Highland Quichua", - "bcp_47": "qug", - "population": 963579, - "score": 0.0 - } - ] - }, - "GQ": { - "score": 0.27923739669086073, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 727475, - "score": 0.45 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 73584, - "score": 0.46 - }, - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 1, - "score": 0.45 - }, - { - "name": "Fang", - "bcp_47": "fan", - "population": 426451, - "score": 0.0 - }, - { - "name": "Bube", - "bcp_47": "bvb", - "population": 66058, - "score": 0.0 - } - ] - }, - "GT": { - "score": 0.4185, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 15952569, - "score": 0.45 - }, - { - "name": "Kʼicheʼ", - "bcp_47": "quc", - "population": 1200731, - "score": 0.0 - } - ] - }, - "IC": { - "score": 0.45, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 2056618, - "score": 0.45 - } - ] - }, - "NI": { - "score": 0.45, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 4838683, - "score": 0.45 - } - ] - }, - "PE": { - "score": 0.3666294642857143, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 23297950, - "score": 0.45 - }, - { - "name": "Quechua", - "bcp_47": "qu", - "population": 4787250, - "score": 0.0 - }, - { - "name": "Aymara", - "bcp_47": "ay", - "population": 510640, - "score": 0.0 - } - ] - }, - "PY": { - "score": 0.03322879759433273, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 230134, - "score": 0.45 - }, - { - "name": "German", - "bcp_47": "de", - "population": 208559, - "score": 0.49 - }, - { - "name": "Guarani", - "bcp_47": "gn", - "population": 5753352, - "score": 0.0 - } - ] - }, - "SV": { - "score": 0.45000000000000007, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 5768179, - "score": 0.45 - } - ] - }, - "UY": { - "score": 0.45000000000000007, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 2981097, - "score": 0.45 - } - ] - }, - "VE": { - "score": 0.4499615909817796, - "languages": [ - { - "name": "Spanish", - "bcp_47": "es", - "population": 23488572, - "score": 0.45 - }, - { - "name": "Nheengatu", - "bcp_47": "yrl", - "population": 2005, - "score": 0.0 - } - ] - }, - "BH": { - "score": 0.4046511627906977, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 1309350, - "score": 0.42 - }, - { - "name": "Malayalam", - "bcp_47": "ml", - "population": 49665, - "score": 0.0 - } - ] - }, - "DJ": { - "score": 0.04363652160028553, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 67292, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 19358, - "score": 0.46 - }, - { - "name": "Somali", - "bcp_47": "so", - "population": 377940, - "score": 0.0 - }, - { - "name": "Afar", - "bcp_47": "aa", - "population": 387158, - "score": 0.0 - } - ] - }, - "EH": { - "score": 0.42, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 652271, - "score": 0.42 - } - ] - }, - "IR": { - "score": 0.23949254115959248, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 1698466, - "score": 0.42 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 63692475, - "score": 0.41 - }, - { - "name": "Pashto", - "bcp_47": "ps", - "population": 135877, - "score": 0.0 - }, - { - "name": "Azerbaijani", - "bcp_47": "az", - "population": 20381592, - "score": 0.0 - }, - { - "name": "Kazakh", - "bcp_47": "kk", - "population": 2972, - "score": 0.0 - }, - { - "name": "Central Kurdish", - "bcp_47": "ckb", - "population": 3312009, - "score": 0.0 - }, - { - "name": "Baluchi", - "bcp_47": "bal", - "population": 1698466, - "score": 0.0 - }, - { - "name": "Turkmen", - "bcp_47": "tk", - "population": 2377852, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 203816, - "score": 0.0 - }, - { - "name": "Mazanderani", - "bcp_47": "mzn", - "population": 4246165, - "score": 0.0 - }, - { - "name": "Gilaki", - "bcp_47": "glk", - "population": 3906472, - "score": 0.0 - }, - { - "name": "Georgian", - "bcp_47": "ka", - "population": 60296, - "score": 0.0 - }, - { - "name": "Southern Kurdish", - "bcp_47": "sdh", - "population": 3142162, - "score": 0.0 - }, - { - "name": "Western Balochi", - "bcp_47": "bgn", - "population": 475570, - "score": 0.0 - }, - { - "name": "Northern Luri", - "bcp_47": "lrc", - "population": 1783389, - "score": 0.0 - }, - { - "name": "Domari", - "bcp_47": "rmt", - "population": 1613543, - "score": 0.0 - }, - { - "name": "Bakhtiari", - "bcp_47": "bqi", - "population": 1188926, - "score": 0.0 - }, - { - "name": "Southern Luri", - "bcp_47": "luz", - "population": 1019080, - "score": 0.0 - }, - { - "name": "Parsi-Dari", - "bcp_47": "prd", - "population": 424616, - "score": 0.0 - }, - { - "name": "Laki", - "bcp_47": "lki", - "population": 645417, - "score": 0.0 - }, - { - "name": "Zoroastrian Dari", - "bcp_47": "gbz", - "population": 7983, - "score": 0.0 - } - ] - }, - "KM": { - "score": 0.27709828190644586, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 558545, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 473917, - "score": 0.46 - }, - { - "name": "Ngazidja Comorian", - "bcp_47": "zdj", - "population": 313124, - "score": 0.0 - }, - { - "name": "Ndzwani Comorian", - "bcp_47": "wni", - "population": 287736, - "score": 0.0 - } - ] - }, - "KW": { - "score": 0.42, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 2993710, - "score": 0.42 - } - ] - }, - "LY": { - "score": 0.42, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 5099000, - "score": 0.42 - } - ] - }, - "ML": { - "score": 0.17298209200310574, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 175981, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 8994564, - "score": 0.46 - }, - { - "name": "Bambara", - "bcp_47": "bm", - "population": 9385632, - "score": 0.0 - }, - { - "name": "Tamashek", - "bcp_47": "tmh", - "population": 410621, - "score": 0.0 - }, - { - "name": "Maasina Fulfulde", - "bcp_47": "ffm", - "population": 1505612, - "score": 0.0 - }, - { - "name": "Soninke", - "bcp_47": "snk", - "population": 1153651, - "score": 0.0 - }, - { - "name": "Kita Maninkakan", - "bcp_47": "mwk", - "population": 977670, - "score": 0.0 - }, - { - "name": "Koyraboro Senni", - "bcp_47": "ses", - "population": 664816, - "score": 0.0 - }, - { - "name": "Koyra Chiini", - "bcp_47": "khq", - "population": 332408, - "score": 0.0 - }, - { - "name": "Tomo Kan Dogon", - "bcp_47": "dtm", - "population": 215087, - "score": 0.0 - }, - { - "name": "Xaasongaxango", - "bcp_47": "kao", - "population": 195534, - "score": 0.0 - }, - { - "name": "Bomu", - "bcp_47": "bmq", - "population": 168159, - "score": 0.0 - }, - { - "name": "Jenaama Bozo", - "bcp_47": "bze", - "population": 166204, - "score": 0.0 - } - ] - }, - "MR": { - "score": 0.4031496171525996, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 3404658, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 680932, - "score": 0.46 - }, - { - "name": "Wolof", - "bcp_47": "wo", - "population": 10014, - "score": 0.0 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 228312, - "score": 0.0 - } - ] - }, - "NE": { - "score": 0.13395381465163778, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 47822, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 6603996, - "score": 0.46 - }, - { - "name": "Hausa", - "bcp_47": "ha", - "population": 9336684, - "score": 0.0 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 0, - "score": 0.0 - }, - { - "name": "Zarma", - "bcp_47": "dje", - "population": 3871308, - "score": 0.0 - }, - { - "name": "Tamashek", - "bcp_47": "tmh", - "population": 1366344, - "score": 0.0 - }, - { - "name": "Central-Eastern Niger Fulfulde", - "bcp_47": "fuq", - "population": 1594068, - "score": 0.0 - }, - { - "name": "Tasawaq", - "bcp_47": "twq", - "population": 7970, - "score": 0.0 - } - ] - }, - "OM": { - "score": 0.3961930102252659, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 3778520, - "score": 0.42 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 43849, - "score": 0.41 - }, - { - "name": "Baluchi", - "bcp_47": "bal", - "population": 228577, - "score": 0.0 - } - ] - }, - "PS": { - "score": 0.22459893546675047, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 4818260, - "score": 0.42 - }, - { - "name": "North Levantine Arabic", - "bcp_47": "apc", - "population": 4191886, - "score": 0.0 - } - ] - }, - "QA": { - "score": 0.41777205848450016, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 2175311, - "score": 0.42 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 268859, - "score": 0.41 - }, - { - "name": "Malayalam", - "bcp_47": "ml", - "population": 6599, - "score": 0.0 - } - ] - }, - "SA": { - "score": 0.4077669902912621, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 34173500, - "score": 0.42 - }, - { - "name": "Najdi Arabic", - "bcp_47": "ars", - "population": 1025205, - "score": 0.0 - } - ] - }, - "SO": { - "score": 0.1326691120161243, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 3997414, - "score": 0.42 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 235142, - "score": 0.45 - }, - { - "name": "Oromo", - "bcp_47": "om", - "population": 49380, - "score": 0.0 - }, - { - "name": "Somali", - "bcp_47": "so", - "population": 9170538, - "score": 0.0 - } - ] - }, - "SY": { - "score": 0.20086954810836308, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 15518720, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 1144506, - "score": 0.46 - }, - { - "name": "North Levantine Arabic", - "bcp_47": "apc", - "population": 16488640, - "score": 0.0 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 1551872, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 349171, - "score": 0.0 - }, - { - "name": "Syriac", - "bcp_47": "syr", - "population": 16295, - "score": 0.0 - } - ] - }, - "TD": { - "score": 0.4441860465116279, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 2869158, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 4388124, - "score": 0.46 - } - ] - }, - "TJ": { - "score": 0.05075244729560809, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 976, - "score": 0.42 - }, - { - "name": "Russian", - "bcp_47": "ru", - "population": 1064840, - "score": 0.45 - }, - { - "name": "Persian", - "bcp_47": "fa", - "population": 69215, - "score": 0.41 - }, - { - "name": "Tajik", - "bcp_47": "tg", - "population": 8873670, - "score": 0.0 - } - ] - }, - "TN": { - "score": 0.28283464566929134, - "languages": [ - { - "name": "Arabic", - "bcp_47": "ar", - "population": 10549080, - "score": 0.42 - }, - { - "name": "French", - "bcp_47": "fr", - "population": 8673688, - "score": 0.46 - }, - { - "name": "Tunisian Arabic", - "bcp_47": "aeb", - "population": 10549080, - "score": 0.0 - } - ] - }, - "BF": { - "score": 0.1076595744680851, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 4583788, - "score": 0.46 - }, - { - "name": "Mossi", - "bcp_47": "mos", - "population": 8334160, - "score": 0.0 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 0, - "score": 0.0 - }, - { - "name": "Dyula", - "bcp_47": "dyu", - "population": 6667328, - "score": 0.0 - } - ] - }, - "BJ": { - "score": 0.24029850746268658, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 4502610, - "score": 0.46 - }, - { - "name": "Yoruba", - "bcp_47": "yo", - "population": 861928, - "score": 0.0 - }, - { - "name": "Fon", - "bcp_47": "fon", - "population": 3216150, - "score": 0.0 - }, - { - "name": "Anii", - "bcp_47": "blo", - "population": 38594, - "score": 0.0 - } - ] - }, - "BL": { - "score": 0.46, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 6837, - "score": 0.46 - } - ] - }, - "CD": { - "score": 0.34013185580025246, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 3867640, - "score": 0.46 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 50890000, - "score": 0.45 - }, - { - "name": "Kinyarwanda", - "bcp_47": "rw", - "population": 386764, - "score": 0.0 - }, - { - "name": "Luba-Lulua", - "bcp_47": "lua", - "population": 9770880, - "score": 0.0 - }, - { - "name": "Lingala", - "bcp_47": "ln", - "population": 3155180, - "score": 0.0 - }, - { - "name": "Luba-Katanga", - "bcp_47": "lu", - "population": 2340940, - "score": 0.0 - }, - { - "name": "Kongo", - "bcp_47": "kg", - "population": 1526700, - "score": 0.0 - }, - { - "name": "Mongo", - "bcp_47": "lol", - "population": 620858, - "score": 0.0 - } - ] - }, - "CF": { - "score": 0.22943811316779433, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 2935521, - "score": 0.46 - }, - { - "name": "Lingala", - "bcp_47": "ln", - "population": 14378, - "score": 0.0 - }, - { - "name": "Sango", - "bcp_47": "sg", - "population": 2935521, - "score": 0.0 - } - ] - }, - "CG": { - "score": 0.4472221914876915, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 4446179, - "score": 0.46 - }, - { - "name": "Lingala", - "bcp_47": "ln", - "population": 127034, - "score": 0.0 - } - ] - }, - "CI": { - "score": 0.32809315344736595, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 13465739, - "score": 0.46 - }, - { - "name": "Baoulé", - "bcp_47": "bci", - "population": 3022921, - "score": 0.0 - }, - { - "name": "Cebaara Senoufo", - "bcp_47": "sef", - "population": 1181687, - "score": 0.0 - }, - { - "name": "Dan", - "bcp_47": "dnj", - "population": 1099244, - "score": 0.0 - }, - { - "name": "Koro", - "bcp_47": "kfo", - "population": 63207, - "score": 0.0 - }, - { - "name": "Koro Wachi", - "bcp_47": "bqv", - "population": 46718, - "score": 0.0 - } - ] - }, - "GA": { - "score": 0.4024999642024461, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 1405473, - "score": 0.46 - }, - { - "name": "Punu", - "bcp_47": "puu", - "population": 200782, - "score": 0.0 - } - ] - }, - "GN": { - "score": 0.13640082022253552, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 3632946, - "score": 0.46 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 3257124, - "score": 0.0 - }, - { - "name": "Mandingo", - "bcp_47": "man", - "population": 2881302, - "score": 0.0 - }, - { - "name": "Susu", - "bcp_47": "sus", - "population": 1378014, - "score": 0.0 - }, - { - "name": "Kpelle", - "bcp_47": "kpe", - "population": 476041, - "score": 0.0 - }, - { - "name": "N’Ko", - "bcp_47": "nqo", - "population": 626370, - "score": 0.0 - } - ] - }, - "GP": { - "score": 0.46, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 407498, - "score": 0.46 - } - ] - }, - "HT": { - "score": 0.025227556257943377, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 520187, - "score": 0.46 - }, - { - "name": "Haitian Creole", - "bcp_47": "ht", - "population": 8964918, - "score": 0.0 - } - ] - }, - "MC": { - "score": 0.4600000000000001, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 38610, - "score": 0.46 - } - ] - }, - "MF": { - "score": 0.46, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 32556, - "score": 0.46 - } - ] - }, - "MQ": { - "score": 0.4600000000000001, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 427408, - "score": 0.46 - } - ] - }, - "NC": { - "score": 0.46, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 278409, - "score": 0.46 - } - ] - }, - "RE": { - "score": 0.26908571814147125, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 700950, - "score": 0.46 - }, - { - "name": "Tamil", - "bcp_47": "ta", - "population": 118138, - "score": 0.41 - }, - { - "name": "Réunion Creole French", - "bcp_47": "rcf", - "population": 559185, - "score": 0.0 - } - ] - }, - "SN": { - "score": 0.1219628328989918, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 6137196, - "score": 0.46 - }, - { - "name": "Wolof", - "bcp_47": "wo", - "population": 11015480, - "score": 0.0 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 3304644, - "score": 0.0 - }, - { - "name": "Serer", - "bcp_47": "srr", - "population": 1731004, - "score": 0.0 - }, - { - "name": "Jola-Fonyi", - "bcp_47": "dyo", - "population": 409146, - "score": 0.0 - }, - { - "name": "Saafi-Saafi", - "bcp_47": "sav", - "population": 236046, - "score": 0.0 - }, - { - "name": "Mandjak", - "bcp_47": "mfv", - "population": 121170, - "score": 0.0 - }, - { - "name": "Balanta-Ganja", - "bcp_47": "bjt", - "population": 95992, - "score": 0.0 - }, - { - "name": "Mankanya", - "bcp_47": "knf", - "population": 33046, - "score": 0.0 - }, - { - "name": "Noon", - "bcp_47": "snf", - "population": 37767, - "score": 0.0 - }, - { - "name": "Bassari", - "bcp_47": "bsc", - "population": 15264, - "score": 0.0 - }, - { - "name": "Hassaniyya", - "bcp_47": "mey", - "population": 7239, - "score": 0.0 - }, - { - "name": "Ménik", - "bcp_47": "tnr", - "population": 3305, - "score": 0.0 - } - ] - }, - "TF": { - "score": 0.46, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 140, - "score": 0.46 - } - ] - }, - "TG": { - "score": 0.353178050842427, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 5251148, - "score": 0.46 - }, - { - "name": "Ewe", - "bcp_47": "ee", - "population": 1463435, - "score": 0.0 - }, - { - "name": "Ifè", - "bcp_47": "ife", - "population": 111910, - "score": 0.0 - }, - { - "name": "Anii", - "bcp_47": "blo", - "population": 12913, - "score": 0.0 - } - ] - }, - "WF": { - "score": 0.16000548496206235, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 7610, - "score": 0.46 - }, - { - "name": "Wallisian", - "bcp_47": "wls", - "population": 9512, - "score": 0.0 - }, - { - "name": "East Futuna", - "bcp_47": "fud", - "population": 4756, - "score": 0.0 - } - ] - }, - "YT": { - "score": 0.15850059031877214, - "languages": [ - { - "name": "French", - "bcp_47": "fr", - "population": 110580, - "score": 0.46 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 2716, - "score": 0.45 - }, - { - "name": "Comorian", - "bcp_47": "swb", - "population": 170720, - "score": 0.0 - }, - { - "name": "Bushi", - "bcp_47": "buc", - "population": 44620, - "score": 0.0 - } - ] - }, - "AO": { - "score": 0.2478014326653792, - "languages": [ - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 21789941, - "score": 0.45 - }, - { - "name": "Umbundu", - "bcp_47": "umb", - "population": 9431467, - "score": 0.0 - }, - { - "name": "Kimbundu", - "bcp_47": "kmb", - "population": 8130575, - "score": 0.0 - }, - { - "name": "Lingala", - "bcp_47": "ln", - "population": 217899, - "score": 0.0 - } - ] - }, - "CV": { - "score": 0.20479048002332564, - "languages": [ - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 443274, - "score": 0.45 - }, - { - "name": "Kabuverdianu", - "bcp_47": "kea", - "population": 530762, - "score": 0.0 - } - ] - }, - "GW": { - "score": 0.43859551519338624, - "languages": [ - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 1927100, - "score": 0.45 - }, - { - "name": "Fula", - "bcp_47": "ff", - "population": 4, - "score": 0.0 - }, - { - "name": "Mankanya", - "bcp_47": "knf", - "population": 50105, - "score": 0.0 - } - ] - }, - "MZ": { - "score": 0.1480934184335346, - "languages": [ - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 8126514, - "score": 0.45 - }, - { - "name": "Swahili", - "bcp_47": "sw", - "population": 9330, - "score": 0.45 - }, - { - "name": "Nyanja", - "bcp_47": "ny", - "population": 782553, - "score": 0.0 - }, - { - "name": "Zulu", - "bcp_47": "zu", - "population": 1806, - "score": 0.0 - }, - { - "name": "Tsonga", - "bcp_47": "ts", - "population": 2377758, - "score": 0.0 - }, - { - "name": "Makhuwa", - "bcp_47": "vmw", - "population": 3912766, - "score": 0.0 - }, - { - "name": "Ndau", - "bcp_47": "ndc", - "population": 2979722, - "score": 0.0 - }, - { - "name": "Lomwe", - "bcp_47": "ngl", - "population": 2046678, - "score": 0.0 - }, - { - "name": "Sena", - "bcp_47": "seh", - "population": 1384517, - "score": 0.0 - }, - { - "name": "Makhuwa-Meetto", - "bcp_47": "mgh", - "population": 1354419, - "score": 0.0 - }, - { - "name": "Ronga", - "bcp_47": "rng", - "population": 1023339, - "score": 0.0 - }, - { - "name": "Yao", - "bcp_47": "yao", - "population": 722357, - "score": 0.0 - } - ] - }, - "ST": { - "score": 0.45, - "languages": [ - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 179454, - "score": 0.45 - } - ] - }, - "TL": { - "score": 0.225, - "languages": [ - { - "name": "Portuguese", - "bcp_47": "pt", - "population": 816395, - "score": 0.45 - }, - { - "name": "Tetum", - "bcp_47": "tet", - "population": 816395, - "score": 0.0 - } - ] - }, - "BY": { - "score": 0.04821427057437069, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 1137350, - "score": 0.45 - }, - { - "name": "Belarusian", - "bcp_47": "be", - "population": 9477920, - "score": 0.0 - } - ] - }, - "GE": { - "score": 0.03423789210395573, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 359730, - "score": 0.45 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 35573, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 279790, - "score": 0.0 - }, - { - "name": "Georgian", - "bcp_47": "ka", - "population": 3437420, - "score": 0.0 - }, - { - "name": "Ossetic", - "bcp_47": "os", - "population": 87934, - "score": 0.0 - }, - { - "name": "Mingrelian", - "bcp_47": "xmf", - "population": 439670, - "score": 0.0 - }, - { - "name": "Abkhazian", - "bcp_47": "ab", - "population": 87934, - "score": 0.0 - } - ] - }, - "KG": { - "score": 0.19285714285714287, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 2147364, - "score": 0.45 - }, - { - "name": "Kyrgyz", - "bcp_47": "ky", - "population": 2863152, - "score": 0.0 - } - ] - }, - "MD": { - "score": 0.014563109130777574, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 100935, - "score": 0.45 - }, - { - "name": "Ukrainian", - "bcp_47": "uk", - "population": 471030, - "score": 0.0 - }, - { - "name": "Romanian", - "bcp_47": "ro", - "population": 2119635, - "score": 0.0 - }, - { - "name": "Bulgarian", - "bcp_47": "bg", - "population": 316263, - "score": 0.0 - }, - { - "name": "Gagauz", - "bcp_47": "gag", - "population": 111028, - "score": 0.0 - } - ] - }, - "RU": { - "score": 0.4065329789745318, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 133218680, - "score": 0.45 - }, - { - "name": "Azerbaijani", - "bcp_47": "az", - "population": 131801, - "score": 0.0 - }, - { - "name": "Serbian", - "bcp_47": "sr", - "population": 4960, - "score": 0.0 - }, - { - "name": "Mongolian", - "bcp_47": "mn", - "population": 2126, - "score": 0.0 - }, - { - "name": "Finnish", - "bcp_47": "fi", - "population": 17007, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 1190465, - "score": 0.0 - }, - { - "name": "Tatar", - "bcp_47": "tt", - "population": 1984108, - "score": 0.0 - }, - { - "name": "Chuvash", - "bcp_47": "cv", - "population": 1842386, - "score": 0.0 - }, - { - "name": "Bashkir", - "bcp_47": "ba", - "population": 1842386, - "score": 0.0 - }, - { - "name": "Kabardian", - "bcp_47": "kbd", - "population": 439338, - "score": 0.0 - }, - { - "name": "Chechen", - "bcp_47": "ce", - "population": 935365, - "score": 0.0 - }, - { - "name": "Avaric", - "bcp_47": "av", - "population": 552716, - "score": 0.0 - }, - { - "name": "Ossetic", - "bcp_47": "os", - "population": 453510, - "score": 0.0 - }, - { - "name": "Udmurt", - "bcp_47": "udm", - "population": 538544, - "score": 0.0 - }, - { - "name": "Mari", - "bcp_47": "chm", - "population": 524371, - "score": 0.0 - }, - { - "name": "Yakut", - "bcp_47": "sah", - "population": 453510, - "score": 0.0 - }, - { - "name": "Adyghe", - "bcp_47": "ady", - "population": 124715, - "score": 0.0 - }, - { - "name": "Erzya", - "bcp_47": "myv", - "population": 439338, - "score": 0.0 - }, - { - "name": "Dargwa", - "bcp_47": "dar", - "population": 368477, - "score": 0.0 - }, - { - "name": "Buriat", - "bcp_47": "bua", - "population": 311788, - "score": 0.0 - }, - { - "name": "Moksha", - "bcp_47": "mdf", - "population": 297616, - "score": 0.0 - }, - { - "name": "Kumyk", - "bcp_47": "kum", - "population": 283444, - "score": 0.0 - }, - { - "name": "Lezghian", - "bcp_47": "lez", - "population": 255100, - "score": 0.0 - }, - { - "name": "Komi", - "bcp_47": "kv", - "population": 255100, - "score": 0.0 - }, - { - "name": "Karachay-Balkar", - "bcp_47": "krc", - "population": 240927, - "score": 0.0 - }, - { - "name": "Ingush", - "bcp_47": "inh", - "population": 226755, - "score": 0.0 - }, - { - "name": "Tuvinian", - "bcp_47": "tyv", - "population": 184239, - "score": 0.0 - }, - { - "name": "Karelian", - "bcp_47": "krl", - "population": 116212, - "score": 0.0 - }, - { - "name": "Lak", - "bcp_47": "lbe", - "population": 110543, - "score": 0.0 - }, - { - "name": "Komi-Permyak", - "bcp_47": "koi", - "population": 63775, - "score": 0.0 - }, - { - "name": "Western Mari", - "bcp_47": "mrj", - "population": 29762, - "score": 0.0 - }, - { - "name": "Southern Altai", - "bcp_47": "alt", - "population": 19841, - "score": 0.0 - }, - { - "name": "Veps", - "bcp_47": "vep", - "population": 3543, - "score": 0.0 - }, - { - "name": "Ingrian", - "bcp_47": "izh", - "population": 142, - "score": 0.0 - }, - { - "name": "Votic", - "bcp_47": "vot", - "population": 0, - "score": 0.0 - }, - { - "name": "Church Slavic", - "bcp_47": "cu", - "population": 0, - "score": 0.0 - } - ] - }, - "SJ": { - "score": 0.20059435364041606, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 1200, - "score": 0.45 - }, - { - "name": "Norwegian Bokmål", - "bcp_47": "nb", - "population": 1492, - "score": 0.0 - } - ] - }, - "TM": { - "score": 0.059080984625687366, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 663436, - "score": 0.45 - }, - { - "name": "Uzbek", - "bcp_47": "uz", - "population": 497577, - "score": 0.0 - }, - { - "name": "Turkmen", - "bcp_47": "tk", - "population": 3870041, - "score": 0.0 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 22115, - "score": 0.0 - } - ] - }, - "UA": { - "score": 0.17534632621240526, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 20204534, - "score": 0.45 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 184476, - "score": 0.44 - }, - { - "name": "Polish", - "bcp_47": "pl", - "population": 1054150, - "score": 0.0 - }, - { - "name": "Ukrainian", - "bcp_47": "uk", - "population": 28549885, - "score": 0.0 - }, - { - "name": "Romanian", - "bcp_47": "ro", - "population": 228399, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 162515, - "score": 0.0 - }, - { - "name": "Greek", - "bcp_47": "el", - "population": 7028, - "score": 0.0 - }, - { - "name": "Belarusian", - "bcp_47": "be", - "population": 364560, - "score": 0.0 - }, - { - "name": "Bulgarian", - "bcp_47": "bg", - "population": 215222, - "score": 0.0 - }, - { - "name": "Yiddish", - "bcp_47": "yi", - "population": 570998, - "score": 0.0 - }, - { - "name": "Rusyn", - "bcp_47": "rue", - "population": 527075, - "score": 0.0 - }, - { - "name": "Crimean Tatar", - "bcp_47": "crh", - "population": 245968, - "score": 0.0 - } - ] - }, - "UZ": { - "score": 0.05701615696541229, - "languages": [ - { - "name": "Russian", - "bcp_47": "ru", - "population": 4279156, - "score": 0.45 - }, - { - "name": "Turkish", - "bcp_47": "tr", - "population": 232297, - "score": 0.44 - }, - { - "name": "Uzbek", - "bcp_47": "uz", - "population": 30565400, - "score": 0.0 - }, - { - "name": "Kara-Kalpak", - "bcp_47": "kaa", - "population": 489046, - "score": 0.0 - } - ] - }, - "LI": { - "score": 0.26022294592577516, - "languages": [ - { - "name": "German", - "bcp_47": "de", - "population": 39137, - "score": 0.49 - }, - { - "name": "Swiss German", - "bcp_47": "gsw", - "population": 33266, - "score": 0.0 - }, - { - "name": "Walser", - "bcp_47": "wae", - "population": 1292, - "score": 0.0 - } - ] - }, - "JP": { - "score": 0.4560515108353953, - "languages": [ - { - "name": "Japanese", - "bcp_47": "ja", - "population": 119231650, - "score": 0.46 - }, - { - "name": "Korean", - "bcp_47": "ko", - "population": 652636, - "score": 0.41 - }, - { - "name": "Central Okinawan", - "bcp_47": "ryu", - "population": 966404, - "score": 0.0 - } - ] - }, - "AF": { - "score": 0.19133182400153392, - "languages": [ - { - "name": "Persian", - "bcp_47": "fa", - "population": 18321900, - "score": 0.41 - }, - { - "name": "Pashto", - "bcp_47": "ps", - "population": 15756834, - "score": 0.0 - }, - { - "name": "Uzbek", - "bcp_47": "uz", - "population": 1722259, - "score": 0.0 - }, - { - "name": "Kazakh", - "bcp_47": "kk", - "population": 2015, - "score": 0.0 - }, - { - "name": "Uyghur", - "bcp_47": "ug", - "population": 3005, - "score": 0.0 - }, - { - "name": "Turkmen", - "bcp_47": "tk", - "population": 622945, - "score": 0.0 - }, - { - "name": "Hazaragi", - "bcp_47": "haz", - "population": 2161984, - "score": 0.0 - }, - { - "name": "Western Balochi", - "bcp_47": "bgn", - "population": 230856, - "score": 0.0 - }, - { - "name": "Parsi-Dari", - "bcp_47": "prd", - "population": 439726, - "score": 0.0 - } - ] - }, - "MK": { - "score": 0.016125668065966572, - "languages": [ - { - "name": "Turkish", - "bcp_47": "tr", - "population": 74409, - "score": 0.44 - }, - { - "name": "Albanian", - "bcp_47": "sq", - "population": 531492, - "score": 0.0 - }, - { - "name": "Macedonian", - "bcp_47": "mk", - "population": 1424400, - "score": 0.0 - } - ] - }, - "KP": { - "score": 0.41, - "languages": [ - { - "name": "Korean", - "bcp_47": "ko", - "population": 22566280, - "score": 0.41 - } - ] - }, - "KR": { - "score": 0.41, - "languages": [ - { - "name": "Korean", - "bcp_47": "ko", - "population": 51835100, - "score": 0.41 - } - ] - }, - "SM": { - "score": 0.4654018916371436, - "languages": [ - { - "name": "Italian", - "bcp_47": "it", - "population": 30466, - "score": 0.47 - }, - { - "name": "Esperanto", - "bcp_47": "eo", - "population": 301, - "score": 0.0 - } - ] - }, - "VA": { - "score": 0.235, - "languages": [ - { - "name": "Italian", - "bcp_47": "it", - "population": 820, - "score": 0.47 - }, - { - "name": "Latin", - "bcp_47": "la", - "population": 820, - "score": 0.0 - } - ] - }, - "MM": { - "score": 0.0, - "languages": [ - { - "name": "Burmese", - "bcp_47": "my", - "population": 36217664, - "score": 0.0 - }, - { - "name": "Shan", - "bcp_47": "shn", - "population": 3621766, - "score": 0.0 - }, - { - "name": "Rohingya", - "bcp_47": "rhg", - "population": 962032, - "score": 0.0 - }, - { - "name": "Mon", - "bcp_47": "mnw", - "population": 848852, - "score": 0.0 - }, - { - "name": "Kachin", - "bcp_47": "kac", - "population": 962032, - "score": 0.0 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 12450, - "score": 0.0 - }, - { - "name": "Khamti", - "bcp_47": "kht", - "population": 4244, - "score": 0.0 - } - ] - }, - "AM": { - "score": 0.0, - "languages": [ - { - "name": "Azerbaijani", - "bcp_47": "az", - "population": 0, - "score": 0.0 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 99704, - "score": 0.0 - }, - { - "name": "Armenian", - "bcp_47": "hy", - "population": 2960894, - "score": 0.0 - } - ] - }, - "AZ": { - "score": 0.0, - "languages": [ - { - "name": "Azerbaijani", - "bcp_47": "az", - "population": 10093536, - "score": 0.0 - }, - { - "name": "Kurdish", - "bcp_47": "ku", - "population": 24494, - "score": 0.0 - }, - { - "name": "Talysh", - "bcp_47": "tly", - "population": 1000168, - "score": 0.0 - }, - { - "name": "Muslim Tat", - "bcp_47": "ttt", - "population": 22453, - "score": 0.0 - }, - { - "name": "Tsakhur", - "bcp_47": "tkr", - "population": 16329, - "score": 0.0 - } - ] - }, - "BQ": { - "score": 0.0, - "languages": [ - { - "name": "Dutch", - "bcp_47": "nl", - "population": 1600, - "score": 0.0 - }, - { - "name": "Papiamento", - "bcp_47": "pap", - "population": 16200, - "score": 0.0 - } - ] - }, - "RS": { - "score": 0.0, - "languages": [ - { - "name": "Ukrainian", - "bcp_47": "uk", - "population": 0, - "score": 0.0 - }, - { - "name": "Romanian", - "bcp_47": "ro", - "population": 147256, - "score": 0.0 - }, - { - "name": "Serbian", - "bcp_47": "sr", - "population": 13884096, - "score": 0.0 - }, - { - "name": "Hungarian", - "bcp_47": "hu", - "population": 336584, - "score": 0.0 - }, - { - "name": "Croatian", - "bcp_47": "hr", - "population": 65213, - "score": 0.0 - }, - { - "name": "Albanian", - "bcp_47": "sq", - "population": 1332312, - "score": 0.0 - }, - { - "name": "Slovak", - "bcp_47": "sk", - "population": 59603, - "score": 0.0 - } - ] - }, - "ME": { - "score": 0.0, - "languages": [ - { - "name": "Serbian", - "bcp_47": "sr", - "population": 640352, - "score": 0.0 - }, - { - "name": "Albanian", - "bcp_47": "sq", - "population": 48179, - "score": 0.0 - } - ] - }, - "XK": { - "score": 0.0, - "languages": [ - { - "name": "Serbian", - "bcp_47": "sr", - "population": 193276, - "score": 0.0 - }, - { - "name": "Albanian", - "bcp_47": "sq", - "population": 1778148, - "score": 0.0 - }, - { - "name": "Gheg Albanian", - "bcp_47": "aln", - "population": 1430250, - "score": 0.0 - } - ] - }, - "KH": { - "score": 0.0, - "languages": [ - { - "name": "Khmer", - "bcp_47": "km", - "population": 15065030, - "score": 0.0 - }, - { - "name": "Kuy", - "bcp_47": "kdt", - "population": 18620, - "score": 0.0 - }, - { - "name": "Western Cham", - "bcp_47": "cja", - "population": 270832, - "score": 0.0 - } - ] - }, - "AX": { - "score": 0.0, - "languages": [ - { - "name": "Swedish", - "bcp_47": "sv", - "population": 25938, - "score": 0.0 - } - ] - }, - "AL": { - "score": 0.0, - "languages": [ - { - "name": "Greek", - "bcp_47": "el", - "population": 58417, - "score": 0.0 - }, - { - "name": "Albanian", - "bcp_47": "sq", - "population": 3074580, - "score": 0.0 - }, - { - "name": "Macedonian", - "bcp_47": "mk", - "population": 14451, - "score": 0.0 - } - ] - }, - "GL": { - "score": 0.0, - "languages": [ - { - "name": "Danish", - "bcp_47": "da", - "population": 8066, - "score": 0.0 - }, - { - "name": "Kalaallisut", - "bcp_47": "kl", - "population": 48397, - "score": 0.0 - } - ] - }, - "IS": { - "score": 0.0, - "languages": [ - { - "name": "Danish", - "bcp_47": "da", - "population": 2245, - "score": 0.0 - }, - { - "name": "Icelandic", - "bcp_47": "is", - "population": 350734, - "score": 0.0 - } - ] - }, - "NO": { - "score": 0.0, - "languages": [ - { - "name": "Norwegian Bokmål", - "bcp_47": "nb", - "population": 5467440, - "score": 0.0 - }, - { - "name": "Norwegian", - "bcp_47": "no", - "population": 5467440, - "score": 0.0 - }, - { - "name": "Norwegian Nynorsk", - "bcp_47": "nn", - "population": 1366860, - "score": 0.0 - }, - { - "name": "Northern Sami", - "bcp_47": "se", - "population": 15856, - "score": 0.0 - } - ] - }, - "LA": { - "score": 0.0, - "languages": [ - { - "name": "Lao", - "bcp_47": "lo", - "population": 5138706, - "score": 0.0 - }, - { - "name": "Hmong Njua", - "bcp_47": "hnj", - "population": 223422, - "score": 0.0 - }, - { - "name": "Khmu", - "bcp_47": "kjg", - "population": 431949, - "score": 0.0 - }, - { - "name": "Kuy", - "bcp_47": "kdt", - "population": 71495, - "score": 0.0 - } - ] - }, - "FO": { - "score": 0.0, - "languages": [ - { - "name": "Faroese", - "bcp_47": "fo", - "population": 49047, - "score": 0.0 - } - ] - } - } -} \ No newline at end of file