diff --git a/data/Abkhaz-Adyghe.json b/data/Abkhaz-Adyghe.json index fa2edb3b4d2d733a1117c7ea9f63440223b89bac..f2915490ace18360d607d77bb065b49ea49c9b10 100644 --- a/data/Abkhaz-Adyghe.json +++ b/data/Abkhaz-Adyghe.json @@ -1,18 +1,22 @@ { "name": "Abkhaz-Adyghe", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abkhaz-Abazin", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abkhaz", + "depth": 2, "iso_1_code": "ab", "iso_3_code": "abk", "children": [], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "2", "native_tokenizers": [], @@ -22,9 +26,11 @@ }, { "name": "Abaza", + "depth": 2, "iso_1_code": null, "iso_3_code": "abq", "children": [], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "3", "native_tokenizers": [], @@ -33,6 +39,7 @@ ] } ], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "1", "native_tokenizers": [], @@ -40,14 +47,17 @@ }, { "name": "Circassian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adyghe", + "depth": 2, "iso_1_code": null, "iso_3_code": "ady", "children": [], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "5", "native_tokenizers": [], @@ -57,9 +67,11 @@ }, { "name": "Kabardian", + "depth": 2, "iso_1_code": null, "iso_3_code": "kbd", "children": [], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "6", "native_tokenizers": [], @@ -68,6 +80,7 @@ ] } ], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "4", "native_tokenizers": [], @@ -75,26 +88,31 @@ }, { "name": "Ubyx", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ubykh", + "depth": 2, "iso_1_code": null, "iso_3_code": "uby", "children": [], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "8", "native_tokenizers": [], "scripts": [] } ], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "7", "native_tokenizers": [], "scripts": [] } ], + "family": "Abkhaz-Adyghe", "tokenizers": {}, "node_i": "0", "native_tokenizers": [], diff --git a/data/Afro-Asiatic.json b/data/Afro-Asiatic.json index d2acc0027fa08c8f36583faa27f421e6f1b4cfa2..00e95b1576b595b271f49d2fd6f17d31c482c321 100644 --- a/data/Afro-Asiatic.json +++ b/data/Afro-Asiatic.json @@ -1,18 +1,22 @@ { "name": "Afro-Asiatic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berber", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guanche", + "depth": 2, "iso_1_code": null, "iso_3_code": "gnc", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "11", "native_tokenizers": [], @@ -20,19 +24,23 @@ }, { "name": "Eastern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awjila-Sokna", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awjilah", + "depth": 4, "iso_1_code": null, "iso_3_code": "auj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "14", "native_tokenizers": [], @@ -40,15 +48,18 @@ }, { "name": "Sawknah", + "depth": 4, "iso_1_code": null, "iso_3_code": "swn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "15", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "13", "native_tokenizers": [], @@ -56,26 +67,31 @@ }, { "name": "Siwa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Siwi", + "depth": 4, "iso_1_code": null, "iso_3_code": "siz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "17", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "16", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "12", "native_tokenizers": [], @@ -83,14 +99,17 @@ }, { "name": "Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chenoua", + "depth": 3, "iso_1_code": null, "iso_3_code": "cnu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "19", "native_tokenizers": [], @@ -98,14 +117,17 @@ }, { "name": "Atlas", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Judeo-Berber", + "depth": 4, "iso_1_code": null, "iso_3_code": "jbe", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "21", "native_tokenizers": [], @@ -113,18 +135,12 @@ }, { "name": "Tachelhit", + "depth": 4, "iso_1_code": null, "iso_3_code": "shi", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "22", "native_tokenizers": [], "scripts": [ @@ -133,9 +149,11 @@ }, { "name": "Tamazight, Central Atlas", + "depth": 4, "iso_1_code": null, "iso_3_code": "tzm", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "23", "native_tokenizers": [], @@ -145,9 +163,11 @@ }, { "name": "Tamazight, Standard Moroccan", + "depth": 4, "iso_1_code": null, "iso_3_code": "zgh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "24", "native_tokenizers": [], @@ -156,38 +176,26 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "20", "native_tokenizers": [], "scripts": [] }, { "name": "Kabyle", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kabyle", + "depth": 4, "iso_1_code": null, "iso_3_code": "kab", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "26", "native_tokenizers": [], "scripts": [ @@ -195,34 +203,31 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "25", "native_tokenizers": [], "scripts": [] }, { "name": "Zenati", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ghadam\u00e8s", + "depth": 5, "iso_1_code": null, "iso_3_code": "gha", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "29", "native_tokenizers": [], @@ -230,9 +235,11 @@ }, { "name": "Nafusi", + "depth": 5, "iso_1_code": null, "iso_3_code": "jbn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "30", "native_tokenizers": [], @@ -240,15 +247,18 @@ }, { "name": "Sened", + "depth": 5, "iso_1_code": null, "iso_3_code": "sds", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "31", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "28", "native_tokenizers": [], @@ -256,20 +266,24 @@ }, { "name": "Ghomara", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ghomara", + "depth": 5, "iso_1_code": null, "iso_3_code": "gho", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "33", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "32", "native_tokenizers": [], @@ -277,14 +291,17 @@ }, { "name": "Mzab-Wargla", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Taznatit", + "depth": 5, "iso_1_code": null, "iso_3_code": "grr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "35", "native_tokenizers": [], @@ -292,9 +309,11 @@ }, { "name": "Tumzabt", + "depth": 5, "iso_1_code": null, "iso_3_code": "mzb", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "36", "native_tokenizers": [], @@ -302,9 +321,11 @@ }, { "name": "Tagargrent", + "depth": 5, "iso_1_code": null, "iso_3_code": "oua", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "37", "native_tokenizers": [], @@ -312,15 +333,18 @@ }, { "name": "Tamazight, Temacine", + "depth": 5, "iso_1_code": null, "iso_3_code": "tjo", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "38", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "34", "native_tokenizers": [], @@ -328,14 +352,17 @@ }, { "name": "Riff", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tarifit", + "depth": 5, "iso_1_code": null, "iso_3_code": "rif", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "40", "native_tokenizers": [], @@ -343,15 +370,18 @@ }, { "name": "Senhaja Berber", + "depth": 5, "iso_1_code": null, "iso_3_code": "sjs", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "41", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "39", "native_tokenizers": [], @@ -359,20 +389,24 @@ }, { "name": "Shawiya", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tachawit", + "depth": 5, "iso_1_code": null, "iso_3_code": "shy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "43", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "42", "native_tokenizers": [], @@ -380,69 +414,63 @@ }, { "name": "Tidikelt", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tamazight, Tidikelt", + "depth": 5, "iso_1_code": null, "iso_3_code": "tia", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "45", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "44", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "27", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "18", "native_tokenizers": [], "scripts": [] }, { "name": "Tamasheq", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tamahaq, Tahaggart", + "depth": 4, "iso_1_code": null, "iso_3_code": "thv", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "48", "native_tokenizers": [], "scripts": [ @@ -450,38 +478,26 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "47", "native_tokenizers": [], "scripts": [] }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tamasheq", + "depth": 4, "iso_1_code": null, "iso_3_code": "taq", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "50", "native_tokenizers": [], "scripts": [ @@ -491,9 +507,11 @@ }, { "name": "Tamajeq, Tayart", + "depth": 4, "iso_1_code": null, "iso_3_code": "thz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "51", "native_tokenizers": [], @@ -501,18 +519,12 @@ }, { "name": "Tamajaq, Tawallammat", + "depth": 4, "iso_1_code": null, "iso_3_code": "ttq", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "52", "native_tokenizers": [], "scripts": [ @@ -521,43 +533,32 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "49", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "46", "native_tokenizers": [], "scripts": [] }, { "name": "Zenaga", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tetserret", + "depth": 3, "iso_1_code": null, "iso_3_code": "tez", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "54", "native_tokenizers": [], @@ -565,64 +566,67 @@ }, { "name": "Zenaga", + "depth": 3, "iso_1_code": null, "iso_3_code": "zen", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "55", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "53", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "10", "native_tokenizers": [], "scripts": [] }, { "name": "Chadic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biu-Mandara", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A.1", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boga", + "depth": 6, "iso_1_code": null, "iso_3_code": "bvw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "61", "native_tokenizers": [], @@ -630,9 +634,11 @@ }, { "name": "Ga\u2019anda", + "depth": 6, "iso_1_code": null, "iso_3_code": "gqa", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "62", "native_tokenizers": [], @@ -640,15 +646,18 @@ }, { "name": "Hwana", + "depth": 6, "iso_1_code": null, "iso_3_code": "hwo", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "63", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "60", "native_tokenizers": [], @@ -656,14 +665,17 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jara", + "depth": 6, "iso_1_code": null, "iso_3_code": "jaf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "65", "native_tokenizers": [], @@ -671,21 +683,25 @@ }, { "name": "Tera", + "depth": 6, "iso_1_code": null, "iso_3_code": "ttr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "66", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "64", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "59", "native_tokenizers": [], @@ -693,14 +709,17 @@ }, { "name": "A.2", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nggwahyi", + "depth": 5, "iso_1_code": null, "iso_3_code": "ngx", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "68", "native_tokenizers": [], @@ -708,14 +727,17 @@ }, { "name": "1", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bura-Pabir", + "depth": 6, "iso_1_code": null, "iso_3_code": "bwr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "70", "native_tokenizers": [], @@ -723,9 +745,11 @@ }, { "name": "Kibaku", + "depth": 6, "iso_1_code": null, "iso_3_code": "ckl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "71", "native_tokenizers": [], @@ -733,9 +757,11 @@ }, { "name": "Kofa", + "depth": 6, "iso_1_code": null, "iso_3_code": "kso", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "72", "native_tokenizers": [], @@ -743,15 +769,18 @@ }, { "name": "Putai", + "depth": 6, "iso_1_code": null, "iso_3_code": "mfl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "73", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "69", "native_tokenizers": [], @@ -759,14 +788,17 @@ }, { "name": "2", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nya Huba", + "depth": 6, "iso_1_code": null, "iso_3_code": "hbb", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "75", "native_tokenizers": [], @@ -774,9 +806,11 @@ }, { "name": "Marghi South", + "depth": 6, "iso_1_code": null, "iso_3_code": "mfm", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "76", "native_tokenizers": [], @@ -784,21 +818,25 @@ }, { "name": "Marghi Central", + "depth": 6, "iso_1_code": null, "iso_3_code": "mrt", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "77", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "74", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "67", "native_tokenizers": [], @@ -806,23 +844,18 @@ }, { "name": "A.3", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bana", + "depth": 5, "iso_1_code": null, "iso_3_code": "bcw", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "79", "native_tokenizers": [], "scripts": [ @@ -831,9 +864,11 @@ }, { "name": "Kirya-Konzel", + "depth": 5, "iso_1_code": null, "iso_3_code": "fkk", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "80", "native_tokenizers": [], @@ -841,18 +876,12 @@ }, { "name": "Kamwe", + "depth": 5, "iso_1_code": null, "iso_3_code": "hig", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "81", "native_tokenizers": [], "scripts": [ @@ -861,9 +890,11 @@ }, { "name": "Hya", + "depth": 5, "iso_1_code": null, "iso_3_code": "hya", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "82", "native_tokenizers": [], @@ -871,18 +902,12 @@ }, { "name": "Psikye", + "depth": 5, "iso_1_code": null, "iso_3_code": "kvj", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "83", "native_tokenizers": [], "scripts": [ @@ -890,34 +915,31 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "78", "native_tokenizers": [], "scripts": [] }, { "name": "A.4", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lamang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lamang", + "depth": 6, "iso_1_code": null, "iso_3_code": "hia", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "86", "native_tokenizers": [], @@ -925,9 +947,11 @@ }, { "name": "Vemgo-Mabas", + "depth": 6, "iso_1_code": null, "iso_3_code": "vem", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "87", "native_tokenizers": [], @@ -935,18 +959,12 @@ }, { "name": "Hdi", + "depth": 6, "iso_1_code": null, "iso_3_code": "xed", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "88", "native_tokenizers": [], "scripts": [ @@ -954,34 +972,31 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "85", "native_tokenizers": [], "scripts": [] }, { "name": "Mandara Proper", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Glavda", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cineni", + "depth": 7, "iso_1_code": null, "iso_3_code": "cie", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "91", "native_tokenizers": [], @@ -989,9 +1004,11 @@ }, { "name": "Dghwede", + "depth": 7, "iso_1_code": null, "iso_3_code": "dgh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "92", "native_tokenizers": [], @@ -999,9 +1016,11 @@ }, { "name": "Guduf-Gava", + "depth": 7, "iso_1_code": null, "iso_3_code": "gdf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "93", "native_tokenizers": [], @@ -1009,9 +1028,11 @@ }, { "name": "Glavda", + "depth": 7, "iso_1_code": null, "iso_3_code": "glw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "94", "native_tokenizers": [], @@ -1019,15 +1040,18 @@ }, { "name": "Gvoko", + "depth": 7, "iso_1_code": null, "iso_3_code": "ngs", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "95", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "90", "native_tokenizers": [], @@ -1035,23 +1059,18 @@ }, { "name": "Mandara", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wandala", + "depth": 7, "iso_1_code": null, "iso_3_code": "mfi", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "97", "native_tokenizers": [], "scripts": [ @@ -1059,38 +1078,26 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "96", "native_tokenizers": [], "scripts": [] }, { "name": "Podoko", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Parkwa", + "depth": 7, "iso_1_code": null, "iso_3_code": "pbi", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "99", "native_tokenizers": [], "scripts": [ @@ -1098,57 +1105,39 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "98", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "89", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "84", "native_tokenizers": [], "scripts": [] }, { "name": "A.5", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baldemu", + "depth": 5, "iso_1_code": null, "iso_3_code": "bdn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "101", "native_tokenizers": [], @@ -1156,9 +1145,11 @@ }, { "name": "Cuvok", + "depth": 5, "iso_1_code": null, "iso_3_code": "cuv", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "102", "native_tokenizers": [], @@ -1166,9 +1157,11 @@ }, { "name": "Dugwor", + "depth": 5, "iso_1_code": null, "iso_3_code": "dme", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "103", "native_tokenizers": [], @@ -1176,9 +1169,11 @@ }, { "name": "Giziga, North", + "depth": 5, "iso_1_code": null, "iso_3_code": "gis", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "104", "native_tokenizers": [], @@ -1186,18 +1181,12 @@ }, { "name": "Giziga", + "depth": 5, "iso_1_code": null, "iso_3_code": "giz", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "105", "native_tokenizers": [], "scripts": [ @@ -1206,18 +1195,12 @@ }, { "name": "Zulgo-Gemzek", + "depth": 5, "iso_1_code": null, "iso_3_code": "gnd", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "106", "native_tokenizers": [], "scripts": [ @@ -1226,18 +1209,12 @@ }, { "name": "Mafa", + "depth": 5, "iso_1_code": null, "iso_3_code": "maf", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "107", "native_tokenizers": [], "scripts": [ @@ -1246,18 +1223,12 @@ }, { "name": "Merey", + "depth": 5, "iso_1_code": null, "iso_3_code": "meq", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "108", "native_tokenizers": [], "scripts": [ @@ -1266,18 +1237,12 @@ }, { "name": "Matal", + "depth": 5, "iso_1_code": null, "iso_3_code": "mfh", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "109", "native_tokenizers": [], "scripts": [ @@ -1286,9 +1251,11 @@ }, { "name": "Mefele", + "depth": 5, "iso_1_code": null, "iso_3_code": "mfj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "110", "native_tokenizers": [], @@ -1296,18 +1263,12 @@ }, { "name": "Mofu, North", + "depth": 5, "iso_1_code": null, "iso_3_code": "mfk", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "111", "native_tokenizers": [], "scripts": [ @@ -1316,18 +1277,12 @@ }, { "name": "Mofu-Gudur", + "depth": 5, "iso_1_code": null, "iso_3_code": "mif", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "112", "native_tokenizers": [], "scripts": [ @@ -1336,9 +1291,11 @@ }, { "name": "Vame", + "depth": 5, "iso_1_code": null, "iso_3_code": "mlr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "113", "native_tokenizers": [], @@ -1346,9 +1303,11 @@ }, { "name": "Moloko", + "depth": 5, "iso_1_code": null, "iso_3_code": "mlw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "114", "native_tokenizers": [], @@ -1356,18 +1315,12 @@ }, { "name": "Mbuko", + "depth": 5, "iso_1_code": null, "iso_3_code": "mqb", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "115", "native_tokenizers": [], "scripts": [ @@ -1376,18 +1329,12 @@ }, { "name": "Muyang", + "depth": 5, "iso_1_code": null, "iso_3_code": "muy", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "116", "native_tokenizers": [], "scripts": [ @@ -1396,9 +1343,11 @@ }, { "name": "Mada", + "depth": 5, "iso_1_code": null, "iso_3_code": "mxu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "117", "native_tokenizers": [], @@ -1406,44 +1355,43 @@ }, { "name": "Wuzlam", + "depth": 5, "iso_1_code": null, "iso_3_code": "udl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "118", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "100", "native_tokenizers": [], "scripts": [] }, { "name": "A.6", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sukur", + "depth": 5, "iso_1_code": null, "iso_3_code": "syk", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "120", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "119", "native_tokenizers": [], @@ -1451,14 +1399,17 @@ }, { "name": "A.7", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buwal", + "depth": 5, "iso_1_code": null, "iso_3_code": "bhs", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "122", "native_tokenizers": [], @@ -1466,18 +1417,12 @@ }, { "name": "Daba", + "depth": 5, "iso_1_code": null, "iso_3_code": "dbq", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "123", "native_tokenizers": [], "scripts": [ @@ -1486,9 +1431,11 @@ }, { "name": "Mazagway-Hidi", + "depth": 5, "iso_1_code": null, "iso_3_code": "dkx", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "124", "native_tokenizers": [], @@ -1496,9 +1443,11 @@ }, { "name": "Gavar", + "depth": 5, "iso_1_code": null, "iso_3_code": "gou", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "125", "native_tokenizers": [], @@ -1506,9 +1455,11 @@ }, { "name": "Mina", + "depth": 5, "iso_1_code": null, "iso_3_code": "hna", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "126", "native_tokenizers": [], @@ -1516,38 +1467,36 @@ }, { "name": "Mbudum", + "depth": 5, "iso_1_code": null, "iso_3_code": "xmd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "127", "native_tokenizers": [], - "scripts": [] - } - ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" + "scripts": [] } - }, + ], + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "121", "native_tokenizers": [], "scripts": [] }, { "name": "A.8", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bacama", + "depth": 5, "iso_1_code": null, "iso_3_code": "bcy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "129", "native_tokenizers": [], @@ -1555,9 +1504,11 @@ }, { "name": "Bata", + "depth": 5, "iso_1_code": null, "iso_3_code": "bta", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "130", "native_tokenizers": [], @@ -1565,9 +1516,11 @@ }, { "name": "Fali Muchella", + "depth": 5, "iso_1_code": null, "iso_3_code": "fli", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "131", "native_tokenizers": [], @@ -1575,18 +1528,12 @@ }, { "name": "Gude", + "depth": 5, "iso_1_code": null, "iso_3_code": "gde", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "132", "native_tokenizers": [], "scripts": [ @@ -1595,9 +1542,11 @@ }, { "name": "Gudu", + "depth": 5, "iso_1_code": null, "iso_3_code": "gdu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "133", "native_tokenizers": [], @@ -1605,9 +1554,11 @@ }, { "name": "Holma", + "depth": 5, "iso_1_code": null, "iso_3_code": "hod", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "134", "native_tokenizers": [], @@ -1615,9 +1566,11 @@ }, { "name": "Jimjimen", + "depth": 5, "iso_1_code": null, "iso_3_code": "jim", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "135", "native_tokenizers": [], @@ -1625,9 +1578,11 @@ }, { "name": "Ngwaba", + "depth": 5, "iso_1_code": null, "iso_3_code": "ngw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "136", "native_tokenizers": [], @@ -1635,9 +1590,11 @@ }, { "name": "Nzanyi", + "depth": 5, "iso_1_code": null, "iso_3_code": "nja", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "137", "native_tokenizers": [], @@ -1645,9 +1602,11 @@ }, { "name": "Sharwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "swq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "138", "native_tokenizers": [], @@ -1655,9 +1614,11 @@ }, { "name": "Tsuvan", + "depth": 5, "iso_1_code": null, "iso_3_code": "tsh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "139", "native_tokenizers": [], @@ -1665,57 +1626,49 @@ }, { "name": "Zizilivakan", + "depth": 5, "iso_1_code": null, "iso_3_code": "ziz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "140", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "128", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "58", "native_tokenizers": [], "scripts": [] }, { "name": "B", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "B.1", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Auyokawa", + "depth": 5, "iso_1_code": null, "iso_3_code": "auo", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "143", "native_tokenizers": [], @@ -1723,9 +1676,11 @@ }, { "name": "Jilbe", + "depth": 5, "iso_1_code": null, "iso_3_code": "jie", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "144", "native_tokenizers": [], @@ -1733,20 +1688,24 @@ }, { "name": "Buduma", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buduma", + "depth": 6, "iso_1_code": null, "iso_3_code": "bdm", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "146", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "145", "native_tokenizers": [], @@ -1754,14 +1713,17 @@ }, { "name": "Jina", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jina", + "depth": 6, "iso_1_code": null, "iso_3_code": "jia", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "148", "native_tokenizers": [], @@ -1769,15 +1731,18 @@ }, { "name": "Majera", + "depth": 6, "iso_1_code": null, "iso_3_code": "xmj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "149", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "147", "native_tokenizers": [], @@ -1785,19 +1750,23 @@ }, { "name": "Kotoko Proper", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Afade", + "depth": 7, "iso_1_code": null, "iso_3_code": "aal", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "152", "native_tokenizers": [], @@ -1805,9 +1774,11 @@ }, { "name": "Mpade", + "depth": 7, "iso_1_code": null, "iso_3_code": "mpi", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "153", "native_tokenizers": [], @@ -1815,9 +1786,11 @@ }, { "name": "Maslam", + "depth": 7, "iso_1_code": null, "iso_3_code": "msv", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "154", "native_tokenizers": [], @@ -1825,15 +1798,18 @@ }, { "name": "Malgbe", + "depth": 7, "iso_1_code": null, "iso_3_code": "mxf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "155", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "151", "native_tokenizers": [], @@ -1841,14 +1817,17 @@ }, { "name": "South", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lagwan", + "depth": 7, "iso_1_code": null, "iso_3_code": "kot", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "157", "native_tokenizers": [], @@ -1856,27 +1835,32 @@ }, { "name": "Mser", + "depth": 7, "iso_1_code": null, "iso_3_code": "kqx", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "158", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "156", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "150", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "142", "native_tokenizers": [], @@ -1884,14 +1868,17 @@ }, { "name": "B.2", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Muskum", + "depth": 5, "iso_1_code": null, "iso_3_code": "mje", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "160", "native_tokenizers": [], @@ -1899,9 +1886,11 @@ }, { "name": "Mbara", + "depth": 5, "iso_1_code": null, "iso_3_code": "mpk", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "161", "native_tokenizers": [], @@ -1909,18 +1898,12 @@ }, { "name": "Musgu", + "depth": 5, "iso_1_code": null, "iso_3_code": "mug", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "162", "native_tokenizers": [], "scripts": [ @@ -1928,52 +1911,33 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "159", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "141", "native_tokenizers": [], "scripts": [] }, { "name": "C", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gidar", + "depth": 4, "iso_1_code": null, "iso_3_code": "gid", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "164", "native_tokenizers": [], "scripts": [ @@ -1981,53 +1945,44 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "163", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "57", "native_tokenizers": [], "scripts": [] }, { "name": "East", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A.1", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buso", + "depth": 5, "iso_1_code": null, "iso_3_code": "bso", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "168", "native_tokenizers": [], @@ -2035,14 +1990,17 @@ }, { "name": "1", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mulgi", + "depth": 6, "iso_1_code": null, "iso_3_code": "mvh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "170", "native_tokenizers": [], @@ -2050,9 +2008,11 @@ }, { "name": "Ndam", + "depth": 6, "iso_1_code": null, "iso_3_code": "ndm", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "171", "native_tokenizers": [], @@ -2060,9 +2020,11 @@ }, { "name": "Soumraye", + "depth": 6, "iso_1_code": null, "iso_3_code": "sor", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "172", "native_tokenizers": [], @@ -2070,18 +2032,12 @@ }, { "name": "Tumak", + "depth": 6, "iso_1_code": null, "iso_3_code": "tmc", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "173", "native_tokenizers": [], "scripts": [ @@ -2089,29 +2045,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "169", "native_tokenizers": [], "scripts": [] }, { "name": "2", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boor", + "depth": 6, "iso_1_code": null, "iso_3_code": "bvf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "175", "native_tokenizers": [], @@ -2119,9 +2071,11 @@ }, { "name": "Gadang", + "depth": 6, "iso_1_code": null, "iso_3_code": "gdk", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "176", "native_tokenizers": [], @@ -2129,9 +2083,11 @@ }, { "name": "Miltu", + "depth": 6, "iso_1_code": null, "iso_3_code": "mlj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "177", "native_tokenizers": [], @@ -2139,58 +2095,50 @@ }, { "name": "Sarua", + "depth": 6, "iso_1_code": null, "iso_3_code": "swy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "178", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "174", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "167", "native_tokenizers": [], "scripts": [] }, { "name": "A.2", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "1", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kimr\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "kqp", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "181", "native_tokenizers": [], "scripts": [ @@ -2199,18 +2147,12 @@ }, { "name": "Lele", + "depth": 6, "iso_1_code": null, "iso_3_code": "lln", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "182", "native_tokenizers": [], "scripts": [ @@ -2219,38 +2161,36 @@ }, { "name": "Nancere", + "depth": 6, "iso_1_code": null, "iso_3_code": "nnc", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "183", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "180", "native_tokenizers": [], "scripts": [] }, { "name": "2", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gabri", + "depth": 6, "iso_1_code": null, "iso_3_code": "gab", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "185", "native_tokenizers": [], @@ -2258,9 +2198,11 @@ }, { "name": "Kabalai", + "depth": 6, "iso_1_code": null, "iso_3_code": "kvf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "186", "native_tokenizers": [], @@ -2268,53 +2210,44 @@ }, { "name": "Tobanga", + "depth": 6, "iso_1_code": null, "iso_3_code": "tng", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "187", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "184", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "179", "native_tokenizers": [], "scripts": [] }, { "name": "A.3", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kera", + "depth": 5, "iso_1_code": null, "iso_3_code": "ker", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "189", "native_tokenizers": [], "scripts": [ @@ -2323,62 +2256,55 @@ }, { "name": "Kwang", + "depth": 5, "iso_1_code": null, "iso_3_code": "kvi", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "190", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "188", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "166", "native_tokenizers": [], "scripts": [] }, { "name": "B", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "B.1", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "1", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bidiyo", + "depth": 6, "iso_1_code": null, "iso_3_code": "bid", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "194", "native_tokenizers": [], @@ -2386,18 +2312,12 @@ }, { "name": "Dangal\u00e9at", + "depth": 6, "iso_1_code": null, "iso_3_code": "daa", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "195", "native_tokenizers": [], "scripts": [ @@ -2406,9 +2326,11 @@ }, { "name": "Jonkor Bourmataguil", + "depth": 6, "iso_1_code": null, "iso_3_code": "jeu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "196", "native_tokenizers": [], @@ -2416,9 +2338,11 @@ }, { "name": "Mawa", + "depth": 6, "iso_1_code": null, "iso_3_code": "mcw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "197", "native_tokenizers": [], @@ -2426,9 +2350,11 @@ }, { "name": "Migaama", + "depth": 6, "iso_1_code": null, "iso_3_code": "mmy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "198", "native_tokenizers": [], @@ -2436,9 +2362,11 @@ }, { "name": "Mogum", + "depth": 6, "iso_1_code": null, "iso_3_code": "mou", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "199", "native_tokenizers": [], @@ -2446,9 +2374,11 @@ }, { "name": "Mabire", + "depth": 6, "iso_1_code": null, "iso_3_code": "muj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "200", "native_tokenizers": [], @@ -2456,38 +2386,36 @@ }, { "name": "Ubi", + "depth": 6, "iso_1_code": null, "iso_3_code": "ubi", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "201", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "193", "native_tokenizers": [], "scripts": [] }, { "name": "2", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Birgit", + "depth": 6, "iso_1_code": null, "iso_3_code": "btf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "203", "native_tokenizers": [], @@ -2495,9 +2423,11 @@ }, { "name": "Kajakse", + "depth": 6, "iso_1_code": null, "iso_3_code": "ckq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "204", "native_tokenizers": [], @@ -2505,9 +2435,11 @@ }, { "name": "Masmaje", + "depth": 6, "iso_1_code": null, "iso_3_code": "mes", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "205", "native_tokenizers": [], @@ -2515,9 +2447,11 @@ }, { "name": "Mubi", + "depth": 6, "iso_1_code": null, "iso_3_code": "mub", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "206", "native_tokenizers": [], @@ -2525,9 +2459,11 @@ }, { "name": "Toram", + "depth": 6, "iso_1_code": null, "iso_3_code": "trj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "207", "native_tokenizers": [], @@ -2535,50 +2471,50 @@ }, { "name": "Zerenkel", + "depth": 6, "iso_1_code": null, "iso_3_code": "zrn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "208", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "202", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "192", "native_tokenizers": [], "scripts": [] }, { "name": "B.2", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mukulu", + "depth": 5, "iso_1_code": null, "iso_3_code": "moz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "210", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "209", "native_tokenizers": [], @@ -2586,14 +2522,17 @@ }, { "name": "B.3", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barein", + "depth": 5, "iso_1_code": null, "iso_3_code": "bva", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "212", "native_tokenizers": [], @@ -2601,9 +2540,11 @@ }, { "name": "Saba", + "depth": 5, "iso_1_code": null, "iso_3_code": "saa", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "213", "native_tokenizers": [], @@ -2611,9 +2552,11 @@ }, { "name": "Sokoro", + "depth": 5, "iso_1_code": null, "iso_3_code": "sok", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "214", "native_tokenizers": [], @@ -2621,58 +2564,50 @@ }, { "name": "Tamki", + "depth": 5, "iso_1_code": null, "iso_3_code": "tax", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "215", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "211", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "191", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "165", "native_tokenizers": [], "scripts": [] }, { "name": "Masa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Herd\u00e9", + "depth": 3, "iso_1_code": null, "iso_3_code": "hed", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "217", "native_tokenizers": [], @@ -2680,9 +2615,11 @@ }, { "name": "P\u00e9v\u00e9", + "depth": 3, "iso_1_code": null, "iso_3_code": "lme", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "218", "native_tokenizers": [], @@ -2690,18 +2627,12 @@ }, { "name": "Masana", + "depth": 3, "iso_1_code": null, "iso_3_code": "mcn", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "219", "native_tokenizers": [], "scripts": [ @@ -2710,38 +2641,26 @@ }, { "name": "Marba", + "depth": 3, "iso_1_code": null, "iso_3_code": "mpg", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "220", "native_tokenizers": [], "scripts": [ "Latn" - ] - }, - { - "name": "Musey", - "iso_1_code": null, - "iso_3_code": "mse", - "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + ] + }, + { + "name": "Musey", + "depth": 3, + "iso_1_code": null, + "iso_3_code": "mse", + "children": [], + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "221", "native_tokenizers": [], "scripts": [ @@ -2750,9 +2669,11 @@ }, { "name": "Ngete", + "depth": 3, "iso_1_code": null, "iso_3_code": "nnn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "222", "native_tokenizers": [], @@ -2760,9 +2681,11 @@ }, { "name": "Mesme", + "depth": 3, "iso_1_code": null, "iso_3_code": "zim", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "223", "native_tokenizers": [], @@ -2770,48 +2693,48 @@ }, { "name": "Zumaya", + "depth": 3, "iso_1_code": null, "iso_3_code": "zuy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "224", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "216", "native_tokenizers": [], "scripts": [] }, { "name": "West", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A.1", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gwandara", + "depth": 5, "iso_1_code": null, "iso_3_code": "gwn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "228", "native_tokenizers": [], @@ -2819,18 +2742,12 @@ }, { "name": "Hausa", + "depth": 5, "iso_1_code": "ha", "iso_3_code": "hau", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "229", "native_tokenizers": [], "scripts": [ @@ -2838,39 +2755,37 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "227", "native_tokenizers": [], "scripts": [] }, { "name": "A.2", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bole", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bole Proper", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bole", + "depth": 7, "iso_1_code": null, "iso_3_code": "bol", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "233", "native_tokenizers": [], @@ -2878,9 +2793,11 @@ }, { "name": "Bure", + "depth": 7, "iso_1_code": null, "iso_3_code": "bvh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "234", "native_tokenizers": [], @@ -2888,9 +2805,11 @@ }, { "name": "Beele", + "depth": 7, "iso_1_code": null, "iso_3_code": "bxq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "235", "native_tokenizers": [], @@ -2898,9 +2817,11 @@ }, { "name": "Deno", + "depth": 7, "iso_1_code": null, "iso_3_code": "dbb", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "236", "native_tokenizers": [], @@ -2908,9 +2829,11 @@ }, { "name": "Daza", + "depth": 7, "iso_1_code": null, "iso_3_code": "dzd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "237", "native_tokenizers": [], @@ -2918,9 +2841,11 @@ }, { "name": "Geruma", + "depth": 7, "iso_1_code": null, "iso_3_code": "gea", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "238", "native_tokenizers": [], @@ -2928,9 +2853,11 @@ }, { "name": "Gera", + "depth": 7, "iso_1_code": null, "iso_3_code": "gew", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "239", "native_tokenizers": [], @@ -2938,9 +2865,11 @@ }, { "name": "Galambi", + "depth": 7, "iso_1_code": null, "iso_3_code": "glo", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "240", "native_tokenizers": [], @@ -2948,9 +2877,11 @@ }, { "name": "Giiwo", + "depth": 7, "iso_1_code": null, "iso_3_code": "kks", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "241", "native_tokenizers": [], @@ -2958,9 +2889,11 @@ }, { "name": "Kubi", + "depth": 7, "iso_1_code": null, "iso_3_code": "kof", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "242", "native_tokenizers": [], @@ -2968,9 +2901,11 @@ }, { "name": "Kholok", + "depth": 7, "iso_1_code": null, "iso_3_code": "ktc", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "243", "native_tokenizers": [], @@ -2978,9 +2913,11 @@ }, { "name": "Maaka", + "depth": 7, "iso_1_code": null, "iso_3_code": "mew", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "244", "native_tokenizers": [], @@ -2988,9 +2925,11 @@ }, { "name": "Ngamo", + "depth": 7, "iso_1_code": null, "iso_3_code": "nbh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "245", "native_tokenizers": [], @@ -2998,15 +2937,18 @@ }, { "name": "Nyam", + "depth": 7, "iso_1_code": null, "iso_3_code": "nmi", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "246", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "232", "native_tokenizers": [], @@ -3014,26 +2956,31 @@ }, { "name": "Karekare", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karekare", + "depth": 7, "iso_1_code": null, "iso_3_code": "kai", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "248", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "247", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "231", "native_tokenizers": [], @@ -3041,25 +2988,30 @@ }, { "name": "Tangale", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dera", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dera", + "depth": 7, "iso_1_code": null, "iso_3_code": "kna", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "251", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "250", "native_tokenizers": [], @@ -3067,14 +3019,17 @@ }, { "name": "Tangale Proper", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kutto", + "depth": 7, "iso_1_code": null, "iso_3_code": "kpa", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "253", "native_tokenizers": [], @@ -3082,9 +3037,11 @@ }, { "name": "Kwaami", + "depth": 7, "iso_1_code": null, "iso_3_code": "ksq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "254", "native_tokenizers": [], @@ -3092,9 +3049,11 @@ }, { "name": "Kushi", + "depth": 7, "iso_1_code": null, "iso_3_code": "kuh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "255", "native_tokenizers": [], @@ -3102,9 +3061,11 @@ }, { "name": "Pero", + "depth": 7, "iso_1_code": null, "iso_3_code": "pip", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "256", "native_tokenizers": [], @@ -3112,9 +3073,11 @@ }, { "name": "Piya-Kwonci", + "depth": 7, "iso_1_code": null, "iso_3_code": "piy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "257", "native_tokenizers": [], @@ -3122,27 +3085,32 @@ }, { "name": "Tangale", + "depth": 7, "iso_1_code": null, "iso_3_code": "tan", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "258", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "252", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "249", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "230", "native_tokenizers": [], @@ -3150,19 +3118,23 @@ }, { "name": "A.3", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angas Proper", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jakattoe", + "depth": 6, "iso_1_code": null, "iso_3_code": "jrt", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "261", "native_tokenizers": [], @@ -3170,14 +3142,17 @@ }, { "name": "1", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngas", + "depth": 7, "iso_1_code": null, "iso_3_code": "anc", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "263", "native_tokenizers": [], @@ -3185,9 +3160,11 @@ }, { "name": "Cakfem-Mushere", + "depth": 7, "iso_1_code": null, "iso_3_code": "cky", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "264", "native_tokenizers": [], @@ -3195,9 +3172,11 @@ }, { "name": "Belning", + "depth": 7, "iso_1_code": null, "iso_3_code": "glb", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "265", "native_tokenizers": [], @@ -3205,9 +3184,11 @@ }, { "name": "Kofyar", + "depth": 7, "iso_1_code": null, "iso_3_code": "kwl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "266", "native_tokenizers": [], @@ -3215,9 +3196,11 @@ }, { "name": "Miship", + "depth": 7, "iso_1_code": null, "iso_3_code": "mjs", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "267", "native_tokenizers": [], @@ -3225,9 +3208,11 @@ }, { "name": "Nteng", + "depth": 7, "iso_1_code": null, "iso_3_code": "nqt", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "268", "native_tokenizers": [], @@ -3235,18 +3220,12 @@ }, { "name": "Mwaghavul", + "depth": 7, "iso_1_code": null, "iso_3_code": "sur", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "269", "native_tokenizers": [], "scripts": [ @@ -3254,29 +3233,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "262", "native_tokenizers": [], "scripts": [] }, { "name": "2", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Goemai", + "depth": 7, "iso_1_code": null, "iso_3_code": "ank", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "271", "native_tokenizers": [], @@ -3284,9 +3259,11 @@ }, { "name": "Koenoem", + "depth": 7, "iso_1_code": null, "iso_3_code": "kcs", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "272", "native_tokenizers": [], @@ -3294,9 +3271,11 @@ }, { "name": "Tehl", + "depth": 7, "iso_1_code": null, "iso_3_code": "mtl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "273", "native_tokenizers": [], @@ -3304,9 +3283,11 @@ }, { "name": "Piapung", + "depth": 7, "iso_1_code": null, "iso_3_code": "pcw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "274", "native_tokenizers": [], @@ -3314,84 +3295,81 @@ }, { "name": "Tal", + "depth": 7, "iso_1_code": null, "iso_3_code": "tal", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "275", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "270", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "260", "native_tokenizers": [], "scripts": [] }, { "name": "Yiwom", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ywom", + "depth": 6, "iso_1_code": null, "iso_3_code": "gek", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "277", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "276", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "259", "native_tokenizers": [], "scripts": [] }, { "name": "A.4", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fyer", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fyer", + "depth": 6, "iso_1_code": null, "iso_3_code": "fie", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "280", "native_tokenizers": [], @@ -3399,15 +3377,18 @@ }, { "name": "Rom", + "depth": 6, "iso_1_code": null, "iso_3_code": "tdk", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "281", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "279", "native_tokenizers": [], @@ -3415,14 +3396,17 @@ }, { "name": "Ron Proper", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ron", + "depth": 6, "iso_1_code": null, "iso_3_code": "cla", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "283", "native_tokenizers": [], @@ -3430,9 +3414,11 @@ }, { "name": "Duhwa", + "depth": 6, "iso_1_code": null, "iso_3_code": "kbz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "284", "native_tokenizers": [], @@ -3440,9 +3426,11 @@ }, { "name": "Kulere", + "depth": 6, "iso_1_code": null, "iso_3_code": "kul", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "285", "native_tokenizers": [], @@ -3450,9 +3438,11 @@ }, { "name": "Mindat", + "depth": 6, "iso_1_code": null, "iso_3_code": "mmf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "286", "native_tokenizers": [], @@ -3460,55 +3450,56 @@ }, { "name": "Sya", + "depth": 6, "iso_1_code": null, "iso_3_code": "scw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "287", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "282", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "278", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "226", "native_tokenizers": [], "scripts": [] }, { "name": "B", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "B.1", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Teshenawa", + "depth": 5, "iso_1_code": null, "iso_3_code": "twc", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "290", "native_tokenizers": [], @@ -3516,14 +3507,17 @@ }, { "name": "Bade Proper", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bade", + "depth": 6, "iso_1_code": null, "iso_3_code": "bde", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "292", "native_tokenizers": [], @@ -3531,15 +3525,18 @@ }, { "name": "Ngizim", + "depth": 6, "iso_1_code": null, "iso_3_code": "ngi", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "293", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "291", "native_tokenizers": [], @@ -3547,26 +3544,31 @@ }, { "name": "Duwai", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duwai", + "depth": 6, "iso_1_code": null, "iso_3_code": "dbp", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "295", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "294", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "289", "native_tokenizers": [], @@ -3574,14 +3576,17 @@ }, { "name": "B.2", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ajawa", + "depth": 5, "iso_1_code": null, "iso_3_code": "ajw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "297", "native_tokenizers": [], @@ -3589,9 +3594,11 @@ }, { "name": "Burku", + "depth": 5, "iso_1_code": null, "iso_3_code": "bbt", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "298", "native_tokenizers": [], @@ -3599,9 +3606,11 @@ }, { "name": "Dirya", + "depth": 5, "iso_1_code": null, "iso_3_code": "dwa", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "299", "native_tokenizers": [], @@ -3609,9 +3618,11 @@ }, { "name": "Zibinju", + "depth": 5, "iso_1_code": null, "iso_3_code": "jmb", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "300", "native_tokenizers": [], @@ -3619,9 +3630,11 @@ }, { "name": "Kariya", + "depth": 5, "iso_1_code": null, "iso_3_code": "kil", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "301", "native_tokenizers": [], @@ -3629,9 +3642,11 @@ }, { "name": "Vune mi", + "depth": 5, "iso_1_code": null, "iso_3_code": "mkf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "302", "native_tokenizers": [], @@ -3639,9 +3654,11 @@ }, { "name": "Pa\u2019anci", + "depth": 5, "iso_1_code": null, "iso_3_code": "pqa", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "303", "native_tokenizers": [], @@ -3649,9 +3666,11 @@ }, { "name": "Siri", + "depth": 5, "iso_1_code": null, "iso_3_code": "sir", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "304", "native_tokenizers": [], @@ -3659,9 +3678,11 @@ }, { "name": "Choogen", + "depth": 5, "iso_1_code": null, "iso_3_code": "tgd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "305", "native_tokenizers": [], @@ -3669,15 +3690,18 @@ }, { "name": "Warji", + "depth": 5, "iso_1_code": null, "iso_3_code": "wji", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "306", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "296", "native_tokenizers": [], @@ -3685,14 +3709,17 @@ }, { "name": "B.3", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dass", + "depth": 5, "iso_1_code": null, "iso_3_code": "dot", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "308", "native_tokenizers": [], @@ -3700,14 +3727,17 @@ }, { "name": "Boghom", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boghom", + "depth": 6, "iso_1_code": null, "iso_3_code": "bux", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "310", "native_tokenizers": [], @@ -3715,9 +3745,11 @@ }, { "name": "Kir-Balar", + "depth": 6, "iso_1_code": null, "iso_3_code": "kkr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "311", "native_tokenizers": [], @@ -3725,15 +3757,18 @@ }, { "name": "Mansi", + "depth": 6, "iso_1_code": null, "iso_3_code": "zns", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "312", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "309", "native_tokenizers": [], @@ -3741,20 +3776,24 @@ }, { "name": "Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jimi", + "depth": 6, "iso_1_code": null, "iso_3_code": "jmi", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "314", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "313", "native_tokenizers": [], @@ -3762,14 +3801,17 @@ }, { "name": "Guruntum", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guruntum-Mbaaru", + "depth": 6, "iso_1_code": null, "iso_3_code": "grd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "316", "native_tokenizers": [], @@ -3777,9 +3819,11 @@ }, { "name": "Juu", + "depth": 6, "iso_1_code": null, "iso_3_code": "juu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "317", "native_tokenizers": [], @@ -3787,9 +3831,11 @@ }, { "name": "Tala", + "depth": 6, "iso_1_code": null, "iso_3_code": "tak", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "318", "native_tokenizers": [], @@ -3797,15 +3843,18 @@ }, { "name": "Zamwal", + "depth": 6, "iso_1_code": null, "iso_3_code": "zah", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "319", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "315", "native_tokenizers": [], @@ -3813,14 +3862,17 @@ }, { "name": "Zaar Proper", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cha\u2019ari", + "depth": 6, "iso_1_code": null, "iso_3_code": "cxh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "321", "native_tokenizers": [], @@ -3828,9 +3880,11 @@ }, { "name": "Dokshi", + "depth": 6, "iso_1_code": null, "iso_3_code": "dsk", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "322", "native_tokenizers": [], @@ -3838,9 +3892,11 @@ }, { "name": "Dyarim", + "depth": 6, "iso_1_code": null, "iso_3_code": "dyr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "323", "native_tokenizers": [], @@ -3848,9 +3904,11 @@ }, { "name": "Gyaazi", + "depth": 6, "iso_1_code": null, "iso_3_code": "gyz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "324", "native_tokenizers": [], @@ -3858,9 +3916,11 @@ }, { "name": "Luri", + "depth": 6, "iso_1_code": null, "iso_3_code": "ldd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "325", "native_tokenizers": [], @@ -3868,9 +3928,11 @@ }, { "name": "Dir-Nyamzak-Mbarimi", + "depth": 6, "iso_1_code": null, "iso_3_code": "nzr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "326", "native_tokenizers": [], @@ -3878,9 +3940,11 @@ }, { "name": "Pesse", + "depth": 6, "iso_1_code": null, "iso_3_code": "pze", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "327", "native_tokenizers": [], @@ -3888,18 +3952,12 @@ }, { "name": "Saya", + "depth": 6, "iso_1_code": null, "iso_3_code": "say", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "328", "native_tokenizers": [], "scripts": [ @@ -3908,9 +3966,11 @@ }, { "name": "Tulai", + "depth": 6, "iso_1_code": null, "iso_3_code": "tvi", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "329", "native_tokenizers": [], @@ -3918,9 +3978,11 @@ }, { "name": "Buli", + "depth": 6, "iso_1_code": null, "iso_3_code": "uly", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "330", "native_tokenizers": [], @@ -3928,9 +3990,11 @@ }, { "name": "Zari", + "depth": 6, "iso_1_code": null, "iso_3_code": "zaz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "331", "native_tokenizers": [], @@ -3938,9 +4002,11 @@ }, { "name": "Bu", + "depth": 6, "iso_1_code": null, "iso_3_code": "zbu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "332", "native_tokenizers": [], @@ -3948,9 +4014,11 @@ }, { "name": "Zeem", + "depth": 6, "iso_1_code": null, "iso_3_code": "zem", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "333", "native_tokenizers": [], @@ -3958,110 +4026,83 @@ }, { "name": "Zul", + "depth": 6, "iso_1_code": null, "iso_3_code": "zlu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "334", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "320", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "307", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "288", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "225", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "56", "native_tokenizers": [], "scripts": [] }, { "name": "Cushitic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Xamtanga", + "depth": 4, "iso_1_code": null, "iso_3_code": "xan", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "338", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "337", "native_tokenizers": [], @@ -4069,20 +4110,24 @@ }, { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bilen", + "depth": 4, "iso_1_code": null, "iso_3_code": "byn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "340", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "339", "native_tokenizers": [], @@ -4090,20 +4135,24 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awngi", + "depth": 4, "iso_1_code": null, "iso_3_code": "awn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "342", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "341", "native_tokenizers": [], @@ -4111,26 +4160,31 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Qimant", + "depth": 4, "iso_1_code": null, "iso_3_code": "ahg", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "344", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "343", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "336", "native_tokenizers": [], @@ -4138,14 +4192,17 @@ }, { "name": "East", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boon", + "depth": 3, "iso_1_code": null, "iso_3_code": "bnl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "346", "native_tokenizers": [], @@ -4153,14 +4210,17 @@ }, { "name": "Dullay", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ale", + "depth": 4, "iso_1_code": null, "iso_3_code": "gwd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "348", "native_tokenizers": [], @@ -4168,15 +4228,18 @@ }, { "name": "Tsamai", + "depth": 4, "iso_1_code": null, "iso_3_code": "tsb", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "349", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "347", "native_tokenizers": [], @@ -4184,14 +4247,17 @@ }, { "name": "Highland", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alaba-K\u2019abeena", + "depth": 4, "iso_1_code": null, "iso_3_code": "alw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "351", "native_tokenizers": [], @@ -4199,9 +4265,11 @@ }, { "name": "Burji", + "depth": 4, "iso_1_code": null, "iso_3_code": "bji", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "352", "native_tokenizers": [], @@ -4209,9 +4277,11 @@ }, { "name": "Gedeo", + "depth": 4, "iso_1_code": null, "iso_3_code": "drs", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "353", "native_tokenizers": [], @@ -4219,9 +4289,11 @@ }, { "name": "Hadiyya", + "depth": 4, "iso_1_code": null, "iso_3_code": "hdy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "354", "native_tokenizers": [], @@ -4229,18 +4301,12 @@ }, { "name": "Kambaata", + "depth": 4, "iso_1_code": null, "iso_3_code": "ktb", "children": [], - "tokenizers": { - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "355", "native_tokenizers": [], "scripts": [ @@ -4249,9 +4315,11 @@ }, { "name": "Libido", + "depth": 4, "iso_1_code": null, "iso_3_code": "liq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "356", "native_tokenizers": [], @@ -4259,18 +4327,12 @@ }, { "name": "Sidamo", + "depth": 4, "iso_1_code": null, "iso_3_code": "sid", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "357", "native_tokenizers": [], "scripts": [ @@ -4278,36 +4340,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "350", "native_tokenizers": [], "scripts": [] }, { "name": "Konso-Gidole", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mositacha", + "depth": 4, "iso_1_code": null, "iso_3_code": "dox", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "359", "native_tokenizers": [], @@ -4315,9 +4366,11 @@ }, { "name": "Dirasha", + "depth": 4, "iso_1_code": null, "iso_3_code": "gdl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "360", "native_tokenizers": [], @@ -4325,18 +4378,12 @@ }, { "name": "Konso", + "depth": 4, "iso_1_code": null, "iso_3_code": "kxc", "children": [], - "tokenizers": { - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "361", "native_tokenizers": [], "scripts": [ @@ -4344,29 +4391,25 @@ ] } ], - "tokenizers": { - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "358", "native_tokenizers": [], "scripts": [] }, { "name": "Oromo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oromo, Borana-Arsi-Guji", + "depth": 4, "iso_1_code": "om", "iso_3_code": "gax", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "363", "native_tokenizers": [], @@ -4374,18 +4417,12 @@ }, { "name": "Oromo, West Central", + "depth": 4, "iso_1_code": "om", "iso_3_code": "gaz", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "364", "native_tokenizers": [], "scripts": [ @@ -4394,18 +4431,12 @@ }, { "name": "Oromo, Eastern", + "depth": 4, "iso_1_code": "om", "iso_3_code": "hae", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "365", "native_tokenizers": [], "scripts": [ @@ -4414,9 +4445,11 @@ }, { "name": "Orma", + "depth": 4, "iso_1_code": "om", "iso_3_code": "orc", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "366", "native_tokenizers": [], @@ -4424,38 +4457,36 @@ }, { "name": "Waata", + "depth": 4, "iso_1_code": null, "iso_3_code": "ssn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "367", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "362", "native_tokenizers": [], "scripts": [] }, { "name": "Rendille-Boni", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aweer", + "depth": 4, "iso_1_code": null, "iso_3_code": "bob", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "369", "native_tokenizers": [], @@ -4463,18 +4494,12 @@ }, { "name": "Rendille", + "depth": 4, "iso_1_code": null, "iso_3_code": "rel", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "370", "native_tokenizers": [], "scripts": [ @@ -4482,29 +4507,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "368", "native_tokenizers": [], "scripts": [] }, { "name": "Saho-Afar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Afar", + "depth": 4, "iso_1_code": "aa", "iso_3_code": "aar", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "372", "native_tokenizers": [], @@ -4512,15 +4533,18 @@ }, { "name": "Saho", + "depth": 4, "iso_1_code": null, "iso_3_code": "ssy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "373", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "371", "native_tokenizers": [], @@ -4528,14 +4552,17 @@ }, { "name": "Somali", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dabarre", + "depth": 4, "iso_1_code": null, "iso_3_code": "dbr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "375", "native_tokenizers": [], @@ -4543,9 +4570,11 @@ }, { "name": "Garre", + "depth": 4, "iso_1_code": null, "iso_3_code": "gex", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "376", "native_tokenizers": [], @@ -4553,9 +4582,11 @@ }, { "name": "Girirra", + "depth": 4, "iso_1_code": null, "iso_3_code": "gii", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "377", "native_tokenizers": [], @@ -4563,9 +4594,11 @@ }, { "name": "Jiiddu", + "depth": 4, "iso_1_code": null, "iso_3_code": "jii", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "378", "native_tokenizers": [], @@ -4573,18 +4606,12 @@ }, { "name": "Somali", + "depth": 4, "iso_1_code": "so", "iso_3_code": "som", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "379", "native_tokenizers": [], "scripts": [ @@ -4593,9 +4620,11 @@ }, { "name": "Tunni", + "depth": 4, "iso_1_code": null, "iso_3_code": "tqq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "380", "native_tokenizers": [], @@ -4603,38 +4632,36 @@ }, { "name": "Maay", + "depth": 4, "iso_1_code": null, "iso_3_code": "ymm", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "381", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "374", "native_tokenizers": [], "scripts": [] }, { "name": "Western Omo-Tana", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arbore", + "depth": 4, "iso_1_code": null, "iso_3_code": "arv", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "383", "native_tokenizers": [], @@ -4642,9 +4669,11 @@ }, { "name": "Baiso", + "depth": 4, "iso_1_code": null, "iso_3_code": "bsw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "384", "native_tokenizers": [], @@ -4652,18 +4681,12 @@ }, { "name": "Daasanach", + "depth": 4, "iso_1_code": null, "iso_3_code": "dsh", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "385", "native_tokenizers": [], "scripts": [ @@ -4672,86 +4695,75 @@ }, { "name": "El Molo", + "depth": 4, "iso_1_code": null, "iso_3_code": "elo", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "386", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "382", "native_tokenizers": [], "scripts": [] }, { "name": "Yaaku", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yaaku", + "depth": 4, "iso_1_code": null, "iso_3_code": "muu", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "388", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "387", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "345", "native_tokenizers": [], "scripts": [] }, { "name": "North", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bedawiyet", + "depth": 3, "iso_1_code": null, "iso_3_code": "bej", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "390", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "389", "native_tokenizers": [], @@ -4759,14 +4771,17 @@ }, { "name": "South", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aas\u00e1x", + "depth": 3, "iso_1_code": null, "iso_3_code": "aas", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "392", "native_tokenizers": [], @@ -4774,9 +4789,11 @@ }, { "name": "Burunge", + "depth": 3, "iso_1_code": null, "iso_3_code": "bds", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "393", "native_tokenizers": [], @@ -4784,9 +4801,11 @@ }, { "name": "Dahalo", + "depth": 3, "iso_1_code": null, "iso_3_code": "dal", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "394", "native_tokenizers": [], @@ -4794,9 +4813,11 @@ }, { "name": "Gorowa", + "depth": 3, "iso_1_code": null, "iso_3_code": "gow", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "395", "native_tokenizers": [], @@ -4804,18 +4825,12 @@ }, { "name": "Iraqw", + "depth": 3, "iso_1_code": null, "iso_3_code": "irk", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "396", "native_tokenizers": [], "scripts": [ @@ -4824,9 +4839,11 @@ }, { "name": "Alagwa", + "depth": 3, "iso_1_code": null, "iso_3_code": "wbj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "397", "native_tokenizers": [], @@ -4834,59 +4851,43 @@ }, { "name": "Kw\u2019adza", + "depth": 3, "iso_1_code": null, "iso_3_code": "wka", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "398", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "391", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "335", "native_tokenizers": [], "scripts": [] }, { "name": "Egyptian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Coptic", + "depth": 2, "iso_1_code": null, "iso_3_code": "cop", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Copt": { "full_object": "StanzaTokenizer(\"cop\")", @@ -4905,6 +4906,7 @@ ] } ], + "family": "Afro-Asiatic", "tokenizers": { "Copt": { "full_object": "StanzaTokenizer(\"cop\")", @@ -4920,24 +4922,29 @@ }, { "name": "Omotic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dizoid", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dizin", + "depth": 4, "iso_1_code": null, "iso_3_code": "mdx", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "404", "native_tokenizers": [], @@ -4945,9 +4952,11 @@ }, { "name": "Nayi", + "depth": 4, "iso_1_code": null, "iso_3_code": "noz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "405", "native_tokenizers": [], @@ -4955,15 +4964,18 @@ }, { "name": "Sheko", + "depth": 4, "iso_1_code": null, "iso_3_code": "she", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "406", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "403", "native_tokenizers": [], @@ -4971,30 +4983,36 @@ }, { "name": "Gonga-Gimojan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gimojan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Janjero", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yemsa", + "depth": 6, "iso_1_code": null, "iso_3_code": "jnj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "410", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "409", "native_tokenizers": [], @@ -5002,25 +5020,30 @@ }, { "name": "Ometo-Gimira", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chara", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsaara", + "depth": 7, "iso_1_code": null, "iso_3_code": "cra", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "413", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "412", "native_tokenizers": [], @@ -5028,20 +5051,24 @@ }, { "name": "Gimira", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bench", + "depth": 7, "iso_1_code": null, "iso_3_code": "bcq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "415", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "414", "native_tokenizers": [], @@ -5049,23 +5076,18 @@ }, { "name": "Ometo", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Male", + "depth": 7, "iso_1_code": null, "iso_3_code": "mdy", "children": [], - "tokenizers": { - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "417", "native_tokenizers": [], "scripts": [ @@ -5074,14 +5096,17 @@ }, { "name": "Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dorze", + "depth": 8, "iso_1_code": null, "iso_3_code": "doz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "419", "native_tokenizers": [], @@ -5089,18 +5114,12 @@ }, { "name": "Dawro", + "depth": 8, "iso_1_code": null, "iso_3_code": "dwr", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "420", "native_tokenizers": [], "scripts": [ @@ -5109,25 +5128,12 @@ }, { "name": "Gamo", + "depth": 8, "iso_1_code": null, "iso_3_code": "gmv", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "421", "native_tokenizers": [], "scripts": [ @@ -5137,25 +5143,12 @@ }, { "name": "Gofa", + "depth": 8, "iso_1_code": null, "iso_3_code": "gof", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "422", "native_tokenizers": [], "scripts": [ @@ -5165,9 +5158,11 @@ }, { "name": "Melo", + "depth": 8, "iso_1_code": null, "iso_3_code": "mfx", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "423", "native_tokenizers": [], @@ -5175,9 +5170,11 @@ }, { "name": "Oyda", + "depth": 8, "iso_1_code": null, "iso_3_code": "oyd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "424", "native_tokenizers": [], @@ -5185,25 +5182,12 @@ }, { "name": "Wolaytta", + "depth": 8, "iso_1_code": null, "iso_3_code": "wal", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "425", "native_tokenizers": [], "scripts": [ @@ -5212,36 +5196,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "418", "native_tokenizers": [], "scripts": [] }, { "name": "East", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kachama-Ganjule", + "depth": 8, "iso_1_code": null, "iso_3_code": "kcx", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "427", "native_tokenizers": [], @@ -5249,18 +5222,12 @@ }, { "name": "Koorete", + "depth": 8, "iso_1_code": null, "iso_3_code": "kqy", "children": [], - "tokenizers": { - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "428", "native_tokenizers": [], "scripts": [ @@ -5269,133 +5236,95 @@ }, { "name": "Zayse", + "depth": 8, "iso_1_code": null, "iso_3_code": "zay", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "429", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "426", "native_tokenizers": [], "scripts": [] }, { "name": "West", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Basketo", + "depth": 8, "iso_1_code": null, "iso_3_code": "bst", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "431", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "430", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "416", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "411", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "408", "native_tokenizers": [], "scripts": [] }, { "name": "Gonga", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anfillo", + "depth": 6, "iso_1_code": null, "iso_3_code": "myo", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "434", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "433", "native_tokenizers": [], @@ -5403,20 +5332,24 @@ }, { "name": "North", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Borna", + "depth": 6, "iso_1_code": null, "iso_3_code": "bwo", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "436", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "435", "native_tokenizers": [], @@ -5424,23 +5357,18 @@ }, { "name": "South", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kafa", + "depth": 6, "iso_1_code": null, "iso_3_code": "kbr", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "438", "native_tokenizers": [], "scripts": [ @@ -5449,73 +5377,50 @@ }, { "name": "Shekkacho", + "depth": 6, "iso_1_code": null, "iso_3_code": "moy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "439", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "437", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "432", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "407", "native_tokenizers": [], "scripts": [] }, { "name": "Mao", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ganza", + "depth": 4, "iso_1_code": null, "iso_3_code": "gza", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "441", "native_tokenizers": [], @@ -5523,9 +5428,11 @@ }, { "name": "Hozo", + "depth": 4, "iso_1_code": null, "iso_3_code": "hoz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "442", "native_tokenizers": [], @@ -5533,9 +5440,11 @@ }, { "name": "Mawes Aasse", + "depth": 4, "iso_1_code": null, "iso_3_code": "myf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "443", "native_tokenizers": [], @@ -5543,51 +5452,43 @@ }, { "name": "Seze", + "depth": 4, "iso_1_code": null, "iso_3_code": "sze", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "444", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "440", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "402", "native_tokenizers": [], "scripts": [] }, { "name": "South", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aari", + "depth": 3, "iso_1_code": null, "iso_3_code": "aiw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "446", "native_tokenizers": [], @@ -5595,18 +5496,12 @@ }, { "name": "Hamer-Banna", + "depth": 3, "iso_1_code": null, "iso_3_code": "amf", "children": [], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "447", "native_tokenizers": [], "scripts": [ @@ -5615,9 +5510,11 @@ }, { "name": "Dime", + "depth": 3, "iso_1_code": null, "iso_3_code": "dim", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "448", "native_tokenizers": [], @@ -5625,9 +5522,11 @@ }, { "name": "Gayil", + "depth": 3, "iso_1_code": null, "iso_3_code": "gyl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "449", "native_tokenizers": [], @@ -5635,64 +5534,49 @@ }, { "name": "Karo", + "depth": 3, "iso_1_code": null, "iso_3_code": "kxh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "450", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "445", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "401", "native_tokenizers": [], "scripts": [] }, { "name": "Semitic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Faifi", + "depth": 3, "iso_1_code": null, "iso_3_code": "fif", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "453", "native_tokenizers": [], @@ -5700,9 +5584,11 @@ }, { "name": "R\u0101zi\u1e25\u012b", + "depth": 3, "iso_1_code": null, "iso_3_code": "rzh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "454", "native_tokenizers": [], @@ -5710,19 +5596,23 @@ }, { "name": "Aramaic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Syriac", + "depth": 5, "iso_1_code": null, "iso_3_code": "syc", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "457", "native_tokenizers": [], @@ -5732,19 +5622,23 @@ }, { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northeastern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Assyrian Neo-Aramaic", + "depth": 7, "iso_1_code": null, "iso_3_code": "aii", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "460", "native_tokenizers": [], @@ -5754,9 +5648,11 @@ }, { "name": "Bohtan Neo-Aramaic", + "depth": 7, "iso_1_code": null, "iso_3_code": "bhn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "461", "native_tokenizers": [], @@ -5764,9 +5660,11 @@ }, { "name": "Barzani-Sandu Jewish Neo-Aramaic", + "depth": 7, "iso_1_code": null, "iso_3_code": "bjf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "462", "native_tokenizers": [], @@ -5774,9 +5672,11 @@ }, { "name": "Chaldean Neo-Aramaic", + "depth": 7, "iso_1_code": null, "iso_3_code": "cld", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "463", "native_tokenizers": [], @@ -5784,9 +5684,11 @@ }, { "name": "H\u00e9rtevin", + "depth": 7, "iso_1_code": null, "iso_3_code": "hrt", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "464", "native_tokenizers": [], @@ -5794,9 +5696,11 @@ }, { "name": "Koy Sanjaq Surat", + "depth": 7, "iso_1_code": null, "iso_3_code": "kqd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "465", "native_tokenizers": [], @@ -5804,9 +5708,11 @@ }, { "name": "Senaya", + "depth": 7, "iso_1_code": null, "iso_3_code": "syn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "466", "native_tokenizers": [], @@ -5814,9 +5720,11 @@ }, { "name": "Jewish Babylonian Aramaic", + "depth": 7, "iso_1_code": null, "iso_3_code": "tmr", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "467", "native_tokenizers": [], @@ -5824,14 +5732,17 @@ }, { "name": "Trans-Zab", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inter-Zab Jewish Neo-Aramaic", + "depth": 8, "iso_1_code": null, "iso_3_code": "aij", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "469", "native_tokenizers": [], @@ -5839,9 +5750,11 @@ }, { "name": "Hulaul\u00e1", + "depth": 8, "iso_1_code": null, "iso_3_code": "huy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "470", "native_tokenizers": [], @@ -5849,9 +5762,11 @@ }, { "name": "Lishana Deni", + "depth": 8, "iso_1_code": null, "iso_3_code": "lsd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "471", "native_tokenizers": [], @@ -5859,21 +5774,25 @@ }, { "name": "Lish\u00e1n Noshan", + "depth": 8, "iso_1_code": null, "iso_3_code": "trg", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "472", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "468", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "459", "native_tokenizers": [], @@ -5881,14 +5800,17 @@ }, { "name": "Northwestern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mlahs\u00f6", + "depth": 7, "iso_1_code": null, "iso_3_code": "lhs", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "474", "native_tokenizers": [], @@ -5896,21 +5818,25 @@ }, { "name": "Turoyo", + "depth": 7, "iso_1_code": null, "iso_3_code": "tru", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "475", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "473", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "458", "native_tokenizers": [], @@ -5918,14 +5844,17 @@ }, { "name": "Mandaic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Neo-Mandaic", + "depth": 6, "iso_1_code": null, "iso_3_code": "mid", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "477", "native_tokenizers": [], @@ -5933,21 +5862,25 @@ }, { "name": "Mandaic, Classical", + "depth": 6, "iso_1_code": null, "iso_3_code": "myz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "478", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "476", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "456", "native_tokenizers": [], @@ -5955,14 +5888,17 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Western Neo-Aramaic", + "depth": 5, "iso_1_code": null, "iso_3_code": "amw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "480", "native_tokenizers": [], @@ -5970,21 +5906,25 @@ }, { "name": "Samaritan Aramaic", + "depth": 5, "iso_1_code": null, "iso_3_code": "sam", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "481", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "479", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "455", "native_tokenizers": [], @@ -5992,19 +5932,23 @@ }, { "name": "South", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arabic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arabic, Algerian Saharan", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "aao", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "484", "native_tokenizers": [], @@ -6012,9 +5956,11 @@ }, { "name": "Arabic, Tajiki", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "abh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "485", "native_tokenizers": [], @@ -6022,9 +5968,11 @@ }, { "name": "Arabic, Baharna", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "abv", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "486", "native_tokenizers": [], @@ -6032,9 +5980,11 @@ }, { "name": "Arabic, Mesopotamian", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "acm", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6054,9 +6004,11 @@ }, { "name": "Arabic, Ta\u2019izzi-Adeni", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "acq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "488", "native_tokenizers": [], @@ -6064,9 +6016,11 @@ }, { "name": "Arabic, Hijazi", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "acw", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "489", "native_tokenizers": [], @@ -6074,9 +6028,11 @@ }, { "name": "Arabic, Omani", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "acx", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "490", "native_tokenizers": [], @@ -6084,9 +6040,11 @@ }, { "name": "Arabic, Cypriot", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "acy", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "491", "native_tokenizers": [], @@ -6094,9 +6052,11 @@ }, { "name": "Arabic, Dhofari", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "adf", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "492", "native_tokenizers": [], @@ -6104,9 +6064,11 @@ }, { "name": "Arabic, Tunisian", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "aeb", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6126,9 +6088,11 @@ }, { "name": "Arabic, Sa\u2019idi", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "aec", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "494", "native_tokenizers": [], @@ -6136,9 +6100,11 @@ }, { "name": "Arabic, Gulf", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "afb", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "495", "native_tokenizers": [], @@ -6146,9 +6112,11 @@ }, { "name": "Arabic, Judeo-Moroccan", + "depth": 5, "iso_1_code": null, "iso_3_code": "aju", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "496", "native_tokenizers": [], @@ -6156,9 +6124,11 @@ }, { "name": "Arabic, Levantine", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "apc", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6178,9 +6148,11 @@ }, { "name": "Arabic, Sudanese", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "apd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "498", "native_tokenizers": [], @@ -6188,9 +6160,11 @@ }, { "name": "Arabic, Standard", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "arb", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6218,9 +6192,11 @@ }, { "name": "Arabic, Algerian", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "arq", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6240,9 +6216,11 @@ }, { "name": "Arabic, Najdi", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "ars", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6262,9 +6240,11 @@ }, { "name": "Arabic, Moroccan", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "ary", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6284,9 +6264,11 @@ }, { "name": "Arabic, Egyptian", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "arz", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6306,9 +6288,11 @@ }, { "name": "Arabic, Uzbeki", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "auz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "504", "native_tokenizers": [], @@ -6316,9 +6300,11 @@ }, { "name": "Arabic, Eastern Egyptian Bedawi", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "avl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "505", "native_tokenizers": [], @@ -6326,9 +6312,11 @@ }, { "name": "Arabic, Hadrami", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "ayh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "506", "native_tokenizers": [], @@ -6336,9 +6324,11 @@ }, { "name": "Arabic, Libyan", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "ayl", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "507", "native_tokenizers": [], @@ -6346,9 +6336,11 @@ }, { "name": "Arabic, Sanaani", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "ayn", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "508", "native_tokenizers": [], @@ -6356,9 +6348,11 @@ }, { "name": "Arabic, North Mesopotamian", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "ayp", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6378,9 +6372,11 @@ }, { "name": "Arabic, Judeo-Yemeni", + "depth": 5, "iso_1_code": null, "iso_3_code": "jye", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "510", "native_tokenizers": [], @@ -6388,9 +6384,11 @@ }, { "name": "Hassaniyya", + "depth": 5, "iso_1_code": null, "iso_3_code": "mey", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "511", "native_tokenizers": [], @@ -6398,9 +6396,11 @@ }, { "name": "Maltese", + "depth": 5, "iso_1_code": "mt", "iso_3_code": "mlt", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"mt\")", @@ -6420,9 +6420,11 @@ }, { "name": "Arabic, Chadian", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "shu", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6442,9 +6444,11 @@ }, { "name": "Arabic, Shihhi", + "depth": 5, "iso_1_code": "ar", "iso_3_code": "ssh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "514", "native_tokenizers": [], @@ -6452,9 +6456,11 @@ }, { "name": "Arabic, Judeo-Iraqi", + "depth": 5, "iso_1_code": null, "iso_3_code": "yhd", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "515", "native_tokenizers": [], @@ -6462,15 +6468,18 @@ }, { "name": "Arabic, Judeo-Tripolitanian", + "depth": 5, "iso_1_code": null, "iso_3_code": "yud", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "516", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6493,14 +6502,17 @@ }, { "name": "Canaanite", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hebrew, Ancient", + "depth": 5, "iso_1_code": null, "iso_3_code": "hbo", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Hebr": { "full_object": "StanzaTokenizer(\"hbo\")", @@ -6520,9 +6532,11 @@ }, { "name": "Hebrew", + "depth": 5, "iso_1_code": "he", "iso_3_code": "heb", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Hebr": { "full_object": "SpaCyTokenizer(\"he\")", @@ -6542,15 +6556,18 @@ }, { "name": "Samaritan Hebrew", + "depth": 5, "iso_1_code": null, "iso_3_code": "smp", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "520", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Hebr": { "full_object": "SpaCyTokenizer(\"he\")", @@ -6565,6 +6582,7 @@ "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6593,6 +6611,7 @@ "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -6622,24 +6641,29 @@ }, { "name": "South", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ethiopian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dahalik", + "depth": 5, "iso_1_code": null, "iso_3_code": "dlk", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "524", "native_tokenizers": [], @@ -6647,9 +6671,11 @@ }, { "name": "Geez", + "depth": 5, "iso_1_code": null, "iso_3_code": "gez", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "525", "native_tokenizers": [], @@ -6657,9 +6683,11 @@ }, { "name": "Tigr\u00e9", + "depth": 5, "iso_1_code": null, "iso_3_code": "tig", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"ti\")", @@ -6677,9 +6705,11 @@ }, { "name": "Tigrigna", + "depth": 5, "iso_1_code": "ti", "iso_3_code": "tir", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"ti\")", @@ -6698,6 +6728,7 @@ ] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"ti\")", @@ -6713,24 +6744,29 @@ }, { "name": "South", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Outer", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "n-Group", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gafat", + "depth": 7, "iso_1_code": null, "iso_3_code": "gft", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "531", "native_tokenizers": [], @@ -6738,15 +6774,18 @@ }, { "name": "Kistane", + "depth": 7, "iso_1_code": null, "iso_3_code": "gru", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "532", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "530", "native_tokenizers": [], @@ -6754,14 +6793,17 @@ }, { "name": "tt-Group", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inor", + "depth": 7, "iso_1_code": null, "iso_3_code": "ior", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "534", "native_tokenizers": [], @@ -6769,9 +6811,11 @@ }, { "name": "Mesqan", + "depth": 7, "iso_1_code": null, "iso_3_code": "mvz", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "535", "native_tokenizers": [], @@ -6779,9 +6823,11 @@ }, { "name": "Mesmes", + "depth": 7, "iso_1_code": null, "iso_3_code": "mys", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "536", "native_tokenizers": [], @@ -6789,9 +6835,11 @@ }, { "name": "Sebat Bet Gurage", + "depth": 7, "iso_1_code": null, "iso_3_code": "sgw", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6808,6 +6856,7 @@ ] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6822,6 +6871,7 @@ "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6837,19 +6887,23 @@ }, { "name": "Transversal", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amharic-Argobba", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Argobba", + "depth": 7, "iso_1_code": null, "iso_3_code": "agj", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "540", "native_tokenizers": [], @@ -6857,9 +6911,11 @@ }, { "name": "Amharic", + "depth": 7, "iso_1_code": "am", "iso_3_code": "amh", "children": [], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6878,6 +6934,7 @@ ] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6893,14 +6950,17 @@ }, { "name": "Harari-East Gurage", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Harari", + "depth": 7, "iso_1_code": null, "iso_3_code": "har", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "543", "native_tokenizers": [], @@ -6908,9 +6968,11 @@ }, { "name": "Silt\u2019e", + "depth": 7, "iso_1_code": null, "iso_3_code": "stv", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "544", "native_tokenizers": [], @@ -6918,9 +6980,11 @@ }, { "name": "Wolane", + "depth": 7, "iso_1_code": null, "iso_3_code": "wle", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "545", "native_tokenizers": [], @@ -6928,21 +6992,25 @@ }, { "name": "Zay", + "depth": 7, "iso_1_code": null, "iso_3_code": "zwa", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "546", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "542", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6957,6 +7025,7 @@ "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6971,6 +7040,7 @@ "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -6986,14 +7056,17 @@ }, { "name": "South Arabian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bathari", + "depth": 4, "iso_1_code": null, "iso_3_code": "bhm", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "548", "native_tokenizers": [], @@ -7001,9 +7074,11 @@ }, { "name": "Mehri", + "depth": 4, "iso_1_code": null, "iso_3_code": "gdq", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "549", "native_tokenizers": [], @@ -7011,9 +7086,11 @@ }, { "name": "Hoby\u00f3t", + "depth": 4, "iso_1_code": null, "iso_3_code": "hoh", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "550", "native_tokenizers": [], @@ -7021,9 +7098,11 @@ }, { "name": "Harsusi", + "depth": 4, "iso_1_code": null, "iso_3_code": "hss", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "551", "native_tokenizers": [], @@ -7031,9 +7110,11 @@ }, { "name": "Shehri", + "depth": 4, "iso_1_code": null, "iso_3_code": "shv", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "552", "native_tokenizers": [], @@ -7041,21 +7122,25 @@ }, { "name": "Soqotri", + "depth": 4, "iso_1_code": null, "iso_3_code": "sqt", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "553", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "547", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Ethi": { "full_object": "SpaCyTokenizer(\"am\")", @@ -7070,6 +7155,7 @@ "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": { "Arab": { "full_object": "SpaCyTokenizer(\"ar\")", @@ -7106,63 +7192,32 @@ }, { "name": "Unclassified", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ongota", + "depth": 2, "iso_1_code": null, "iso_3_code": "bxe", "children": [], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "555", "native_tokenizers": [], "scripts": [] } ], + "family": "Afro-Asiatic", "tokenizers": {}, "node_i": "554", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Copt": { - "full_object": "StanzaTokenizer(\"cop\")", - "original_lang_name": "coptic", - "original_lang_code": "cop", - "script": "Copt", - "class_name": "StanzaTokenizer" - }, - "Arab": { - "full_object": "SpaCyTokenizer(\"ar\")", - "original_lang_name": "arabic", - "original_lang_code": "ara", - "script": "Arab", - "class_name": "SpaCyTokenizer" - }, - "Latn": { - "full_object": "StanzaTokenizer(\"mt\")", - "original_lang_name": "maltese", - "original_lang_code": "mlt", - "script": "Latn", - "class_name": "StanzaTokenizer" - }, - "Hebr": { - "full_object": "SpaCyTokenizer(\"he\")", - "original_lang_name": "hebrew", - "original_lang_code": "heb", - "script": "Hebr", - "class_name": "SpaCyTokenizer" - }, - "Ethi": { - "full_object": "SpaCyTokenizer(\"am\")", - "original_lang_name": "amharic", - "original_lang_code": "amh", - "script": "Ethi", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Afro-Asiatic", + "tokenizers": {}, "node_i": "9", "native_tokenizers": [], "scripts": [] diff --git a/data/Algic.json b/data/Algic.json index d50bab1c7ae72539ea64cb34d17c4ec8da0098e0..c2636295f810442d5e0f3138618b6ff0ce1e3248 100644 --- a/data/Algic.json +++ b/data/Algic.json @@ -1,18 +1,22 @@ { "name": "Algic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Algonquian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Blackfoot", + "depth": 2, "iso_1_code": null, "iso_3_code": "bla", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "558", "native_tokenizers": [], @@ -22,9 +26,11 @@ }, { "name": "Cheyenne", + "depth": 2, "iso_1_code": null, "iso_3_code": "chy", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "559", "native_tokenizers": [], @@ -32,9 +38,11 @@ }, { "name": "Menominee", + "depth": 2, "iso_1_code": null, "iso_3_code": "mez", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "560", "native_tokenizers": [], @@ -42,9 +50,11 @@ }, { "name": "Miami", + "depth": 2, "iso_1_code": null, "iso_3_code": "mia", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "561", "native_tokenizers": [], @@ -52,9 +62,11 @@ }, { "name": "Nawathinehena", + "depth": 2, "iso_1_code": null, "iso_3_code": "nwa", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "562", "native_tokenizers": [], @@ -62,9 +74,11 @@ }, { "name": "Shawnee", + "depth": 2, "iso_1_code": null, "iso_3_code": "sjw", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "563", "native_tokenizers": [], @@ -72,14 +86,17 @@ }, { "name": "Arapaho", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arapaho", + "depth": 3, "iso_1_code": null, "iso_3_code": "arp", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "565", "native_tokenizers": [], @@ -89,15 +106,18 @@ }, { "name": "Gros Ventre", + "depth": 3, "iso_1_code": null, "iso_3_code": "ats", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "566", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "564", "native_tokenizers": [], @@ -105,14 +125,17 @@ }, { "name": "Cree-Montagnais", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atikamekw", + "depth": 3, "iso_1_code": null, "iso_3_code": "atj", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "568", "native_tokenizers": [], @@ -122,9 +145,11 @@ }, { "name": "Cree, Southern East", + "depth": 3, "iso_1_code": "cr", "iso_3_code": "crj", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "569", "native_tokenizers": [], @@ -134,9 +159,11 @@ }, { "name": "Cree, Plains", + "depth": 3, "iso_1_code": "cr", "iso_3_code": "crk", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "570", "native_tokenizers": [], @@ -147,9 +174,11 @@ }, { "name": "Cree, Northern East", + "depth": 3, "iso_1_code": "cr", "iso_3_code": "crl", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "571", "native_tokenizers": [], @@ -159,9 +188,11 @@ }, { "name": "Cree, Moose", + "depth": 3, "iso_1_code": "cr", "iso_3_code": "crm", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "572", "native_tokenizers": [], @@ -171,9 +202,11 @@ }, { "name": "Cree, Swampy", + "depth": 3, "iso_1_code": "cr", "iso_3_code": "csw", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "573", "native_tokenizers": [], @@ -183,9 +216,11 @@ }, { "name": "Cree, Woods", + "depth": 3, "iso_1_code": "cr", "iso_3_code": "cwd", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "574", "native_tokenizers": [], @@ -195,9 +230,11 @@ }, { "name": "Innu", + "depth": 3, "iso_1_code": null, "iso_3_code": "moe", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "575", "native_tokenizers": [], @@ -205,15 +242,18 @@ }, { "name": "Naskapi", + "depth": 3, "iso_1_code": null, "iso_3_code": "nsk", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "576", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "567", "native_tokenizers": [], @@ -221,14 +261,17 @@ }, { "name": "Eastern Algonquian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Carolina Algonquian", + "depth": 3, "iso_1_code": null, "iso_3_code": "crr", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "578", "native_tokenizers": [], @@ -236,9 +279,11 @@ }, { "name": "Etchemin", + "depth": 3, "iso_1_code": null, "iso_3_code": "etc", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "579", "native_tokenizers": [], @@ -246,9 +291,11 @@ }, { "name": "Mi\u2019kmaq", + "depth": 3, "iso_1_code": null, "iso_3_code": "mic", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "580", "native_tokenizers": [], @@ -258,9 +305,11 @@ }, { "name": "Powhatan", + "depth": 3, "iso_1_code": null, "iso_3_code": "pim", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "581", "native_tokenizers": [], @@ -268,9 +317,11 @@ }, { "name": "Malecite-Passamaquoddy", + "depth": 3, "iso_1_code": null, "iso_3_code": "pqm", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "582", "native_tokenizers": [], @@ -278,9 +329,11 @@ }, { "name": "Quiripi", + "depth": 3, "iso_1_code": null, "iso_3_code": "qyp", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "583", "native_tokenizers": [], @@ -288,9 +341,11 @@ }, { "name": "Wampanoag", + "depth": 3, "iso_1_code": null, "iso_3_code": "wam", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "584", "native_tokenizers": [], @@ -298,9 +353,11 @@ }, { "name": "Loup B", + "depth": 3, "iso_1_code": null, "iso_3_code": "xlb", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "585", "native_tokenizers": [], @@ -308,9 +365,11 @@ }, { "name": "Loup A", + "depth": 3, "iso_1_code": null, "iso_3_code": "xlo", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "586", "native_tokenizers": [], @@ -318,9 +377,11 @@ }, { "name": "Narragansett", + "depth": 3, "iso_1_code": null, "iso_3_code": "xnt", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "587", "native_tokenizers": [], @@ -328,9 +389,11 @@ }, { "name": "Mohegan-Pequot", + "depth": 3, "iso_1_code": null, "iso_3_code": "xpq", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "588", "native_tokenizers": [], @@ -338,14 +401,17 @@ }, { "name": "Abenaki", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abenaki, Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "aaq", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "590", "native_tokenizers": [], @@ -353,15 +419,18 @@ }, { "name": "Abenaki, Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "abe", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "591", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "589", "native_tokenizers": [], @@ -369,14 +438,17 @@ }, { "name": "Delaware", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mahican", + "depth": 4, "iso_1_code": null, "iso_3_code": "mjy", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "593", "native_tokenizers": [], @@ -384,9 +456,11 @@ }, { "name": "Munsee", + "depth": 4, "iso_1_code": null, "iso_3_code": "umu", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "594", "native_tokenizers": [], @@ -394,15 +468,18 @@ }, { "name": "Unami", + "depth": 4, "iso_1_code": null, "iso_3_code": "unm", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "595", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "592", "native_tokenizers": [], @@ -410,14 +487,17 @@ }, { "name": "Nanticoke-Conoy", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nanticoke", + "depth": 4, "iso_1_code": null, "iso_3_code": "nnt", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "597", "native_tokenizers": [], @@ -425,21 +505,25 @@ }, { "name": "Piscataway", + "depth": 4, "iso_1_code": null, "iso_3_code": "psy", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "598", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "596", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "577", "native_tokenizers": [], @@ -447,14 +531,17 @@ }, { "name": "Fox", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kickapoo", + "depth": 3, "iso_1_code": null, "iso_3_code": "kic", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "600", "native_tokenizers": [], @@ -462,15 +549,18 @@ }, { "name": "Meskwaki", + "depth": 3, "iso_1_code": null, "iso_3_code": "sac", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "601", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "599", "native_tokenizers": [], @@ -478,14 +568,17 @@ }, { "name": "Ojibwa-Potawatomi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Algonquin", + "depth": 3, "iso_1_code": null, "iso_3_code": "alq", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "603", "native_tokenizers": [], @@ -495,9 +588,11 @@ }, { "name": "Chippewa", + "depth": 3, "iso_1_code": "oj", "iso_3_code": "ciw", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "604", "native_tokenizers": [], @@ -505,9 +600,11 @@ }, { "name": "Ojibwa, Northwestern", + "depth": 3, "iso_1_code": "oj", "iso_3_code": "ojb", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "605", "native_tokenizers": [], @@ -518,9 +615,11 @@ }, { "name": "Ojibwa, Central", + "depth": 3, "iso_1_code": "oj", "iso_3_code": "ojc", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "606", "native_tokenizers": [], @@ -528,9 +627,11 @@ }, { "name": "Ojibwa, Eastern", + "depth": 3, "iso_1_code": "oj", "iso_3_code": "ojg", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "607", "native_tokenizers": [], @@ -538,9 +639,11 @@ }, { "name": "Oji-Cree", + "depth": 3, "iso_1_code": "oj", "iso_3_code": "ojs", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "608", "native_tokenizers": [], @@ -548,9 +651,11 @@ }, { "name": "Ojibwa, Western", + "depth": 3, "iso_1_code": "oj", "iso_3_code": "ojw", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "609", "native_tokenizers": [], @@ -558,9 +663,11 @@ }, { "name": "Ottawa", + "depth": 3, "iso_1_code": "oj", "iso_3_code": "otw", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "610", "native_tokenizers": [], @@ -570,9 +677,11 @@ }, { "name": "Potawatomi", + "depth": 3, "iso_1_code": null, "iso_3_code": "pot", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "611", "native_tokenizers": [], @@ -581,12 +690,14 @@ ] } ], + "family": "Algic", "tokenizers": {}, "node_i": "602", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "557", "native_tokenizers": [], @@ -594,14 +705,17 @@ }, { "name": "Ritwan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wiyot", + "depth": 2, "iso_1_code": null, "iso_3_code": "wiy", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "613", "native_tokenizers": [], @@ -609,21 +723,25 @@ }, { "name": "Yurok", + "depth": 2, "iso_1_code": null, "iso_3_code": "yur", "children": [], + "family": "Algic", "tokenizers": {}, "node_i": "614", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "612", "native_tokenizers": [], "scripts": [] } ], + "family": "Algic", "tokenizers": {}, "node_i": "556", "native_tokenizers": [], diff --git a/data/Amto-Musan.json b/data/Amto-Musan.json index 4b4642a906e7ae8605121a52c0c9bb72582443d7..148d13812d295a4ab0234a8c0cd0f9576c5554f5 100644 --- a/data/Amto-Musan.json +++ b/data/Amto-Musan.json @@ -1,13 +1,16 @@ { "name": "Amto-Musan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amto", + "depth": 1, "iso_1_code": null, "iso_3_code": "amt", "children": [], + "family": "Amto-Musan", "tokenizers": {}, "node_i": "616", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Siawi", + "depth": 1, "iso_1_code": null, "iso_3_code": "mmp", "children": [], + "family": "Amto-Musan", "tokenizers": {}, "node_i": "617", "native_tokenizers": [], "scripts": [] } ], + "family": "Amto-Musan", "tokenizers": {}, "node_i": "615", "native_tokenizers": [], diff --git a/data/Andamanese.json b/data/Andamanese.json index 71dfdf3055dcfe2e23bb159745e5f4b99bbd50ba..270a3178e4978b49dfbc2785f582736fe7ed90da 100644 --- a/data/Andamanese.json +++ b/data/Andamanese.json @@ -1,18 +1,22 @@ { "name": "Andamanese", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Great Andamanese", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Great Andamanese, Mixed", + "depth": 2, "iso_1_code": null, "iso_3_code": "gac", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "620", "native_tokenizers": [], @@ -20,14 +24,17 @@ }, { "name": "Central", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aka-Bea", + "depth": 3, "iso_1_code": null, "iso_3_code": "abj", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "622", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Akar-Bale", + "depth": 3, "iso_1_code": null, "iso_3_code": "acl", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "623", "native_tokenizers": [], @@ -45,9 +54,11 @@ }, { "name": "Aka-Kede", + "depth": 3, "iso_1_code": null, "iso_3_code": "akx", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "624", "native_tokenizers": [], @@ -55,9 +66,11 @@ }, { "name": "Aka-Kol", + "depth": 3, "iso_1_code": null, "iso_3_code": "aky", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "625", "native_tokenizers": [], @@ -65,9 +78,11 @@ }, { "name": "A-Pucikwar", + "depth": 3, "iso_1_code": null, "iso_3_code": "apq", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "626", "native_tokenizers": [], @@ -75,15 +90,18 @@ }, { "name": "Oko-Juwoi", + "depth": 3, "iso_1_code": null, "iso_3_code": "okj", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "627", "native_tokenizers": [], "scripts": [] } ], + "family": "Andamanese", "tokenizers": {}, "node_i": "621", "native_tokenizers": [], @@ -91,14 +109,17 @@ }, { "name": "Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aka-Cari", + "depth": 3, "iso_1_code": null, "iso_3_code": "aci", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "629", "native_tokenizers": [], @@ -106,9 +127,11 @@ }, { "name": "Aka-Kora", + "depth": 3, "iso_1_code": null, "iso_3_code": "ack", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "630", "native_tokenizers": [], @@ -116,9 +139,11 @@ }, { "name": "Aka-Jeru", + "depth": 3, "iso_1_code": null, "iso_3_code": "akj", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "631", "native_tokenizers": [], @@ -126,21 +151,25 @@ }, { "name": "Aka-Bo", + "depth": 3, "iso_1_code": null, "iso_3_code": "akm", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "632", "native_tokenizers": [], "scripts": [] } ], + "family": "Andamanese", "tokenizers": {}, "node_i": "628", "native_tokenizers": [], "scripts": [] } ], + "family": "Andamanese", "tokenizers": {}, "node_i": "619", "native_tokenizers": [], @@ -148,14 +177,17 @@ }, { "name": "South Andamanese", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jarawa", + "depth": 2, "iso_1_code": null, "iso_3_code": "anq", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "634", "native_tokenizers": [], @@ -163,9 +195,11 @@ }, { "name": "\u00d6\u00f1ge", + "depth": 2, "iso_1_code": null, "iso_3_code": "oon", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "635", "native_tokenizers": [], @@ -173,21 +207,25 @@ }, { "name": "Sentinel", + "depth": 2, "iso_1_code": null, "iso_3_code": "std", "children": [], + "family": "Andamanese", "tokenizers": {}, "node_i": "636", "native_tokenizers": [], "scripts": [] } ], + "family": "Andamanese", "tokenizers": {}, "node_i": "633", "native_tokenizers": [], "scripts": [] } ], + "family": "Andamanese", "tokenizers": {}, "node_i": "618", "native_tokenizers": [], diff --git a/data/Arafundi.json b/data/Arafundi.json index d9346dfe62024b7e51cb32a8c0d8a9fe00279f0d..51d314397bef31752ccbeb1787c3632cb6985446 100644 --- a/data/Arafundi.json +++ b/data/Arafundi.json @@ -1,13 +1,16 @@ { "name": "Arafundi", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andai", + "depth": 1, "iso_1_code": null, "iso_3_code": "afd", "children": [], + "family": "Arafundi", "tokenizers": {}, "node_i": "638", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Nanubae", + "depth": 1, "iso_1_code": null, "iso_3_code": "afk", "children": [], + "family": "Arafundi", "tokenizers": {}, "node_i": "639", "native_tokenizers": [], @@ -25,15 +30,18 @@ }, { "name": "Tapei", + "depth": 1, "iso_1_code": null, "iso_3_code": "afp", "children": [], + "family": "Arafundi", "tokenizers": {}, "node_i": "640", "native_tokenizers": [], "scripts": [] } ], + "family": "Arafundi", "tokenizers": {}, "node_i": "637", "native_tokenizers": [], diff --git a/data/Arai (Left May).json b/data/Arai (Left May).json index ae8423a138bf040a9e2ed969f8fa93b366a27f2d..2b1f1f7fe5573a3925edb6a7b76badbb12b03f5c 100644 --- a/data/Arai (Left May).json +++ b/data/Arai (Left May).json @@ -1,13 +1,16 @@ { "name": "Arai (Left May)", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sawiyanu", + "depth": 1, "iso_1_code": null, "iso_3_code": "amm", "children": [], + "family": "Arai (Left May)", "tokenizers": {}, "node_i": "642", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Bo", + "depth": 1, "iso_1_code": null, "iso_3_code": "bpw", "children": [], + "family": "Arai (Left May)", "tokenizers": {}, "node_i": "643", "native_tokenizers": [], @@ -27,9 +32,11 @@ }, { "name": "Yawuno Teneyo", + "depth": 1, "iso_1_code": null, "iso_3_code": "itr", "children": [], + "family": "Arai (Left May)", "tokenizers": {}, "node_i": "644", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Nakwi", + "depth": 1, "iso_1_code": null, "iso_3_code": "nax", "children": [], + "family": "Arai (Left May)", "tokenizers": {}, "node_i": "645", "native_tokenizers": [], @@ -47,9 +56,11 @@ }, { "name": "Nimo", + "depth": 1, "iso_1_code": null, "iso_3_code": "niw", "children": [], + "family": "Arai (Left May)", "tokenizers": {}, "node_i": "646", "native_tokenizers": [], @@ -57,15 +68,18 @@ }, { "name": "Owiniga", + "depth": 1, "iso_1_code": null, "iso_3_code": "owi", "children": [], + "family": "Arai (Left May)", "tokenizers": {}, "node_i": "647", "native_tokenizers": [], "scripts": [] } ], + "family": "Arai (Left May)", "tokenizers": {}, "node_i": "641", "native_tokenizers": [], diff --git a/data/Arauan.json b/data/Arauan.json index 0ba5f8d4e224d425adeaa3583d3f882e4896c3b6..91e746f917c5e4fe718a5b1b2d72c13ef2d96c2c 100644 --- a/data/Arauan.json +++ b/data/Arauan.json @@ -1,13 +1,16 @@ { "name": "Arauan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aru\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "aru", "children": [], + "family": "Arauan", "tokenizers": {}, "node_i": "649", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Kulina", + "depth": 1, "iso_1_code": null, "iso_3_code": "cul", "children": [], + "family": "Arauan", "tokenizers": {}, "node_i": "650", "native_tokenizers": [], @@ -27,9 +32,11 @@ }, { "name": "Den\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": "dny", "children": [], + "family": "Arauan", "tokenizers": {}, "node_i": "651", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Paumar\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": "pad", "children": [], + "family": "Arauan", "tokenizers": {}, "node_i": "652", "native_tokenizers": [], @@ -49,9 +58,11 @@ }, { "name": "Suruah\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "swx", "children": [], + "family": "Arauan", "tokenizers": {}, "node_i": "653", "native_tokenizers": [], @@ -59,14 +70,17 @@ }, { "name": "Jamamadi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jamamad\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": "jaa", "children": [], + "family": "Arauan", "tokenizers": {}, "node_i": "655", "native_tokenizers": [], @@ -75,12 +89,14 @@ ] } ], + "family": "Arauan", "tokenizers": {}, "node_i": "654", "native_tokenizers": [], "scripts": [] } ], + "family": "Arauan", "tokenizers": {}, "node_i": "648", "native_tokenizers": [], diff --git a/data/Australian.json b/data/Australian.json index 9fe7c8ac8ca0163d0f831055778c5d862ebcc751..dbfbaac2b861fbd86341fea24ef750c0d1ace9d4 100644 --- a/data/Australian.json +++ b/data/Australian.json @@ -1,13 +1,16 @@ { "name": "Australian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lanima", + "depth": 1, "iso_1_code": null, "iso_3_code": "lnw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "657", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Bunaban", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bunuba", + "depth": 2, "iso_1_code": null, "iso_3_code": "bck", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "659", "native_tokenizers": [], @@ -30,15 +36,18 @@ }, { "name": "Gooniyandi", + "depth": 2, "iso_1_code": null, "iso_3_code": "gni", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "660", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "658", "native_tokenizers": [], @@ -46,24 +55,29 @@ }, { "name": "Daly", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bringen-Wagaydy", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bringen", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marrithiyel", + "depth": 4, "iso_1_code": null, "iso_3_code": "mfr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "664", "native_tokenizers": [], @@ -71,9 +85,11 @@ }, { "name": "Maridan", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "665", "native_tokenizers": [], @@ -81,9 +97,11 @@ }, { "name": "Marti Ke", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "666", "native_tokenizers": [], @@ -91,9 +109,11 @@ }, { "name": "Maridjabin", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "667", "native_tokenizers": [], @@ -101,9 +121,11 @@ }, { "name": "Marimanindji", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "668", "native_tokenizers": [], @@ -111,9 +133,11 @@ }, { "name": "Maringarr", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "669", "native_tokenizers": [], @@ -121,15 +145,18 @@ }, { "name": "Mariyedi", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "670", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "663", "native_tokenizers": [], @@ -137,14 +164,17 @@ }, { "name": "Wagaydy", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ami", + "depth": 4, "iso_1_code": null, "iso_3_code": "amy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "672", "native_tokenizers": [], @@ -152,9 +182,11 @@ }, { "name": "Giyug", + "depth": 4, "iso_1_code": null, "iso_3_code": "giy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "673", "native_tokenizers": [], @@ -162,9 +194,11 @@ }, { "name": "Wadjiginy", + "depth": 4, "iso_1_code": null, "iso_3_code": "wdj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "674", "native_tokenizers": [], @@ -172,9 +206,11 @@ }, { "name": "Manda", + "depth": 4, "iso_1_code": null, "iso_3_code": "zma", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "675", "native_tokenizers": [], @@ -182,21 +218,25 @@ }, { "name": "Maranunggu", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "676", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "671", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "662", "native_tokenizers": [], @@ -204,19 +244,23 @@ }, { "name": "Malagmalag", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Daly Proper", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamu", + "depth": 4, "iso_1_code": null, "iso_3_code": "xmu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "679", "native_tokenizers": [], @@ -224,15 +268,18 @@ }, { "name": "Matngala", + "depth": 4, "iso_1_code": null, "iso_3_code": "zml", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "680", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "678", "native_tokenizers": [], @@ -240,14 +287,17 @@ }, { "name": "Malagmalag Proper", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malak Malak", + "depth": 4, "iso_1_code": null, "iso_3_code": "mpb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "682", "native_tokenizers": [], @@ -255,21 +305,25 @@ }, { "name": "Kuwema", + "depth": 4, "iso_1_code": null, "iso_3_code": "woa", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "683", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "681", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "677", "native_tokenizers": [], @@ -277,20 +331,24 @@ }, { "name": "Marriammu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marriammu", + "depth": 3, "iso_1_code": null, "iso_3_code": "xru", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "685", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "684", "native_tokenizers": [], @@ -298,14 +356,17 @@ }, { "name": "Murrinh-Patha", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Murrinh-Patha", + "depth": 3, "iso_1_code": null, "iso_3_code": "mwf", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "687", "native_tokenizers": [], @@ -315,21 +376,25 @@ }, { "name": "Ngan\u2019gityemerri", + "depth": 3, "iso_1_code": null, "iso_3_code": "nam", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "688", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "686", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "661", "native_tokenizers": [], @@ -337,14 +402,17 @@ }, { "name": "Djamindjungan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Djamindjung", + "depth": 2, "iso_1_code": null, "iso_3_code": "djd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "690", "native_tokenizers": [], @@ -352,15 +420,18 @@ }, { "name": "Nungali", + "depth": 2, "iso_1_code": null, "iso_3_code": "nug", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "691", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "689", "native_tokenizers": [], @@ -368,14 +439,17 @@ }, { "name": "Djeragan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gadjerawang", + "depth": 2, "iso_1_code": null, "iso_3_code": "gdh", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "693", "native_tokenizers": [], @@ -383,9 +457,11 @@ }, { "name": "Kija", + "depth": 2, "iso_1_code": null, "iso_3_code": "gia", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "694", "native_tokenizers": [], @@ -393,15 +469,18 @@ }, { "name": "Miriwoong", + "depth": 2, "iso_1_code": null, "iso_3_code": "mep", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "695", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "692", "native_tokenizers": [], @@ -409,14 +488,17 @@ }, { "name": "Giimbiyu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Erre", + "depth": 2, "iso_1_code": null, "iso_3_code": "err", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "697", "native_tokenizers": [], @@ -424,9 +506,11 @@ }, { "name": "Urningangg", + "depth": 2, "iso_1_code": null, "iso_3_code": "urc", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "698", "native_tokenizers": [], @@ -434,15 +518,18 @@ }, { "name": "Mangerr", + "depth": 2, "iso_1_code": null, "iso_3_code": "zme", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "699", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "696", "native_tokenizers": [], @@ -450,19 +537,23 @@ }, { "name": "Gunwingguan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burarran", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burarra", + "depth": 3, "iso_1_code": null, "iso_3_code": "bvr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "702", "native_tokenizers": [], @@ -472,9 +563,11 @@ }, { "name": "Djeebbana", + "depth": 3, "iso_1_code": null, "iso_3_code": "djj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "703", "native_tokenizers": [], @@ -482,9 +575,11 @@ }, { "name": "Gurr-goni", + "depth": 3, "iso_1_code": null, "iso_3_code": "gge", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "704", "native_tokenizers": [], @@ -492,15 +587,18 @@ }, { "name": "Na-kara", + "depth": 3, "iso_1_code": null, "iso_3_code": "nck", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "705", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "701", "native_tokenizers": [], @@ -508,20 +606,24 @@ }, { "name": "Djauanic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Djauan", + "depth": 3, "iso_1_code": null, "iso_3_code": "djn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "707", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "706", "native_tokenizers": [], @@ -529,14 +631,17 @@ }, { "name": "Enindhilyagwa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anindilyakwa", + "depth": 3, "iso_1_code": null, "iso_3_code": "aoi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "709", "native_tokenizers": [], @@ -546,9 +651,11 @@ }, { "name": "Ngandi", + "depth": 3, "iso_1_code": null, "iso_3_code": "nid", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "710", "native_tokenizers": [], @@ -556,9 +663,11 @@ }, { "name": "Nunggubuyu", + "depth": 3, "iso_1_code": null, "iso_3_code": "nuy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "711", "native_tokenizers": [], @@ -567,6 +676,7 @@ ] } ], + "family": "Australian", "tokenizers": {}, "node_i": "708", "native_tokenizers": [], @@ -574,20 +684,24 @@ }, { "name": "Gagudjuan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gagadu", + "depth": 3, "iso_1_code": null, "iso_3_code": "gbu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "713", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "712", "native_tokenizers": [], @@ -595,20 +709,24 @@ }, { "name": "Gungaraganyan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kungarakany", + "depth": 3, "iso_1_code": null, "iso_3_code": "ggk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "715", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "714", "native_tokenizers": [], @@ -616,14 +734,17 @@ }, { "name": "Gunwinggic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gunwinggu", + "depth": 3, "iso_1_code": null, "iso_3_code": "gup", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "717", "native_tokenizers": [], @@ -631,15 +752,18 @@ }, { "name": "Kunbarlang", + "depth": 3, "iso_1_code": null, "iso_3_code": "wlg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "718", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "716", "native_tokenizers": [], @@ -647,20 +771,24 @@ }, { "name": "Mangarayic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mangarrayi", + "depth": 3, "iso_1_code": null, "iso_3_code": "mpc", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "720", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "719", "native_tokenizers": [], @@ -668,14 +796,17 @@ }, { "name": "Maran", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yugul", + "depth": 3, "iso_1_code": null, "iso_3_code": "ygu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "722", "native_tokenizers": [], @@ -683,20 +814,24 @@ }, { "name": "Alawic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alawa", + "depth": 4, "iso_1_code": null, "iso_3_code": "alh", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "724", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "723", "native_tokenizers": [], @@ -704,14 +839,17 @@ }, { "name": "Mara", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marra", + "depth": 4, "iso_1_code": null, "iso_3_code": "mec", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "726", "native_tokenizers": [], @@ -719,21 +857,25 @@ }, { "name": "Wandarang", + "depth": 4, "iso_1_code": null, "iso_3_code": "wnd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "727", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "725", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "721", "native_tokenizers": [], @@ -741,20 +883,24 @@ }, { "name": "Ngalkbun", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dalabon", + "depth": 3, "iso_1_code": null, "iso_3_code": "ngk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "729", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "728", "native_tokenizers": [], @@ -762,14 +908,17 @@ }, { "name": "Rembargic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngalakgan", + "depth": 3, "iso_1_code": null, "iso_3_code": "nig", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "731", "native_tokenizers": [], @@ -777,15 +926,18 @@ }, { "name": "Rembarrnga", + "depth": 3, "iso_1_code": null, "iso_3_code": "rmb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "732", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "730", "native_tokenizers": [], @@ -793,20 +945,24 @@ }, { "name": "Wagiman", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wagiman", + "depth": 3, "iso_1_code": null, "iso_3_code": "waq", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "734", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "733", "native_tokenizers": [], @@ -814,20 +970,24 @@ }, { "name": "Warayan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Waray", + "depth": 3, "iso_1_code": null, "iso_3_code": "wrz", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "736", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "735", "native_tokenizers": [], @@ -835,14 +995,17 @@ }, { "name": "Yangmanic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dagoman", + "depth": 3, "iso_1_code": null, "iso_3_code": "dgn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "738", "native_tokenizers": [], @@ -850,9 +1013,11 @@ }, { "name": "Yangman", + "depth": 3, "iso_1_code": null, "iso_3_code": "jng", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "739", "native_tokenizers": [], @@ -860,21 +1025,25 @@ }, { "name": "Wardaman", + "depth": 3, "iso_1_code": null, "iso_3_code": "wrr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "740", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "737", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "700", "native_tokenizers": [], @@ -882,20 +1051,24 @@ }, { "name": "Laragiyan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Laragia", + "depth": 2, "iso_1_code": null, "iso_3_code": "lrg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "742", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "741", "native_tokenizers": [], @@ -903,14 +1076,17 @@ }, { "name": "Limilngan-Wulna", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Limilngan", + "depth": 2, "iso_1_code": null, "iso_3_code": "lmc", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "744", "native_tokenizers": [], @@ -918,15 +1094,18 @@ }, { "name": "Wulna", + "depth": 2, "iso_1_code": null, "iso_3_code": "wux", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "745", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "743", "native_tokenizers": [], @@ -934,14 +1113,17 @@ }, { "name": "Nyulnyulan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bardi", + "depth": 2, "iso_1_code": null, "iso_3_code": "bcj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "747", "native_tokenizers": [], @@ -949,9 +1131,11 @@ }, { "name": "Djawi", + "depth": 2, "iso_1_code": null, "iso_3_code": "djw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "748", "native_tokenizers": [], @@ -959,9 +1143,11 @@ }, { "name": "Dyaberdyaber", + "depth": 2, "iso_1_code": null, "iso_3_code": "dyb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "749", "native_tokenizers": [], @@ -969,9 +1155,11 @@ }, { "name": "Dyugun", + "depth": 2, "iso_1_code": null, "iso_3_code": "dyd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "750", "native_tokenizers": [], @@ -979,9 +1167,11 @@ }, { "name": "Nimanbur", + "depth": 2, "iso_1_code": null, "iso_3_code": "nmp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "751", "native_tokenizers": [], @@ -989,9 +1179,11 @@ }, { "name": "Nyikina", + "depth": 2, "iso_1_code": null, "iso_3_code": "nyh", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "752", "native_tokenizers": [], @@ -999,9 +1191,11 @@ }, { "name": "Nyulnyul", + "depth": 2, "iso_1_code": null, "iso_3_code": "nyv", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "753", "native_tokenizers": [], @@ -1009,9 +1203,11 @@ }, { "name": "Warrwa", + "depth": 2, "iso_1_code": null, "iso_3_code": "wwr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "754", "native_tokenizers": [], @@ -1019,9 +1215,11 @@ }, { "name": "Ngumbarl", + "depth": 2, "iso_1_code": null, "iso_3_code": "xnm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "755", "native_tokenizers": [], @@ -1029,15 +1227,18 @@ }, { "name": "Yawuru", + "depth": 2, "iso_1_code": null, "iso_3_code": "ywr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "756", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "746", "native_tokenizers": [], @@ -1045,14 +1246,17 @@ }, { "name": "Pama-Nyungan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bidhawal", + "depth": 2, "iso_1_code": null, "iso_3_code": "ihw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "758", "native_tokenizers": [], @@ -1060,9 +1264,11 @@ }, { "name": "Kurnai", + "depth": 2, "iso_1_code": null, "iso_3_code": "unn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "759", "native_tokenizers": [], @@ -1070,9 +1276,11 @@ }, { "name": "Keerray-Woorroong", + "depth": 2, "iso_1_code": null, "iso_3_code": "wkr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "760", "native_tokenizers": [], @@ -1080,9 +1288,11 @@ }, { "name": "Bindal", + "depth": 2, "iso_1_code": null, "iso_3_code": "xbd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "761", "native_tokenizers": [], @@ -1090,9 +1300,11 @@ }, { "name": "Bigambal", + "depth": 2, "iso_1_code": null, "iso_3_code": "xbe", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "762", "native_tokenizers": [], @@ -1100,9 +1312,11 @@ }, { "name": "Yuyu", + "depth": 2, "iso_1_code": null, "iso_3_code": "yxu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "763", "native_tokenizers": [], @@ -1110,14 +1324,17 @@ }, { "name": "Arandic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andegerebinha", + "depth": 3, "iso_1_code": null, "iso_3_code": "adg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "765", "native_tokenizers": [], @@ -1125,9 +1342,11 @@ }, { "name": "Arrernte, Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": "aer", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "766", "native_tokenizers": [], @@ -1137,9 +1356,11 @@ }, { "name": "Alyawarr", + "depth": 3, "iso_1_code": null, "iso_3_code": "aly", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "767", "native_tokenizers": [], @@ -1149,9 +1370,11 @@ }, { "name": "Anmatyerr", + "depth": 3, "iso_1_code": null, "iso_3_code": "amx", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "768", "native_tokenizers": [], @@ -1161,9 +1384,11 @@ }, { "name": "Arrarnta, Western", + "depth": 3, "iso_1_code": null, "iso_3_code": "are", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "769", "native_tokenizers": [], @@ -1173,9 +1398,11 @@ }, { "name": "Ayerrerenge", + "depth": 3, "iso_1_code": null, "iso_3_code": "axe", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "770", "native_tokenizers": [], @@ -1183,9 +1410,11 @@ }, { "name": "Aranda, Lower Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": "axl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "771", "native_tokenizers": [], @@ -1193,15 +1422,18 @@ }, { "name": "Kaytetye", + "depth": 3, "iso_1_code": null, "iso_3_code": "gbb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "772", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "764", "native_tokenizers": [], @@ -1209,20 +1441,24 @@ }, { "name": "Baagandji", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Paakantyi", + "depth": 3, "iso_1_code": null, "iso_3_code": "drl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "774", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "773", "native_tokenizers": [], @@ -1230,14 +1466,17 @@ }, { "name": "Bandjalangic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bandjalang", + "depth": 3, "iso_1_code": null, "iso_3_code": "bdy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "776", "native_tokenizers": [], @@ -1245,9 +1484,11 @@ }, { "name": "Githabul", + "depth": 3, "iso_1_code": null, "iso_3_code": "gih", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "777", "native_tokenizers": [], @@ -1255,9 +1496,11 @@ }, { "name": "Arakwal", + "depth": 3, "iso_1_code": null, "iso_3_code": "rkw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "778", "native_tokenizers": [], @@ -1265,15 +1508,18 @@ }, { "name": "Minjungbal", + "depth": 3, "iso_1_code": null, "iso_3_code": "xjb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "779", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "775", "native_tokenizers": [], @@ -1281,14 +1527,17 @@ }, { "name": "Bungandidj", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gunditjmara", + "depth": 3, "iso_1_code": null, "iso_3_code": "gjm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "781", "native_tokenizers": [], @@ -1296,15 +1545,18 @@ }, { "name": "Bunganditj", + "depth": 3, "iso_1_code": null, "iso_3_code": "xbg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "782", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "780", "native_tokenizers": [], @@ -1312,14 +1564,17 @@ }, { "name": "Durubulic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jandai", + "depth": 3, "iso_1_code": null, "iso_3_code": "jan", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "784", "native_tokenizers": [], @@ -1327,9 +1582,11 @@ }, { "name": "Nunukul", + "depth": 3, "iso_1_code": null, "iso_3_code": "xnu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "785", "native_tokenizers": [], @@ -1337,15 +1594,18 @@ }, { "name": "Yagara", + "depth": 3, "iso_1_code": null, "iso_3_code": "yxg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "786", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "783", "native_tokenizers": [], @@ -1353,14 +1613,17 @@ }, { "name": "Dyangadi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dyangadi", + "depth": 3, "iso_1_code": null, "iso_3_code": "dyn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "788", "native_tokenizers": [], @@ -1368,15 +1631,18 @@ }, { "name": "Nganyaywana", + "depth": 3, "iso_1_code": null, "iso_3_code": "nyx", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "789", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "787", "native_tokenizers": [], @@ -1384,14 +1650,17 @@ }, { "name": "Dyirbalic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dyirbal", + "depth": 3, "iso_1_code": null, "iso_3_code": "dbl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "791", "native_tokenizers": [], @@ -1399,9 +1668,11 @@ }, { "name": "Yuru", + "depth": 3, "iso_1_code": null, "iso_3_code": "ljx", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "792", "native_tokenizers": [], @@ -1409,9 +1680,11 @@ }, { "name": "Nyawaygi", + "depth": 3, "iso_1_code": null, "iso_3_code": "nyt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "793", "native_tokenizers": [], @@ -1419,15 +1692,18 @@ }, { "name": "Warrgamay", + "depth": 3, "iso_1_code": null, "iso_3_code": "wgy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "794", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "790", "native_tokenizers": [], @@ -1435,20 +1711,24 @@ }, { "name": "Flinders Island", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Flinders Island", + "depth": 3, "iso_1_code": null, "iso_3_code": "fln", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "796", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "795", "native_tokenizers": [], @@ -1456,14 +1736,17 @@ }, { "name": "Galgadungic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalkutung", + "depth": 3, "iso_1_code": null, "iso_3_code": "ktg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "798", "native_tokenizers": [], @@ -1471,9 +1754,11 @@ }, { "name": "Wakabunga", + "depth": 3, "iso_1_code": null, "iso_3_code": "wwb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "799", "native_tokenizers": [], @@ -1481,15 +1766,18 @@ }, { "name": "Yalarnnga", + "depth": 3, "iso_1_code": null, "iso_3_code": "ylr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "800", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "797", "native_tokenizers": [], @@ -1497,14 +1785,17 @@ }, { "name": "Gumbaynggiric", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kumbainggar", + "depth": 3, "iso_1_code": null, "iso_3_code": "kgs", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "802", "native_tokenizers": [], @@ -1512,15 +1803,18 @@ }, { "name": "Yaygir", + "depth": 3, "iso_1_code": null, "iso_3_code": "xya", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "803", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "801", "native_tokenizers": [], @@ -1528,14 +1822,17 @@ }, { "name": "Guugu-Yimidhirr", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barrow Point", + "depth": 3, "iso_1_code": null, "iso_3_code": "bpt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "805", "native_tokenizers": [], @@ -1543,15 +1840,18 @@ }, { "name": "Guugu Yimidhirr", + "depth": 3, "iso_1_code": null, "iso_3_code": "kky", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "806", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "804", "native_tokenizers": [], @@ -1559,14 +1859,17 @@ }, { "name": "Kala Lagaw Ya", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kala Lagaw Ya", + "depth": 3, "iso_1_code": null, "iso_3_code": "mwp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "808", "native_tokenizers": [], @@ -1575,6 +1878,7 @@ ] } ], + "family": "Australian", "tokenizers": {}, "node_i": "807", "native_tokenizers": [], @@ -1582,14 +1886,17 @@ }, { "name": "Karnic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karenggapa", + "depth": 3, "iso_1_code": null, "iso_3_code": "eaa", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "810", "native_tokenizers": [], @@ -1597,9 +1904,11 @@ }, { "name": "Kungardutyi", + "depth": 3, "iso_1_code": null, "iso_3_code": "gdt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "811", "native_tokenizers": [], @@ -1607,9 +1916,11 @@ }, { "name": "Nhirrpi", + "depth": 3, "iso_1_code": null, "iso_3_code": "hrp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "812", "native_tokenizers": [], @@ -1617,9 +1928,11 @@ }, { "name": "Kungkari", + "depth": 3, "iso_1_code": null, "iso_3_code": "lku", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "813", "native_tokenizers": [], @@ -1627,9 +1940,11 @@ }, { "name": "Ngantangarra", + "depth": 3, "iso_1_code": null, "iso_3_code": "ntg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "814", "native_tokenizers": [], @@ -1637,9 +1952,11 @@ }, { "name": "Karuwali", + "depth": 3, "iso_1_code": null, "iso_3_code": "rxw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "815", "native_tokenizers": [], @@ -1647,9 +1964,11 @@ }, { "name": "Wangkayutyuru", + "depth": 3, "iso_1_code": null, "iso_3_code": "wky", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "816", "native_tokenizers": [], @@ -1657,9 +1976,11 @@ }, { "name": "Pirriya", + "depth": 3, "iso_1_code": null, "iso_3_code": "xpa", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "817", "native_tokenizers": [], @@ -1667,9 +1988,11 @@ }, { "name": "Yarluyandi", + "depth": 3, "iso_1_code": null, "iso_3_code": "yry", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "818", "native_tokenizers": [], @@ -1677,9 +2000,11 @@ }, { "name": "Mayawali", + "depth": 3, "iso_1_code": null, "iso_3_code": "yxa", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "819", "native_tokenizers": [], @@ -1687,14 +2012,17 @@ }, { "name": "Karna", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pirlatapa", + "depth": 4, "iso_1_code": null, "iso_3_code": "bxi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "821", "native_tokenizers": [], @@ -1702,9 +2030,11 @@ }, { "name": "Diyari", + "depth": 4, "iso_1_code": null, "iso_3_code": "dif", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "822", "native_tokenizers": [], @@ -1712,9 +2042,11 @@ }, { "name": "Ngamini", + "depth": 4, "iso_1_code": null, "iso_3_code": "nmv", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "823", "native_tokenizers": [], @@ -1722,9 +2054,11 @@ }, { "name": "Yandruwandha", + "depth": 4, "iso_1_code": null, "iso_3_code": "ynd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "824", "native_tokenizers": [], @@ -1732,15 +2066,18 @@ }, { "name": "Yawarawarga", + "depth": 4, "iso_1_code": null, "iso_3_code": "yww", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "825", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "820", "native_tokenizers": [], @@ -1748,14 +2085,17 @@ }, { "name": "Ngura", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Garlali", + "depth": 4, "iso_1_code": null, "iso_3_code": "gll", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "827", "native_tokenizers": [], @@ -1763,9 +2103,11 @@ }, { "name": "Badjiri", + "depth": 4, "iso_1_code": null, "iso_3_code": "jbi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "828", "native_tokenizers": [], @@ -1773,9 +2115,11 @@ }, { "name": "Punthamara", + "depth": 4, "iso_1_code": null, "iso_3_code": "xpt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "829", "native_tokenizers": [], @@ -1783,15 +2127,18 @@ }, { "name": "Wangkumara", + "depth": 4, "iso_1_code": null, "iso_3_code": "xwk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "830", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "826", "native_tokenizers": [], @@ -1799,14 +2146,17 @@ }, { "name": "Palku", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arabana", + "depth": 4, "iso_1_code": null, "iso_3_code": "ard", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "832", "native_tokenizers": [], @@ -1814,9 +2164,11 @@ }, { "name": "Pitta Pitta", + "depth": 4, "iso_1_code": null, "iso_3_code": "pit", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "833", "native_tokenizers": [], @@ -1824,9 +2176,11 @@ }, { "name": "Wangkangurru", + "depth": 4, "iso_1_code": null, "iso_3_code": "wgg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "834", "native_tokenizers": [], @@ -1834,21 +2188,25 @@ }, { "name": "Wanggamala", + "depth": 4, "iso_1_code": null, "iso_3_code": "wnm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "835", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "831", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "809", "native_tokenizers": [], @@ -1856,14 +2214,17 @@ }, { "name": "Kulin", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Daungwurrung", + "depth": 3, "iso_1_code": null, "iso_3_code": "dgw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "837", "native_tokenizers": [], @@ -1871,9 +2232,11 @@ }, { "name": "Djadjawurrung", + "depth": 3, "iso_1_code": null, "iso_3_code": "dja", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "838", "native_tokenizers": [], @@ -1881,9 +2244,11 @@ }, { "name": "Madhi Madhi", + "depth": 3, "iso_1_code": null, "iso_3_code": "dmd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "839", "native_tokenizers": [], @@ -1891,9 +2256,11 @@ }, { "name": "Ladji Ladji", + "depth": 3, "iso_1_code": null, "iso_3_code": "llj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "840", "native_tokenizers": [], @@ -1901,9 +2268,11 @@ }, { "name": "Nari Nari", + "depth": 3, "iso_1_code": null, "iso_3_code": "rnr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "841", "native_tokenizers": [], @@ -1911,9 +2280,11 @@ }, { "name": "Djabwurrung", + "depth": 3, "iso_1_code": null, "iso_3_code": "tjw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "842", "native_tokenizers": [], @@ -1921,9 +2292,11 @@ }, { "name": "Wergaia", + "depth": 3, "iso_1_code": null, "iso_3_code": "weg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "843", "native_tokenizers": [], @@ -1931,9 +2304,11 @@ }, { "name": "Wathawurrung", + "depth": 3, "iso_1_code": null, "iso_3_code": "wth", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "844", "native_tokenizers": [], @@ -1941,9 +2316,11 @@ }, { "name": "Woiwurrung", + "depth": 3, "iso_1_code": null, "iso_3_code": "wyi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "845", "native_tokenizers": [], @@ -1951,9 +2328,11 @@ }, { "name": "Wadi Wadi", + "depth": 3, "iso_1_code": null, "iso_3_code": "xwd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "846", "native_tokenizers": [], @@ -1961,9 +2340,11 @@ }, { "name": "Wemba Wemba", + "depth": 3, "iso_1_code": null, "iso_3_code": "xww", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "847", "native_tokenizers": [], @@ -1971,26 +2352,31 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barababaraba", + "depth": 4, "iso_1_code": null, "iso_3_code": "rbp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "849", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "848", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "836", "native_tokenizers": [], @@ -1998,20 +2384,24 @@ }, { "name": "Lardil", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lardil", + "depth": 3, "iso_1_code": null, "iso_3_code": "lbz", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "851", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "850", "native_tokenizers": [], @@ -2019,14 +2409,17 @@ }, { "name": "Maric", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bidjara", + "depth": 3, "iso_1_code": null, "iso_3_code": "bym", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "853", "native_tokenizers": [], @@ -2034,9 +2427,11 @@ }, { "name": "Biri", + "depth": 3, "iso_1_code": null, "iso_3_code": "bzr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "854", "native_tokenizers": [], @@ -2044,9 +2439,11 @@ }, { "name": "Dhungaloo", + "depth": 3, "iso_1_code": null, "iso_3_code": "dhx", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "855", "native_tokenizers": [], @@ -2054,9 +2451,11 @@ }, { "name": "Gugu Badhun", + "depth": 3, "iso_1_code": null, "iso_3_code": "gdc", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "856", "native_tokenizers": [], @@ -2064,9 +2463,11 @@ }, { "name": "Gangulu", + "depth": 3, "iso_1_code": null, "iso_3_code": "gnl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "857", "native_tokenizers": [], @@ -2074,9 +2475,11 @@ }, { "name": "Guwamu", + "depth": 3, "iso_1_code": null, "iso_3_code": "gwu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "858", "native_tokenizers": [], @@ -2084,9 +2487,11 @@ }, { "name": "Gungabula", + "depth": 3, "iso_1_code": null, "iso_3_code": "gyf", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "859", "native_tokenizers": [], @@ -2094,9 +2499,11 @@ }, { "name": "Gunya", + "depth": 3, "iso_1_code": null, "iso_3_code": "gyy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "860", "native_tokenizers": [], @@ -2104,9 +2511,11 @@ }, { "name": "Kunggari", + "depth": 3, "iso_1_code": null, "iso_3_code": "kgl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "861", "native_tokenizers": [], @@ -2114,9 +2523,11 @@ }, { "name": "Yirandali", + "depth": 3, "iso_1_code": null, "iso_3_code": "ljw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "862", "native_tokenizers": [], @@ -2124,9 +2535,11 @@ }, { "name": "Wadjigu", + "depth": 3, "iso_1_code": null, "iso_3_code": "wdu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "863", "native_tokenizers": [], @@ -2134,9 +2547,11 @@ }, { "name": "Wadjabangayi", + "depth": 3, "iso_1_code": null, "iso_3_code": "wdy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "864", "native_tokenizers": [], @@ -2144,9 +2559,11 @@ }, { "name": "Warungu", + "depth": 3, "iso_1_code": null, "iso_3_code": "wrg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "865", "native_tokenizers": [], @@ -2154,9 +2571,11 @@ }, { "name": "Lower Burdekin", + "depth": 3, "iso_1_code": null, "iso_3_code": "xbb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "866", "native_tokenizers": [], @@ -2164,9 +2583,11 @@ }, { "name": "Garingbal", + "depth": 3, "iso_1_code": null, "iso_3_code": "xgi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "867", "native_tokenizers": [], @@ -2174,9 +2595,11 @@ }, { "name": "Dharumbal", + "depth": 3, "iso_1_code": null, "iso_3_code": "xgm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "868", "native_tokenizers": [], @@ -2184,9 +2607,11 @@ }, { "name": "Guwa", + "depth": 3, "iso_1_code": null, "iso_3_code": "xgw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "869", "native_tokenizers": [], @@ -2194,9 +2619,11 @@ }, { "name": "Wotjobaluk", + "depth": 3, "iso_1_code": null, "iso_3_code": "xwt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "870", "native_tokenizers": [], @@ -2204,9 +2631,11 @@ }, { "name": "Yandjibara", + "depth": 3, "iso_1_code": null, "iso_3_code": "xyb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "871", "native_tokenizers": [], @@ -2214,9 +2643,11 @@ }, { "name": "Yanda", + "depth": 3, "iso_1_code": null, "iso_3_code": "yda", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "872", "native_tokenizers": [], @@ -2224,9 +2655,11 @@ }, { "name": "Yiningayi", + "depth": 3, "iso_1_code": null, "iso_3_code": "ygi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "873", "native_tokenizers": [], @@ -2234,9 +2667,11 @@ }, { "name": "Margany", + "depth": 3, "iso_1_code": null, "iso_3_code": "zmc", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "874", "native_tokenizers": [], @@ -2244,15 +2679,18 @@ }, { "name": "Mandandanyi", + "depth": 3, "iso_1_code": null, "iso_3_code": "zmk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "875", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "852", "native_tokenizers": [], @@ -2260,20 +2698,24 @@ }, { "name": "Mbara", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbara", + "depth": 3, "iso_1_code": null, "iso_3_code": "mvl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "877", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "876", "native_tokenizers": [], @@ -2281,20 +2723,24 @@ }, { "name": "Muruwaric", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Muruwari", + "depth": 3, "iso_1_code": null, "iso_3_code": "zmu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "879", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "878", "native_tokenizers": [], @@ -2302,14 +2748,17 @@ }, { "name": "Ngarinyeric-Yithayithic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dadi Dadi", + "depth": 3, "iso_1_code": null, "iso_3_code": "dda", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "881", "native_tokenizers": [], @@ -2317,9 +2766,11 @@ }, { "name": "Ngarrindjeri", + "depth": 3, "iso_1_code": null, "iso_3_code": "nay", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "882", "native_tokenizers": [], @@ -2327,15 +2778,18 @@ }, { "name": "Ngayawung", + "depth": 3, "iso_1_code": null, "iso_3_code": "nwg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "883", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "880", "native_tokenizers": [], @@ -2343,14 +2797,17 @@ }, { "name": "Pallanganmiddang", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhudhuroa", + "depth": 3, "iso_1_code": null, "iso_3_code": "ddr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "885", "native_tokenizers": [], @@ -2358,15 +2815,18 @@ }, { "name": "Pallanganmiddang", + "depth": 3, "iso_1_code": null, "iso_3_code": "pmd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "886", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "884", "native_tokenizers": [], @@ -2374,14 +2834,17 @@ }, { "name": "Paman", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Olkol", + "depth": 3, "iso_1_code": null, "iso_3_code": "olk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "888", "native_tokenizers": [], @@ -2389,9 +2852,11 @@ }, { "name": "Tagalaka", + "depth": 3, "iso_1_code": null, "iso_3_code": "tgz", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "889", "native_tokenizers": [], @@ -2399,9 +2864,11 @@ }, { "name": "Gudang", + "depth": 3, "iso_1_code": null, "iso_3_code": "xgd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "890", "native_tokenizers": [], @@ -2409,9 +2876,11 @@ }, { "name": "Yatay", + "depth": 3, "iso_1_code": null, "iso_3_code": "yty", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "891", "native_tokenizers": [], @@ -2419,9 +2888,11 @@ }, { "name": "Yinwum", + "depth": 3, "iso_1_code": null, "iso_3_code": "yxm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "892", "native_tokenizers": [], @@ -2429,20 +2900,24 @@ }, { "name": "Central Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kunjen", + "depth": 4, "iso_1_code": null, "iso_3_code": "kjn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "894", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "893", "native_tokenizers": [], @@ -2450,20 +2925,24 @@ }, { "name": "Coastal Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koko-Bera", + "depth": 4, "iso_1_code": null, "iso_3_code": "kkp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "896", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "895", "native_tokenizers": [], @@ -2471,20 +2950,24 @@ }, { "name": "Flinders Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gugadj", + "depth": 4, "iso_1_code": null, "iso_3_code": "ggd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "898", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "897", "native_tokenizers": [], @@ -2492,14 +2975,17 @@ }, { "name": "Lamalamic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lamalama", + "depth": 4, "iso_1_code": null, "iso_3_code": "lby", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "900", "native_tokenizers": [], @@ -2507,15 +2993,18 @@ }, { "name": "Morrobalama", + "depth": 4, "iso_1_code": null, "iso_3_code": "umg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "901", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "899", "native_tokenizers": [], @@ -2523,14 +3012,17 @@ }, { "name": "Mayabic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngawun", + "depth": 4, "iso_1_code": null, "iso_3_code": "nxn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "903", "native_tokenizers": [], @@ -2538,9 +3030,11 @@ }, { "name": "Wunumara", + "depth": 4, "iso_1_code": null, "iso_3_code": "wnn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "904", "native_tokenizers": [], @@ -2548,9 +3042,11 @@ }, { "name": "Mayaguduna", + "depth": 4, "iso_1_code": null, "iso_3_code": "xmy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "905", "native_tokenizers": [], @@ -2558,9 +3054,11 @@ }, { "name": "Mayi-Yapi", + "depth": 4, "iso_1_code": null, "iso_3_code": "xyj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "906", "native_tokenizers": [], @@ -2568,9 +3066,11 @@ }, { "name": "Mayi-Kulan", + "depth": 4, "iso_1_code": null, "iso_3_code": "xyk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "907", "native_tokenizers": [], @@ -2578,15 +3078,18 @@ }, { "name": "Mayi-Thakurti", + "depth": 4, "iso_1_code": null, "iso_3_code": "xyt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "908", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "902", "native_tokenizers": [], @@ -2594,14 +3097,17 @@ }, { "name": "Mbariman", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gugu Warra", + "depth": 4, "iso_1_code": null, "iso_3_code": "wrw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "910", "native_tokenizers": [], @@ -2609,15 +3115,18 @@ }, { "name": "Mbariman-Gudhinma", + "depth": 4, "iso_1_code": null, "iso_3_code": "zmv", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "911", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "909", "native_tokenizers": [], @@ -2625,14 +3134,17 @@ }, { "name": "Middle Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ayabadhu", + "depth": 4, "iso_1_code": null, "iso_3_code": "ayd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "913", "native_tokenizers": [], @@ -2640,9 +3152,11 @@ }, { "name": "Pakanha", + "depth": 4, "iso_1_code": null, "iso_3_code": "pkn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "914", "native_tokenizers": [], @@ -2650,9 +3164,11 @@ }, { "name": "Kuku-Ugbanh", + "depth": 4, "iso_1_code": null, "iso_3_code": "ugb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "915", "native_tokenizers": [], @@ -2660,9 +3176,11 @@ }, { "name": "Kuku-Uwanh", + "depth": 4, "iso_1_code": null, "iso_3_code": "uwa", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "916", "native_tokenizers": [], @@ -2670,9 +3188,11 @@ }, { "name": "Wik-Epa", + "depth": 4, "iso_1_code": null, "iso_3_code": "wie", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "917", "native_tokenizers": [], @@ -2680,9 +3200,11 @@ }, { "name": "Wik-Keyangan", + "depth": 4, "iso_1_code": null, "iso_3_code": "wif", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "918", "native_tokenizers": [], @@ -2690,9 +3212,11 @@ }, { "name": "Wik Ngathan", + "depth": 4, "iso_1_code": null, "iso_3_code": "wig", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "919", "native_tokenizers": [], @@ -2700,9 +3224,11 @@ }, { "name": "Wik-Me\u2019anha", + "depth": 4, "iso_1_code": null, "iso_3_code": "wih", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "920", "native_tokenizers": [], @@ -2710,9 +3236,11 @@ }, { "name": "Wik-Iiyanh", + "depth": 4, "iso_1_code": null, "iso_3_code": "wij", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "921", "native_tokenizers": [], @@ -2720,9 +3248,11 @@ }, { "name": "Wikalkan", + "depth": 4, "iso_1_code": null, "iso_3_code": "wik", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "922", "native_tokenizers": [], @@ -2730,9 +3260,11 @@ }, { "name": "Wik-Mungkan", + "depth": 4, "iso_1_code": null, "iso_3_code": "wim", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "923", "native_tokenizers": [], @@ -2742,9 +3274,11 @@ }, { "name": "Wikngenchera", + "depth": 4, "iso_1_code": null, "iso_3_code": "wua", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "924", "native_tokenizers": [], @@ -2752,9 +3286,11 @@ }, { "name": "Kugu-Muminh", + "depth": 4, "iso_1_code": null, "iso_3_code": "xmh", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "925", "native_tokenizers": [], @@ -2762,9 +3298,11 @@ }, { "name": "Kuku-Mu\u2019inh", + "depth": 4, "iso_1_code": null, "iso_3_code": "xmp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "926", "native_tokenizers": [], @@ -2772,15 +3310,18 @@ }, { "name": "Kuku-Mangk", + "depth": 4, "iso_1_code": null, "iso_3_code": "xmq", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "927", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "912", "native_tokenizers": [], @@ -2788,14 +3329,17 @@ }, { "name": "Norman Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Areba", + "depth": 4, "iso_1_code": null, "iso_3_code": "aea", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "929", "native_tokenizers": [], @@ -2803,9 +3347,11 @@ }, { "name": "Gurdjar", + "depth": 4, "iso_1_code": null, "iso_3_code": "gdj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "930", "native_tokenizers": [], @@ -2813,15 +3359,18 @@ }, { "name": "Kuthant", + "depth": 4, "iso_1_code": null, "iso_3_code": "xut", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "931", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "928", "native_tokenizers": [], @@ -2829,14 +3378,17 @@ }, { "name": "Northeastern Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kanju", + "depth": 4, "iso_1_code": null, "iso_3_code": "kbe", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "933", "native_tokenizers": [], @@ -2844,9 +3396,11 @@ }, { "name": "Kuuku-Ya\u2019u", + "depth": 4, "iso_1_code": null, "iso_3_code": "kuy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "934", "native_tokenizers": [], @@ -2854,15 +3408,18 @@ }, { "name": "Umpila", + "depth": 4, "iso_1_code": null, "iso_3_code": "ump", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "935", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "932", "native_tokenizers": [], @@ -2870,14 +3427,17 @@ }, { "name": "Northern Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alngith", + "depth": 4, "iso_1_code": null, "iso_3_code": "aid", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "937", "native_tokenizers": [], @@ -2885,9 +3445,11 @@ }, { "name": "Atampaya", + "depth": 4, "iso_1_code": null, "iso_3_code": "amz", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "938", "native_tokenizers": [], @@ -2895,9 +3457,11 @@ }, { "name": "Angkamuthi", + "depth": 4, "iso_1_code": null, "iso_3_code": "avm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "939", "native_tokenizers": [], @@ -2905,9 +3469,11 @@ }, { "name": "Anguthimri", + "depth": 4, "iso_1_code": null, "iso_3_code": "awg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "940", "native_tokenizers": [], @@ -2915,9 +3481,11 @@ }, { "name": "Ndra\u2019ngith", + "depth": 4, "iso_1_code": null, "iso_3_code": "dgt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "941", "native_tokenizers": [], @@ -2925,9 +3493,11 @@ }, { "name": "Adithinngithigh", + "depth": 4, "iso_1_code": null, "iso_3_code": "dth", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "942", "native_tokenizers": [], @@ -2935,9 +3505,11 @@ }, { "name": "Awngthim", + "depth": 4, "iso_1_code": null, "iso_3_code": "gwm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "943", "native_tokenizers": [], @@ -2945,9 +3517,11 @@ }, { "name": "Leningitij", + "depth": 4, "iso_1_code": null, "iso_3_code": "lnj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "944", "native_tokenizers": [], @@ -2955,9 +3529,11 @@ }, { "name": "Arritinngithigh", + "depth": 4, "iso_1_code": null, "iso_3_code": "rrt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "945", "native_tokenizers": [], @@ -2965,9 +3541,11 @@ }, { "name": "Tjungundji", + "depth": 4, "iso_1_code": null, "iso_3_code": "tjj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "946", "native_tokenizers": [], @@ -2975,9 +3553,11 @@ }, { "name": "Uradhi", + "depth": 4, "iso_1_code": null, "iso_3_code": "urf", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "947", "native_tokenizers": [], @@ -2985,15 +3565,18 @@ }, { "name": "Mpalitjanh", + "depth": 4, "iso_1_code": null, "iso_3_code": "xpj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "948", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "936", "native_tokenizers": [], @@ -3001,14 +3584,17 @@ }, { "name": "Rarmul Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aghu-Tharnggala", + "depth": 4, "iso_1_code": null, "iso_3_code": "gtu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "950", "native_tokenizers": [], @@ -3016,9 +3602,11 @@ }, { "name": "Ikaranggal", + "depth": 4, "iso_1_code": null, "iso_3_code": "ikr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "951", "native_tokenizers": [], @@ -3026,15 +3614,18 @@ }, { "name": "Thaypan", + "depth": 4, "iso_1_code": null, "iso_3_code": "typ", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "952", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "949", "native_tokenizers": [], @@ -3042,14 +3633,17 @@ }, { "name": "Southern Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barbaram", + "depth": 4, "iso_1_code": null, "iso_3_code": "vmb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "954", "native_tokenizers": [], @@ -3057,15 +3651,18 @@ }, { "name": "Wamin", + "depth": 4, "iso_1_code": null, "iso_3_code": "wmi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "955", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "953", "native_tokenizers": [], @@ -3073,14 +3670,17 @@ }, { "name": "Southwestern Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kok-Nar", + "depth": 4, "iso_1_code": null, "iso_3_code": "gko", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "957", "native_tokenizers": [], @@ -3088,9 +3688,11 @@ }, { "name": "Koko Babangk", + "depth": 4, "iso_1_code": null, "iso_3_code": "okg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "958", "native_tokenizers": [], @@ -3098,15 +3700,18 @@ }, { "name": "Kuuk-Yak", + "depth": 4, "iso_1_code": null, "iso_3_code": "uky", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "959", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "956", "native_tokenizers": [], @@ -3114,20 +3719,24 @@ }, { "name": "Umbindhamuic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Umbindhamu", + "depth": 4, "iso_1_code": null, "iso_3_code": "umd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "961", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "960", "native_tokenizers": [], @@ -3135,20 +3744,24 @@ }, { "name": "Western Pama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuuk Thayorre", + "depth": 4, "iso_1_code": null, "iso_3_code": "thd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "963", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "962", "native_tokenizers": [], @@ -3156,14 +3769,17 @@ }, { "name": "Yir Yoront", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yirrk-Mel", + "depth": 4, "iso_1_code": null, "iso_3_code": "yrm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "965", "native_tokenizers": [], @@ -3171,21 +3787,25 @@ }, { "name": "Yir-Yoront", + "depth": 4, "iso_1_code": null, "iso_3_code": "yyr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "966", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "964", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "887", "native_tokenizers": [], @@ -3193,14 +3813,17 @@ }, { "name": "South-West", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalaamaya", + "depth": 3, "iso_1_code": null, "iso_3_code": "lkm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "968", "native_tokenizers": [], @@ -3208,9 +3831,11 @@ }, { "name": "Walangama", + "depth": 3, "iso_1_code": null, "iso_3_code": "nlw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "969", "native_tokenizers": [], @@ -3218,14 +3843,17 @@ }, { "name": "Coastal Ngayarda", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Djiwarli", + "depth": 4, "iso_1_code": null, "iso_3_code": "dze", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "971", "native_tokenizers": [], @@ -3233,9 +3861,11 @@ }, { "name": "Thiin", + "depth": 4, "iso_1_code": null, "iso_3_code": "iin", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "972", "native_tokenizers": [], @@ -3243,9 +3873,11 @@ }, { "name": "Nhuwala", + "depth": 4, "iso_1_code": null, "iso_3_code": "nhf", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "973", "native_tokenizers": [], @@ -3253,9 +3885,11 @@ }, { "name": "Ngarluma", + "depth": 4, "iso_1_code": null, "iso_3_code": "nrl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "974", "native_tokenizers": [], @@ -3263,9 +3897,11 @@ }, { "name": "Kariyarra", + "depth": 4, "iso_1_code": null, "iso_3_code": "vka", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "975", "native_tokenizers": [], @@ -3273,9 +3909,11 @@ }, { "name": "Kurrama", + "depth": 4, "iso_1_code": null, "iso_3_code": "vku", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "976", "native_tokenizers": [], @@ -3283,9 +3921,11 @@ }, { "name": "Martuyhunira", + "depth": 4, "iso_1_code": null, "iso_3_code": "vma", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "977", "native_tokenizers": [], @@ -3293,15 +3933,18 @@ }, { "name": "Yindjibarndi", + "depth": 4, "iso_1_code": null, "iso_3_code": "yij", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "978", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "970", "native_tokenizers": [], @@ -3309,14 +3952,17 @@ }, { "name": "Dhalandji", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhalandji", + "depth": 4, "iso_1_code": null, "iso_3_code": "dhl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "980", "native_tokenizers": [], @@ -3324,15 +3970,18 @@ }, { "name": "Pinigura", + "depth": 4, "iso_1_code": null, "iso_3_code": "pnv", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "981", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "979", "native_tokenizers": [], @@ -3340,14 +3989,17 @@ }, { "name": "Inland Ngayarda", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhargari", + "depth": 4, "iso_1_code": null, "iso_3_code": "dhr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "983", "native_tokenizers": [], @@ -3355,9 +4007,11 @@ }, { "name": "Nyamal", + "depth": 4, "iso_1_code": null, "iso_3_code": "nly", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "984", "native_tokenizers": [], @@ -3365,9 +4019,11 @@ }, { "name": "Ngarla", + "depth": 4, "iso_1_code": null, "iso_3_code": "nrk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "985", "native_tokenizers": [], @@ -3375,9 +4031,11 @@ }, { "name": "Banyjima", + "depth": 4, "iso_1_code": null, "iso_3_code": "pnw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "986", "native_tokenizers": [], @@ -3385,9 +4043,11 @@ }, { "name": "Tjurruru", + "depth": 4, "iso_1_code": null, "iso_3_code": "tju", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "987", "native_tokenizers": [], @@ -3395,9 +4055,11 @@ }, { "name": "Wariyangga", + "depth": 4, "iso_1_code": null, "iso_3_code": "wri", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "988", "native_tokenizers": [], @@ -3405,15 +4067,18 @@ }, { "name": "Yinhawangka", + "depth": 4, "iso_1_code": null, "iso_3_code": "ywg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "989", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "982", "native_tokenizers": [], @@ -3421,14 +4086,17 @@ }, { "name": "Kanyara", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bayungu", + "depth": 4, "iso_1_code": null, "iso_3_code": "bxj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "991", "native_tokenizers": [], @@ -3436,15 +4104,18 @@ }, { "name": "Burduna", + "depth": 4, "iso_1_code": null, "iso_3_code": "bxn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "992", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "990", "native_tokenizers": [], @@ -3452,20 +4123,24 @@ }, { "name": "Malgana", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malgana", + "depth": 4, "iso_1_code": null, "iso_3_code": "vml", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "994", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "993", "native_tokenizers": [], @@ -3473,20 +4148,24 @@ }, { "name": "Mangala", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mangala", + "depth": 4, "iso_1_code": null, "iso_3_code": "mem", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "996", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "995", "native_tokenizers": [], @@ -3494,14 +4173,17 @@ }, { "name": "Marngu", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karajarri", + "depth": 4, "iso_1_code": null, "iso_3_code": "gbd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "998", "native_tokenizers": [], @@ -3509,15 +4191,18 @@ }, { "name": "Nyangumarta", + "depth": 4, "iso_1_code": null, "iso_3_code": "nna", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "999", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "997", "native_tokenizers": [], @@ -3525,14 +4210,17 @@ }, { "name": "Mirning", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mirning", + "depth": 4, "iso_1_code": null, "iso_3_code": "gmr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1001", "native_tokenizers": [], @@ -3540,9 +4228,11 @@ }, { "name": "Kalarko", + "depth": 4, "iso_1_code": null, "iso_3_code": "kba", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1002", "native_tokenizers": [], @@ -3550,15 +4240,18 @@ }, { "name": "Ngadjunmaya", + "depth": 4, "iso_1_code": null, "iso_3_code": "nju", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1003", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1000", "native_tokenizers": [], @@ -3566,14 +4259,17 @@ }, { "name": "Ngarga", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Warlpiri", + "depth": 4, "iso_1_code": null, "iso_3_code": "wbp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1005", "native_tokenizers": [], @@ -3583,15 +4279,18 @@ }, { "name": "Warlmanpa", + "depth": 4, "iso_1_code": null, "iso_3_code": "wrl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1006", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1004", "native_tokenizers": [], @@ -3599,14 +4298,17 @@ }, { "name": "Ngumbin", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jaru", + "depth": 4, "iso_1_code": null, "iso_3_code": "ddj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1008", "native_tokenizers": [], @@ -3614,9 +4316,11 @@ }, { "name": "Mudburra", + "depth": 4, "iso_1_code": null, "iso_3_code": "dmw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1009", "native_tokenizers": [], @@ -3624,9 +4328,11 @@ }, { "name": "Gurindji", + "depth": 4, "iso_1_code": null, "iso_3_code": "gue", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1010", "native_tokenizers": [], @@ -3634,9 +4340,11 @@ }, { "name": "Ngarinyman", + "depth": 4, "iso_1_code": null, "iso_3_code": "nbj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1011", "native_tokenizers": [], @@ -3644,9 +4352,11 @@ }, { "name": "Ngardi", + "depth": 4, "iso_1_code": null, "iso_3_code": "rxd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1012", "native_tokenizers": [], @@ -3654,9 +4364,11 @@ }, { "name": "Walmajarri", + "depth": 4, "iso_1_code": null, "iso_3_code": "wmt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1013", "native_tokenizers": [], @@ -3665,6 +4377,7 @@ ] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1007", "native_tokenizers": [], @@ -3672,14 +4385,17 @@ }, { "name": "Nyungar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyungar", + "depth": 4, "iso_1_code": null, "iso_3_code": "nys", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1015", "native_tokenizers": [], @@ -3687,9 +4403,11 @@ }, { "name": "Pinjarup", + "depth": 4, "iso_1_code": null, "iso_3_code": "pnj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1016", "native_tokenizers": [], @@ -3697,9 +4415,11 @@ }, { "name": "Wardandi", + "depth": 4, "iso_1_code": null, "iso_3_code": "wxw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1017", "native_tokenizers": [], @@ -3707,9 +4427,11 @@ }, { "name": "Bibbulman", + "depth": 4, "iso_1_code": null, "iso_3_code": "xbp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1018", "native_tokenizers": [], @@ -3717,9 +4439,11 @@ }, { "name": "Goreng", + "depth": 4, "iso_1_code": null, "iso_3_code": "xgg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1019", "native_tokenizers": [], @@ -3727,9 +4451,11 @@ }, { "name": "Nganakarti", + "depth": 4, "iso_1_code": null, "iso_3_code": "xnk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1020", "native_tokenizers": [], @@ -3737,9 +4463,11 @@ }, { "name": "Minang", + "depth": 4, "iso_1_code": null, "iso_3_code": "xrg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1021", "native_tokenizers": [], @@ -3747,15 +4475,18 @@ }, { "name": "Wajuk", + "depth": 4, "iso_1_code": null, "iso_3_code": "xwj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1022", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1014", "native_tokenizers": [], @@ -3763,14 +4494,17 @@ }, { "name": "Wadjari", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Badimaya", + "depth": 4, "iso_1_code": null, "iso_3_code": "bia", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1024", "native_tokenizers": [], @@ -3778,15 +4512,18 @@ }, { "name": "Wajarri", + "depth": 4, "iso_1_code": null, "iso_3_code": "wbv", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1025", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1023", "native_tokenizers": [], @@ -3794,14 +4531,17 @@ }, { "name": "Wati", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Antikarinya", + "depth": 4, "iso_1_code": null, "iso_3_code": "ant", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1027", "native_tokenizers": [], @@ -3809,9 +4549,11 @@ }, { "name": "Yankunytjatjara", + "depth": 4, "iso_1_code": null, "iso_3_code": "kdd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1028", "native_tokenizers": [], @@ -3819,9 +4561,11 @@ }, { "name": "Kokata", + "depth": 4, "iso_1_code": null, "iso_3_code": "ktd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1029", "native_tokenizers": [], @@ -3829,9 +4573,11 @@ }, { "name": "Kukatja", + "depth": 4, "iso_1_code": null, "iso_3_code": "kux", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1030", "native_tokenizers": [], @@ -3839,9 +4585,11 @@ }, { "name": "Martu Wangka", + "depth": 4, "iso_1_code": null, "iso_3_code": "mpj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1031", "native_tokenizers": [], @@ -3849,9 +4597,11 @@ }, { "name": "Ngaanyatjarra", + "depth": 4, "iso_1_code": null, "iso_3_code": "ntj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1032", "native_tokenizers": [], @@ -3859,9 +4609,11 @@ }, { "name": "Pintupi-Luritja", + "depth": 4, "iso_1_code": null, "iso_3_code": "piu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1033", "native_tokenizers": [], @@ -3869,9 +4621,11 @@ }, { "name": "Pitjantjatjara", + "depth": 4, "iso_1_code": null, "iso_3_code": "pjt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1034", "native_tokenizers": [], @@ -3881,9 +4635,11 @@ }, { "name": "Pintiini", + "depth": 4, "iso_1_code": null, "iso_3_code": "pti", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1035", "native_tokenizers": [], @@ -3891,9 +4647,11 @@ }, { "name": "Tjupany", + "depth": 4, "iso_1_code": null, "iso_3_code": "tjp", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1036", "native_tokenizers": [], @@ -3901,9 +4659,11 @@ }, { "name": "Warnman", + "depth": 4, "iso_1_code": null, "iso_3_code": "wbt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1037", "native_tokenizers": [], @@ -3911,15 +4671,18 @@ }, { "name": "Nyiyaparli", + "depth": 4, "iso_1_code": null, "iso_3_code": "xny", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1038", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1026", "native_tokenizers": [], @@ -3927,14 +4690,17 @@ }, { "name": "Yinggarda", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nhanda", + "depth": 4, "iso_1_code": null, "iso_3_code": "nha", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1040", "native_tokenizers": [], @@ -3942,15 +4708,18 @@ }, { "name": "Yinggarda", + "depth": 4, "iso_1_code": null, "iso_3_code": "yia", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1041", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1039", "native_tokenizers": [], @@ -3958,14 +4727,17 @@ }, { "name": "Yura", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adnyamathanha", + "depth": 4, "iso_1_code": null, "iso_3_code": "adt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1043", "native_tokenizers": [], @@ -3973,9 +4745,11 @@ }, { "name": "Barngarla", + "depth": 4, "iso_1_code": null, "iso_3_code": "bjb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1044", "native_tokenizers": [], @@ -3983,9 +4757,11 @@ }, { "name": "Guyani", + "depth": 4, "iso_1_code": null, "iso_3_code": "gvy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1045", "native_tokenizers": [], @@ -3993,9 +4769,11 @@ }, { "name": "Ngadjuri", + "depth": 4, "iso_1_code": null, "iso_3_code": "jui", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1046", "native_tokenizers": [], @@ -4003,9 +4781,11 @@ }, { "name": "Narungga", + "depth": 4, "iso_1_code": null, "iso_3_code": "nnr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1047", "native_tokenizers": [], @@ -4013,9 +4793,11 @@ }, { "name": "Nugunu", + "depth": 4, "iso_1_code": null, "iso_3_code": "nnv", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1048", "native_tokenizers": [], @@ -4023,9 +4805,11 @@ }, { "name": "Nauo", + "depth": 4, "iso_1_code": null, "iso_3_code": "nwo", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1049", "native_tokenizers": [], @@ -4033,9 +4817,11 @@ }, { "name": "Wirangu", + "depth": 4, "iso_1_code": null, "iso_3_code": "wgu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1050", "native_tokenizers": [], @@ -4043,21 +4829,25 @@ }, { "name": "Kaurna", + "depth": 4, "iso_1_code": null, "iso_3_code": "zku", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1051", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1042", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "967", "native_tokenizers": [], @@ -4065,19 +4855,23 @@ }, { "name": "Wagaya-Warluwaric", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Warluwara-Thawa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wagaya", + "depth": 4, "iso_1_code": null, "iso_3_code": "wga", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1054", "native_tokenizers": [], @@ -4085,9 +4879,11 @@ }, { "name": "Waluwarra", + "depth": 4, "iso_1_code": null, "iso_3_code": "wrb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1055", "native_tokenizers": [], @@ -4095,21 +4891,25 @@ }, { "name": "Yindjilandji", + "depth": 4, "iso_1_code": null, "iso_3_code": "yil", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1056", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1053", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1052", "native_tokenizers": [], @@ -4117,14 +4917,17 @@ }, { "name": "Waka-Kabic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gabi-Gabi", + "depth": 3, "iso_1_code": null, "iso_3_code": "gbw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1058", "native_tokenizers": [], @@ -4132,9 +4935,11 @@ }, { "name": "Batjala", + "depth": 3, "iso_1_code": null, "iso_3_code": "xby", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1059", "native_tokenizers": [], @@ -4142,20 +4947,24 @@ }, { "name": "Kingkel", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bayali", + "depth": 4, "iso_1_code": null, "iso_3_code": "bjy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1061", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1060", "native_tokenizers": [], @@ -4163,14 +4972,17 @@ }, { "name": "Miyan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wakawaka", + "depth": 4, "iso_1_code": null, "iso_3_code": "wkw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1063", "native_tokenizers": [], @@ -4178,15 +4990,18 @@ }, { "name": "Wuliwuli", + "depth": 4, "iso_1_code": null, "iso_3_code": "wlu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1064", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1062", "native_tokenizers": [], @@ -4194,26 +5009,31 @@ }, { "name": "Than", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gureng Gureng", + "depth": 4, "iso_1_code": null, "iso_3_code": "gnr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1066", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1065", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1057", "native_tokenizers": [], @@ -4221,20 +5041,24 @@ }, { "name": "Warumungic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Warumungu", + "depth": 3, "iso_1_code": null, "iso_3_code": "wrm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1068", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1067", "native_tokenizers": [], @@ -4242,14 +5066,17 @@ }, { "name": "Wiradhuric", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gamilaraay", + "depth": 3, "iso_1_code": null, "iso_3_code": "kld", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1070", "native_tokenizers": [], @@ -4257,9 +5084,11 @@ }, { "name": "Wiradjuri", + "depth": 3, "iso_1_code": null, "iso_3_code": "wrh", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1071", "native_tokenizers": [], @@ -4267,15 +5096,18 @@ }, { "name": "Wangaaybuwan-Ngiyambaa", + "depth": 3, "iso_1_code": null, "iso_3_code": "wyb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1072", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1069", "native_tokenizers": [], @@ -4283,14 +5115,17 @@ }, { "name": "Worimi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awabakal", + "depth": 3, "iso_1_code": null, "iso_3_code": "awk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1074", "native_tokenizers": [], @@ -4298,15 +5133,18 @@ }, { "name": "Worimi", + "depth": 3, "iso_1_code": null, "iso_3_code": "kda", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1075", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1073", "native_tokenizers": [], @@ -4314,14 +5152,17 @@ }, { "name": "Yalandyic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Djangun", + "depth": 3, "iso_1_code": null, "iso_3_code": "djf", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1077", "native_tokenizers": [], @@ -4329,9 +5170,11 @@ }, { "name": "Kuku-Yalanji", + "depth": 3, "iso_1_code": null, "iso_3_code": "gvn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1078", "native_tokenizers": [], @@ -4341,15 +5184,18 @@ }, { "name": "Muluridyi", + "depth": 3, "iso_1_code": null, "iso_3_code": "vmu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1079", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1076", "native_tokenizers": [], @@ -4357,20 +5203,24 @@ }, { "name": "Yanyuwan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yanyuwa", + "depth": 3, "iso_1_code": null, "iso_3_code": "jao", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1081", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1080", "native_tokenizers": [], @@ -4378,14 +5228,17 @@ }, { "name": "Yarli", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wadikali", + "depth": 3, "iso_1_code": null, "iso_3_code": "wdk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1083", "native_tokenizers": [], @@ -4393,9 +5246,11 @@ }, { "name": "Malyangapa", + "depth": 3, "iso_1_code": null, "iso_3_code": "yga", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1084", "native_tokenizers": [], @@ -4403,15 +5258,18 @@ }, { "name": "Yardliyawarra", + "depth": 3, "iso_1_code": null, "iso_3_code": "yxl", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1085", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1082", "native_tokenizers": [], @@ -4419,14 +5277,17 @@ }, { "name": "Yidinic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Djabugay", + "depth": 3, "iso_1_code": null, "iso_3_code": "dyy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1087", "native_tokenizers": [], @@ -4434,15 +5295,18 @@ }, { "name": "Yidiny", + "depth": 3, "iso_1_code": null, "iso_3_code": "yii", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1088", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1086", "native_tokenizers": [], @@ -4450,14 +5314,17 @@ }, { "name": "Yotayotic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yorta Yorta", + "depth": 3, "iso_1_code": null, "iso_3_code": "xyy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1090", "native_tokenizers": [], @@ -4465,15 +5332,18 @@ }, { "name": "Yabula Yabula", + "depth": 3, "iso_1_code": null, "iso_3_code": "yxy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1091", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1089", "native_tokenizers": [], @@ -4481,20 +5351,24 @@ }, { "name": "Yugambal", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yugambal", + "depth": 3, "iso_1_code": null, "iso_3_code": "yub", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1093", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1092", "native_tokenizers": [], @@ -4502,14 +5376,17 @@ }, { "name": "Yuin", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhurga", + "depth": 3, "iso_1_code": null, "iso_3_code": "dhu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1095", "native_tokenizers": [], @@ -4517,9 +5394,11 @@ }, { "name": "Dharawal", + "depth": 3, "iso_1_code": null, "iso_3_code": "tbh", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1096", "native_tokenizers": [], @@ -4527,9 +5406,11 @@ }, { "name": "Birrpayi", + "depth": 3, "iso_1_code": null, "iso_3_code": "xbj", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1097", "native_tokenizers": [], @@ -4537,9 +5418,11 @@ }, { "name": "Darkinyung", + "depth": 3, "iso_1_code": null, "iso_3_code": "xda", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1098", "native_tokenizers": [], @@ -4547,9 +5430,11 @@ }, { "name": "Dharuk", + "depth": 3, "iso_1_code": null, "iso_3_code": "xdk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1099", "native_tokenizers": [], @@ -4557,9 +5442,11 @@ }, { "name": "Jaitmatang", + "depth": 3, "iso_1_code": null, "iso_3_code": "xjt", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1100", "native_tokenizers": [], @@ -4567,9 +5454,11 @@ }, { "name": "Ngarigu", + "depth": 3, "iso_1_code": null, "iso_3_code": "xni", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1101", "native_tokenizers": [], @@ -4577,9 +5466,11 @@ }, { "name": "Gundungurra", + "depth": 3, "iso_1_code": null, "iso_3_code": "xrd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1102", "native_tokenizers": [], @@ -4587,9 +5478,11 @@ }, { "name": "Thawa", + "depth": 3, "iso_1_code": null, "iso_3_code": "xtv", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1103", "native_tokenizers": [], @@ -4597,15 +5490,18 @@ }, { "name": "Ngunawal", + "depth": 3, "iso_1_code": null, "iso_3_code": "xul", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1104", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1094", "native_tokenizers": [], @@ -4613,14 +5509,17 @@ }, { "name": "Yuulngu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Golpa", + "depth": 3, "iso_1_code": null, "iso_3_code": "lja", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1106", "native_tokenizers": [], @@ -4628,14 +5527,17 @@ }, { "name": "Dhangu", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhangu-Djangu", + "depth": 4, "iso_1_code": null, "iso_3_code": "dhg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1108", "native_tokenizers": [], @@ -4645,15 +5547,18 @@ }, { "name": "Yan-nhangu", + "depth": 4, "iso_1_code": null, "iso_3_code": "jay", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1109", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1107", "native_tokenizers": [], @@ -4661,14 +5566,17 @@ }, { "name": "Dhuwal", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dayi", + "depth": 4, "iso_1_code": null, "iso_3_code": "dax", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1111", "native_tokenizers": [], @@ -4676,9 +5584,11 @@ }, { "name": "Djambarrpuyngu", + "depth": 4, "iso_1_code": null, "iso_3_code": "djr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1112", "native_tokenizers": [], @@ -4688,9 +5598,11 @@ }, { "name": "Dhuwal", + "depth": 4, "iso_1_code": null, "iso_3_code": "dwu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1113", "native_tokenizers": [], @@ -4698,9 +5610,11 @@ }, { "name": "Dhuwaya", + "depth": 4, "iso_1_code": null, "iso_3_code": "dwy", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1114", "native_tokenizers": [], @@ -4708,9 +5622,11 @@ }, { "name": "Gumatj", + "depth": 4, "iso_1_code": null, "iso_3_code": "gnn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1115", "native_tokenizers": [], @@ -4720,9 +5636,11 @@ }, { "name": "Gupapuyngu", + "depth": 4, "iso_1_code": null, "iso_3_code": "guf", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1116", "native_tokenizers": [], @@ -4730,15 +5648,18 @@ }, { "name": "Ritharrngu", + "depth": 4, "iso_1_code": null, "iso_3_code": "rit", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1117", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1110", "native_tokenizers": [], @@ -4746,14 +5667,17 @@ }, { "name": "Djinang", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Djinba", + "depth": 4, "iso_1_code": null, "iso_3_code": "djb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1119", "native_tokenizers": [], @@ -4761,27 +5685,32 @@ }, { "name": "Djinang", + "depth": 4, "iso_1_code": null, "iso_3_code": "dji", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1120", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1118", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1105", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "757", "native_tokenizers": [], @@ -4789,14 +5718,17 @@ }, { "name": "Tangic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ganggalida", + "depth": 2, "iso_1_code": null, "iso_3_code": "gcd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1122", "native_tokenizers": [], @@ -4804,9 +5736,11 @@ }, { "name": "Kayardild", + "depth": 2, "iso_1_code": null, "iso_3_code": "gyd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1123", "native_tokenizers": [], @@ -4814,9 +5748,11 @@ }, { "name": "Nyangga", + "depth": 2, "iso_1_code": null, "iso_3_code": "nny", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1124", "native_tokenizers": [], @@ -4824,15 +5760,18 @@ }, { "name": "Minkin", + "depth": 2, "iso_1_code": null, "iso_3_code": "xxm", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1125", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1121", "native_tokenizers": [], @@ -4840,20 +5779,24 @@ }, { "name": "Tiwian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tiwi", + "depth": 2, "iso_1_code": null, "iso_3_code": "tiw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1127", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1126", "native_tokenizers": [], @@ -4861,14 +5804,17 @@ }, { "name": "Umbugarla-Ngumbur", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngurmbur", + "depth": 2, "iso_1_code": null, "iso_3_code": "nrx", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1129", "native_tokenizers": [], @@ -4876,15 +5822,18 @@ }, { "name": "Umbugarla", + "depth": 2, "iso_1_code": null, "iso_3_code": "umr", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1130", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1128", "native_tokenizers": [], @@ -4892,14 +5841,17 @@ }, { "name": "West Barkly", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jingulu", + "depth": 2, "iso_1_code": null, "iso_3_code": "jig", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1132", "native_tokenizers": [], @@ -4907,9 +5859,11 @@ }, { "name": "Gudanji", + "depth": 2, "iso_1_code": null, "iso_3_code": "nji", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1133", "native_tokenizers": [], @@ -4917,15 +5871,18 @@ }, { "name": "Wambaya", + "depth": 2, "iso_1_code": null, "iso_3_code": "wmb", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1134", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1131", "native_tokenizers": [], @@ -4933,14 +5890,17 @@ }, { "name": "Worrorran", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gambera", + "depth": 2, "iso_1_code": null, "iso_3_code": "gma", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1136", "native_tokenizers": [], @@ -4948,9 +5908,11 @@ }, { "name": "Kwini", + "depth": 2, "iso_1_code": null, "iso_3_code": "gww", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1137", "native_tokenizers": [], @@ -4958,9 +5920,11 @@ }, { "name": "Ngarinyin", + "depth": 2, "iso_1_code": null, "iso_3_code": "ung", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1138", "native_tokenizers": [], @@ -4968,9 +5932,11 @@ }, { "name": "Miwa", + "depth": 2, "iso_1_code": null, "iso_3_code": "vmi", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1139", "native_tokenizers": [], @@ -4978,9 +5944,11 @@ }, { "name": "Wilawila", + "depth": 2, "iso_1_code": null, "iso_3_code": "wil", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1140", "native_tokenizers": [], @@ -4988,9 +5956,11 @@ }, { "name": "Wunambal", + "depth": 2, "iso_1_code": null, "iso_3_code": "wub", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1141", "native_tokenizers": [], @@ -4998,20 +5968,24 @@ }, { "name": "Ngarinyinic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andajin", + "depth": 3, "iso_1_code": null, "iso_3_code": "ajn", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1143", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1142", "native_tokenizers": [], @@ -5019,14 +5993,17 @@ }, { "name": "Western Worrorran", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yawijibaya", + "depth": 3, "iso_1_code": null, "iso_3_code": "jbw", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1145", "native_tokenizers": [], @@ -5034,9 +6011,11 @@ }, { "name": "Worrorra", + "depth": 3, "iso_1_code": null, "iso_3_code": "wro", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1146", "native_tokenizers": [], @@ -5044,9 +6023,11 @@ }, { "name": "Unggumi", + "depth": 3, "iso_1_code": null, "iso_3_code": "xgu", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1147", "native_tokenizers": [], @@ -5054,9 +6035,11 @@ }, { "name": "Umiida", + "depth": 3, "iso_1_code": null, "iso_3_code": "xud", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1148", "native_tokenizers": [], @@ -5064,21 +6047,25 @@ }, { "name": "Unggaranggu", + "depth": 3, "iso_1_code": null, "iso_3_code": "xun", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1149", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1144", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1135", "native_tokenizers": [], @@ -5086,14 +6073,17 @@ }, { "name": "Yanyi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Waanyi", + "depth": 2, "iso_1_code": null, "iso_3_code": "wny", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1151", "native_tokenizers": [], @@ -5101,9 +6091,11 @@ }, { "name": "Garrwa", + "depth": 2, "iso_1_code": null, "iso_3_code": "wrk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1152", "native_tokenizers": [], @@ -5112,6 +6104,7 @@ ] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1150", "native_tokenizers": [], @@ -5119,25 +6112,30 @@ }, { "name": "Yiwaidjan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amaragic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amurdak", + "depth": 3, "iso_1_code": null, "iso_3_code": "amg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1155", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1154", "native_tokenizers": [], @@ -5145,20 +6143,24 @@ }, { "name": "Margic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Margu", + "depth": 3, "iso_1_code": null, "iso_3_code": "mhg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1157", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1156", "native_tokenizers": [], @@ -5166,14 +6168,17 @@ }, { "name": "Yiwaidjic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iwaidja", + "depth": 3, "iso_1_code": null, "iso_3_code": "ibd", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1159", "native_tokenizers": [], @@ -5181,9 +6186,11 @@ }, { "name": "Garig-Ilgar", + "depth": 3, "iso_1_code": null, "iso_3_code": "ilg", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1160", "native_tokenizers": [], @@ -5191,9 +6198,11 @@ }, { "name": "Maung", + "depth": 3, "iso_1_code": null, "iso_3_code": "mph", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1161", "native_tokenizers": [], @@ -5203,27 +6212,32 @@ }, { "name": "Manangkari", + "depth": 3, "iso_1_code": null, "iso_3_code": "znk", "children": [], + "family": "Australian", "tokenizers": {}, "node_i": "1162", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1158", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "1153", "native_tokenizers": [], "scripts": [] } ], + "family": "Australian", "tokenizers": {}, "node_i": "656", "native_tokenizers": [], diff --git a/data/Austro-Asiatic.json b/data/Austro-Asiatic.json index 68513102e28fb22ec5bbb702faf280872063161e..54a2db1331efe5a928b79a416b6a58d297aafa28 100644 --- a/data/Austro-Asiatic.json +++ b/data/Austro-Asiatic.json @@ -1,34 +1,41 @@ { "name": "Austro-Asiatic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mon-Khmer", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aslian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jah Hut", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jah Hut", + "depth": 4, "iso_1_code": null, "iso_3_code": "jah", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1167", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1166", "native_tokenizers": [], @@ -36,25 +43,30 @@ }, { "name": "North Aslian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chewong", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cheq Wong", + "depth": 5, "iso_1_code": null, "iso_3_code": "cwg", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1170", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1169", "native_tokenizers": [], @@ -62,14 +74,17 @@ }, { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Batek", + "depth": 5, "iso_1_code": null, "iso_3_code": "btq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1172", "native_tokenizers": [], @@ -77,9 +92,11 @@ }, { "name": "Jehai", + "depth": 5, "iso_1_code": null, "iso_3_code": "jhi", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1173", "native_tokenizers": [], @@ -87,9 +104,11 @@ }, { "name": "Minriq", + "depth": 5, "iso_1_code": null, "iso_3_code": "mnq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1174", "native_tokenizers": [], @@ -97,15 +116,18 @@ }, { "name": "Mintil", + "depth": 5, "iso_1_code": null, "iso_3_code": "mzt", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1175", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1171", "native_tokenizers": [], @@ -113,20 +135,24 @@ }, { "name": "Tonga", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ten\u2019edn", + "depth": 5, "iso_1_code": null, "iso_3_code": "tnz", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1177", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1176", "native_tokenizers": [], @@ -134,14 +160,17 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kintaq", + "depth": 5, "iso_1_code": null, "iso_3_code": "knq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1179", "native_tokenizers": [], @@ -149,21 +178,25 @@ }, { "name": "Kensiu", + "depth": 5, "iso_1_code": null, "iso_3_code": "kns", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1180", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1178", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1168", "native_tokenizers": [], @@ -171,14 +204,17 @@ }, { "name": "Senoic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lanoh", + "depth": 4, "iso_1_code": null, "iso_3_code": "lnh", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1182", "native_tokenizers": [], @@ -186,9 +222,11 @@ }, { "name": "Sab\u00fcm", + "depth": 4, "iso_1_code": null, "iso_3_code": "sbo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1183", "native_tokenizers": [], @@ -196,9 +234,11 @@ }, { "name": "Semai", + "depth": 4, "iso_1_code": null, "iso_3_code": "sea", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1184", "native_tokenizers": [], @@ -206,9 +246,11 @@ }, { "name": "Semnam", + "depth": 4, "iso_1_code": null, "iso_3_code": "ssm", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1185", "native_tokenizers": [], @@ -216,15 +258,18 @@ }, { "name": "Temiar", + "depth": 4, "iso_1_code": null, "iso_3_code": "tea", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1186", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1181", "native_tokenizers": [], @@ -232,14 +277,17 @@ }, { "name": "South Aslian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mah Meri", + "depth": 4, "iso_1_code": null, "iso_3_code": "mhe", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1188", "native_tokenizers": [], @@ -247,9 +295,11 @@ }, { "name": "Semelai", + "depth": 4, "iso_1_code": null, "iso_3_code": "sza", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1189", "native_tokenizers": [], @@ -257,9 +307,11 @@ }, { "name": "Semaq Beri", + "depth": 4, "iso_1_code": null, "iso_3_code": "szc", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1190", "native_tokenizers": [], @@ -267,21 +319,25 @@ }, { "name": "Temoq", + "depth": 4, "iso_1_code": null, "iso_3_code": "tmo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1191", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1187", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1165", "native_tokenizers": [], @@ -289,24 +345,29 @@ }, { "name": "Eastern Mon-Khmer", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bahnaric", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Bahnaric", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alak", + "depth": 5, "iso_1_code": null, "iso_3_code": "alk", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1195", "native_tokenizers": [], @@ -314,9 +375,11 @@ }, { "name": "Bahnar", + "depth": 5, "iso_1_code": null, "iso_3_code": "bdq", "children": [], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -334,9 +397,11 @@ }, { "name": "Romam", + "depth": 5, "iso_1_code": null, "iso_3_code": "rmx", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1197", "native_tokenizers": [], @@ -344,15 +409,18 @@ }, { "name": "Tampuan", + "depth": 5, "iso_1_code": null, "iso_3_code": "tpu", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1198", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -368,20 +436,24 @@ }, { "name": "East Bahnaric", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cua", + "depth": 5, "iso_1_code": null, "iso_3_code": "cua", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1200", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1199", "native_tokenizers": [], @@ -389,14 +461,17 @@ }, { "name": "North Bahnaric", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Katua", + "depth": 5, "iso_1_code": null, "iso_3_code": "kta", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1202", "native_tokenizers": [], @@ -404,9 +479,11 @@ }, { "name": "Kachok", + "depth": 5, "iso_1_code": null, "iso_3_code": "xkk", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1203", "native_tokenizers": [], @@ -414,14 +491,17 @@ }, { "name": "East", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayong", + "depth": 6, "iso_1_code": null, "iso_3_code": "kxy", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1205", "native_tokenizers": [], @@ -429,15 +509,18 @@ }, { "name": "Takua", + "depth": 6, "iso_1_code": null, "iso_3_code": "tkz", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1206", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1204", "native_tokenizers": [], @@ -445,14 +528,17 @@ }, { "name": "West", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Trieng", + "depth": 6, "iso_1_code": null, "iso_3_code": "stg", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1208", "native_tokenizers": [], @@ -460,9 +546,11 @@ }, { "name": "Talieng", + "depth": 6, "iso_1_code": null, "iso_3_code": "tdf", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1209", "native_tokenizers": [], @@ -470,20 +558,24 @@ }, { "name": "Duan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Halang Doan", + "depth": 7, "iso_1_code": null, "iso_3_code": "hld", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1211", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1210", "native_tokenizers": [], @@ -491,14 +583,17 @@ }, { "name": "Jeh-Halang", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Halang", + "depth": 7, "iso_1_code": null, "iso_3_code": "hal", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1213", "native_tokenizers": [], @@ -506,15 +601,18 @@ }, { "name": "Jeh", + "depth": 7, "iso_1_code": null, "iso_3_code": "jeh", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1214", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1212", "native_tokenizers": [], @@ -522,20 +620,24 @@ }, { "name": "Rengao", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rengao", + "depth": 7, "iso_1_code": null, "iso_3_code": "ren", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1216", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1215", "native_tokenizers": [], @@ -543,19 +645,23 @@ }, { "name": "Sedang-Todrah", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sedang", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hre", + "depth": 8, "iso_1_code": null, "iso_3_code": "hre", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1219", "native_tokenizers": [], @@ -563,15 +669,18 @@ }, { "name": "Sedang", + "depth": 8, "iso_1_code": null, "iso_3_code": "sed", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1220", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1218", "native_tokenizers": [], @@ -579,14 +688,17 @@ }, { "name": "Todrah-Monom", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Monom", + "depth": 8, "iso_1_code": null, "iso_3_code": "moo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1222", "native_tokenizers": [], @@ -594,33 +706,39 @@ }, { "name": "Todrah", + "depth": 8, "iso_1_code": null, "iso_3_code": "tdr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1223", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1221", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1217", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1207", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1201", "native_tokenizers": [], @@ -628,14 +746,17 @@ }, { "name": "South Bahnaric", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Stieng, Budeh", + "depth": 5, "iso_1_code": null, "iso_3_code": "stt", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1225", "native_tokenizers": [], @@ -643,30 +764,36 @@ }, { "name": "Sre-Mnong", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mnong", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Mnong", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mnong, Eastern", + "depth": 8, "iso_1_code": null, "iso_3_code": "mng", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1229", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1228", "native_tokenizers": [], @@ -674,14 +801,17 @@ }, { "name": "Southern-Central Mnong", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mnong, Central", + "depth": 8, "iso_1_code": null, "iso_3_code": "cmo", "children": [], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -700,9 +830,11 @@ }, { "name": "Mnong, Southern", + "depth": 8, "iso_1_code": null, "iso_3_code": "mnn", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1232", "native_tokenizers": [], @@ -710,15 +842,18 @@ }, { "name": "Kraol", + "depth": 8, "iso_1_code": null, "iso_3_code": "rka", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1233", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -733,6 +868,7 @@ "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -748,14 +884,17 @@ }, { "name": "Sre", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maa", + "depth": 7, "iso_1_code": null, "iso_3_code": "cma", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1235", "native_tokenizers": [], @@ -763,21 +902,25 @@ }, { "name": "Koho", + "depth": 7, "iso_1_code": null, "iso_3_code": "kpm", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1236", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1234", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -793,14 +936,17 @@ }, { "name": "Stieng-Chrau", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chrau", + "depth": 6, "iso_1_code": null, "iso_3_code": "crw", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1238", "native_tokenizers": [], @@ -808,9 +954,11 @@ }, { "name": "Mel-Khaonh", + "depth": 6, "iso_1_code": null, "iso_3_code": "hkn", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1239", "native_tokenizers": [], @@ -818,21 +966,25 @@ }, { "name": "Stieng, Bulo", + "depth": 6, "iso_1_code": null, "iso_3_code": "sti", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1240", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1237", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -848,14 +1000,17 @@ }, { "name": "West Bahnaric", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lavi", + "depth": 5, "iso_1_code": null, "iso_3_code": "lvi", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1242", "native_tokenizers": [], @@ -863,14 +1018,17 @@ }, { "name": "Brao-Kravet", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Brao", + "depth": 6, "iso_1_code": null, "iso_3_code": "brb", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1244", "native_tokenizers": [], @@ -878,9 +1036,11 @@ }, { "name": "Krung", + "depth": 6, "iso_1_code": null, "iso_3_code": "krr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1245", "native_tokenizers": [], @@ -888,9 +1048,11 @@ }, { "name": "Kavet", + "depth": 6, "iso_1_code": null, "iso_3_code": "krv", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1246", "native_tokenizers": [], @@ -898,15 +1060,18 @@ }, { "name": "Sou", + "depth": 6, "iso_1_code": null, "iso_3_code": "sqq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1247", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1243", "native_tokenizers": [], @@ -914,20 +1079,24 @@ }, { "name": "Laven", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Laven", + "depth": 6, "iso_1_code": null, "iso_3_code": "lbo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1249", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1248", "native_tokenizers": [], @@ -935,20 +1104,24 @@ }, { "name": "Nyaheun", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyaheun", + "depth": 6, "iso_1_code": null, "iso_3_code": "nev", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1251", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1250", "native_tokenizers": [], @@ -956,14 +1129,17 @@ }, { "name": "Oi-The", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oy", + "depth": 6, "iso_1_code": null, "iso_3_code": "oyb", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1253", "native_tokenizers": [], @@ -971,27 +1147,32 @@ }, { "name": "Sapuan", + "depth": 6, "iso_1_code": null, "iso_3_code": "spu", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1254", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1252", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1241", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1007,24 +1188,29 @@ }, { "name": "Katuic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Katuic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ta\u2019oih", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ir", + "depth": 6, "iso_1_code": null, "iso_3_code": "irr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1258", "native_tokenizers": [], @@ -1032,9 +1218,11 @@ }, { "name": "Ong", + "depth": 6, "iso_1_code": null, "iso_3_code": "oog", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1259", "native_tokenizers": [], @@ -1042,9 +1230,11 @@ }, { "name": "Ta\u2019oih, Upper", + "depth": 6, "iso_1_code": null, "iso_3_code": "tth", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1260", "native_tokenizers": [], @@ -1052,21 +1242,25 @@ }, { "name": "Ta\u2019oih, Lower", + "depth": 6, "iso_1_code": null, "iso_3_code": "tto", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1261", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1257", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1256", "native_tokenizers": [], @@ -1074,19 +1268,23 @@ }, { "name": "East Katuic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Katu-Pacoh", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Katu, Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": "ktv", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1264", "native_tokenizers": [], @@ -1094,9 +1292,11 @@ }, { "name": "Katu, Western", + "depth": 6, "iso_1_code": null, "iso_3_code": "kuf", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1265", "native_tokenizers": [], @@ -1104,9 +1304,11 @@ }, { "name": "Pacoh", + "depth": 6, "iso_1_code": null, "iso_3_code": "pac", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1266", "native_tokenizers": [], @@ -1114,9 +1316,11 @@ }, { "name": "Phuong", + "depth": 6, "iso_1_code": null, "iso_3_code": "phg", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1267", "native_tokenizers": [], @@ -1124,15 +1328,18 @@ }, { "name": "Tareng", + "depth": 6, "iso_1_code": null, "iso_3_code": "tgr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1268", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1263", "native_tokenizers": [], @@ -1140,26 +1347,31 @@ }, { "name": "Ngeq-Nkriang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kriang", + "depth": 6, "iso_1_code": null, "iso_3_code": "ngt", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1270", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1269", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1262", "native_tokenizers": [], @@ -1167,19 +1379,23 @@ }, { "name": "West Katuic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bru", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bru, Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": "bru", "children": [], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1197,9 +1413,11 @@ }, { "name": "Bru, Western", + "depth": 6, "iso_1_code": null, "iso_3_code": "brv", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1274", "native_tokenizers": [], @@ -1207,9 +1425,11 @@ }, { "name": "Katang, Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": "ncq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1275", "native_tokenizers": [], @@ -1219,9 +1439,11 @@ }, { "name": "Katang, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "sct", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1276", "native_tokenizers": [], @@ -1229,9 +1451,11 @@ }, { "name": "So", + "depth": 6, "iso_1_code": null, "iso_3_code": "sss", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1277", "native_tokenizers": [], @@ -1239,15 +1463,18 @@ }, { "name": "Khua", + "depth": 6, "iso_1_code": null, "iso_3_code": "xhv", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1278", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1263,14 +1490,17 @@ }, { "name": "Kuay", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuay", + "depth": 6, "iso_1_code": null, "iso_3_code": "kdt", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1280", "native_tokenizers": [], @@ -1278,21 +1508,25 @@ }, { "name": "Nyeu", + "depth": 6, "iso_1_code": null, "iso_3_code": "nyl", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1281", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1279", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1307,6 +1541,7 @@ "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1322,14 +1557,17 @@ }, { "name": "Khmer", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khmer", + "depth": 4, "iso_1_code": "km", "iso_3_code": "khm", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1283", "native_tokenizers": [], @@ -1339,9 +1577,11 @@ }, { "name": "Khmer, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "kxm", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1284", "native_tokenizers": [], @@ -1350,6 +1590,7 @@ ] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1282", "native_tokenizers": [], @@ -1357,25 +1598,30 @@ }, { "name": "Pearic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pear", + "depth": 5, "iso_1_code": null, "iso_3_code": "pcb", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1287", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1286", "native_tokenizers": [], @@ -1383,19 +1629,23 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chong", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chong", + "depth": 6, "iso_1_code": null, "iso_3_code": "cog", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1290", "native_tokenizers": [], @@ -1403,15 +1653,18 @@ }, { "name": "Chung", + "depth": 6, "iso_1_code": null, "iso_3_code": "scq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1291", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1289", "native_tokenizers": [], @@ -1419,14 +1672,17 @@ }, { "name": "Samre", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Somray", + "depth": 6, "iso_1_code": null, "iso_3_code": "smu", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1293", "native_tokenizers": [], @@ -1434,15 +1690,18 @@ }, { "name": "Samre", + "depth": 6, "iso_1_code": null, "iso_3_code": "sxm", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1294", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1292", "native_tokenizers": [], @@ -1450,38 +1709,45 @@ }, { "name": "Suoy", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Su\u2019ung", + "depth": 6, "iso_1_code": null, "iso_3_code": "syo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1296", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1295", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1288", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1285", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1497,14 +1763,17 @@ }, { "name": "Monic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mon", + "depth": 3, "iso_1_code": null, "iso_3_code": "mnw", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1298", "native_tokenizers": [], @@ -1513,6 +1782,7 @@ ] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1297", "native_tokenizers": [], @@ -1520,19 +1790,23 @@ }, { "name": "Nicobar", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Car", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nicobarese, Car", + "depth": 4, "iso_1_code": null, "iso_3_code": "caq", "children": [], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1549,6 +1823,7 @@ ] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1564,14 +1839,17 @@ }, { "name": "Chowra-Teressa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chaura", + "depth": 4, "iso_1_code": null, "iso_3_code": "crv", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1303", "native_tokenizers": [], @@ -1579,15 +1857,18 @@ }, { "name": "Teressa", + "depth": 4, "iso_1_code": null, "iso_3_code": "tef", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1304", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1302", "native_tokenizers": [], @@ -1595,20 +1876,24 @@ }, { "name": "Great Nicobar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nicobarese, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "nik", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1306", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1305", "native_tokenizers": [], @@ -1616,20 +1901,24 @@ }, { "name": "Nancowry", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nicobarese, Central", + "depth": 4, "iso_1_code": null, "iso_3_code": "ncb", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1308", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1307", "native_tokenizers": [], @@ -1637,26 +1926,31 @@ }, { "name": "Shom Peng", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shom Peng", + "depth": 4, "iso_1_code": null, "iso_3_code": "sii", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1310", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1309", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1672,19 +1966,23 @@ }, { "name": "Northern Mon-Khmer", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khasian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "War-Jaintia", + "depth": 4, "iso_1_code": null, "iso_3_code": "aml", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1313", "native_tokenizers": [], @@ -1692,9 +1990,11 @@ }, { "name": "Khasi", + "depth": 4, "iso_1_code": null, "iso_3_code": "kha", "children": [], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1712,9 +2012,11 @@ }, { "name": "Lyngngam", + "depth": 4, "iso_1_code": null, "iso_3_code": "lyg", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1315", "native_tokenizers": [], @@ -1722,15 +2024,18 @@ }, { "name": "Pnar", + "depth": 4, "iso_1_code": null, "iso_3_code": "pbv", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1316", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -1746,25 +2051,30 @@ }, { "name": "Khmuic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khao", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khao", + "depth": 5, "iso_1_code": null, "iso_3_code": "xao", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1319", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1318", "native_tokenizers": [], @@ -1772,19 +2082,23 @@ }, { "name": "Mal-Khmu\u2019", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khmu\u2019", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khuen", + "depth": 6, "iso_1_code": null, "iso_3_code": "khf", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1322", "native_tokenizers": [], @@ -1792,9 +2106,11 @@ }, { "name": "Khmu", + "depth": 6, "iso_1_code": null, "iso_3_code": "kjg", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1323", "native_tokenizers": [], @@ -1802,15 +2118,18 @@ }, { "name": "O\u2019du", + "depth": 6, "iso_1_code": null, "iso_3_code": "tyh", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1324", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1321", "native_tokenizers": [], @@ -1818,14 +2137,17 @@ }, { "name": "Mal-Prai", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mal", + "depth": 6, "iso_1_code": null, "iso_3_code": "mlf", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1326", "native_tokenizers": [], @@ -1833,21 +2155,25 @@ }, { "name": "Prai", + "depth": 6, "iso_1_code": null, "iso_3_code": "prt", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1327", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1325", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1320", "native_tokenizers": [], @@ -1855,20 +2181,24 @@ }, { "name": "Mlabri", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mlabri", + "depth": 5, "iso_1_code": null, "iso_3_code": "mra", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1329", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1328", "native_tokenizers": [], @@ -1876,14 +2206,17 @@ }, { "name": "Xinh Mul", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Phong-Kniang", + "depth": 5, "iso_1_code": null, "iso_3_code": "pnx", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1331", "native_tokenizers": [], @@ -1891,21 +2224,25 @@ }, { "name": "Puoc", + "depth": 5, "iso_1_code": null, "iso_3_code": "puo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1332", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1330", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1317", "native_tokenizers": [], @@ -1913,20 +2250,24 @@ }, { "name": "Mang", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mang", + "depth": 4, "iso_1_code": null, "iso_3_code": "zng", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1334", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1333", "native_tokenizers": [], @@ -1934,24 +2275,29 @@ }, { "name": "Palaungic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Palaungic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angkuic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hu", + "depth": 6, "iso_1_code": null, "iso_3_code": "huo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1338", "native_tokenizers": [], @@ -1959,9 +2305,11 @@ }, { "name": "Kon Keu", + "depth": 6, "iso_1_code": null, "iso_3_code": "kkn", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1339", "native_tokenizers": [], @@ -1969,9 +2317,11 @@ }, { "name": "Man Met", + "depth": 6, "iso_1_code": null, "iso_3_code": "mml", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1340", "native_tokenizers": [], @@ -1979,9 +2329,11 @@ }, { "name": "Mok", + "depth": 6, "iso_1_code": null, "iso_3_code": "mqt", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1341", "native_tokenizers": [], @@ -1989,9 +2341,11 @@ }, { "name": "Samtao", + "depth": 6, "iso_1_code": null, "iso_3_code": "stu", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1342", "native_tokenizers": [], @@ -1999,9 +2353,11 @@ }, { "name": "Tai Loi", + "depth": 6, "iso_1_code": null, "iso_3_code": "tlq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1343", "native_tokenizers": [], @@ -2009,9 +2365,11 @@ }, { "name": "Muak Sa-aak", + "depth": 6, "iso_1_code": null, "iso_3_code": "ukk", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1344", "native_tokenizers": [], @@ -2019,9 +2377,11 @@ }, { "name": "U", + "depth": 6, "iso_1_code": null, "iso_3_code": "uuu", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1345", "native_tokenizers": [], @@ -2029,15 +2389,18 @@ }, { "name": "Kiorr", + "depth": 6, "iso_1_code": null, "iso_3_code": "xko", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1346", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1337", "native_tokenizers": [], @@ -2045,14 +2408,17 @@ }, { "name": "Bit-Khang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bit", + "depth": 6, "iso_1_code": null, "iso_3_code": "bgk", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1348", "native_tokenizers": [], @@ -2060,9 +2426,11 @@ }, { "name": "Bumang", + "depth": 6, "iso_1_code": null, "iso_3_code": "bvp", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1349", "native_tokenizers": [], @@ -2070,15 +2438,18 @@ }, { "name": "Kh\u00e1ng", + "depth": 6, "iso_1_code": null, "iso_3_code": "kjm", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1350", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1347", "native_tokenizers": [], @@ -2086,14 +2457,17 @@ }, { "name": "Lametic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Con", + "depth": 6, "iso_1_code": null, "iso_3_code": "cno", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1352", "native_tokenizers": [], @@ -2101,15 +2475,18 @@ }, { "name": "Rmeet", + "depth": 6, "iso_1_code": null, "iso_3_code": "lbn", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1353", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1351", "native_tokenizers": [], @@ -2117,25 +2494,30 @@ }, { "name": "Waic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bulang", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Blang", + "depth": 7, "iso_1_code": null, "iso_3_code": "blr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1356", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1355", "native_tokenizers": [], @@ -2143,14 +2525,17 @@ }, { "name": "Lawa", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lawa, Western", + "depth": 7, "iso_1_code": null, "iso_3_code": "lcp", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1358", "native_tokenizers": [], @@ -2160,15 +2545,18 @@ }, { "name": "Lawa, Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": "lwl", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1359", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1357", "native_tokenizers": [], @@ -2176,14 +2564,17 @@ }, { "name": "Wa", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wa, Parauk", + "depth": 7, "iso_1_code": null, "iso_3_code": "prk", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1361", "native_tokenizers": [], @@ -2191,9 +2582,11 @@ }, { "name": "Awa", + "depth": 7, "iso_1_code": null, "iso_3_code": "vwa", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1362", "native_tokenizers": [], @@ -2201,9 +2594,11 @@ }, { "name": "Wa, Vo", + "depth": 7, "iso_1_code": null, "iso_3_code": "wbm", "children": [], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2220,6 +2615,7 @@ ] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2234,6 +2630,7 @@ "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2248,6 +2645,7 @@ "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2263,25 +2661,30 @@ }, { "name": "Western Palaungic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Danau", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Danau", + "depth": 6, "iso_1_code": null, "iso_3_code": "dnu", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1366", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1365", "native_tokenizers": [], @@ -2289,14 +2692,17 @@ }, { "name": "Palaung", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Palaung, Ruching", + "depth": 6, "iso_1_code": null, "iso_3_code": "pce", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1368", "native_tokenizers": [], @@ -2304,9 +2710,11 @@ }, { "name": "Palaung, Shwe", + "depth": 6, "iso_1_code": null, "iso_3_code": "pll", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1369", "native_tokenizers": [], @@ -2314,15 +2722,18 @@ }, { "name": "Palaung, Rumai", + "depth": 6, "iso_1_code": null, "iso_3_code": "rbb", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1370", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1367", "native_tokenizers": [], @@ -2330,14 +2741,17 @@ }, { "name": "Riang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Riang Lang", + "depth": 6, "iso_1_code": null, "iso_3_code": "ril", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1372", "native_tokenizers": [], @@ -2345,27 +2759,32 @@ }, { "name": "Riang Lai", + "depth": 6, "iso_1_code": null, "iso_3_code": "yin", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1373", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1371", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1364", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2380,6 +2799,7 @@ "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2395,14 +2815,17 @@ }, { "name": "Palyu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bugan", + "depth": 3, "iso_1_code": null, "iso_3_code": "bbh", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1375", "native_tokenizers": [], @@ -2410,15 +2833,18 @@ }, { "name": "Bolyu", + "depth": 3, "iso_1_code": null, "iso_3_code": "ply", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1376", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1374", "native_tokenizers": [], @@ -2426,20 +2852,24 @@ }, { "name": "Southern Monic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyahkur", + "depth": 3, "iso_1_code": null, "iso_3_code": "cbn", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1378", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1377", "native_tokenizers": [], @@ -2447,14 +2877,17 @@ }, { "name": "Unclassified", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kemiehua", + "depth": 3, "iso_1_code": null, "iso_3_code": "kfj", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1380", "native_tokenizers": [], @@ -2462,15 +2895,18 @@ }, { "name": "Kuanhua", + "depth": 3, "iso_1_code": null, "iso_3_code": "xnh", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1381", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1379", "native_tokenizers": [], @@ -2478,19 +2914,23 @@ }, { "name": "Viet-Muong", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chut", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arem", + "depth": 4, "iso_1_code": null, "iso_3_code": "aem", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1384", "native_tokenizers": [], @@ -2498,9 +2938,11 @@ }, { "name": "Maleng", + "depth": 4, "iso_1_code": null, "iso_3_code": "pkt", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1385", "native_tokenizers": [], @@ -2508,15 +2950,18 @@ }, { "name": "Chut", + "depth": 4, "iso_1_code": null, "iso_3_code": "scb", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1386", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1383", "native_tokenizers": [], @@ -2524,14 +2969,17 @@ }, { "name": "Cuoi", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hung", + "depth": 4, "iso_1_code": null, "iso_3_code": "hnu", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1388", "native_tokenizers": [], @@ -2539,15 +2987,18 @@ }, { "name": "Tho", + "depth": 4, "iso_1_code": null, "iso_3_code": "tou", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1389", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1387", "native_tokenizers": [], @@ -2555,14 +3006,17 @@ }, { "name": "Muong", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bo", + "depth": 4, "iso_1_code": null, "iso_3_code": "bgl", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1391", "native_tokenizers": [], @@ -2570,9 +3024,11 @@ }, { "name": "Muong", + "depth": 4, "iso_1_code": null, "iso_3_code": "mtq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1392", "native_tokenizers": [], @@ -2580,15 +3036,18 @@ }, { "name": "Ngu\u00f4n", + "depth": 4, "iso_1_code": null, "iso_3_code": "nuo", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1393", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1390", "native_tokenizers": [], @@ -2596,20 +3055,24 @@ }, { "name": "Thavung", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aheu", + "depth": 4, "iso_1_code": null, "iso_3_code": "thm", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1395", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1394", "native_tokenizers": [], @@ -2617,14 +3080,17 @@ }, { "name": "Vietnamese", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vietnamese", + "depth": 4, "iso_1_code": "vi", "iso_3_code": "vie", "children": [], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2643,6 +3109,7 @@ ] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2657,6 +3124,7 @@ "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2671,6 +3139,7 @@ "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"vi\")", @@ -2686,24 +3155,29 @@ }, { "name": "Munda", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North Munda", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kherwari", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agariya", + "depth": 4, "iso_1_code": null, "iso_3_code": "agi", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1401", "native_tokenizers": [], @@ -2711,9 +3185,11 @@ }, { "name": "Bijori", + "depth": 4, "iso_1_code": null, "iso_3_code": "bix", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1402", "native_tokenizers": [], @@ -2721,9 +3197,11 @@ }, { "name": "Kodaku", + "depth": 4, "iso_1_code": null, "iso_3_code": "ksz", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1403", "native_tokenizers": [], @@ -2731,14 +3209,17 @@ }, { "name": "Mundari", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asuri", + "depth": 5, "iso_1_code": null, "iso_3_code": "asr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1405", "native_tokenizers": [], @@ -2746,9 +3227,11 @@ }, { "name": "Birhor", + "depth": 5, "iso_1_code": null, "iso_3_code": "biy", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1406", "native_tokenizers": [], @@ -2756,9 +3239,11 @@ }, { "name": "Koda", + "depth": 5, "iso_1_code": null, "iso_3_code": "cdz", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1407", "native_tokenizers": [], @@ -2766,9 +3251,11 @@ }, { "name": "Kol", + "depth": 5, "iso_1_code": null, "iso_3_code": "ekl", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1408", "native_tokenizers": [], @@ -2776,18 +3263,12 @@ }, { "name": "Ho", + "depth": 5, "iso_1_code": null, "iso_3_code": "hoc", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1409", "native_tokenizers": [], "scripts": [ @@ -2797,9 +3278,11 @@ }, { "name": "Korwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "kfp", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1410", "native_tokenizers": [], @@ -2807,9 +3290,11 @@ }, { "name": "Mundari", + "depth": 5, "iso_1_code": null, "iso_3_code": "unr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1411", "native_tokenizers": [], @@ -2817,38 +3302,36 @@ }, { "name": "Munda", + "depth": 5, "iso_1_code": null, "iso_3_code": "unx", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1412", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1404", "native_tokenizers": [], "scripts": [] }, { "name": "Santali", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mahali", + "depth": 5, "iso_1_code": null, "iso_3_code": "mjx", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1414", "native_tokenizers": [], @@ -2856,18 +3339,12 @@ }, { "name": "Santhali", + "depth": 5, "iso_1_code": null, "iso_3_code": "sat", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1415", "native_tokenizers": [], "scripts": [ @@ -2877,92 +3354,81 @@ }, { "name": "Turi", + "depth": 5, "iso_1_code": null, "iso_3_code": "trd", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1416", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1413", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1400", "native_tokenizers": [], "scripts": [] }, { "name": "Korku", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Korku", + "depth": 4, "iso_1_code": null, "iso_3_code": "kfq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1418", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1417", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1399", "native_tokenizers": [], "scripts": [] }, { "name": "South Munda", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kharia-Juang", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Juang", + "depth": 4, "iso_1_code": null, "iso_3_code": "jun", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1421", "native_tokenizers": [], @@ -2972,15 +3438,18 @@ }, { "name": "Kharia", + "depth": 4, "iso_1_code": null, "iso_3_code": "khr", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1422", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1420", "native_tokenizers": [], @@ -2988,30 +3457,36 @@ }, { "name": "Koraput Munda", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gutob-Remo-Geta\u2019", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Geta\u2019", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gata\u2019", + "depth": 6, "iso_1_code": null, "iso_3_code": "gaq", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1426", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1425", "native_tokenizers": [], @@ -3019,14 +3494,17 @@ }, { "name": "Gutob-Remo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bondo", + "depth": 6, "iso_1_code": null, "iso_3_code": "bfw", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1428", "native_tokenizers": [], @@ -3034,21 +3512,25 @@ }, { "name": "Gadaba, Bodo", + "depth": 6, "iso_1_code": null, "iso_3_code": "gbj", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1429", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1427", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1424", "native_tokenizers": [], @@ -3056,25 +3538,30 @@ }, { "name": "Sora-Juray-Gorum", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gorum", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Parenga", + "depth": 6, "iso_1_code": null, "iso_3_code": "pcj", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1432", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1431", "native_tokenizers": [], @@ -3082,14 +3569,17 @@ }, { "name": "Sora-Juray", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Juray", + "depth": 6, "iso_1_code": null, "iso_3_code": "juy", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1434", "native_tokenizers": [], @@ -3097,62 +3587,54 @@ }, { "name": "Sora", + "depth": 6, "iso_1_code": null, "iso_3_code": "srb", "children": [], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1435", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1433", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1430", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1423", "native_tokenizers": [], "scripts": [] } ], + "family": "Austro-Asiatic", "tokenizers": {}, "node_i": "1419", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1398", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"vi\")", - "original_lang_name": "vietnamese", - "original_lang_code": "vie", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austro-Asiatic", + "tokenizers": {}, "node_i": "1163", "native_tokenizers": [], "scripts": [] diff --git a/data/Austronesian.json b/data/Austronesian.json index 9c96b72ce4bcb33694bc0c74912e23694bd3ac40..ed39c9fb03958cce60b22c76d3de2cf56195be34 100644 --- a/data/Austronesian.json +++ b/data/Austronesian.json @@ -1,27 +1,23 @@ { "name": "Austronesian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atayalic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atayal", + "depth": 2, "iso_1_code": null, "iso_3_code": "tay", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1438", "native_tokenizers": [], "scripts": [ @@ -30,18 +26,12 @@ }, { "name": "Sediq", + "depth": 2, "iso_1_code": null, "iso_3_code": "trv", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1439", "native_tokenizers": [], "scripts": [ @@ -49,35 +39,32 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1437", "native_tokenizers": [], "scripts": [] }, { "name": "Bunun", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bunun", + "depth": 2, "iso_1_code": null, "iso_3_code": "bnn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1441", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1440", "native_tokenizers": [], @@ -85,28 +72,24 @@ }, { "name": "East Formosan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amis", + "depth": 3, "iso_1_code": null, "iso_3_code": "ami", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1444", "native_tokenizers": [], "scripts": [ @@ -115,18 +98,12 @@ }, { "name": "Sakizaya", + "depth": 3, "iso_1_code": null, "iso_3_code": "szy", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1445", "native_tokenizers": [], "scripts": [ @@ -134,29 +111,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1443", "native_tokenizers": [], "scripts": [] }, { "name": "Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Basay", + "depth": 3, "iso_1_code": null, "iso_3_code": "byq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1447", "native_tokenizers": [], @@ -164,15 +137,18 @@ }, { "name": "Kavalan", + "depth": 3, "iso_1_code": null, "iso_3_code": "ckv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1448", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1446", "native_tokenizers": [], @@ -180,14 +156,17 @@ }, { "name": "Southwest", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Siraya", + "depth": 3, "iso_1_code": null, "iso_3_code": "fos", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1450", "native_tokenizers": [], @@ -195,44 +174,43 @@ }, { "name": "Taivoan", + "depth": 3, "iso_1_code": null, "iso_3_code": "tvx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1451", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1449", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1442", "native_tokenizers": [], "scripts": [] }, { "name": "Malayo-Polynesian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agta, Villa Viciosa", + "depth": 2, "iso_1_code": null, "iso_3_code": "dyg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1453", "native_tokenizers": [], @@ -240,14 +218,17 @@ }, { "name": "Bali-Sasak-Sumbawa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bali", + "depth": 3, "iso_1_code": null, "iso_3_code": "ban", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -265,14 +246,17 @@ }, { "name": "Sasak-Sumbawa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sasak", + "depth": 4, "iso_1_code": null, "iso_3_code": "sas", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -290,15 +274,18 @@ }, { "name": "Sumbawa", + "depth": 4, "iso_1_code": null, "iso_3_code": "smw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1458", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -313,6 +300,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -328,19 +316,23 @@ }, { "name": "Bashiic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ivatan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibatan", + "depth": 4, "iso_1_code": null, "iso_3_code": "ivb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -358,9 +350,11 @@ }, { "name": "Ivatan", + "depth": 4, "iso_1_code": null, "iso_3_code": "ivv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -377,6 +371,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -392,26 +387,31 @@ }, { "name": "Yami", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yami", + "depth": 4, "iso_1_code": null, "iso_3_code": "tao", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1464", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1463", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -427,14 +427,17 @@ }, { "name": "Bilic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bagobo-Klata", + "depth": 3, "iso_1_code": null, "iso_3_code": "bgi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1466", "native_tokenizers": [], @@ -442,9 +445,11 @@ }, { "name": "Teduray", + "depth": 3, "iso_1_code": null, "iso_3_code": "tiy", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -462,14 +467,17 @@ }, { "name": "Blaan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Blaan, Koronadal", + "depth": 4, "iso_1_code": null, "iso_3_code": "bpr", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -487,9 +495,11 @@ }, { "name": "Blaan, Sarangani", + "depth": 4, "iso_1_code": null, "iso_3_code": "bps", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -506,6 +516,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -521,14 +532,17 @@ }, { "name": "Tboli", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tboli", + "depth": 4, "iso_1_code": null, "iso_3_code": "tbl", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -545,6 +559,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -559,6 +574,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -574,29 +590,35 @@ }, { "name": "Celebic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saluan-Banggai", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banggai", + "depth": 6, "iso_1_code": null, "iso_3_code": "bgz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -614,9 +636,11 @@ }, { "name": "Balantak", + "depth": 6, "iso_1_code": null, "iso_3_code": "blz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -633,6 +657,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -648,14 +673,17 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andio", + "depth": 6, "iso_1_code": null, "iso_3_code": "bzb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1480", "native_tokenizers": [], @@ -663,14 +691,17 @@ }, { "name": "Saluanic", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bobongko", + "depth": 7, "iso_1_code": null, "iso_3_code": "bgb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1482", "native_tokenizers": [], @@ -678,9 +709,11 @@ }, { "name": "Saluan", + "depth": 7, "iso_1_code": null, "iso_3_code": "loe", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -698,15 +731,18 @@ }, { "name": "Batui", + "depth": 7, "iso_1_code": null, "iso_3_code": "zbt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1484", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -721,6 +757,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -735,6 +772,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -750,29 +788,35 @@ }, { "name": "Southeastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bungku-Tolaki", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Coast", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bungku", + "depth": 8, "iso_1_code": null, "iso_3_code": "bkz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1489", "native_tokenizers": [], @@ -780,9 +824,11 @@ }, { "name": "Bahonsuai", + "depth": 8, "iso_1_code": null, "iso_3_code": "bsu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1490", "native_tokenizers": [], @@ -790,9 +836,11 @@ }, { "name": "Wawonii", + "depth": 8, "iso_1_code": null, "iso_3_code": "wow", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1491", "native_tokenizers": [], @@ -800,9 +848,11 @@ }, { "name": "Mori Bawah", + "depth": 8, "iso_1_code": null, "iso_3_code": "xmz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1492", "native_tokenizers": [], @@ -810,14 +860,17 @@ }, { "name": "Kulisusu", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Taloki", + "depth": 9, "iso_1_code": null, "iso_3_code": "tlk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1494", "native_tokenizers": [], @@ -825,9 +878,11 @@ }, { "name": "Kulisusu", + "depth": 9, "iso_1_code": null, "iso_3_code": "vkl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1495", "native_tokenizers": [], @@ -835,21 +890,25 @@ }, { "name": "Koroni", + "depth": 9, "iso_1_code": null, "iso_3_code": "xkq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1496", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1493", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1488", "native_tokenizers": [], @@ -857,26 +916,31 @@ }, { "name": "Southwest", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Moronene", + "depth": 8, "iso_1_code": null, "iso_3_code": "mqn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1498", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1497", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1487", "native_tokenizers": [], @@ -884,19 +948,23 @@ }, { "name": "Western", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Interior", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mori Atas", + "depth": 8, "iso_1_code": null, "iso_3_code": "mzq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1501", "native_tokenizers": [], @@ -904,9 +972,11 @@ }, { "name": "Padoe", + "depth": 8, "iso_1_code": null, "iso_3_code": "pdo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1502", "native_tokenizers": [], @@ -914,15 +984,18 @@ }, { "name": "Tomadino", + "depth": 8, "iso_1_code": null, "iso_3_code": "tdi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1503", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1500", "native_tokenizers": [], @@ -930,14 +1003,17 @@ }, { "name": "West Coast", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tolaki", + "depth": 8, "iso_1_code": null, "iso_3_code": "lbw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1505", "native_tokenizers": [], @@ -945,9 +1021,11 @@ }, { "name": "Rahambuu", + "depth": 8, "iso_1_code": null, "iso_3_code": "raz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1506", "native_tokenizers": [], @@ -955,9 +1033,11 @@ }, { "name": "Kodeoha", + "depth": 8, "iso_1_code": null, "iso_3_code": "vko", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1507", "native_tokenizers": [], @@ -965,27 +1045,32 @@ }, { "name": "Waru", + "depth": 8, "iso_1_code": null, "iso_3_code": "wru", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1508", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1504", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1499", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1486", "native_tokenizers": [], @@ -993,29 +1078,35 @@ }, { "name": "Muna-Buton", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuclear Muna-Buton", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buton", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Buton", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lasalimu", + "depth": 9, "iso_1_code": null, "iso_3_code": "llm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1513", "native_tokenizers": [], @@ -1023,15 +1114,18 @@ }, { "name": "Kumbewaha", + "depth": 9, "iso_1_code": null, "iso_3_code": "xks", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1514", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1512", "native_tokenizers": [], @@ -1039,26 +1133,31 @@ }, { "name": "West Buton", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cia-Cia", + "depth": 9, "iso_1_code": null, "iso_3_code": "cia", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1516", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1515", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1511", "native_tokenizers": [], @@ -1066,14 +1165,17 @@ }, { "name": "Munan", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Busoa", + "depth": 8, "iso_1_code": null, "iso_3_code": "bup", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1518", "native_tokenizers": [], @@ -1081,14 +1183,17 @@ }, { "name": "Munic", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaimbulawa", + "depth": 9, "iso_1_code": null, "iso_3_code": "zka", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1520", "native_tokenizers": [], @@ -1096,14 +1201,17 @@ }, { "name": "Western", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Liabuku", + "depth": 10, "iso_1_code": null, "iso_3_code": "lix", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1522", "native_tokenizers": [], @@ -1111,9 +1219,11 @@ }, { "name": "Muna", + "depth": 10, "iso_1_code": null, "iso_3_code": "mnb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1131,9 +1241,11 @@ }, { "name": "Pancana", + "depth": 10, "iso_1_code": null, "iso_3_code": "pnp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1524", "native_tokenizers": [], @@ -1141,15 +1253,18 @@ }, { "name": "Kioko", + "depth": 10, "iso_1_code": null, "iso_3_code": "ues", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1525", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1164,6 +1279,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1178,6 +1294,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1192,6 +1309,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1207,14 +1325,17 @@ }, { "name": "Tukangbesi-Bonerate", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tukang Besi South", + "depth": 7, "iso_1_code": null, "iso_3_code": "bhq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1527", "native_tokenizers": [], @@ -1222,9 +1343,11 @@ }, { "name": "Bonerate", + "depth": 7, "iso_1_code": null, "iso_3_code": "bna", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1528", "native_tokenizers": [], @@ -1232,21 +1355,25 @@ }, { "name": "Tukang Besi North", + "depth": 7, "iso_1_code": null, "iso_3_code": "khc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1529", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1526", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1261,6 +1388,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1275,6 +1403,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1290,24 +1419,29 @@ }, { "name": "Kaili-Pamona", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaili", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baras", + "depth": 6, "iso_1_code": null, "iso_3_code": "brs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1533", "native_tokenizers": [], @@ -1315,9 +1449,11 @@ }, { "name": "Tado", + "depth": 6, "iso_1_code": null, "iso_3_code": "klw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1534", "native_tokenizers": [], @@ -1325,9 +1461,11 @@ }, { "name": "Kaili, Da\u2019a", + "depth": 6, "iso_1_code": null, "iso_3_code": "kzf", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1345,9 +1483,11 @@ }, { "name": "Kaili, Ledo", + "depth": 6, "iso_1_code": null, "iso_3_code": "lew", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1365,9 +1505,11 @@ }, { "name": "Moma", + "depth": 6, "iso_1_code": null, "iso_3_code": "myl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1537", "native_tokenizers": [], @@ -1375,9 +1517,11 @@ }, { "name": "Topoiyo", + "depth": 6, "iso_1_code": null, "iso_3_code": "toy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1538", "native_tokenizers": [], @@ -1385,9 +1529,11 @@ }, { "name": "Sedoa", + "depth": 6, "iso_1_code": null, "iso_3_code": "tvw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1539", "native_tokenizers": [], @@ -1395,15 +1541,18 @@ }, { "name": "Kaili, Unde", + "depth": 6, "iso_1_code": null, "iso_3_code": "unz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1540", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1419,14 +1568,17 @@ }, { "name": "Pamona", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pamona", + "depth": 6, "iso_1_code": null, "iso_3_code": "pmf", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1444,15 +1596,18 @@ }, { "name": "Tombelala", + "depth": 6, "iso_1_code": null, "iso_3_code": "ttp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1543", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1467,6 +1622,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1482,14 +1638,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rampi", + "depth": 5, "iso_1_code": null, "iso_3_code": "lje", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1545", "native_tokenizers": [], @@ -1497,9 +1656,11 @@ }, { "name": "Uma", + "depth": 5, "iso_1_code": null, "iso_3_code": "ppk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1517,9 +1678,11 @@ }, { "name": "Sarudu", + "depth": 5, "iso_1_code": null, "iso_3_code": "sdu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1547", "native_tokenizers": [], @@ -1527,14 +1690,17 @@ }, { "name": "Badaic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Behoa", + "depth": 6, "iso_1_code": null, "iso_3_code": "bep", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1549", "native_tokenizers": [], @@ -1542,9 +1708,11 @@ }, { "name": "Bada", + "depth": 6, "iso_1_code": null, "iso_3_code": "bhz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1562,9 +1730,11 @@ }, { "name": "Napu", + "depth": 6, "iso_1_code": null, "iso_3_code": "npy", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1581,6 +1751,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1595,6 +1766,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1609,6 +1781,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1624,19 +1797,23 @@ }, { "name": "Tomini-Tolitoli", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tolitoli", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boano", + "depth": 5, "iso_1_code": null, "iso_3_code": "bzl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1554", "native_tokenizers": [], @@ -1644,15 +1821,18 @@ }, { "name": "Totoli", + "depth": 5, "iso_1_code": null, "iso_3_code": "txe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1555", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1553", "native_tokenizers": [], @@ -1660,19 +1840,23 @@ }, { "name": "Tomini", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dondo", + "depth": 6, "iso_1_code": null, "iso_3_code": "dok", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1558", "native_tokenizers": [], @@ -1680,9 +1864,11 @@ }, { "name": "Lauje", + "depth": 6, "iso_1_code": null, "iso_3_code": "law", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1700,15 +1886,18 @@ }, { "name": "Tomini", + "depth": 6, "iso_1_code": null, "iso_3_code": "txm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1560", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1724,14 +1913,17 @@ }, { "name": "Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balaesang", + "depth": 6, "iso_1_code": null, "iso_3_code": "bls", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1562", "native_tokenizers": [], @@ -1739,9 +1931,11 @@ }, { "name": "Dampelas", + "depth": 6, "iso_1_code": null, "iso_3_code": "dms", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1563", "native_tokenizers": [], @@ -1749,9 +1943,11 @@ }, { "name": "Taje", + "depth": 6, "iso_1_code": null, "iso_3_code": "pee", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1564", "native_tokenizers": [], @@ -1759,9 +1955,11 @@ }, { "name": "Tajio", + "depth": 6, "iso_1_code": null, "iso_3_code": "tdj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1565", "native_tokenizers": [], @@ -1769,21 +1967,25 @@ }, { "name": "Pendau", + "depth": 6, "iso_1_code": null, "iso_3_code": "ums", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1566", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1561", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1798,6 +2000,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1813,14 +2016,17 @@ }, { "name": "Wotu-Wolio", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wotu", + "depth": 4, "iso_1_code": null, "iso_3_code": "wtw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1568", "native_tokenizers": [], @@ -1828,14 +2034,17 @@ }, { "name": "Kalao", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalao", + "depth": 5, "iso_1_code": null, "iso_3_code": "kly", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1570", "native_tokenizers": [], @@ -1843,15 +2052,18 @@ }, { "name": "Laiyolo", + "depth": 5, "iso_1_code": null, "iso_3_code": "lji", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1571", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1569", "native_tokenizers": [], @@ -1859,14 +2071,17 @@ }, { "name": "Wolio-Kamaru", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamaru", + "depth": 5, "iso_1_code": null, "iso_3_code": "kgx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1573", "native_tokenizers": [], @@ -1874,27 +2089,32 @@ }, { "name": "Wolio", + "depth": 5, "iso_1_code": null, "iso_3_code": "wlo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1574", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1572", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1567", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1910,19 +2130,23 @@ }, { "name": "Central Luzon", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pampangan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kapampangan", + "depth": 4, "iso_1_code": null, "iso_3_code": "pam", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1939,6 +2163,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1954,14 +2179,17 @@ }, { "name": "Sambalic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ayta, Ambala", + "depth": 4, "iso_1_code": null, "iso_3_code": "abc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1579", "native_tokenizers": [], @@ -1969,9 +2197,11 @@ }, { "name": "Ayta, Abellen", + "depth": 4, "iso_1_code": null, "iso_3_code": "abp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1580", "native_tokenizers": [], @@ -1979,9 +2209,11 @@ }, { "name": "Ayta, Magbukun", + "depth": 4, "iso_1_code": null, "iso_3_code": "ayt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1581", "native_tokenizers": [], @@ -1989,9 +2221,11 @@ }, { "name": "Ayta, Mag-Indi", + "depth": 4, "iso_1_code": null, "iso_3_code": "blx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1582", "native_tokenizers": [], @@ -1999,9 +2233,11 @@ }, { "name": "Sambal, Botolan", + "depth": 4, "iso_1_code": null, "iso_3_code": "sbl", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2019,9 +2255,11 @@ }, { "name": "Ayta, Mag-antsi", + "depth": 4, "iso_1_code": null, "iso_3_code": "sgb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2039,9 +2277,11 @@ }, { "name": "Bolinao", + "depth": 4, "iso_1_code": null, "iso_3_code": "smk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2059,9 +2299,11 @@ }, { "name": "Sambal", + "depth": 4, "iso_1_code": null, "iso_3_code": "xsb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2078,6 +2320,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2093,26 +2336,31 @@ }, { "name": "Sinauna", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dumagat, Remontado", + "depth": 4, "iso_1_code": null, "iso_3_code": "agv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1588", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1587", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2128,19 +2376,23 @@ }, { "name": "Central-Eastern Malayo-Polynesian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aru", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barakai", + "depth": 4, "iso_1_code": null, "iso_3_code": "baj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1591", "native_tokenizers": [], @@ -2148,9 +2400,11 @@ }, { "name": "Gwatlelir", + "depth": 4, "iso_1_code": null, "iso_3_code": "bay", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1592", "native_tokenizers": [], @@ -2158,9 +2412,11 @@ }, { "name": "Koba", + "depth": 4, "iso_1_code": null, "iso_3_code": "kpd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1593", "native_tokenizers": [], @@ -2168,9 +2424,11 @@ }, { "name": "Dobel", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1594", "native_tokenizers": [], @@ -2178,9 +2436,11 @@ }, { "name": "Kompane", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1595", "native_tokenizers": [], @@ -2188,9 +2448,11 @@ }, { "name": "Kola", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1596", "native_tokenizers": [], @@ -2198,9 +2460,11 @@ }, { "name": "Karey", + "depth": 4, "iso_1_code": null, "iso_3_code": "kyd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1597", "native_tokenizers": [], @@ -2208,9 +2472,11 @@ }, { "name": "Lola", + "depth": 4, "iso_1_code": null, "iso_3_code": "lcd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1598", "native_tokenizers": [], @@ -2218,9 +2484,11 @@ }, { "name": "Lorang", + "depth": 4, "iso_1_code": null, "iso_3_code": "lrn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1599", "native_tokenizers": [], @@ -2228,9 +2496,11 @@ }, { "name": "Mariri", + "depth": 4, "iso_1_code": null, "iso_3_code": "mqi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1600", "native_tokenizers": [], @@ -2238,9 +2508,11 @@ }, { "name": "Tarangan, East", + "depth": 4, "iso_1_code": null, "iso_3_code": "tre", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1601", "native_tokenizers": [], @@ -2248,9 +2520,11 @@ }, { "name": "Tarangan, West", + "depth": 4, "iso_1_code": null, "iso_3_code": "txn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1602", "native_tokenizers": [], @@ -2258,9 +2532,11 @@ }, { "name": "Ujir", + "depth": 4, "iso_1_code": null, "iso_3_code": "udj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1603", "native_tokenizers": [], @@ -2268,15 +2544,18 @@ }, { "name": "Manombai", + "depth": 4, "iso_1_code": null, "iso_3_code": "woo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1604", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1590", "native_tokenizers": [], @@ -2284,19 +2563,23 @@ }, { "name": "Babar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Babar, North", + "depth": 5, "iso_1_code": null, "iso_3_code": "bcd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1607", "native_tokenizers": [], @@ -2304,9 +2587,11 @@ }, { "name": "Dawera-Daweloor", + "depth": 5, "iso_1_code": null, "iso_3_code": "ddw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1608", "native_tokenizers": [], @@ -2314,15 +2599,18 @@ }, { "name": "Dai", + "depth": 5, "iso_1_code": null, "iso_3_code": "dij", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1609", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1606", "native_tokenizers": [], @@ -2330,19 +2618,23 @@ }, { "name": "South", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Masela-South Babar", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Masela, West", + "depth": 6, "iso_1_code": null, "iso_3_code": "mss", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1612", "native_tokenizers": [], @@ -2350,9 +2642,11 @@ }, { "name": "Masela, Central", + "depth": 6, "iso_1_code": null, "iso_3_code": "mxz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1613", "native_tokenizers": [], @@ -2360,9 +2654,11 @@ }, { "name": "Serili", + "depth": 6, "iso_1_code": null, "iso_3_code": "sve", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1614", "native_tokenizers": [], @@ -2370,9 +2666,11 @@ }, { "name": "Babar, Southeast", + "depth": 6, "iso_1_code": null, "iso_3_code": "vbb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1615", "native_tokenizers": [], @@ -2380,15 +2678,18 @@ }, { "name": "Masela, East", + "depth": 6, "iso_1_code": null, "iso_3_code": "vme", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1616", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1611", "native_tokenizers": [], @@ -2396,14 +2697,17 @@ }, { "name": "Southwest Babar", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Emplawas", + "depth": 6, "iso_1_code": null, "iso_3_code": "emw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1618", "native_tokenizers": [], @@ -2411,9 +2715,11 @@ }, { "name": "Imroing", + "depth": 6, "iso_1_code": null, "iso_3_code": "imr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1619", "native_tokenizers": [], @@ -2421,27 +2727,32 @@ }, { "name": "Tela-Masbuar", + "depth": 6, "iso_1_code": null, "iso_3_code": "tvm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1620", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1617", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1610", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1605", "native_tokenizers": [], @@ -2449,14 +2760,17 @@ }, { "name": "Bima-Lembata", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adonara", + "depth": 4, "iso_1_code": null, "iso_3_code": "adr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1622", "native_tokenizers": [], @@ -2464,9 +2778,11 @@ }, { "name": "Alor", + "depth": 4, "iso_1_code": null, "iso_3_code": "aol", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1623", "native_tokenizers": [], @@ -2474,9 +2790,11 @@ }, { "name": "Bima", + "depth": 4, "iso_1_code": null, "iso_3_code": "bhp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2494,9 +2812,11 @@ }, { "name": "Ende", + "depth": 4, "iso_1_code": null, "iso_3_code": "end", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1625", "native_tokenizers": [], @@ -2504,9 +2824,11 @@ }, { "name": "Ile Ape", + "depth": 4, "iso_1_code": null, "iso_3_code": "ila", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1626", "native_tokenizers": [], @@ -2514,9 +2836,11 @@ }, { "name": "Kedang", + "depth": 4, "iso_1_code": null, "iso_3_code": "ksx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1627", "native_tokenizers": [], @@ -2524,9 +2848,11 @@ }, { "name": "Kepo\u2019", + "depth": 4, "iso_1_code": null, "iso_3_code": "kuk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1628", "native_tokenizers": [], @@ -2534,9 +2860,11 @@ }, { "name": "Komodo", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1629", "native_tokenizers": [], @@ -2544,9 +2872,11 @@ }, { "name": "Li\u2019o", + "depth": 4, "iso_1_code": null, "iso_3_code": "ljl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1630", "native_tokenizers": [], @@ -2554,9 +2884,11 @@ }, { "name": "Painara", + "depth": 4, "iso_1_code": null, "iso_3_code": "lmf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1631", "native_tokenizers": [], @@ -2564,9 +2896,11 @@ }, { "name": "Labalekan-Mingar", + "depth": 4, "iso_1_code": null, "iso_3_code": "lmj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1632", "native_tokenizers": [], @@ -2574,9 +2908,11 @@ }, { "name": "Lamatuka", + "depth": 4, "iso_1_code": null, "iso_3_code": "lmq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1633", "native_tokenizers": [], @@ -2584,9 +2920,11 @@ }, { "name": "Lamalera", + "depth": 4, "iso_1_code": null, "iso_3_code": "lmr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1634", "native_tokenizers": [], @@ -2594,9 +2932,11 @@ }, { "name": "Levuka", + "depth": 4, "iso_1_code": null, "iso_3_code": "lvu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1635", "native_tokenizers": [], @@ -2604,9 +2944,11 @@ }, { "name": "Lewoeleng", + "depth": 4, "iso_1_code": null, "iso_3_code": "lwe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1636", "native_tokenizers": [], @@ -2614,9 +2956,11 @@ }, { "name": "Lewotobi", + "depth": 4, "iso_1_code": null, "iso_3_code": "lwt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1637", "native_tokenizers": [], @@ -2624,9 +2968,11 @@ }, { "name": "Manggarai", + "depth": 4, "iso_1_code": null, "iso_3_code": "mqy", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2644,9 +2990,11 @@ }, { "name": "Ngad\u2019a, Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "nea", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1639", "native_tokenizers": [], @@ -2654,9 +3002,11 @@ }, { "name": "Nage", + "depth": 4, "iso_1_code": null, "iso_3_code": "nxe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1640", "native_tokenizers": [], @@ -2664,9 +3014,11 @@ }, { "name": "Ngad\u2019a", + "depth": 4, "iso_1_code": null, "iso_3_code": "nxg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1641", "native_tokenizers": [], @@ -2674,9 +3026,11 @@ }, { "name": "Palu\u2019e", + "depth": 4, "iso_1_code": null, "iso_3_code": "ple", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1642", "native_tokenizers": [], @@ -2684,9 +3038,11 @@ }, { "name": "Rembong", + "depth": 4, "iso_1_code": null, "iso_3_code": "reb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1643", "native_tokenizers": [], @@ -2694,9 +3050,11 @@ }, { "name": "Riung", + "depth": 4, "iso_1_code": null, "iso_3_code": "riu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1644", "native_tokenizers": [], @@ -2704,9 +3062,11 @@ }, { "name": "Rajong", + "depth": 4, "iso_1_code": null, "iso_3_code": "rjg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1645", "native_tokenizers": [], @@ -2714,9 +3074,11 @@ }, { "name": "Rongga", + "depth": 4, "iso_1_code": null, "iso_3_code": "ror", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1646", "native_tokenizers": [], @@ -2724,9 +3086,11 @@ }, { "name": "Sika", + "depth": 4, "iso_1_code": null, "iso_3_code": "ski", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1647", "native_tokenizers": [], @@ -2734,9 +3098,11 @@ }, { "name": "Lamaholot", + "depth": 4, "iso_1_code": null, "iso_3_code": "slp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1648", "native_tokenizers": [], @@ -2744,9 +3110,11 @@ }, { "name": "So\u2019a", + "depth": 4, "iso_1_code": null, "iso_3_code": "ssq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1649", "native_tokenizers": [], @@ -2754,9 +3122,11 @@ }, { "name": "Wae Rana", + "depth": 4, "iso_1_code": null, "iso_3_code": "wrx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1650", "native_tokenizers": [], @@ -2764,15 +3134,18 @@ }, { "name": "Ke\u2019o", + "depth": 4, "iso_1_code": null, "iso_3_code": "xxk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1651", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -2788,25 +3161,30 @@ }, { "name": "Central Maluku", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ambelau", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ambelau", + "depth": 5, "iso_1_code": null, "iso_3_code": "amv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1654", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1653", "native_tokenizers": [], @@ -2814,14 +3192,17 @@ }, { "name": "Buru", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lisela", + "depth": 5, "iso_1_code": null, "iso_3_code": "lcl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1656", "native_tokenizers": [], @@ -2829,9 +3210,11 @@ }, { "name": "Buru", + "depth": 5, "iso_1_code": null, "iso_3_code": "mhs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1657", "native_tokenizers": [], @@ -2839,15 +3222,18 @@ }, { "name": "Moksela", + "depth": 5, "iso_1_code": null, "iso_3_code": "vms", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1658", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1655", "native_tokenizers": [], @@ -2855,14 +3241,17 @@ }, { "name": "East", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manipa", + "depth": 5, "iso_1_code": null, "iso_3_code": "mqp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1660", "native_tokenizers": [], @@ -2870,14 +3259,17 @@ }, { "name": "Banda-Geser", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda", + "depth": 6, "iso_1_code": null, "iso_3_code": "bnd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1662", "native_tokenizers": [], @@ -2885,14 +3277,17 @@ }, { "name": "Geser-Gorom", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bati", + "depth": 7, "iso_1_code": null, "iso_3_code": "bvt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1664", "native_tokenizers": [], @@ -2900,9 +3295,11 @@ }, { "name": "Geser-Gorom", + "depth": 7, "iso_1_code": null, "iso_3_code": "ges", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1665", "native_tokenizers": [], @@ -2910,21 +3307,25 @@ }, { "name": "Watubela", + "depth": 7, "iso_1_code": null, "iso_3_code": "wah", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1666", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1663", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1661", "native_tokenizers": [], @@ -2932,25 +3333,30 @@ }, { "name": "Seram", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bobot", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bobot", + "depth": 7, "iso_1_code": null, "iso_3_code": "bty", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1669", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1668", "native_tokenizers": [], @@ -2958,20 +3364,24 @@ }, { "name": "East Seram", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hoti", + "depth": 7, "iso_1_code": null, "iso_3_code": "hti", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1671", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1670", "native_tokenizers": [], @@ -2979,14 +3389,17 @@ }, { "name": "Manusela-Seti", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Benggoi", + "depth": 7, "iso_1_code": null, "iso_3_code": "bgy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1673", "native_tokenizers": [], @@ -2994,9 +3407,11 @@ }, { "name": "Huaulu", + "depth": 7, "iso_1_code": null, "iso_3_code": "hud", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1674", "native_tokenizers": [], @@ -3004,9 +3419,11 @@ }, { "name": "Salas", + "depth": 7, "iso_1_code": null, "iso_3_code": "sgu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1675", "native_tokenizers": [], @@ -3014,9 +3431,11 @@ }, { "name": "Liana-Seti", + "depth": 7, "iso_1_code": null, "iso_3_code": "ste", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1676", "native_tokenizers": [], @@ -3024,15 +3443,18 @@ }, { "name": "Sou Upaa", + "depth": 7, "iso_1_code": null, "iso_3_code": "wha", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1677", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1672", "native_tokenizers": [], @@ -3040,20 +3462,24 @@ }, { "name": "Masiwang", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Masiwang", + "depth": 7, "iso_1_code": null, "iso_3_code": "bnf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1679", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1678", "native_tokenizers": [], @@ -3061,25 +3487,30 @@ }, { "name": "Nunusaku", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayeli", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayeli", + "depth": 8, "iso_1_code": null, "iso_3_code": "kzl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1682", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1681", "native_tokenizers": [], @@ -3087,14 +3518,17 @@ }, { "name": "Piru Bay", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haruku", + "depth": 8, "iso_1_code": null, "iso_3_code": "hrk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1684", "native_tokenizers": [], @@ -3102,14 +3536,17 @@ }, { "name": "East", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaibobo", + "depth": 9, "iso_1_code": null, "iso_3_code": "kzb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1686", "native_tokenizers": [], @@ -3117,9 +3554,11 @@ }, { "name": "Sepa", + "depth": 9, "iso_1_code": null, "iso_3_code": "spb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1687", "native_tokenizers": [], @@ -3127,9 +3566,11 @@ }, { "name": "Sou Nama", + "depth": 9, "iso_1_code": null, "iso_3_code": "tlt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1688", "native_tokenizers": [], @@ -3137,19 +3578,23 @@ }, { "name": "Seram Straits", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ambon", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hitu", + "depth": 11, "iso_1_code": null, "iso_3_code": "htu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1691", "native_tokenizers": [], @@ -3157,9 +3602,11 @@ }, { "name": "Laha", + "depth": 11, "iso_1_code": null, "iso_3_code": "lhh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1692", "native_tokenizers": [], @@ -3167,15 +3614,18 @@ }, { "name": "Tulehu", + "depth": 11, "iso_1_code": null, "iso_3_code": "tlu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1693", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1690", "native_tokenizers": [], @@ -3183,20 +3633,24 @@ }, { "name": "Solehua", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Paulohi", + "depth": 11, "iso_1_code": null, "iso_3_code": "plh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1695", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1694", "native_tokenizers": [], @@ -3204,24 +3658,29 @@ }, { "name": "Uliase", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hatuhaha", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Elpaputi", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amahai", + "depth": 13, "iso_1_code": null, "iso_3_code": "amq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1699", "native_tokenizers": [], @@ -3229,15 +3688,18 @@ }, { "name": "Nusa Laut", + "depth": 13, "iso_1_code": null, "iso_3_code": "nul", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1700", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1698", "native_tokenizers": [], @@ -3245,14 +3707,17 @@ }, { "name": "Saparua", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Latu", + "depth": 13, "iso_1_code": null, "iso_3_code": "ltu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1702", "native_tokenizers": [], @@ -3260,21 +3725,25 @@ }, { "name": "Saparua", + "depth": 13, "iso_1_code": null, "iso_3_code": "spr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1703", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1701", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1697", "native_tokenizers": [], @@ -3282,38 +3751,45 @@ }, { "name": "Kamarian", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamarian", + "depth": 12, "iso_1_code": null, "iso_3_code": "kzx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1705", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1704", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1696", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1689", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1685", "native_tokenizers": [], @@ -3321,19 +3797,23 @@ }, { "name": "West", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asilulu", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asilulu", + "depth": 10, "iso_1_code": null, "iso_3_code": "asl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1708", "native_tokenizers": [], @@ -3341,15 +3821,18 @@ }, { "name": "Seit-Kaitetu", + "depth": 10, "iso_1_code": null, "iso_3_code": "hik", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1709", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1707", "native_tokenizers": [], @@ -3357,14 +3840,17 @@ }, { "name": "Hoamoal", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Larike-Wakasihu", + "depth": 10, "iso_1_code": null, "iso_3_code": "alo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1711", "native_tokenizers": [], @@ -3372,27 +3858,32 @@ }, { "name": "Boano", + "depth": 10, "iso_1_code": null, "iso_3_code": "bzn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1712", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1710", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1706", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1683", "native_tokenizers": [], @@ -3400,14 +3891,17 @@ }, { "name": "Three Rivers", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yalahatan", + "depth": 8, "iso_1_code": null, "iso_3_code": "jal", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1714", "native_tokenizers": [], @@ -3415,19 +3909,23 @@ }, { "name": "Amalumute", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northwest Seram", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luhu", + "depth": 10, "iso_1_code": null, "iso_3_code": "lcq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1717", "native_tokenizers": [], @@ -3435,9 +3933,11 @@ }, { "name": "Lisabata-Nuniali", + "depth": 10, "iso_1_code": null, "iso_3_code": "lcs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1718", "native_tokenizers": [], @@ -3445,20 +3945,24 @@ }, { "name": "Hulung", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hulung", + "depth": 11, "iso_1_code": null, "iso_3_code": "huk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1720", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1719", "native_tokenizers": [], @@ -3466,20 +3970,24 @@ }, { "name": "Loun", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Loun", + "depth": 11, "iso_1_code": null, "iso_3_code": "lox", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1722", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1721", "native_tokenizers": [], @@ -3487,14 +3995,17 @@ }, { "name": "Ulat Inai", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alune", + "depth": 11, "iso_1_code": null, "iso_3_code": "alp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3512,15 +4023,18 @@ }, { "name": "Naka\u2019ela", + "depth": 11, "iso_1_code": null, "iso_3_code": "nae", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1725", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3535,6 +4049,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3549,6 +4064,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3564,26 +4080,31 @@ }, { "name": "Wemale", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wemale", + "depth": 9, "iso_1_code": null, "iso_3_code": "weo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1727", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1726", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3598,6 +4119,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3613,14 +4135,17 @@ }, { "name": "Sawai-Nuaulu", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuaulu, North", + "depth": 7, "iso_1_code": null, "iso_3_code": "nni", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1729", "native_tokenizers": [], @@ -3628,9 +4153,11 @@ }, { "name": "Nuaulu, South", + "depth": 7, "iso_1_code": null, "iso_3_code": "nxl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1730", "native_tokenizers": [], @@ -3638,21 +4165,25 @@ }, { "name": "Saleman", + "depth": 7, "iso_1_code": null, "iso_3_code": "sau", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1731", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1728", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3667,6 +4198,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3682,14 +4214,17 @@ }, { "name": "Sula", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mangole", + "depth": 5, "iso_1_code": null, "iso_3_code": "mqc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1733", "native_tokenizers": [], @@ -3697,9 +4232,11 @@ }, { "name": "Sula", + "depth": 5, "iso_1_code": null, "iso_3_code": "szn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1734", "native_tokenizers": [], @@ -3707,14 +4244,17 @@ }, { "name": "Taliabo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kadai", + "depth": 6, "iso_1_code": null, "iso_3_code": "kzd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1736", "native_tokenizers": [], @@ -3722,27 +4262,32 @@ }, { "name": "Taliabu", + "depth": 6, "iso_1_code": null, "iso_3_code": "tlv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1737", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1735", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1732", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3758,39 +4303,47 @@ }, { "name": "Eastern Malayo-Polynesian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oceanic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Admiralty Islands", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manus", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andra-Hus", + "depth": 9, "iso_1_code": null, "iso_3_code": "anx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1744", "native_tokenizers": [], @@ -3798,9 +4351,11 @@ }, { "name": "Elu", + "depth": 9, "iso_1_code": null, "iso_3_code": "elu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1745", "native_tokenizers": [], @@ -3808,9 +4363,11 @@ }, { "name": "Kurti", + "depth": 9, "iso_1_code": null, "iso_3_code": "ktm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3828,9 +4385,11 @@ }, { "name": "Koro", + "depth": 9, "iso_1_code": null, "iso_3_code": "kxr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1747", "native_tokenizers": [], @@ -3838,9 +4397,11 @@ }, { "name": "Leipon", + "depth": 9, "iso_1_code": null, "iso_3_code": "lek", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1748", "native_tokenizers": [], @@ -3848,9 +4409,11 @@ }, { "name": "Lele", + "depth": 9, "iso_1_code": null, "iso_3_code": "lle", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1749", "native_tokenizers": [], @@ -3858,9 +4421,11 @@ }, { "name": "Ponam", + "depth": 9, "iso_1_code": null, "iso_3_code": "ncc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1750", "native_tokenizers": [], @@ -3868,9 +4433,11 @@ }, { "name": "Nali", + "depth": 9, "iso_1_code": null, "iso_3_code": "nss", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3888,9 +4455,11 @@ }, { "name": "Kele", + "depth": 9, "iso_1_code": null, "iso_3_code": "sbc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1752", "native_tokenizers": [], @@ -3898,9 +4467,11 @@ }, { "name": "Titan", + "depth": 9, "iso_1_code": null, "iso_3_code": "ttv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1753", "native_tokenizers": [], @@ -3908,15 +4479,18 @@ }, { "name": "Ere", + "depth": 9, "iso_1_code": null, "iso_3_code": "twp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1754", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -3932,14 +4506,17 @@ }, { "name": "Mokoreng-Loniu", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Loniu", + "depth": 9, "iso_1_code": null, "iso_3_code": "los", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1756", "native_tokenizers": [], @@ -3947,15 +4524,18 @@ }, { "name": "Idio", + "depth": 9, "iso_1_code": null, "iso_3_code": "mft", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1757", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1755", "native_tokenizers": [], @@ -3963,14 +4543,17 @@ }, { "name": "West", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bipi", + "depth": 9, "iso_1_code": null, "iso_3_code": "biq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1759", "native_tokenizers": [], @@ -3978,9 +4561,11 @@ }, { "name": "Likum", + "depth": 9, "iso_1_code": null, "iso_3_code": "lib", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1760", "native_tokenizers": [], @@ -3988,9 +4573,11 @@ }, { "name": "Nyindrou", + "depth": 9, "iso_1_code": null, "iso_3_code": "lid", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4008,9 +4595,11 @@ }, { "name": "Hermit", + "depth": 9, "iso_1_code": null, "iso_3_code": "llf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1762", "native_tokenizers": [], @@ -4018,9 +4607,11 @@ }, { "name": "Mondropolon", + "depth": 9, "iso_1_code": null, "iso_3_code": "npn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1763", "native_tokenizers": [], @@ -4028,9 +4619,11 @@ }, { "name": "Tulu-Bohuai", + "depth": 9, "iso_1_code": null, "iso_3_code": "rak", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1764", "native_tokenizers": [], @@ -4038,9 +4631,11 @@ }, { "name": "Sori-Harengan", + "depth": 9, "iso_1_code": null, "iso_3_code": "sbh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1765", "native_tokenizers": [], @@ -4048,15 +4643,18 @@ }, { "name": "Khehek", + "depth": 9, "iso_1_code": null, "iso_3_code": "tlx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1766", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4071,6 +4669,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4086,20 +4685,24 @@ }, { "name": "Pak-Tong", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pak-Tong", + "depth": 8, "iso_1_code": null, "iso_3_code": "pkg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1768", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1767", "native_tokenizers": [], @@ -4107,14 +4710,17 @@ }, { "name": "Southeast Islands", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Paluai", + "depth": 8, "iso_1_code": null, "iso_3_code": "blq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1770", "native_tokenizers": [], @@ -4122,9 +4728,11 @@ }, { "name": "Lenkau", + "depth": 8, "iso_1_code": null, "iso_3_code": "ler", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1771", "native_tokenizers": [], @@ -4132,9 +4740,11 @@ }, { "name": "Lou", + "depth": 8, "iso_1_code": null, "iso_3_code": "loj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1772", "native_tokenizers": [], @@ -4142,9 +4752,11 @@ }, { "name": "Neherneh", + "depth": 8, "iso_1_code": null, "iso_3_code": "ncn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1773", "native_tokenizers": [], @@ -4152,21 +4764,25 @@ }, { "name": "Penchal", + "depth": 8, "iso_1_code": null, "iso_3_code": "pek", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1774", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1769", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4182,14 +4798,17 @@ }, { "name": "Western", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaniet", + "depth": 7, "iso_1_code": null, "iso_3_code": "ktk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1776", "native_tokenizers": [], @@ -4197,9 +4816,11 @@ }, { "name": "Seimat", + "depth": 7, "iso_1_code": null, "iso_3_code": "ssg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4217,9 +4838,11 @@ }, { "name": "Wuvulu-Aua", + "depth": 7, "iso_1_code": null, "iso_3_code": "wuv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4236,6 +4859,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4250,6 +4874,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4265,34 +4890,41 @@ }, { "name": "Central-Eastern Oceanic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Remote Oceanic", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Pacific", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Fijian-Polynesian", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Fijian", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fijian", + "depth": 10, "iso_1_code": "fj", "iso_3_code": "fij", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4310,9 +4942,11 @@ }, { "name": "Gone Dau", + "depth": 10, "iso_1_code": null, "iso_3_code": "goo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1785", "native_tokenizers": [], @@ -4320,9 +4954,11 @@ }, { "name": "Lauan", + "depth": 10, "iso_1_code": null, "iso_3_code": "llx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1786", "native_tokenizers": [], @@ -4330,15 +4966,18 @@ }, { "name": "Lomaiviti", + "depth": 10, "iso_1_code": null, "iso_3_code": "lmv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1787", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4354,29 +4993,35 @@ }, { "name": "Polynesian", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuclear", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rapa", + "depth": 13, "iso_1_code": null, "iso_3_code": "ray", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1792", "native_tokenizers": [], @@ -4384,14 +5029,17 @@ }, { "name": "Marquesic", + "depth": 13, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hawaiian", + "depth": 14, "iso_1_code": null, "iso_3_code": "haw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4409,9 +5057,11 @@ }, { "name": "Marquesan, South", + "depth": 14, "iso_1_code": null, "iso_3_code": "mqm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1795", "native_tokenizers": [], @@ -4419,9 +5069,11 @@ }, { "name": "Marquesan, North", + "depth": 14, "iso_1_code": null, "iso_3_code": "mrq", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4439,9 +5091,11 @@ }, { "name": "Mangareva", + "depth": 14, "iso_1_code": null, "iso_3_code": "mrv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4458,6 +5112,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4473,14 +5128,17 @@ }, { "name": "Tahitic", + "depth": 13, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Austral", + "depth": 14, "iso_1_code": null, "iso_3_code": "aut", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1799", "native_tokenizers": [], @@ -4488,9 +5146,11 @@ }, { "name": "Maori", + "depth": 14, "iso_1_code": "mi", "iso_3_code": "mri", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4508,9 +5168,11 @@ }, { "name": "Tuamotuan", + "depth": 14, "iso_1_code": null, "iso_3_code": "pmt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1801", "native_tokenizers": [], @@ -4518,9 +5180,11 @@ }, { "name": "Penrhyn", + "depth": 14, "iso_1_code": null, "iso_3_code": "pnh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1802", "native_tokenizers": [], @@ -4528,9 +5192,11 @@ }, { "name": "Cook Islands Maori", + "depth": 14, "iso_1_code": null, "iso_3_code": "rar", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4548,9 +5214,11 @@ }, { "name": "Rakahanga-Manihiki", + "depth": 14, "iso_1_code": null, "iso_3_code": "rkh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1804", "native_tokenizers": [], @@ -4558,9 +5226,11 @@ }, { "name": "Moriori", + "depth": 14, "iso_1_code": null, "iso_3_code": "rrm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1805", "native_tokenizers": [], @@ -4568,9 +5238,11 @@ }, { "name": "Tahitian", + "depth": 14, "iso_1_code": "ty", "iso_3_code": "tah", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4587,6 +5259,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4601,6 +5274,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4616,14 +5290,17 @@ }, { "name": "Rapanui", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rapa Nui", + "depth": 13, "iso_1_code": null, "iso_3_code": "rap", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4640,6 +5317,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4654,6 +5332,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4669,19 +5348,23 @@ }, { "name": "Samoic-Outlier", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Uvean-Niuafo\u2019ou", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Niuatoputapu", + "depth": 13, "iso_1_code": null, "iso_3_code": "nkp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1811", "native_tokenizers": [], @@ -4689,9 +5372,11 @@ }, { "name": "Niuafo\u2019ou", + "depth": 13, "iso_1_code": null, "iso_3_code": "num", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1812", "native_tokenizers": [], @@ -4699,9 +5384,11 @@ }, { "name": "Wallisian", + "depth": 13, "iso_1_code": null, "iso_3_code": "wls", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4718,6 +5405,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4733,14 +5421,17 @@ }, { "name": "Ellicean", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kapingamarangi", + "depth": 13, "iso_1_code": null, "iso_3_code": "kpg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4758,9 +5449,11 @@ }, { "name": "Takuu", + "depth": 13, "iso_1_code": null, "iso_3_code": "nho", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4778,9 +5471,11 @@ }, { "name": "Nukuoro", + "depth": 13, "iso_1_code": null, "iso_3_code": "nkr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1817", "native_tokenizers": [], @@ -4788,9 +5483,11 @@ }, { "name": "Nukumanu", + "depth": 13, "iso_1_code": null, "iso_3_code": "nuq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1818", "native_tokenizers": [], @@ -4798,9 +5495,11 @@ }, { "name": "Nukeria", + "depth": 13, "iso_1_code": null, "iso_3_code": "nur", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1819", "native_tokenizers": [], @@ -4808,9 +5507,11 @@ }, { "name": "Ontong Java", + "depth": 13, "iso_1_code": null, "iso_3_code": "ojv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1820", "native_tokenizers": [], @@ -4818,9 +5519,11 @@ }, { "name": "Sikaiana", + "depth": 13, "iso_1_code": null, "iso_3_code": "sky", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1821", "native_tokenizers": [], @@ -4828,9 +5531,11 @@ }, { "name": "Tuvaluan", + "depth": 13, "iso_1_code": null, "iso_3_code": "tvl", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4847,6 +5552,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4862,14 +5568,17 @@ }, { "name": "Futunic", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anuta", + "depth": 13, "iso_1_code": null, "iso_3_code": "aud", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1824", "native_tokenizers": [], @@ -4877,9 +5586,11 @@ }, { "name": "Futuna, East", + "depth": 13, "iso_1_code": null, "iso_3_code": "fud", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4897,9 +5608,11 @@ }, { "name": "Futuna-Aniwa", + "depth": 13, "iso_1_code": null, "iso_3_code": "fut", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1826", "native_tokenizers": [], @@ -4907,9 +5620,11 @@ }, { "name": "Emae", + "depth": 13, "iso_1_code": null, "iso_3_code": "mmw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1827", "native_tokenizers": [], @@ -4917,9 +5632,11 @@ }, { "name": "Rennell-Bellona", + "depth": 13, "iso_1_code": null, "iso_3_code": "mnv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1828", "native_tokenizers": [], @@ -4927,9 +5644,11 @@ }, { "name": "Mele-Fila", + "depth": 13, "iso_1_code": null, "iso_3_code": "mxe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1829", "native_tokenizers": [], @@ -4937,9 +5656,11 @@ }, { "name": "Vaeakau-Taumako", + "depth": 13, "iso_1_code": null, "iso_3_code": "piv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1830", "native_tokenizers": [], @@ -4947,9 +5668,11 @@ }, { "name": "Tikopia", + "depth": 13, "iso_1_code": null, "iso_3_code": "tkp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1831", "native_tokenizers": [], @@ -4957,15 +5680,18 @@ }, { "name": "Fagauvea", + "depth": 13, "iso_1_code": null, "iso_3_code": "uve", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1832", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -4981,20 +5707,24 @@ }, { "name": "Pukapuka", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pukapuka", + "depth": 13, "iso_1_code": null, "iso_3_code": "pkp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1834", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1833", "native_tokenizers": [], @@ -5002,14 +5732,17 @@ }, { "name": "Samoan", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Samoan", + "depth": 13, "iso_1_code": "sm", "iso_3_code": "smo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5026,6 +5759,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5041,14 +5775,17 @@ }, { "name": "Tokelauan", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tokelauan", + "depth": 13, "iso_1_code": null, "iso_3_code": "tkl", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5065,6 +5802,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5079,6 +5817,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5093,6 +5832,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5108,14 +5848,17 @@ }, { "name": "Tongic", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Niue", + "depth": 11, "iso_1_code": null, "iso_3_code": "niu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5133,9 +5876,11 @@ }, { "name": "Tongan", + "depth": 11, "iso_1_code": "to", "iso_3_code": "ton", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5152,6 +5897,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5166,6 +5912,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5180,6 +5927,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5195,19 +5943,23 @@ }, { "name": "West Fijian-Rotuman", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rotuman", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rotuman", + "depth": 10, "iso_1_code": null, "iso_3_code": "rtm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5224,6 +5976,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5239,14 +5992,17 @@ }, { "name": "West Fijian", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Namosi-Naitasiri-Serua", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1846", "native_tokenizers": [], @@ -5254,21 +6010,25 @@ }, { "name": "Fijian, Western", + "depth": 10, "iso_1_code": null, "iso_3_code": "wyy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1847", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1845", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5283,6 +6043,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5298,14 +6059,17 @@ }, { "name": "Loyalty Islands", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Drehu", + "depth": 8, "iso_1_code": null, "iso_3_code": "dhv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5323,9 +6087,11 @@ }, { "name": "Iaai", + "depth": 8, "iso_1_code": null, "iso_3_code": "iai", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1850", "native_tokenizers": [], @@ -5333,15 +6099,18 @@ }, { "name": "Nengone", + "depth": 8, "iso_1_code": null, "iso_3_code": "nen", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1851", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5357,24 +6126,29 @@ }, { "name": "Micronesian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Micronesian Proper", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ikiribati", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kiribati", + "depth": 10, "iso_1_code": null, "iso_3_code": "gil", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5391,6 +6165,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5406,14 +6181,17 @@ }, { "name": "Kusaiean", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kosraean", + "depth": 10, "iso_1_code": null, "iso_3_code": "kos", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5430,6 +6208,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5445,14 +6224,17 @@ }, { "name": "Marshallese", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marshallese", + "depth": 10, "iso_1_code": "mh", "iso_3_code": "mah", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5469,6 +6251,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5484,19 +6267,23 @@ }, { "name": "Pohnpeic-Chuukic", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chuukic", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Carolinian", + "depth": 11, "iso_1_code": null, "iso_3_code": "cal", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1862", "native_tokenizers": [], @@ -5504,9 +6291,11 @@ }, { "name": "Chuukese", + "depth": 11, "iso_1_code": null, "iso_3_code": "chk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5524,9 +6313,11 @@ }, { "name": "Mapia", + "depth": 11, "iso_1_code": null, "iso_3_code": "mpy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1864", "native_tokenizers": [], @@ -5534,9 +6325,11 @@ }, { "name": "Mortlockese", + "depth": 11, "iso_1_code": null, "iso_3_code": "mrl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1865", "native_tokenizers": [], @@ -5544,9 +6337,11 @@ }, { "name": "Namonuito", + "depth": 11, "iso_1_code": null, "iso_3_code": "nmt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1866", "native_tokenizers": [], @@ -5554,9 +6349,11 @@ }, { "name": "P\u00e1\u00e1fang", + "depth": 11, "iso_1_code": null, "iso_3_code": "pfa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1867", "native_tokenizers": [], @@ -5564,9 +6361,11 @@ }, { "name": "Puluwatese", + "depth": 11, "iso_1_code": null, "iso_3_code": "puw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1868", "native_tokenizers": [], @@ -5574,9 +6373,11 @@ }, { "name": "Sonsorolese", + "depth": 11, "iso_1_code": null, "iso_3_code": "sov", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1869", "native_tokenizers": [], @@ -5584,9 +6385,11 @@ }, { "name": "Satawalese", + "depth": 11, "iso_1_code": null, "iso_3_code": "stw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1870", "native_tokenizers": [], @@ -5594,9 +6397,11 @@ }, { "name": "Tobian", + "depth": 11, "iso_1_code": null, "iso_3_code": "tox", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1871", "native_tokenizers": [], @@ -5604,9 +6409,11 @@ }, { "name": "Tanapag", + "depth": 11, "iso_1_code": null, "iso_3_code": "tpv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1872", "native_tokenizers": [], @@ -5614,9 +6421,11 @@ }, { "name": "Ulithian", + "depth": 11, "iso_1_code": null, "iso_3_code": "uli", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1873", "native_tokenizers": [], @@ -5624,15 +6433,18 @@ }, { "name": "Woleaian", + "depth": 11, "iso_1_code": null, "iso_3_code": "woe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1874", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5648,14 +6460,17 @@ }, { "name": "Pohnpeic", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mokilese", + "depth": 11, "iso_1_code": null, "iso_3_code": "mkj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1876", "native_tokenizers": [], @@ -5663,9 +6478,11 @@ }, { "name": "Pingelapese", + "depth": 11, "iso_1_code": null, "iso_3_code": "pif", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1877", "native_tokenizers": [], @@ -5673,9 +6490,11 @@ }, { "name": "Pohnpeian", + "depth": 11, "iso_1_code": null, "iso_3_code": "pon", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5692,6 +6511,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5706,6 +6526,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5720,6 +6541,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5735,26 +6557,31 @@ }, { "name": "Nauruan", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nauruan", + "depth": 9, "iso_1_code": "na", "iso_3_code": "nau", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1880", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1879", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5770,25 +6597,30 @@ }, { "name": "New Caledonian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haekic", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haeke", + "depth": 9, "iso_1_code": null, "iso_3_code": "aek", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1883", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1882", "native_tokenizers": [], @@ -5796,14 +6628,17 @@ }, { "name": "Northern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haveke", + "depth": 9, "iso_1_code": null, "iso_3_code": "hvk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1885", "native_tokenizers": [], @@ -5811,9 +6646,11 @@ }, { "name": "Vamale", + "depth": 9, "iso_1_code": null, "iso_3_code": "mkt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1886", "native_tokenizers": [], @@ -5821,14 +6658,17 @@ }, { "name": "Central", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cemuh\u00ee", + "depth": 10, "iso_1_code": null, "iso_3_code": "cam", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1888", "native_tokenizers": [], @@ -5836,9 +6676,11 @@ }, { "name": "Paic\u00ee", + "depth": 10, "iso_1_code": null, "iso_3_code": "pri", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5855,6 +6697,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -5870,14 +6713,17 @@ }, { "name": "Extreme Northern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Caac", + "depth": 10, "iso_1_code": null, "iso_3_code": "msq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1891", "native_tokenizers": [], @@ -5885,9 +6731,11 @@ }, { "name": "N\u00eal\u00eamwa-Nixumwak", + "depth": 10, "iso_1_code": null, "iso_3_code": "nee", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1892", "native_tokenizers": [], @@ -5895,9 +6743,11 @@ }, { "name": "Yuanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "nua", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1893", "native_tokenizers": [], @@ -5905,15 +6755,18 @@ }, { "name": "Nyel\u00e2yu", + "depth": 10, "iso_1_code": null, "iso_3_code": "yly", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1894", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1890", "native_tokenizers": [], @@ -5921,14 +6774,17 @@ }, { "name": "North", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pwaamei", + "depth": 10, "iso_1_code": null, "iso_3_code": "pme", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1896", "native_tokenizers": [], @@ -5936,9 +6792,11 @@ }, { "name": "Pwapw\u00e2", + "depth": 10, "iso_1_code": null, "iso_3_code": "pop", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1897", "native_tokenizers": [], @@ -5946,14 +6804,17 @@ }, { "name": "Hmwaveke", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bwatoo", + "depth": 11, "iso_1_code": null, "iso_3_code": "bwa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1899", "native_tokenizers": [], @@ -5961,9 +6822,11 @@ }, { "name": "Hmwaveke", + "depth": 11, "iso_1_code": null, "iso_3_code": "mrk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1900", "native_tokenizers": [], @@ -5971,15 +6834,18 @@ }, { "name": "Waamwang", + "depth": 11, "iso_1_code": null, "iso_3_code": "wmn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1901", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1898", "native_tokenizers": [], @@ -5987,14 +6853,17 @@ }, { "name": "Nemi", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fw\u00e2i", + "depth": 11, "iso_1_code": null, "iso_3_code": "fwa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1903", "native_tokenizers": [], @@ -6002,9 +6871,11 @@ }, { "name": "Jawe", + "depth": 11, "iso_1_code": null, "iso_3_code": "jaz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1904", "native_tokenizers": [], @@ -6012,9 +6883,11 @@ }, { "name": "Nemi", + "depth": 11, "iso_1_code": null, "iso_3_code": "nem", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1905", "native_tokenizers": [], @@ -6022,27 +6895,32 @@ }, { "name": "Pije", + "depth": 11, "iso_1_code": null, "iso_3_code": "piz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1906", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1902", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1895", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6058,19 +6936,23 @@ }, { "name": "Southern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Extreme Southern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Drubea", + "depth": 10, "iso_1_code": null, "iso_3_code": "duf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1909", "native_tokenizers": [], @@ -6078,15 +6960,18 @@ }, { "name": "Num\u00e8\u00e8", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1910", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1908", "native_tokenizers": [], @@ -6094,19 +6979,23 @@ }, { "name": "South", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wailic", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aji\u00eb", + "depth": 11, "iso_1_code": null, "iso_3_code": "aji", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6124,9 +7013,11 @@ }, { "name": "Arh\u00f6", + "depth": 11, "iso_1_code": null, "iso_3_code": "aok", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1914", "native_tokenizers": [], @@ -6134,9 +7025,11 @@ }, { "name": "Arh\u00e2", + "depth": 11, "iso_1_code": null, "iso_3_code": "aqr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1915", "native_tokenizers": [], @@ -6144,9 +7037,11 @@ }, { "name": "Orowe", + "depth": 11, "iso_1_code": null, "iso_3_code": "bpk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1916", "native_tokenizers": [], @@ -6154,15 +7049,18 @@ }, { "name": "Neku", + "depth": 11, "iso_1_code": null, "iso_3_code": "nek", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1917", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6178,14 +7076,17 @@ }, { "name": "Xaracuu-Xaragure", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "X\u00e2r\u00e2c\u00f9\u00f9", + "depth": 11, "iso_1_code": null, "iso_3_code": "ane", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1919", "native_tokenizers": [], @@ -6193,15 +7094,18 @@ }, { "name": "X\u00e2r\u00e2gur\u00e8", + "depth": 11, "iso_1_code": null, "iso_3_code": "axx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1920", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1918", "native_tokenizers": [], @@ -6209,14 +7113,17 @@ }, { "name": "Zire-Tiri", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "T\u00eer\u00ee", + "depth": 11, "iso_1_code": null, "iso_3_code": "cir", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1922", "native_tokenizers": [], @@ -6224,21 +7131,25 @@ }, { "name": "S\u00eesh\u00eb\u00eb", + "depth": 11, "iso_1_code": null, "iso_3_code": "sih", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1923", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1921", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6253,6 +7164,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6267,6 +7179,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6282,30 +7195,36 @@ }, { "name": "North and Central Vanuatu", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Santo", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "N\u2019kep", + "depth": 10, "iso_1_code": null, "iso_3_code": "sku", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1927", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1926", "native_tokenizers": [], @@ -6313,14 +7232,17 @@ }, { "name": "South", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Butmas-Tur", + "depth": 10, "iso_1_code": null, "iso_3_code": "bnr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1929", "native_tokenizers": [], @@ -6328,9 +7250,11 @@ }, { "name": "Lorediakarkar", + "depth": 10, "iso_1_code": null, "iso_3_code": "lnn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1930", "native_tokenizers": [], @@ -6338,9 +7262,11 @@ }, { "name": "Atin", + "depth": 10, "iso_1_code": null, "iso_3_code": "plb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1931", "native_tokenizers": [], @@ -6348,21 +7274,25 @@ }, { "name": "Ngen", + "depth": 10, "iso_1_code": null, "iso_3_code": "ssv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1932", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1928", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1925", "native_tokenizers": [], @@ -6370,25 +7300,30 @@ }, { "name": "Malekula Interior", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Labo", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ninde", + "depth": 10, "iso_1_code": null, "iso_3_code": "mwi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1935", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1934", "native_tokenizers": [], @@ -6396,14 +7331,17 @@ }, { "name": "Malekula Central", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Neverver", + "depth": 10, "iso_1_code": null, "iso_3_code": "lgk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1937", "native_tokenizers": [], @@ -6411,9 +7349,11 @@ }, { "name": "Larevat", + "depth": 10, "iso_1_code": null, "iso_3_code": "lrv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1938", "native_tokenizers": [], @@ -6421,9 +7361,11 @@ }, { "name": "Litzlitz", + "depth": 10, "iso_1_code": null, "iso_3_code": "lzl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1939", "native_tokenizers": [], @@ -6431,9 +7373,11 @@ }, { "name": "Maragus", + "depth": 10, "iso_1_code": null, "iso_3_code": "mrs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1940", "native_tokenizers": [], @@ -6441,9 +7385,11 @@ }, { "name": "V\u2019\u00ebnen Taut", + "depth": 10, "iso_1_code": null, "iso_3_code": "nmb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1941", "native_tokenizers": [], @@ -6451,9 +7397,11 @@ }, { "name": "Nasarian", + "depth": 10, "iso_1_code": null, "iso_3_code": "nvh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1942", "native_tokenizers": [], @@ -6461,9 +7409,11 @@ }, { "name": "Avava", + "depth": 10, "iso_1_code": null, "iso_3_code": "tmb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1943", "native_tokenizers": [], @@ -6471,15 +7421,18 @@ }, { "name": "Neve\u2019ei", + "depth": 10, "iso_1_code": null, "iso_3_code": "vnm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1944", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1936", "native_tokenizers": [], @@ -6487,14 +7440,17 @@ }, { "name": "Small Nambas", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dixon Reef", + "depth": 10, "iso_1_code": null, "iso_3_code": "dix", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1946", "native_tokenizers": [], @@ -6502,9 +7458,11 @@ }, { "name": "Letemboi", + "depth": 10, "iso_1_code": null, "iso_3_code": "nms", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1947", "native_tokenizers": [], @@ -6512,21 +7470,25 @@ }, { "name": "Repanbitip", + "depth": 10, "iso_1_code": null, "iso_3_code": "rpn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1948", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1945", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1933", "native_tokenizers": [], @@ -6534,19 +7496,23 @@ }, { "name": "Northeast Vanuatu-Banks Islands", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Vanuatu", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Efate, South", + "depth": 10, "iso_1_code": null, "iso_3_code": "erk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1951", "native_tokenizers": [], @@ -6554,9 +7520,11 @@ }, { "name": "Eton", + "depth": 10, "iso_1_code": null, "iso_3_code": "etn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1952", "native_tokenizers": [], @@ -6564,9 +7532,11 @@ }, { "name": "Efate, North", + "depth": 10, "iso_1_code": null, "iso_3_code": "llp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1953", "native_tokenizers": [], @@ -6574,9 +7544,11 @@ }, { "name": "Lelepa", + "depth": 10, "iso_1_code": null, "iso_3_code": "lpa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1954", "native_tokenizers": [], @@ -6584,15 +7556,18 @@ }, { "name": "Namakura", + "depth": 10, "iso_1_code": null, "iso_3_code": "nmk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1955", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1950", "native_tokenizers": [], @@ -6600,14 +7575,17 @@ }, { "name": "East Vanuatu", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apma", + "depth": 10, "iso_1_code": null, "iso_3_code": "app", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1957", "native_tokenizers": [], @@ -6615,9 +7593,11 @@ }, { "name": "Daakaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "bpa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1958", "native_tokenizers": [], @@ -6625,9 +7605,11 @@ }, { "name": "Baetora", + "depth": 10, "iso_1_code": null, "iso_3_code": "btr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1959", "native_tokenizers": [], @@ -6635,9 +7617,11 @@ }, { "name": "Lonwolwol", + "depth": 10, "iso_1_code": null, "iso_3_code": "crc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1960", "native_tokenizers": [], @@ -6645,9 +7629,11 @@ }, { "name": "Fanbak", + "depth": 10, "iso_1_code": null, "iso_3_code": "fnb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1961", "native_tokenizers": [], @@ -6655,9 +7641,11 @@ }, { "name": "Hiw", + "depth": 10, "iso_1_code": null, "iso_3_code": "hiw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1962", "native_tokenizers": [], @@ -6665,9 +7653,11 @@ }, { "name": "Koro", + "depth": 10, "iso_1_code": null, "iso_3_code": "krf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1963", "native_tokenizers": [], @@ -6675,9 +7665,11 @@ }, { "name": "Lo-Toga", + "depth": 10, "iso_1_code": null, "iso_3_code": "lht", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1964", "native_tokenizers": [], @@ -6685,9 +7677,11 @@ }, { "name": "Lakon", + "depth": 10, "iso_1_code": null, "iso_3_code": "lkn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1965", "native_tokenizers": [], @@ -6695,9 +7689,11 @@ }, { "name": "Hano", + "depth": 10, "iso_1_code": null, "iso_3_code": "lml", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1966", "native_tokenizers": [], @@ -6705,9 +7701,11 @@ }, { "name": "Lemerig", + "depth": 10, "iso_1_code": null, "iso_3_code": "lrz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1967", "native_tokenizers": [], @@ -6715,9 +7713,11 @@ }, { "name": "Mwotlap", + "depth": 10, "iso_1_code": null, "iso_3_code": "mlv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1968", "native_tokenizers": [], @@ -6725,9 +7725,11 @@ }, { "name": "Ambrym, North", + "depth": 10, "iso_1_code": null, "iso_3_code": "mmg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1969", "native_tokenizers": [], @@ -6735,9 +7737,11 @@ }, { "name": "Marino", + "depth": 10, "iso_1_code": null, "iso_3_code": "mrb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1970", "native_tokenizers": [], @@ -6745,9 +7749,11 @@ }, { "name": "Mwerlap", + "depth": 10, "iso_1_code": null, "iso_3_code": "mrm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1971", "native_tokenizers": [], @@ -6755,9 +7761,11 @@ }, { "name": "Vur\u00ebs", + "depth": 10, "iso_1_code": null, "iso_3_code": "msn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1972", "native_tokenizers": [], @@ -6765,9 +7773,11 @@ }, { "name": "Mota", + "depth": 10, "iso_1_code": null, "iso_3_code": "mtt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1973", "native_tokenizers": [], @@ -6775,9 +7785,11 @@ }, { "name": "Maewo, Central", + "depth": 10, "iso_1_code": null, "iso_3_code": "mwo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1974", "native_tokenizers": [], @@ -6785,9 +7797,11 @@ }, { "name": "Ambae, West", + "depth": 10, "iso_1_code": null, "iso_3_code": "nnd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1975", "native_tokenizers": [], @@ -6795,9 +7809,11 @@ }, { "name": "Olrat", + "depth": 10, "iso_1_code": null, "iso_3_code": "olr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1976", "native_tokenizers": [], @@ -6805,9 +7821,11 @@ }, { "name": "Ambae, East", + "depth": 10, "iso_1_code": null, "iso_3_code": "omb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6825,9 +7843,11 @@ }, { "name": "Paama", + "depth": 10, "iso_1_code": null, "iso_3_code": "pma", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6845,9 +7865,11 @@ }, { "name": "Port Vato", + "depth": 10, "iso_1_code": null, "iso_3_code": "ptv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1979", "native_tokenizers": [], @@ -6855,9 +7877,11 @@ }, { "name": "Sa", + "depth": 10, "iso_1_code": null, "iso_3_code": "sax", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1980", "native_tokenizers": [], @@ -6865,9 +7889,11 @@ }, { "name": "Ske", + "depth": 10, "iso_1_code": null, "iso_3_code": "ske", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1981", "native_tokenizers": [], @@ -6875,9 +7901,11 @@ }, { "name": "Sowa", + "depth": 10, "iso_1_code": null, "iso_3_code": "sww", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1982", "native_tokenizers": [], @@ -6885,9 +7913,11 @@ }, { "name": "Nume", + "depth": 10, "iso_1_code": null, "iso_3_code": "tgs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1983", "native_tokenizers": [], @@ -6895,9 +7925,11 @@ }, { "name": "Lehali", + "depth": 10, "iso_1_code": null, "iso_3_code": "tql", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1984", "native_tokenizers": [], @@ -6905,9 +7937,11 @@ }, { "name": "Ambrym, Southeast", + "depth": 10, "iso_1_code": null, "iso_3_code": "tvk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6925,9 +7959,11 @@ }, { "name": "L\u00f6y\u00f6p", + "depth": 10, "iso_1_code": null, "iso_3_code": "urr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1986", "native_tokenizers": [], @@ -6935,9 +7971,11 @@ }, { "name": "Vera\u2019a", + "depth": 10, "iso_1_code": null, "iso_3_code": "vra", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1987", "native_tokenizers": [], @@ -6945,15 +7983,18 @@ }, { "name": "Dorig", + "depth": 10, "iso_1_code": null, "iso_3_code": "wwo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1988", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -6969,19 +8010,23 @@ }, { "name": "Epi", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bieria-Maii", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bieria", + "depth": 11, "iso_1_code": null, "iso_3_code": "brj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1991", "native_tokenizers": [], @@ -6989,15 +8034,18 @@ }, { "name": "Maii", + "depth": 11, "iso_1_code": null, "iso_3_code": "mmm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1992", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1990", "native_tokenizers": [], @@ -7005,19 +8053,23 @@ }, { "name": "Lamenu-Baki", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baki-Bierebo", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baki", + "depth": 12, "iso_1_code": null, "iso_3_code": "bki", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1995", "native_tokenizers": [], @@ -7025,15 +8077,18 @@ }, { "name": "Bierebo", + "depth": 12, "iso_1_code": null, "iso_3_code": "bnk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1996", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "1994", "native_tokenizers": [], @@ -7041,14 +8096,17 @@ }, { "name": "Lamenu-Lewo", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lamenu", + "depth": 12, "iso_1_code": null, "iso_3_code": "lmu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "1998", "native_tokenizers": [], @@ -7056,9 +8114,11 @@ }, { "name": "Lewo", + "depth": 12, "iso_1_code": null, "iso_3_code": "lww", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7075,6 +8135,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7089,6 +8150,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7103,6 +8165,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7118,14 +8181,17 @@ }, { "name": "Malekula Coastal", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Axamb", + "depth": 10, "iso_1_code": null, "iso_3_code": "ahb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2001", "native_tokenizers": [], @@ -7133,9 +8199,11 @@ }, { "name": "Aulua", + "depth": 10, "iso_1_code": null, "iso_3_code": "aul", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2002", "native_tokenizers": [], @@ -7143,9 +8211,11 @@ }, { "name": "Maskelynes", + "depth": 10, "iso_1_code": null, "iso_3_code": "klv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7163,9 +8233,11 @@ }, { "name": "Malua Bay", + "depth": 10, "iso_1_code": null, "iso_3_code": "mll", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2004", "native_tokenizers": [], @@ -7173,9 +8245,11 @@ }, { "name": "Na\u2019ahai", + "depth": 10, "iso_1_code": null, "iso_3_code": "mlx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2005", "native_tokenizers": [], @@ -7183,9 +8257,11 @@ }, { "name": "Mae", + "depth": 10, "iso_1_code": null, "iso_3_code": "mme", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2006", "native_tokenizers": [], @@ -7193,9 +8269,11 @@ }, { "name": "Mpotovoro", + "depth": 10, "iso_1_code": null, "iso_3_code": "mvt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2007", "native_tokenizers": [], @@ -7203,9 +8281,11 @@ }, { "name": "Unua", + "depth": 10, "iso_1_code": null, "iso_3_code": "onu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2008", "native_tokenizers": [], @@ -7213,9 +8293,11 @@ }, { "name": "Rerep", + "depth": 10, "iso_1_code": null, "iso_3_code": "pgk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2009", "native_tokenizers": [], @@ -7223,9 +8305,11 @@ }, { "name": "Port Sandwich", + "depth": 10, "iso_1_code": null, "iso_3_code": "psw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2010", "native_tokenizers": [], @@ -7233,9 +8317,11 @@ }, { "name": "Nahavaq", + "depth": 10, "iso_1_code": null, "iso_3_code": "sns", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2011", "native_tokenizers": [], @@ -7243,9 +8329,11 @@ }, { "name": "Uripiv-Wala-Rano-Atchin", + "depth": 10, "iso_1_code": null, "iso_3_code": "upv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7263,9 +8351,11 @@ }, { "name": "Vao", + "depth": 10, "iso_1_code": null, "iso_3_code": "vao", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2013", "native_tokenizers": [], @@ -7273,15 +8363,18 @@ }, { "name": "Banam Bay", + "depth": 10, "iso_1_code": null, "iso_3_code": "vrt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2014", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7297,14 +8390,17 @@ }, { "name": "West Santo", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Soro-n Raki", + "depth": 10, "iso_1_code": null, "iso_3_code": "akr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2016", "native_tokenizers": [], @@ -7312,9 +8408,11 @@ }, { "name": "Amblong", + "depth": 10, "iso_1_code": null, "iso_3_code": "alm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2017", "native_tokenizers": [], @@ -7322,9 +8420,11 @@ }, { "name": "Aore", + "depth": 10, "iso_1_code": null, "iso_3_code": "aor", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2018", "native_tokenizers": [], @@ -7332,9 +8432,11 @@ }, { "name": "Kiae", + "depth": 10, "iso_1_code": null, "iso_3_code": "frt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2019", "native_tokenizers": [], @@ -7342,9 +8444,11 @@ }, { "name": "Merei", + "depth": 10, "iso_1_code": null, "iso_3_code": "lmb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2020", "native_tokenizers": [], @@ -7352,9 +8456,11 @@ }, { "name": "Mafea", + "depth": 10, "iso_1_code": null, "iso_3_code": "mkv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2021", "native_tokenizers": [], @@ -7362,9 +8468,11 @@ }, { "name": "Malo", + "depth": 10, "iso_1_code": null, "iso_3_code": "mla", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2022", "native_tokenizers": [], @@ -7372,9 +8480,11 @@ }, { "name": "Tiale", + "depth": 10, "iso_1_code": null, "iso_3_code": "mnl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2023", "native_tokenizers": [], @@ -7382,9 +8492,11 @@ }, { "name": "Morouas", + "depth": 10, "iso_1_code": null, "iso_3_code": "mrp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2024", "native_tokenizers": [], @@ -7392,9 +8504,11 @@ }, { "name": "Tanokuku", + "depth": 10, "iso_1_code": null, "iso_3_code": "nkk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2025", "native_tokenizers": [], @@ -7402,9 +8516,11 @@ }, { "name": "Varsaf", + "depth": 10, "iso_1_code": null, "iso_3_code": "nrg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2026", "native_tokenizers": [], @@ -7412,9 +8528,11 @@ }, { "name": "Balen", + "depth": 10, "iso_1_code": null, "iso_3_code": "nsw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2027", "native_tokenizers": [], @@ -7422,9 +8540,11 @@ }, { "name": "Tapiafaru", + "depth": 10, "iso_1_code": null, "iso_3_code": "ptr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2028", "native_tokenizers": [], @@ -7432,9 +8552,11 @@ }, { "name": "Mores", + "depth": 10, "iso_1_code": null, "iso_3_code": "rga", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2029", "native_tokenizers": [], @@ -7442,9 +8564,11 @@ }, { "name": "Tangoa", + "depth": 10, "iso_1_code": null, "iso_3_code": "tgp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7462,9 +8586,11 @@ }, { "name": "Tolomako", + "depth": 10, "iso_1_code": null, "iso_3_code": "tlm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2031", "native_tokenizers": [], @@ -7472,9 +8598,11 @@ }, { "name": "Tambotalo", + "depth": 10, "iso_1_code": null, "iso_3_code": "tls", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2032", "native_tokenizers": [], @@ -7482,9 +8610,11 @@ }, { "name": "Vinekula", + "depth": 10, "iso_1_code": null, "iso_3_code": "tmi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2033", "native_tokenizers": [], @@ -7492,9 +8622,11 @@ }, { "name": "Oa", + "depth": 10, "iso_1_code": null, "iso_3_code": "tmt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2034", "native_tokenizers": [], @@ -7502,9 +8634,11 @@ }, { "name": "Akei", + "depth": 10, "iso_1_code": null, "iso_3_code": "tsr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2035", "native_tokenizers": [], @@ -7512,9 +8646,11 @@ }, { "name": "Tavanlav", + "depth": 10, "iso_1_code": null, "iso_3_code": "vlp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2036", "native_tokenizers": [], @@ -7522,9 +8658,11 @@ }, { "name": "Tapesena", + "depth": 10, "iso_1_code": null, "iso_3_code": "vnp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2037", "native_tokenizers": [], @@ -7532,9 +8670,11 @@ }, { "name": "Moiso", + "depth": 10, "iso_1_code": null, "iso_3_code": "wlr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2038", "native_tokenizers": [], @@ -7542,15 +8682,18 @@ }, { "name": "Jo", + "depth": 10, "iso_1_code": null, "iso_3_code": "wsi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2039", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7565,6 +8708,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7579,6 +8723,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7593,6 +8738,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7608,25 +8754,30 @@ }, { "name": "South Vanuatu", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aneityum", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aneityum", + "depth": 8, "iso_1_code": null, "iso_3_code": "aty", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2042", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2041", "native_tokenizers": [], @@ -7634,14 +8785,17 @@ }, { "name": "Erromanga", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sie", + "depth": 8, "iso_1_code": null, "iso_3_code": "erg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2044", "native_tokenizers": [], @@ -7649,9 +8803,11 @@ }, { "name": "Ifo", + "depth": 8, "iso_1_code": null, "iso_3_code": "iff", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2045", "native_tokenizers": [], @@ -7659,15 +8815,18 @@ }, { "name": "Ura", + "depth": 8, "iso_1_code": null, "iso_3_code": "uur", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2046", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2043", "native_tokenizers": [], @@ -7675,14 +8834,17 @@ }, { "name": "Tanna", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tanna, Southwest", + "depth": 8, "iso_1_code": null, "iso_3_code": "nwi", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7700,9 +8862,11 @@ }, { "name": "Kwamera", + "depth": 8, "iso_1_code": null, "iso_3_code": "tnk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7720,9 +8884,11 @@ }, { "name": "Lenakel", + "depth": 8, "iso_1_code": null, "iso_3_code": "tnl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2050", "native_tokenizers": [], @@ -7730,9 +8896,11 @@ }, { "name": "Tanna, North", + "depth": 8, "iso_1_code": null, "iso_3_code": "tnn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7750,9 +8918,11 @@ }, { "name": "Whitesands", + "depth": 8, "iso_1_code": null, "iso_3_code": "tnp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7769,6 +8939,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7783,6 +8954,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7798,24 +8970,29 @@ }, { "name": "Southeast Solomonic", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gela-Guadalcanal", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bughotu", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bughotu", + "depth": 9, "iso_1_code": null, "iso_3_code": "bgt", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7832,6 +9009,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7847,14 +9025,17 @@ }, { "name": "Gela", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lengo", + "depth": 9, "iso_1_code": null, "iso_3_code": "lgr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2058", "native_tokenizers": [], @@ -7862,9 +9043,11 @@ }, { "name": "Gela", + "depth": 9, "iso_1_code": null, "iso_3_code": "nlg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7881,6 +9064,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7896,14 +9080,17 @@ }, { "name": "Guadalcanal", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Birao", + "depth": 9, "iso_1_code": null, "iso_3_code": "brr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2061", "native_tokenizers": [], @@ -7911,9 +9098,11 @@ }, { "name": "Ghari", + "depth": 9, "iso_1_code": null, "iso_3_code": "gri", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2062", "native_tokenizers": [], @@ -7921,9 +9110,11 @@ }, { "name": "Malango", + "depth": 9, "iso_1_code": null, "iso_3_code": "mln", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2063", "native_tokenizers": [], @@ -7931,21 +9122,25 @@ }, { "name": "Talise", + "depth": 9, "iso_1_code": null, "iso_3_code": "tlr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2064", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2060", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -7961,30 +9156,36 @@ }, { "name": "Malaita-San Cristobal", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malaita", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Longgu", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Longgu", + "depth": 10, "iso_1_code": null, "iso_3_code": "lgu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2068", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2067", "native_tokenizers": [], @@ -7992,14 +9193,17 @@ }, { "name": "Northern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baelelea", + "depth": 10, "iso_1_code": null, "iso_3_code": "bvc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8017,9 +9221,11 @@ }, { "name": "Baeggu", + "depth": 10, "iso_1_code": null, "iso_3_code": "bvd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8037,9 +9243,11 @@ }, { "name": "Fataleka", + "depth": 10, "iso_1_code": null, "iso_3_code": "far", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8057,9 +9265,11 @@ }, { "name": "Gula\u2019alaa", + "depth": 10, "iso_1_code": null, "iso_3_code": "gmb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2073", "native_tokenizers": [], @@ -8067,9 +9277,11 @@ }, { "name": "Kwaio", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8087,9 +9299,11 @@ }, { "name": "Kwara\u2019ae", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwf", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8107,9 +9321,11 @@ }, { "name": "Wala", + "depth": 10, "iso_1_code": null, "iso_3_code": "lgl", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8127,9 +9343,11 @@ }, { "name": "Lau", + "depth": 10, "iso_1_code": null, "iso_3_code": "llu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2077", "native_tokenizers": [], @@ -8137,9 +9355,11 @@ }, { "name": "To\u2019abaita", + "depth": 10, "iso_1_code": null, "iso_3_code": "mlu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8156,6 +9376,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8171,14 +9392,17 @@ }, { "name": "Southern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u2019Are\u2019are", + "depth": 10, "iso_1_code": null, "iso_3_code": "alu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2080", "native_tokenizers": [], @@ -8186,9 +9410,11 @@ }, { "name": "Sa\ua78ca", + "depth": 10, "iso_1_code": null, "iso_3_code": "apb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8206,9 +9432,11 @@ }, { "name": "Dori\u2019o", + "depth": 10, "iso_1_code": null, "iso_3_code": "dor", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2082", "native_tokenizers": [], @@ -8216,15 +9444,18 @@ }, { "name": "Oroha", + "depth": 10, "iso_1_code": null, "iso_3_code": "ora", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2083", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8239,6 +9470,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8254,14 +9486,17 @@ }, { "name": "San Cristobal", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kahua", + "depth": 9, "iso_1_code": null, "iso_3_code": "agw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8279,9 +9514,11 @@ }, { "name": "Arosi", + "depth": 9, "iso_1_code": null, "iso_3_code": "aia", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8299,9 +9536,11 @@ }, { "name": "Bauro", + "depth": 9, "iso_1_code": null, "iso_3_code": "bxa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2087", "native_tokenizers": [], @@ -8309,9 +9548,11 @@ }, { "name": "Fagani", + "depth": 9, "iso_1_code": null, "iso_3_code": "faf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2088", "native_tokenizers": [], @@ -8319,9 +9560,11 @@ }, { "name": "Owa", + "depth": 9, "iso_1_code": null, "iso_3_code": "stn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8338,6 +9581,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8352,6 +9596,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8366,6 +9611,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8380,6 +9626,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8395,14 +9642,17 @@ }, { "name": "St. Matthias", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mussau-Emira", + "depth": 6, "iso_1_code": null, "iso_3_code": "emi", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8420,15 +9670,18 @@ }, { "name": "Tenis", + "depth": 6, "iso_1_code": null, "iso_3_code": "tns", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2092", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8444,19 +9697,23 @@ }, { "name": "Temotu", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Reefs-Santa Cruz", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u00c4iwoo", + "depth": 7, "iso_1_code": null, "iso_3_code": "nfl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2095", "native_tokenizers": [], @@ -8464,9 +9721,11 @@ }, { "name": "Engdewu", + "depth": 7, "iso_1_code": null, "iso_3_code": "ngr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2096", "native_tokenizers": [], @@ -8474,9 +9733,11 @@ }, { "name": "Nal\u00f6go", + "depth": 7, "iso_1_code": null, "iso_3_code": "nlz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2097", "native_tokenizers": [], @@ -8484,9 +9745,11 @@ }, { "name": "Noip\u00e4", + "depth": 7, "iso_1_code": null, "iso_3_code": "npx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2098", "native_tokenizers": [], @@ -8494,9 +9757,11 @@ }, { "name": "Nat\u00fcgu", + "depth": 7, "iso_1_code": null, "iso_3_code": "ntu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8513,6 +9778,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8528,14 +9794,17 @@ }, { "name": "Utupua-Vanikoro", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Teanu", + "depth": 7, "iso_1_code": null, "iso_3_code": "tkw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2101", "native_tokenizers": [], @@ -8543,9 +9812,11 @@ }, { "name": "Tanema", + "depth": 7, "iso_1_code": null, "iso_3_code": "tnx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2102", "native_tokenizers": [], @@ -8553,9 +9824,11 @@ }, { "name": "Lovono", + "depth": 7, "iso_1_code": null, "iso_3_code": "vnk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2103", "native_tokenizers": [], @@ -8563,14 +9836,17 @@ }, { "name": "Utupua", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asumboa", + "depth": 8, "iso_1_code": null, "iso_3_code": "aua", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2105", "native_tokenizers": [], @@ -8578,9 +9854,11 @@ }, { "name": "Tanibili", + "depth": 8, "iso_1_code": null, "iso_3_code": "tbe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2106", "native_tokenizers": [], @@ -8588,27 +9866,32 @@ }, { "name": "Amba", + "depth": 8, "iso_1_code": null, "iso_3_code": "utp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2107", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2104", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2100", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8624,24 +9907,29 @@ }, { "name": "Western Oceanic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Meso Melanesian", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bali-Vitu", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Uneapa", + "depth": 8, "iso_1_code": null, "iso_3_code": "bbn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2111", "native_tokenizers": [], @@ -8649,15 +9937,18 @@ }, { "name": "Vitu", + "depth": 8, "iso_1_code": null, "iso_3_code": "wiv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2112", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2110", "native_tokenizers": [], @@ -8665,19 +9956,23 @@ }, { "name": "New Ireland", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lavongai-Nalik", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tungag", + "depth": 9, "iso_1_code": null, "iso_3_code": "lcm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8695,9 +9990,11 @@ }, { "name": "Kara", + "depth": 9, "iso_1_code": null, "iso_3_code": "leu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8715,9 +10012,11 @@ }, { "name": "Lakurumau", + "depth": 9, "iso_1_code": null, "iso_3_code": "lxm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2117", "native_tokenizers": [], @@ -8725,9 +10024,11 @@ }, { "name": "Nalik", + "depth": 9, "iso_1_code": null, "iso_3_code": "nal", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2118", "native_tokenizers": [], @@ -8735,9 +10036,11 @@ }, { "name": "Mandara", + "depth": 9, "iso_1_code": null, "iso_3_code": "tbf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2119", "native_tokenizers": [], @@ -8745,9 +10048,11 @@ }, { "name": "Tiang", + "depth": 9, "iso_1_code": null, "iso_3_code": "tbj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2120", "native_tokenizers": [], @@ -8755,15 +10060,18 @@ }, { "name": "Tigak", + "depth": 9, "iso_1_code": null, "iso_3_code": "tgc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2121", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8779,14 +10087,17 @@ }, { "name": "Madak", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barok", + "depth": 9, "iso_1_code": null, "iso_3_code": "bjk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2123", "native_tokenizers": [], @@ -8794,9 +10105,11 @@ }, { "name": "Lavatbura-Lamusong", + "depth": 9, "iso_1_code": null, "iso_3_code": "lbv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2124", "native_tokenizers": [], @@ -8804,9 +10117,11 @@ }, { "name": "Madak", + "depth": 9, "iso_1_code": null, "iso_3_code": "mmx", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8823,6 +10138,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -8838,14 +10154,17 @@ }, { "name": "South New Ireland-Northwest Solomonic", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Minigir", + "depth": 9, "iso_1_code": null, "iso_3_code": "bxf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2127", "native_tokenizers": [], @@ -8853,14 +10172,17 @@ }, { "name": "Choiseul", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Babatana", + "depth": 10, "iso_1_code": null, "iso_3_code": "baa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2129", "native_tokenizers": [], @@ -8868,9 +10190,11 @@ }, { "name": "Ririo", + "depth": 10, "iso_1_code": null, "iso_3_code": "rri", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2130", "native_tokenizers": [], @@ -8878,9 +10202,11 @@ }, { "name": "Vaghua", + "depth": 10, "iso_1_code": null, "iso_3_code": "tva", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2131", "native_tokenizers": [], @@ -8888,15 +10214,18 @@ }, { "name": "Varisi", + "depth": 10, "iso_1_code": null, "iso_3_code": "vrs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2132", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2128", "native_tokenizers": [], @@ -8904,14 +10233,17 @@ }, { "name": "Mono-Uruava", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mono", + "depth": 10, "iso_1_code": null, "iso_3_code": "mte", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2134", "native_tokenizers": [], @@ -8919,9 +10251,11 @@ }, { "name": "Torau", + "depth": 10, "iso_1_code": null, "iso_3_code": "ttu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2135", "native_tokenizers": [], @@ -8929,9 +10263,11 @@ }, { "name": "Uruava", + "depth": 10, "iso_1_code": null, "iso_3_code": "urv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2136", "native_tokenizers": [], @@ -8939,15 +10275,18 @@ }, { "name": "Vinitiri", + "depth": 10, "iso_1_code": null, "iso_3_code": "vmg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2137", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2133", "native_tokenizers": [], @@ -8955,19 +10294,23 @@ }, { "name": "Nehan-North Bougainville", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buka", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Petats", + "depth": 11, "iso_1_code": null, "iso_3_code": "pex", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2140", "native_tokenizers": [], @@ -8975,14 +10318,17 @@ }, { "name": "Halia", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hak\u00f6", + "depth": 12, "iso_1_code": null, "iso_3_code": "hao", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2142", "native_tokenizers": [], @@ -8990,9 +10336,11 @@ }, { "name": "Halia", + "depth": 12, "iso_1_code": null, "iso_3_code": "hla", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9009,6 +10357,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9023,6 +10372,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9038,14 +10388,17 @@ }, { "name": "Nehan", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nehan", + "depth": 11, "iso_1_code": null, "iso_3_code": "nsn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9062,6 +10415,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9077,20 +10431,24 @@ }, { "name": "Papapana", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Papapana", + "depth": 11, "iso_1_code": null, "iso_3_code": "ppn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2147", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2146", "native_tokenizers": [], @@ -9098,14 +10456,17 @@ }, { "name": "Saposa-Tinputz", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hahon", + "depth": 11, "iso_1_code": null, "iso_3_code": "hah", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2149", "native_tokenizers": [], @@ -9113,9 +10474,11 @@ }, { "name": "Saposa", + "depth": 11, "iso_1_code": null, "iso_3_code": "sps", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9133,9 +10496,11 @@ }, { "name": "Teop", + "depth": 11, "iso_1_code": null, "iso_3_code": "tio", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2151", "native_tokenizers": [], @@ -9143,9 +10508,11 @@ }, { "name": "Tinputz", + "depth": 11, "iso_1_code": null, "iso_3_code": "tpz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9162,6 +10529,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9177,26 +10545,31 @@ }, { "name": "Solos", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Solos", + "depth": 11, "iso_1_code": null, "iso_3_code": "sol", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2154", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2153", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9212,19 +10585,23 @@ }, { "name": "New Georgia", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vangunu", + "depth": 11, "iso_1_code": null, "iso_3_code": "mpr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2157", "native_tokenizers": [], @@ -9232,15 +10609,18 @@ }, { "name": "Marovo", + "depth": 11, "iso_1_code": null, "iso_3_code": "mvo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2158", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2156", "native_tokenizers": [], @@ -9248,14 +10628,17 @@ }, { "name": "West", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ghanongga", + "depth": 11, "iso_1_code": null, "iso_3_code": "ghn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2160", "native_tokenizers": [], @@ -9263,9 +10646,11 @@ }, { "name": "Hoava", + "depth": 11, "iso_1_code": null, "iso_3_code": "hoa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2161", "native_tokenizers": [], @@ -9273,9 +10658,11 @@ }, { "name": "Kusaghe", + "depth": 11, "iso_1_code": null, "iso_3_code": "ksg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2162", "native_tokenizers": [], @@ -9283,9 +10670,11 @@ }, { "name": "Kazukuru", + "depth": 11, "iso_1_code": null, "iso_3_code": "kzk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2163", "native_tokenizers": [], @@ -9293,9 +10682,11 @@ }, { "name": "Lungga", + "depth": 11, "iso_1_code": null, "iso_3_code": "lga", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2164", "native_tokenizers": [], @@ -9303,9 +10694,11 @@ }, { "name": "Dughore", + "depth": 11, "iso_1_code": null, "iso_3_code": "nke", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2165", "native_tokenizers": [], @@ -9313,9 +10706,11 @@ }, { "name": "Roviana", + "depth": 11, "iso_1_code": null, "iso_3_code": "rug", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9333,9 +10728,11 @@ }, { "name": "Simbo", + "depth": 11, "iso_1_code": null, "iso_3_code": "sbb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2167", "native_tokenizers": [], @@ -9343,15 +10740,18 @@ }, { "name": "Ughele", + "depth": 11, "iso_1_code": null, "iso_3_code": "uge", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2168", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9366,6 +10766,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9381,14 +10782,17 @@ }, { "name": "Patpatar-Tolai", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fanamaket", + "depth": 10, "iso_1_code": null, "iso_3_code": "bjp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9406,9 +10810,11 @@ }, { "name": "Patpatar", + "depth": 10, "iso_1_code": null, "iso_3_code": "gfk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9426,9 +10832,11 @@ }, { "name": "Guramalum", + "depth": 10, "iso_1_code": null, "iso_3_code": "grz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2172", "native_tokenizers": [], @@ -9436,9 +10844,11 @@ }, { "name": "Niwer Mil", + "depth": 10, "iso_1_code": null, "iso_3_code": "hrc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2173", "native_tokenizers": [], @@ -9446,9 +10856,11 @@ }, { "name": "Warwar Feni", + "depth": 10, "iso_1_code": null, "iso_3_code": "hrw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2174", "native_tokenizers": [], @@ -9456,9 +10868,11 @@ }, { "name": "Konomala", + "depth": 10, "iso_1_code": null, "iso_3_code": "koa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2175", "native_tokenizers": [], @@ -9466,9 +10880,11 @@ }, { "name": "Kandas", + "depth": 10, "iso_1_code": null, "iso_3_code": "kqw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9486,9 +10902,11 @@ }, { "name": "Kuanua", + "depth": 10, "iso_1_code": null, "iso_3_code": "ksd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9506,9 +10924,11 @@ }, { "name": "Label", + "depth": 10, "iso_1_code": null, "iso_3_code": "lbb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9526,9 +10946,11 @@ }, { "name": "Ramoaaina", + "depth": 10, "iso_1_code": null, "iso_3_code": "rai", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9546,9 +10968,11 @@ }, { "name": "Sursurunga", + "depth": 10, "iso_1_code": null, "iso_3_code": "sgz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9566,15 +10990,18 @@ }, { "name": "Siar-Lak", + "depth": 10, "iso_1_code": null, "iso_3_code": "sjr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2181", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9590,14 +11017,17 @@ }, { "name": "Piva-Banoni", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bannoni", + "depth": 10, "iso_1_code": null, "iso_3_code": "bcm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2183", "native_tokenizers": [], @@ -9605,15 +11035,18 @@ }, { "name": "Lawunuia", + "depth": 10, "iso_1_code": null, "iso_3_code": "tgi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2184", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2182", "native_tokenizers": [], @@ -9621,19 +11054,23 @@ }, { "name": "Santa Isabel", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Blablanga", + "depth": 11, "iso_1_code": null, "iso_3_code": "blp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2187", "native_tokenizers": [], @@ -9641,9 +11078,11 @@ }, { "name": "Zazao", + "depth": 11, "iso_1_code": null, "iso_3_code": "jaj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2188", "native_tokenizers": [], @@ -9651,15 +11090,18 @@ }, { "name": "Kokota", + "depth": 11, "iso_1_code": null, "iso_3_code": "kkk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2189", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2186", "native_tokenizers": [], @@ -9667,14 +11109,17 @@ }, { "name": "East", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gao", + "depth": 11, "iso_1_code": null, "iso_3_code": "gga", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2191", "native_tokenizers": [], @@ -9682,15 +11127,18 @@ }, { "name": "Cheke Holo", + "depth": 11, "iso_1_code": null, "iso_3_code": "mrn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2192", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2190", "native_tokenizers": [], @@ -9698,14 +11146,17 @@ }, { "name": "West", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zabana", + "depth": 11, "iso_1_code": null, "iso_3_code": "kji", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2194", "native_tokenizers": [], @@ -9713,27 +11164,32 @@ }, { "name": "Laghu", + "depth": 11, "iso_1_code": null, "iso_3_code": "lgb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2195", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2193", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2185", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9749,14 +11205,17 @@ }, { "name": "Tabar", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lihir", + "depth": 9, "iso_1_code": null, "iso_3_code": "lih", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2197", "native_tokenizers": [], @@ -9764,15 +11223,18 @@ }, { "name": "Notsi", + "depth": 9, "iso_1_code": null, "iso_3_code": "ncf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2198", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2196", "native_tokenizers": [], @@ -9780,26 +11242,31 @@ }, { "name": "Tomoip", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tomoip", + "depth": 9, "iso_1_code": null, "iso_3_code": "tqp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2200", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2199", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9815,14 +11282,17 @@ }, { "name": "Willaumez", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bulu", + "depth": 8, "iso_1_code": null, "iso_3_code": "bjl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2202", "native_tokenizers": [], @@ -9830,9 +11300,11 @@ }, { "name": "Bola", + "depth": 8, "iso_1_code": null, "iso_3_code": "bnp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9850,9 +11322,11 @@ }, { "name": "Meramera", + "depth": 8, "iso_1_code": null, "iso_3_code": "mxm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2204", "native_tokenizers": [], @@ -9860,9 +11334,11 @@ }, { "name": "Nakanai", + "depth": 8, "iso_1_code": null, "iso_3_code": "nak", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9879,6 +11355,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9893,6 +11370,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -9908,34 +11386,41 @@ }, { "name": "North New Guinea", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Huon Gulf", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Markham", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lower", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Busu", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duwet", + "depth": 11, "iso_1_code": null, "iso_3_code": "gve", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2211", "native_tokenizers": [], @@ -9943,9 +11428,11 @@ }, { "name": "Aribwatsa", + "depth": 11, "iso_1_code": null, "iso_3_code": "laz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2212", "native_tokenizers": [], @@ -9953,9 +11440,11 @@ }, { "name": "Musom", + "depth": 11, "iso_1_code": null, "iso_3_code": "msu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2213", "native_tokenizers": [], @@ -9963,9 +11452,11 @@ }, { "name": "Nafi", + "depth": 11, "iso_1_code": null, "iso_3_code": "srf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2214", "native_tokenizers": [], @@ -9973,15 +11464,18 @@ }, { "name": "Aribwaung", + "depth": 11, "iso_1_code": null, "iso_3_code": "ylu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2215", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2210", "native_tokenizers": [], @@ -9989,20 +11483,24 @@ }, { "name": "Labu", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Labu", + "depth": 11, "iso_1_code": null, "iso_3_code": "lbu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2217", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2216", "native_tokenizers": [], @@ -10010,26 +11508,31 @@ }, { "name": "Wampar", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wampar", + "depth": 11, "iso_1_code": null, "iso_3_code": "lbq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2219", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2218", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2209", "native_tokenizers": [], @@ -10037,14 +11540,17 @@ }, { "name": "Upper", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adzera", + "depth": 10, "iso_1_code": null, "iso_3_code": "adz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10062,14 +11568,17 @@ }, { "name": "Mountain", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mari", + "depth": 11, "iso_1_code": null, "iso_3_code": "hob", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2223", "native_tokenizers": [], @@ -10077,9 +11586,11 @@ }, { "name": "Wampur", + "depth": 11, "iso_1_code": null, "iso_3_code": "waz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2224", "native_tokenizers": [], @@ -10087,9 +11598,11 @@ }, { "name": "Sarasira", + "depth": 11, "iso_1_code": null, "iso_3_code": "zsa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2225", "native_tokenizers": [], @@ -10097,21 +11610,25 @@ }, { "name": "Sukurum", + "depth": 11, "iso_1_code": null, "iso_3_code": "zsu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2226", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2222", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10127,14 +11644,17 @@ }, { "name": "Watut", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kodut, South", + "depth": 10, "iso_1_code": null, "iso_3_code": "mcy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2228", "native_tokenizers": [], @@ -10142,9 +11662,11 @@ }, { "name": "Kodut, Middle", + "depth": 10, "iso_1_code": null, "iso_3_code": "mpl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2229", "native_tokenizers": [], @@ -10152,21 +11674,25 @@ }, { "name": "Kodut, North", + "depth": 10, "iso_1_code": null, "iso_3_code": "una", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2230", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2227", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10182,14 +11708,17 @@ }, { "name": "North", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bugawac", + "depth": 9, "iso_1_code": null, "iso_3_code": "buk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10207,9 +11736,11 @@ }, { "name": "Yabem", + "depth": 9, "iso_1_code": null, "iso_3_code": "jae", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10227,15 +11758,18 @@ }, { "name": "Kala", + "depth": 9, "iso_1_code": null, "iso_3_code": "kcl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2234", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10251,20 +11785,24 @@ }, { "name": "Numbami", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Numbami", + "depth": 9, "iso_1_code": null, "iso_3_code": "sij", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2236", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2235", "native_tokenizers": [], @@ -10272,24 +11810,29 @@ }, { "name": "South", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hote-Buang", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buang", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buang, Central", + "depth": 11, "iso_1_code": null, "iso_3_code": "bzh", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10307,9 +11850,11 @@ }, { "name": "Buang, Mangga", + "depth": 11, "iso_1_code": null, "iso_3_code": "mmo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10327,9 +11872,11 @@ }, { "name": "Piu", + "depth": 11, "iso_1_code": null, "iso_3_code": "pix", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2242", "native_tokenizers": [], @@ -10337,9 +11884,11 @@ }, { "name": "Kapin", + "depth": 11, "iso_1_code": null, "iso_3_code": "tbx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2243", "native_tokenizers": [], @@ -10347,9 +11896,11 @@ }, { "name": "Vehes", + "depth": 11, "iso_1_code": null, "iso_3_code": "val", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2244", "native_tokenizers": [], @@ -10357,14 +11908,17 @@ }, { "name": "Mumeng", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dambi", + "depth": 12, "iso_1_code": null, "iso_3_code": "dac", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2246", "native_tokenizers": [], @@ -10372,9 +11926,11 @@ }, { "name": "Gorakor", + "depth": 12, "iso_1_code": null, "iso_3_code": "goc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2247", "native_tokenizers": [], @@ -10382,9 +11938,11 @@ }, { "name": "Kumalu", + "depth": 12, "iso_1_code": null, "iso_3_code": "ksl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2248", "native_tokenizers": [], @@ -10392,9 +11950,11 @@ }, { "name": "Patep", + "depth": 12, "iso_1_code": null, "iso_3_code": "ptp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10412,15 +11972,18 @@ }, { "name": "Zenag", + "depth": 12, "iso_1_code": null, "iso_3_code": "zeg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2250", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10435,6 +11998,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10450,14 +12014,17 @@ }, { "name": "Hote", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malei", + "depth": 11, "iso_1_code": null, "iso_3_code": "hot", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10475,15 +12042,18 @@ }, { "name": "Yamap", + "depth": 11, "iso_1_code": null, "iso_3_code": "ymp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2253", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10498,6 +12068,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10513,14 +12084,17 @@ }, { "name": "Kaiwa", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iwal", + "depth": 10, "iso_1_code": null, "iso_3_code": "kbm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10537,6 +12111,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10551,6 +12126,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10565,6 +12141,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10580,24 +12157,29 @@ }, { "name": "Ngero-Vitiaz", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngero", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bariai", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bariai", + "depth": 10, "iso_1_code": null, "iso_3_code": "bch", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10615,9 +12197,11 @@ }, { "name": "Lusi", + "depth": 10, "iso_1_code": null, "iso_3_code": "khl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2260", "native_tokenizers": [], @@ -10625,9 +12209,11 @@ }, { "name": "Kove", + "depth": 10, "iso_1_code": null, "iso_3_code": "kvc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2261", "native_tokenizers": [], @@ -10635,15 +12221,18 @@ }, { "name": "Mala", + "depth": 10, "iso_1_code": null, "iso_3_code": "mmt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2262", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10659,14 +12248,17 @@ }, { "name": "Tuam", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gitua", + "depth": 10, "iso_1_code": null, "iso_3_code": "ggt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2264", "native_tokenizers": [], @@ -10674,9 +12266,11 @@ }, { "name": "Mutu", + "depth": 10, "iso_1_code": null, "iso_3_code": "tuc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10693,6 +12287,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10707,6 +12302,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10722,24 +12318,29 @@ }, { "name": "Vitiaz", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bel", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Astrolabe", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awad Bing", + "depth": 11, "iso_1_code": null, "iso_3_code": "bcu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2269", "native_tokenizers": [], @@ -10747,9 +12348,11 @@ }, { "name": "Mindiri", + "depth": 11, "iso_1_code": null, "iso_3_code": "mpn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2270", "native_tokenizers": [], @@ -10757,15 +12360,18 @@ }, { "name": "Yote", + "depth": 11, "iso_1_code": null, "iso_3_code": "wab", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2271", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2268", "native_tokenizers": [], @@ -10773,19 +12379,23 @@ }, { "name": "Nuclear Bel", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bilbil", + "depth": 12, "iso_1_code": null, "iso_3_code": "brz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2274", "native_tokenizers": [], @@ -10793,9 +12403,11 @@ }, { "name": "Gedaged", + "depth": 12, "iso_1_code": null, "iso_3_code": "gdd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2275", "native_tokenizers": [], @@ -10803,9 +12415,11 @@ }, { "name": "Matukar Panau", + "depth": 12, "iso_1_code": null, "iso_3_code": "mjk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2276", "native_tokenizers": [], @@ -10813,9 +12427,11 @@ }, { "name": "Takia", + "depth": 12, "iso_1_code": null, "iso_3_code": "tbc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10832,6 +12448,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10847,14 +12464,17 @@ }, { "name": "Southern", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marik", + "depth": 12, "iso_1_code": null, "iso_3_code": "dad", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10871,6 +12491,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10885,6 +12506,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10899,6 +12521,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10914,20 +12537,24 @@ }, { "name": "Kilenge-Maleu", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maleu-Kilenge", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2281", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2280", "native_tokenizers": [], @@ -10935,14 +12562,17 @@ }, { "name": "Korap", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arop-Lokep", + "depth": 10, "iso_1_code": null, "iso_3_code": "apr", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -10960,9 +12590,11 @@ }, { "name": "Karnai", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2284", "native_tokenizers": [], @@ -10970,9 +12602,11 @@ }, { "name": "Pano", + "depth": 10, "iso_1_code": null, "iso_3_code": "mqz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2285", "native_tokenizers": [], @@ -10980,15 +12614,18 @@ }, { "name": "Mur Pano", + "depth": 10, "iso_1_code": null, "iso_3_code": "tkv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2286", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11004,14 +12641,17 @@ }, { "name": "Mangap-Mbula", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbula", + "depth": 10, "iso_1_code": null, "iso_3_code": "mna", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11028,6 +12668,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11043,14 +12684,17 @@ }, { "name": "Mengen", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mamusi", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2290", "native_tokenizers": [], @@ -11058,9 +12702,11 @@ }, { "name": "Mengen", + "depth": 10, "iso_1_code": null, "iso_3_code": "mee", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11078,9 +12724,11 @@ }, { "name": "Lote", + "depth": 10, "iso_1_code": null, "iso_3_code": "uvl", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11097,6 +12745,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11112,14 +12761,17 @@ }, { "name": "Roinji-Nenaya", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mato", + "depth": 10, "iso_1_code": null, "iso_3_code": "met", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11137,15 +12789,18 @@ }, { "name": "Uma", + "depth": 10, "iso_1_code": null, "iso_3_code": "roe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2295", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11161,14 +12816,17 @@ }, { "name": "Sio", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sio", + "depth": 10, "iso_1_code": null, "iso_3_code": "xsi", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11185,6 +12843,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11200,25 +12859,30 @@ }, { "name": "Southwest New Britain", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amara", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amara", + "depth": 11, "iso_1_code": null, "iso_3_code": "aie", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2300", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2299", "native_tokenizers": [], @@ -11226,19 +12890,23 @@ }, { "name": "Arawe-Pasismanua", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arawe", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mangseng", + "depth": 12, "iso_1_code": null, "iso_3_code": "mbh", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11256,14 +12924,17 @@ }, { "name": "East Arawe", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akolet", + "depth": 13, "iso_1_code": null, "iso_3_code": "akt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2305", "native_tokenizers": [], @@ -11271,9 +12942,11 @@ }, { "name": "Avau", + "depth": 13, "iso_1_code": null, "iso_3_code": "avb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2306", "native_tokenizers": [], @@ -11281,9 +12954,11 @@ }, { "name": "Bebeli", + "depth": 13, "iso_1_code": null, "iso_3_code": "bek", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2307", "native_tokenizers": [], @@ -11291,15 +12966,18 @@ }, { "name": "Amio-Gelimi", + "depth": 13, "iso_1_code": null, "iso_3_code": "let", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2308", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2304", "native_tokenizers": [], @@ -11307,14 +12985,17 @@ }, { "name": "West Arawe", + "depth": 12, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Solong", + "depth": 13, "iso_1_code": null, "iso_3_code": "aaw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2310", "native_tokenizers": [], @@ -11322,9 +13003,11 @@ }, { "name": "Ambul", + "depth": 13, "iso_1_code": null, "iso_3_code": "apo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2311", "native_tokenizers": [], @@ -11332,9 +13015,11 @@ }, { "name": "Gimi", + "depth": 13, "iso_1_code": null, "iso_3_code": "gip", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2312", "native_tokenizers": [], @@ -11342,21 +13027,25 @@ }, { "name": "Aiklep", + "depth": 13, "iso_1_code": null, "iso_3_code": "mwg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2313", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2309", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11372,14 +13061,17 @@ }, { "name": "Pasismanua", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aighon", + "depth": 12, "iso_1_code": null, "iso_3_code": "aix", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2315", "native_tokenizers": [], @@ -11387,9 +13079,11 @@ }, { "name": "Miu", + "depth": 12, "iso_1_code": null, "iso_3_code": "mpo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2316", "native_tokenizers": [], @@ -11397,9 +13091,11 @@ }, { "name": "Kaulong", + "depth": 12, "iso_1_code": null, "iso_3_code": "pss", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11417,9 +13113,11 @@ }, { "name": "Sengseng", + "depth": 12, "iso_1_code": null, "iso_3_code": "ssz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2318", "native_tokenizers": [], @@ -11427,15 +13125,18 @@ }, { "name": "Karore", + "depth": 12, "iso_1_code": null, "iso_3_code": "xkx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2319", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11450,6 +13151,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11465,14 +13167,17 @@ }, { "name": "Bibling", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lamogai", + "depth": 11, "iso_1_code": null, "iso_3_code": "lmg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2321", "native_tokenizers": [], @@ -11480,21 +13185,25 @@ }, { "name": "Mouk-Aria", + "depth": 11, "iso_1_code": null, "iso_3_code": "mwh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2322", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2320", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11510,26 +13219,31 @@ }, { "name": "Tami", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tami", + "depth": 10, "iso_1_code": null, "iso_3_code": "tmy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2324", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2323", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11544,6 +13258,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11559,19 +13274,23 @@ }, { "name": "Sarmi-Jayapura Bay", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jayapura Bay", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayupulau", + "depth": 9, "iso_1_code": null, "iso_3_code": "kzu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2327", "native_tokenizers": [], @@ -11579,9 +13298,11 @@ }, { "name": "Ormu", + "depth": 9, "iso_1_code": null, "iso_3_code": "orz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2328", "native_tokenizers": [], @@ -11589,15 +13310,18 @@ }, { "name": "Tobati", + "depth": 9, "iso_1_code": null, "iso_3_code": "tti", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2329", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2326", "native_tokenizers": [], @@ -11605,14 +13329,17 @@ }, { "name": "Sarmi", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anus", + "depth": 9, "iso_1_code": null, "iso_3_code": "auq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2331", "native_tokenizers": [], @@ -11620,9 +13347,11 @@ }, { "name": "Bonggo", + "depth": 9, "iso_1_code": null, "iso_3_code": "bpg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2332", "native_tokenizers": [], @@ -11630,9 +13359,11 @@ }, { "name": "Masimasi", + "depth": 9, "iso_1_code": null, "iso_3_code": "ism", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2333", "native_tokenizers": [], @@ -11640,9 +13371,11 @@ }, { "name": "Kaptiau", + "depth": 9, "iso_1_code": null, "iso_3_code": "kbi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2334", "native_tokenizers": [], @@ -11650,9 +13383,11 @@ }, { "name": "Liki", + "depth": 9, "iso_1_code": null, "iso_3_code": "lio", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2335", "native_tokenizers": [], @@ -11660,9 +13395,11 @@ }, { "name": "Fedan", + "depth": 9, "iso_1_code": null, "iso_3_code": "pdn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2336", "native_tokenizers": [], @@ -11670,9 +13407,11 @@ }, { "name": "Sobei", + "depth": 9, "iso_1_code": null, "iso_3_code": "sob", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2337", "native_tokenizers": [], @@ -11680,9 +13419,11 @@ }, { "name": "Tarpia", + "depth": 9, "iso_1_code": null, "iso_3_code": "tpf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2338", "native_tokenizers": [], @@ -11690,9 +13431,11 @@ }, { "name": "Mo", + "depth": 9, "iso_1_code": null, "iso_3_code": "wkd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2339", "native_tokenizers": [], @@ -11700,9 +13443,11 @@ }, { "name": "Sunum", + "depth": 9, "iso_1_code": null, "iso_3_code": "ymn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2340", "native_tokenizers": [], @@ -11710,21 +13455,25 @@ }, { "name": "Yarsun", + "depth": 9, "iso_1_code": null, "iso_3_code": "yrs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2341", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2330", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2325", "native_tokenizers": [], @@ -11732,24 +13481,29 @@ }, { "name": "Schouten", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kairiru-Manam", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kairiru", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaiep", + "depth": 10, "iso_1_code": null, "iso_3_code": "kbw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2345", "native_tokenizers": [], @@ -11757,9 +13511,11 @@ }, { "name": "Kairiru", + "depth": 10, "iso_1_code": null, "iso_3_code": "kxa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2346", "native_tokenizers": [], @@ -11767,15 +13523,18 @@ }, { "name": "Terebu", + "depth": 10, "iso_1_code": null, "iso_3_code": "trb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2347", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2344", "native_tokenizers": [], @@ -11783,14 +13542,17 @@ }, { "name": "Manam", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biem", + "depth": 10, "iso_1_code": null, "iso_3_code": "bmc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2349", "native_tokenizers": [], @@ -11798,9 +13560,11 @@ }, { "name": "Kis", + "depth": 10, "iso_1_code": null, "iso_3_code": "kis", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2350", "native_tokenizers": [], @@ -11808,9 +13572,11 @@ }, { "name": "Medebur", + "depth": 10, "iso_1_code": null, "iso_3_code": "mjm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2351", "native_tokenizers": [], @@ -11818,9 +13584,11 @@ }, { "name": "Manam", + "depth": 10, "iso_1_code": null, "iso_3_code": "mva", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11838,9 +13606,11 @@ }, { "name": "Sepa", + "depth": 10, "iso_1_code": null, "iso_3_code": "spe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2353", "native_tokenizers": [], @@ -11848,15 +13618,18 @@ }, { "name": "Wogeo", + "depth": 10, "iso_1_code": null, "iso_3_code": "woc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2354", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11871,6 +13644,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11886,14 +13660,17 @@ }, { "name": "Siau", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Orop", + "depth": 9, "iso_1_code": null, "iso_3_code": "aps", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2356", "native_tokenizers": [], @@ -11901,9 +13678,11 @@ }, { "name": "Malol", + "depth": 9, "iso_1_code": null, "iso_3_code": "mbk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2357", "native_tokenizers": [], @@ -11911,9 +13690,11 @@ }, { "name": "Sera", + "depth": 9, "iso_1_code": null, "iso_3_code": "sry", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2358", "native_tokenizers": [], @@ -11921,9 +13702,11 @@ }, { "name": "Essono", + "depth": 9, "iso_1_code": null, "iso_3_code": "sso", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2359", "native_tokenizers": [], @@ -11931,9 +13714,11 @@ }, { "name": "Ulau-Suain", + "depth": 9, "iso_1_code": null, "iso_3_code": "svb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2360", "native_tokenizers": [], @@ -11941,9 +13726,11 @@ }, { "name": "Tumleo", + "depth": 9, "iso_1_code": null, "iso_3_code": "tmq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2361", "native_tokenizers": [], @@ -11951,21 +13738,25 @@ }, { "name": "Kap", + "depth": 9, "iso_1_code": null, "iso_3_code": "ykm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2362", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2355", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11980,6 +13771,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -11995,30 +13787,36 @@ }, { "name": "Papuan Tip", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuclear", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maisin", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maisin", + "depth": 9, "iso_1_code": null, "iso_3_code": "mbq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2366", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2365", "native_tokenizers": [], @@ -12026,19 +13824,23 @@ }, { "name": "North Papuan Mainland-D\u2019Entrecasteaux", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anuki", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anuki", + "depth": 10, "iso_1_code": null, "iso_3_code": "aui", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12055,6 +13857,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12070,19 +13873,23 @@ }, { "name": "Are-Taupota", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Are", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miniafia Oyan", + "depth": 11, "iso_1_code": null, "iso_3_code": "aai", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12100,9 +13907,11 @@ }, { "name": "Ghayavi", + "depth": 11, "iso_1_code": null, "iso_3_code": "bmk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12120,9 +13929,11 @@ }, { "name": "Doga", + "depth": 11, "iso_1_code": null, "iso_3_code": "dgg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2374", "native_tokenizers": [], @@ -12130,9 +13941,11 @@ }, { "name": "Are", + "depth": 11, "iso_1_code": null, "iso_3_code": "mwc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12150,9 +13963,11 @@ }, { "name": "Gapapaiwa", + "depth": 11, "iso_1_code": null, "iso_3_code": "pwg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12170,9 +13985,11 @@ }, { "name": "Ubir", + "depth": 11, "iso_1_code": null, "iso_3_code": "ubr", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12190,9 +14007,11 @@ }, { "name": "Kaninuwa", + "depth": 11, "iso_1_code": null, "iso_3_code": "wat", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12209,6 +14028,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12224,14 +14044,17 @@ }, { "name": "Taupota", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gweda", + "depth": 11, "iso_1_code": null, "iso_3_code": "grw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2380", "native_tokenizers": [], @@ -12239,9 +14062,11 @@ }, { "name": "Haigwai", + "depth": 11, "iso_1_code": null, "iso_3_code": "hgw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2381", "native_tokenizers": [], @@ -12249,9 +14074,11 @@ }, { "name": "Maiwala", + "depth": 11, "iso_1_code": null, "iso_3_code": "mum", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2382", "native_tokenizers": [], @@ -12259,9 +14086,11 @@ }, { "name": "Minaveha", + "depth": 11, "iso_1_code": null, "iso_3_code": "mvn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12279,9 +14108,11 @@ }, { "name": "Tawala", + "depth": 11, "iso_1_code": null, "iso_3_code": "tbo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12299,9 +14130,11 @@ }, { "name": "Taupota", + "depth": 11, "iso_1_code": null, "iso_3_code": "tpa", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12319,9 +14152,11 @@ }, { "name": "Wa\u2019ema", + "depth": 11, "iso_1_code": null, "iso_3_code": "wag", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2386", "native_tokenizers": [], @@ -12329,9 +14164,11 @@ }, { "name": "Wedau", + "depth": 11, "iso_1_code": null, "iso_3_code": "wed", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12349,15 +14186,18 @@ }, { "name": "Yakaikeke", + "depth": 11, "iso_1_code": null, "iso_3_code": "ykk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2388", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12372,6 +14212,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12387,14 +14228,17 @@ }, { "name": "Bwaidoga", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bwaidoka", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12412,9 +14256,11 @@ }, { "name": "Goodenough, West", + "depth": 10, "iso_1_code": null, "iso_3_code": "ddi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2391", "native_tokenizers": [], @@ -12422,9 +14268,11 @@ }, { "name": "Koluwawa", + "depth": 10, "iso_1_code": null, "iso_3_code": "klx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2392", "native_tokenizers": [], @@ -12432,9 +14280,11 @@ }, { "name": "Molima", + "depth": 10, "iso_1_code": null, "iso_3_code": "mox", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12452,9 +14302,11 @@ }, { "name": "Maiadomu", + "depth": 10, "iso_1_code": null, "iso_3_code": "mzz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12472,9 +14324,11 @@ }, { "name": "Iduna", + "depth": 10, "iso_1_code": null, "iso_3_code": "viv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12492,9 +14346,11 @@ }, { "name": "Iamalele", + "depth": 10, "iso_1_code": null, "iso_3_code": "yml", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12511,6 +14367,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12526,14 +14383,17 @@ }, { "name": "Dobu-Duau", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bunama", + "depth": 10, "iso_1_code": null, "iso_3_code": "bdd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12551,9 +14411,11 @@ }, { "name": "Boselewa", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2399", "native_tokenizers": [], @@ -12561,9 +14423,11 @@ }, { "name": "Dobu", + "depth": 10, "iso_1_code": null, "iso_3_code": "dob", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12581,9 +14445,11 @@ }, { "name": "Duau", + "depth": 10, "iso_1_code": null, "iso_3_code": "dva", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2401", "native_tokenizers": [], @@ -12591,9 +14457,11 @@ }, { "name": "Galeya", + "depth": 10, "iso_1_code": null, "iso_3_code": "gar", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2402", "native_tokenizers": [], @@ -12601,9 +14469,11 @@ }, { "name": "Mwatebu", + "depth": 10, "iso_1_code": null, "iso_3_code": "mwa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2403", "native_tokenizers": [], @@ -12611,15 +14481,18 @@ }, { "name": "Sewa Bay", + "depth": 10, "iso_1_code": null, "iso_3_code": "sew", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2404", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12635,20 +14508,24 @@ }, { "name": "Gumawana", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gumawana", + "depth": 10, "iso_1_code": null, "iso_3_code": "gvs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2406", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2405", "native_tokenizers": [], @@ -12656,14 +14533,17 @@ }, { "name": "Kakabai", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dawawa", + "depth": 10, "iso_1_code": null, "iso_3_code": "dww", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12681,9 +14561,11 @@ }, { "name": "Kakabai", + "depth": 10, "iso_1_code": null, "iso_3_code": "kqf", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12700,6 +14582,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12714,6 +14597,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12729,14 +14613,17 @@ }, { "name": "Suauic", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buhutu", + "depth": 9, "iso_1_code": null, "iso_3_code": "bxh", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12754,9 +14641,11 @@ }, { "name": "\u2019Auhelawa", + "depth": 9, "iso_1_code": null, "iso_3_code": "kud", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12774,9 +14663,11 @@ }, { "name": "Oya\u2019oya", + "depth": 9, "iso_1_code": null, "iso_3_code": "oyy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2413", "native_tokenizers": [], @@ -12784,9 +14675,11 @@ }, { "name": "Saliba", + "depth": 9, "iso_1_code": null, "iso_3_code": "sbe", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12804,9 +14697,11 @@ }, { "name": "Suau", + "depth": 9, "iso_1_code": null, "iso_3_code": "swp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12824,9 +14719,11 @@ }, { "name": "Bwanabwana", + "depth": 9, "iso_1_code": null, "iso_3_code": "tte", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12844,9 +14741,11 @@ }, { "name": "Unubahe", + "depth": 9, "iso_1_code": null, "iso_3_code": "unu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2417", "native_tokenizers": [], @@ -12854,9 +14753,11 @@ }, { "name": "Wagawaga", + "depth": 9, "iso_1_code": null, "iso_3_code": "wgb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2418", "native_tokenizers": [], @@ -12864,15 +14765,18 @@ }, { "name": "Yaleba", + "depth": 9, "iso_1_code": null, "iso_3_code": "ylb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2419", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12887,6 +14791,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -12902,24 +14807,29 @@ }, { "name": "Peripheral", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Papuan", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oumic", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ouma", + "depth": 10, "iso_1_code": null, "iso_3_code": "oum", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2423", "native_tokenizers": [], @@ -12927,14 +14837,17 @@ }, { "name": "Magoric", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bina", + "depth": 11, "iso_1_code": null, "iso_3_code": "bmn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2425", "native_tokenizers": [], @@ -12942,9 +14855,11 @@ }, { "name": "Yoba", + "depth": 11, "iso_1_code": null, "iso_3_code": "yob", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2426", "native_tokenizers": [], @@ -12952,21 +14867,25 @@ }, { "name": "Magori", + "depth": 11, "iso_1_code": null, "iso_3_code": "zgr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2427", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2424", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2422", "native_tokenizers": [], @@ -12974,14 +14893,17 @@ }, { "name": "Sinagoro-Keapara", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vula\u2019a", + "depth": 10, "iso_1_code": null, "iso_3_code": "hul", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2429", "native_tokenizers": [], @@ -12989,9 +14911,11 @@ }, { "name": "Keapara", + "depth": 10, "iso_1_code": null, "iso_3_code": "khz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13009,9 +14933,11 @@ }, { "name": "Motu", + "depth": 10, "iso_1_code": null, "iso_3_code": "meu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13029,9 +14955,11 @@ }, { "name": "Sinaugoro", + "depth": 10, "iso_1_code": null, "iso_3_code": "snc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13048,6 +14976,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13063,25 +14992,30 @@ }, { "name": "West Central Papuan", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gabadi", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abadi", + "depth": 11, "iso_1_code": null, "iso_3_code": "kbt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2435", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2434", "native_tokenizers": [], @@ -13089,14 +15023,17 @@ }, { "name": "Nuclear", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Toura", + "depth": 11, "iso_1_code": null, "iso_3_code": "don", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2437", "native_tokenizers": [], @@ -13104,9 +15041,11 @@ }, { "name": "Kuni", + "depth": 11, "iso_1_code": null, "iso_3_code": "kse", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2438", "native_tokenizers": [], @@ -13114,9 +15053,11 @@ }, { "name": "Mekeo", + "depth": 11, "iso_1_code": null, "iso_3_code": "mek", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13134,9 +15075,11 @@ }, { "name": "Lala", + "depth": 11, "iso_1_code": null, "iso_3_code": "nrz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2440", "native_tokenizers": [], @@ -13144,9 +15087,11 @@ }, { "name": "Waima", + "depth": 11, "iso_1_code": null, "iso_3_code": "rro", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13163,6 +15108,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13177,6 +15123,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13191,6 +15138,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13206,19 +15154,23 @@ }, { "name": "Kilivila-Louisiades", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kilivila", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Budibud", + "depth": 10, "iso_1_code": null, "iso_3_code": "btp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2444", "native_tokenizers": [], @@ -13226,9 +15178,11 @@ }, { "name": "Kilivila", + "depth": 10, "iso_1_code": null, "iso_3_code": "kij", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13246,9 +15200,11 @@ }, { "name": "Muyuw", + "depth": 10, "iso_1_code": null, "iso_3_code": "myw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13265,6 +15221,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13280,14 +15237,17 @@ }, { "name": "Misima", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Misima-Panaeati", + "depth": 10, "iso_1_code": null, "iso_3_code": "mpx", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13304,6 +15264,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13319,14 +15280,17 @@ }, { "name": "Nimoa-Sudest", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rifao", + "depth": 10, "iso_1_code": null, "iso_3_code": "nmw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13344,9 +15308,11 @@ }, { "name": "Sudest", + "depth": 10, "iso_1_code": null, "iso_3_code": "tgo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13363,6 +15329,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13377,6 +15344,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13391,6 +15359,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13405,6 +15374,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13419,6 +15389,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13434,14 +15405,17 @@ }, { "name": "Yapese", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yapese", + "depth": 6, "iso_1_code": null, "iso_3_code": "yap", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13458,6 +15432,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13472,6 +15447,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13487,19 +15463,23 @@ }, { "name": "South Halmahera-West New Guinea", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "South Halmahera", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Irarutu", + "depth": 6, "iso_1_code": null, "iso_3_code": "irh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2456", "native_tokenizers": [], @@ -13507,14 +15487,17 @@ }, { "name": "East Makian-Gane", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gane", + "depth": 7, "iso_1_code": null, "iso_3_code": "gzn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2458", "native_tokenizers": [], @@ -13522,15 +15505,18 @@ }, { "name": "Makian, East", + "depth": 7, "iso_1_code": null, "iso_3_code": "mky", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2459", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2457", "native_tokenizers": [], @@ -13538,14 +15524,17 @@ }, { "name": "Southeast", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buli", + "depth": 7, "iso_1_code": null, "iso_3_code": "bzq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2461", "native_tokenizers": [], @@ -13553,9 +15542,11 @@ }, { "name": "Maba", + "depth": 7, "iso_1_code": null, "iso_3_code": "mqa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2462", "native_tokenizers": [], @@ -13563,9 +15554,11 @@ }, { "name": "Patani", + "depth": 7, "iso_1_code": null, "iso_3_code": "ptn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2463", "native_tokenizers": [], @@ -13573,21 +15566,25 @@ }, { "name": "Sawai", + "depth": 7, "iso_1_code": null, "iso_3_code": "szw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2464", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2460", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2455", "native_tokenizers": [], @@ -13595,19 +15592,23 @@ }, { "name": "West New Guinea", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bomberai", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bedoanas", + "depth": 7, "iso_1_code": null, "iso_3_code": "bed", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2467", "native_tokenizers": [], @@ -13615,15 +15616,18 @@ }, { "name": "Erokwanas", + "depth": 7, "iso_1_code": null, "iso_3_code": "erw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2468", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2466", "native_tokenizers": [], @@ -13631,19 +15635,23 @@ }, { "name": "Cenderawasih Bay", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biakic", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biak", + "depth": 8, "iso_1_code": null, "iso_3_code": "bhw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13661,9 +15669,11 @@ }, { "name": "Dusner", + "depth": 8, "iso_1_code": null, "iso_3_code": "dsn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2472", "native_tokenizers": [], @@ -13671,15 +15681,18 @@ }, { "name": "Meoswar", + "depth": 8, "iso_1_code": null, "iso_3_code": "mvx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2473", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13695,20 +15708,24 @@ }, { "name": "Iresim", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yeresiam", + "depth": 8, "iso_1_code": null, "iso_3_code": "ire", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2475", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2474", "native_tokenizers": [], @@ -13716,20 +15733,24 @@ }, { "name": "Mor", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mor", + "depth": 8, "iso_1_code": null, "iso_3_code": "mhz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2477", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2476", "native_tokenizers": [], @@ -13737,14 +15758,17 @@ }, { "name": "Raja Ampat", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "As", + "depth": 8, "iso_1_code": null, "iso_3_code": "asz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2479", "native_tokenizers": [], @@ -13752,9 +15776,11 @@ }, { "name": "Biga", + "depth": 8, "iso_1_code": null, "iso_3_code": "bhc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2480", "native_tokenizers": [], @@ -13762,9 +15788,11 @@ }, { "name": "Gebe", + "depth": 8, "iso_1_code": null, "iso_3_code": "gei", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2481", "native_tokenizers": [], @@ -13772,9 +15800,11 @@ }, { "name": "Kawe", + "depth": 8, "iso_1_code": null, "iso_3_code": "kgb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2482", "native_tokenizers": [], @@ -13782,9 +15812,11 @@ }, { "name": "Legenyem", + "depth": 8, "iso_1_code": null, "iso_3_code": "lcc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2483", "native_tokenizers": [], @@ -13792,9 +15824,11 @@ }, { "name": "Ma\u2019ya", + "depth": 8, "iso_1_code": null, "iso_3_code": "slz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2484", "native_tokenizers": [], @@ -13802,9 +15836,11 @@ }, { "name": "Ambel", + "depth": 8, "iso_1_code": null, "iso_3_code": "wgo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2485", "native_tokenizers": [], @@ -13812,9 +15848,11 @@ }, { "name": "Wauyai", + "depth": 8, "iso_1_code": null, "iso_3_code": "wuy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2486", "native_tokenizers": [], @@ -13822,9 +15860,11 @@ }, { "name": "Matbat", + "depth": 8, "iso_1_code": null, "iso_3_code": "xmt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2487", "native_tokenizers": [], @@ -13832,15 +15872,18 @@ }, { "name": "Salawati", + "depth": 8, "iso_1_code": null, "iso_3_code": "xmx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2488", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2478", "native_tokenizers": [], @@ -13848,20 +15891,24 @@ }, { "name": "Tandia", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tandia", + "depth": 8, "iso_1_code": null, "iso_3_code": "tni", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2490", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2489", "native_tokenizers": [], @@ -13869,20 +15916,24 @@ }, { "name": "Waropen", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Waropen", + "depth": 8, "iso_1_code": null, "iso_3_code": "wrp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2492", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2491", "native_tokenizers": [], @@ -13890,19 +15941,23 @@ }, { "name": "Yapen", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central-Western", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ambai", + "depth": 9, "iso_1_code": null, "iso_3_code": "amk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -13920,9 +15975,11 @@ }, { "name": "Ansus", + "depth": 9, "iso_1_code": null, "iso_3_code": "and", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2496", "native_tokenizers": [], @@ -13930,9 +15987,11 @@ }, { "name": "Busami", + "depth": 9, "iso_1_code": null, "iso_3_code": "bsm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2497", "native_tokenizers": [], @@ -13940,9 +15999,11 @@ }, { "name": "Munggui", + "depth": 9, "iso_1_code": null, "iso_3_code": "mth", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2498", "native_tokenizers": [], @@ -13950,9 +16011,11 @@ }, { "name": "Marau", + "depth": 9, "iso_1_code": null, "iso_3_code": "mvr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2499", "native_tokenizers": [], @@ -13960,9 +16023,11 @@ }, { "name": "Pom", + "depth": 9, "iso_1_code": null, "iso_3_code": "pmo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2500", "native_tokenizers": [], @@ -13970,9 +16035,11 @@ }, { "name": "Papuma", + "depth": 9, "iso_1_code": null, "iso_3_code": "ppm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2501", "native_tokenizers": [], @@ -13980,9 +16047,11 @@ }, { "name": "Roon", + "depth": 9, "iso_1_code": null, "iso_3_code": "rnn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2502", "native_tokenizers": [], @@ -13990,9 +16059,11 @@ }, { "name": "Serui-Laut", + "depth": 9, "iso_1_code": null, "iso_3_code": "seu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2503", "native_tokenizers": [], @@ -14000,9 +16071,11 @@ }, { "name": "Wamesa", + "depth": 9, "iso_1_code": null, "iso_3_code": "wad", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2504", "native_tokenizers": [], @@ -14010,15 +16083,18 @@ }, { "name": "Woi", + "depth": 9, "iso_1_code": null, "iso_3_code": "wbw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2505", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14034,14 +16110,17 @@ }, { "name": "East", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kurudu", + "depth": 9, "iso_1_code": null, "iso_3_code": "kjr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2507", "native_tokenizers": [], @@ -14049,21 +16128,25 @@ }, { "name": "Wabo", + "depth": 9, "iso_1_code": null, "iso_3_code": "wbb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2508", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2506", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14079,20 +16162,24 @@ }, { "name": "Yaur", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yaur", + "depth": 8, "iso_1_code": null, "iso_3_code": "jau", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2510", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2509", "native_tokenizers": [], @@ -14100,26 +16187,31 @@ }, { "name": "Yeretuar", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yeretuar", + "depth": 8, "iso_1_code": null, "iso_3_code": "gop", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2512", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2511", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14134,6 +16226,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14148,6 +16241,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14162,6 +16256,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14177,20 +16272,24 @@ }, { "name": "Hukumina", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hukumina", + "depth": 4, "iso_1_code": null, "iso_3_code": "huw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2514", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2513", "native_tokenizers": [], @@ -14198,14 +16297,17 @@ }, { "name": "North Bomberai", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arguni", + "depth": 4, "iso_1_code": null, "iso_3_code": "agf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2516", "native_tokenizers": [], @@ -14213,9 +16315,11 @@ }, { "name": "Onin", + "depth": 4, "iso_1_code": null, "iso_3_code": "oni", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2517", "native_tokenizers": [], @@ -14223,9 +16327,11 @@ }, { "name": "Sekar", + "depth": 4, "iso_1_code": null, "iso_3_code": "skz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2518", "native_tokenizers": [], @@ -14233,15 +16339,18 @@ }, { "name": "Uruangnirin", + "depth": 4, "iso_1_code": null, "iso_3_code": "urn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2519", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2515", "native_tokenizers": [], @@ -14249,20 +16358,24 @@ }, { "name": "South Bomberai", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kowiai", + "depth": 4, "iso_1_code": null, "iso_3_code": "kwh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2521", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2520", "native_tokenizers": [], @@ -14270,24 +16383,29 @@ }, { "name": "Southeast Maluku", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kei-Tanimbar", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kei-Fordata", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fordata", + "depth": 6, "iso_1_code": null, "iso_3_code": "frd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14305,9 +16423,11 @@ }, { "name": "Kei", + "depth": 6, "iso_1_code": null, "iso_3_code": "kei", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14324,6 +16444,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14339,26 +16460,31 @@ }, { "name": "Yamdena", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yamdena", + "depth": 6, "iso_1_code": null, "iso_3_code": "jmd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2528", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2527", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14374,14 +16500,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Selaru", + "depth": 5, "iso_1_code": null, "iso_3_code": "slu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2530", "native_tokenizers": [], @@ -14389,21 +16518,25 @@ }, { "name": "Seluwasan", + "depth": 5, "iso_1_code": null, "iso_3_code": "sws", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2531", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2529", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14419,19 +16552,23 @@ }, { "name": "Sumba-Hawu", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hawu-Dhao", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hawu", + "depth": 5, "iso_1_code": null, "iso_3_code": "hvn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14449,9 +16586,11 @@ }, { "name": "Dhao", + "depth": 5, "iso_1_code": null, "iso_3_code": "nfa", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14468,6 +16607,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14483,14 +16623,17 @@ }, { "name": "Sumba", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anakalangu", + "depth": 5, "iso_1_code": null, "iso_3_code": "akg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2537", "native_tokenizers": [], @@ -14498,9 +16641,11 @@ }, { "name": "Kodi", + "depth": 5, "iso_1_code": null, "iso_3_code": "kod", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2538", "native_tokenizers": [], @@ -14508,9 +16653,11 @@ }, { "name": "Lamboya", + "depth": 5, "iso_1_code": null, "iso_3_code": "lmy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2539", "native_tokenizers": [], @@ -14518,9 +16665,11 @@ }, { "name": "Loura", + "depth": 5, "iso_1_code": null, "iso_3_code": "lur", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2540", "native_tokenizers": [], @@ -14528,9 +16677,11 @@ }, { "name": "Mamboru", + "depth": 5, "iso_1_code": null, "iso_3_code": "mvd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2541", "native_tokenizers": [], @@ -14538,9 +16689,11 @@ }, { "name": "Wejewa", + "depth": 5, "iso_1_code": null, "iso_3_code": "wew", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14558,9 +16711,11 @@ }, { "name": "Wanukaka", + "depth": 5, "iso_1_code": null, "iso_3_code": "wnk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2543", "native_tokenizers": [], @@ -14568,9 +16723,11 @@ }, { "name": "Kambera", + "depth": 5, "iso_1_code": null, "iso_3_code": "xbr", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14587,6 +16744,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14601,6 +16759,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14616,14 +16775,17 @@ }, { "name": "Teor-Kur", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kur", + "depth": 4, "iso_1_code": null, "iso_3_code": "kuv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2546", "native_tokenizers": [], @@ -14631,15 +16793,18 @@ }, { "name": "Teor", + "depth": 4, "iso_1_code": null, "iso_3_code": "tev", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2547", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2545", "native_tokenizers": [], @@ -14647,19 +16812,23 @@ }, { "name": "Timor-Babar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuclear Timor", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Galolen", + "depth": 5, "iso_1_code": null, "iso_3_code": "gal", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2550", "native_tokenizers": [], @@ -14667,9 +16836,11 @@ }, { "name": "Habun", + "depth": 5, "iso_1_code": null, "iso_3_code": "hbu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2551", "native_tokenizers": [], @@ -14677,9 +16848,11 @@ }, { "name": "Helong", + "depth": 5, "iso_1_code": null, "iso_3_code": "heg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14697,9 +16870,11 @@ }, { "name": "Idat\u00e9", + "depth": 5, "iso_1_code": null, "iso_3_code": "idt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2553", "native_tokenizers": [], @@ -14707,9 +16882,11 @@ }, { "name": "Kemak", + "depth": 5, "iso_1_code": null, "iso_3_code": "kem", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2554", "native_tokenizers": [], @@ -14717,9 +16894,11 @@ }, { "name": "Kairui-Midiki", + "depth": 5, "iso_1_code": null, "iso_3_code": "krd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2555", "native_tokenizers": [], @@ -14727,9 +16906,11 @@ }, { "name": "Lakalei", + "depth": 5, "iso_1_code": null, "iso_3_code": "lka", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2556", "native_tokenizers": [], @@ -14737,9 +16918,11 @@ }, { "name": "Makuva", + "depth": 5, "iso_1_code": null, "iso_3_code": "lva", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2557", "native_tokenizers": [], @@ -14747,9 +16930,11 @@ }, { "name": "Mambae", + "depth": 5, "iso_1_code": null, "iso_3_code": "mgm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14767,9 +16952,11 @@ }, { "name": "Nauete", + "depth": 5, "iso_1_code": null, "iso_3_code": "nxa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2559", "native_tokenizers": [], @@ -14777,9 +16964,11 @@ }, { "name": "Tetun", + "depth": 5, "iso_1_code": null, "iso_3_code": "tet", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14797,9 +16986,11 @@ }, { "name": "Tukudede", + "depth": 5, "iso_1_code": null, "iso_3_code": "tkd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2561", "native_tokenizers": [], @@ -14807,9 +16998,11 @@ }, { "name": "Welaun", + "depth": 5, "iso_1_code": null, "iso_3_code": "wlh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2562", "native_tokenizers": [], @@ -14817,9 +17010,11 @@ }, { "name": "Waima\u2019a", + "depth": 5, "iso_1_code": null, "iso_3_code": "wmh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2563", "native_tokenizers": [], @@ -14827,14 +17022,17 @@ }, { "name": "Rote", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bilba", + "depth": 6, "iso_1_code": null, "iso_3_code": "bpz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2565", "native_tokenizers": [], @@ -14842,9 +17040,11 @@ }, { "name": "Dengka", + "depth": 6, "iso_1_code": null, "iso_3_code": "dnk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2566", "native_tokenizers": [], @@ -14852,9 +17052,11 @@ }, { "name": "Lole", + "depth": 6, "iso_1_code": null, "iso_3_code": "llg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14872,9 +17074,11 @@ }, { "name": "Rikou", + "depth": 6, "iso_1_code": null, "iso_3_code": "rgu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14892,9 +17096,11 @@ }, { "name": "Dela-Oenale", + "depth": 6, "iso_1_code": null, "iso_3_code": "row", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14912,9 +17118,11 @@ }, { "name": "Termanu", + "depth": 6, "iso_1_code": null, "iso_3_code": "twu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14932,9 +17140,11 @@ }, { "name": "Tii", + "depth": 6, "iso_1_code": null, "iso_3_code": "txq", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14951,6 +17161,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14966,14 +17177,17 @@ }, { "name": "Uab Meto", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amarasi", + "depth": 6, "iso_1_code": null, "iso_3_code": "aaz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -14991,9 +17205,11 @@ }, { "name": "Uab Meto", + "depth": 6, "iso_1_code": null, "iso_3_code": "aoz", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15011,15 +17227,18 @@ }, { "name": "Baikeno", + "depth": 6, "iso_1_code": null, "iso_3_code": "bkx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2575", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15034,6 +17253,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15049,25 +17269,30 @@ }, { "name": "Southwest Maluku", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Damar", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Damar, East", + "depth": 6, "iso_1_code": null, "iso_3_code": "dmr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2578", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2577", "native_tokenizers": [], @@ -15075,14 +17300,17 @@ }, { "name": "Kisar-Roma", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kisar", + "depth": 6, "iso_1_code": null, "iso_3_code": "kje", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15100,15 +17328,18 @@ }, { "name": "Roma", + "depth": 6, "iso_1_code": null, "iso_3_code": "rmm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2581", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15124,14 +17355,17 @@ }, { "name": "Luang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luang", + "depth": 6, "iso_1_code": null, "iso_3_code": "lex", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15149,15 +17383,18 @@ }, { "name": "Leti", + "depth": 6, "iso_1_code": null, "iso_3_code": "lti", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2584", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15173,19 +17410,23 @@ }, { "name": "Teun-Nila-Serua", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nila-Serua", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nila", + "depth": 7, "iso_1_code": null, "iso_3_code": "nil", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2587", "native_tokenizers": [], @@ -15193,15 +17434,18 @@ }, { "name": "Serua", + "depth": 7, "iso_1_code": null, "iso_3_code": "srw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2588", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2586", "native_tokenizers": [], @@ -15209,26 +17453,31 @@ }, { "name": "Teun", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Te\u2019un", + "depth": 7, "iso_1_code": null, "iso_3_code": "tve", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2590", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2589", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2585", "native_tokenizers": [], @@ -15236,14 +17485,17 @@ }, { "name": "Wetar", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atauran", + "depth": 6, "iso_1_code": null, "iso_3_code": "adb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2592", "native_tokenizers": [], @@ -15251,9 +17503,11 @@ }, { "name": "Aputai", + "depth": 6, "iso_1_code": null, "iso_3_code": "apx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2593", "native_tokenizers": [], @@ -15261,9 +17515,11 @@ }, { "name": "Ili\u2019uun", + "depth": 6, "iso_1_code": null, "iso_3_code": "ilu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2594", "native_tokenizers": [], @@ -15271,9 +17527,11 @@ }, { "name": "Tugun", + "depth": 6, "iso_1_code": null, "iso_3_code": "tzn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2595", "native_tokenizers": [], @@ -15281,21 +17539,25 @@ }, { "name": "Perai", + "depth": 6, "iso_1_code": null, "iso_3_code": "wet", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2596", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2591", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15310,6 +17572,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15325,20 +17588,24 @@ }, { "name": "Unclassified", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuri", + "depth": 4, "iso_1_code": null, "iso_3_code": "nbn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2598", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2597", "native_tokenizers": [], @@ -15346,26 +17613,31 @@ }, { "name": "West Damar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Damar, West", + "depth": 4, "iso_1_code": null, "iso_3_code": "drn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2600", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2599", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15381,14 +17653,17 @@ }, { "name": "Chamorro", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chamorro", + "depth": 3, "iso_1_code": "ch", "iso_3_code": "cha", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15405,6 +17680,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15420,19 +17696,23 @@ }, { "name": "Greater Barito", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barito-Mahakam", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ampanang", + "depth": 4, "iso_1_code": null, "iso_3_code": "apg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2605", "native_tokenizers": [], @@ -15440,15 +17720,18 @@ }, { "name": "Tunjung", + "depth": 4, "iso_1_code": null, "iso_3_code": "tjg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2606", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2604", "native_tokenizers": [], @@ -15456,30 +17739,36 @@ }, { "name": "East", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central-South", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dusun Deyah", + "depth": 6, "iso_1_code": null, "iso_3_code": "dun", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2610", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2609", "native_tokenizers": [], @@ -15487,14 +17776,17 @@ }, { "name": "South", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dusun Malang", + "depth": 6, "iso_1_code": null, "iso_3_code": "duq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2612", "native_tokenizers": [], @@ -15502,9 +17794,11 @@ }, { "name": "Dusun Witu", + "depth": 6, "iso_1_code": null, "iso_3_code": "duw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2613", "native_tokenizers": [], @@ -15512,9 +17806,11 @@ }, { "name": "Ma\u2019anyan", + "depth": 6, "iso_1_code": null, "iso_3_code": "mhy", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15532,15 +17828,18 @@ }, { "name": "Paku", + "depth": 6, "iso_1_code": null, "iso_3_code": "pku", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2615", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15555,6 +17854,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15570,14 +17870,17 @@ }, { "name": "Malagasy", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malagasy, Bara", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "bhr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2617", "native_tokenizers": [], @@ -15585,9 +17888,11 @@ }, { "name": "Malagasy, Northern Betsimisaraka", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "bmm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2618", "native_tokenizers": [], @@ -15595,9 +17900,11 @@ }, { "name": "Bushi", + "depth": 5, "iso_1_code": null, "iso_3_code": "buc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2619", "native_tokenizers": [], @@ -15605,9 +17912,11 @@ }, { "name": "Malagasy, Southern Betsimisaraka", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "bzc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2620", "native_tokenizers": [], @@ -15615,9 +17924,11 @@ }, { "name": "Malagasy, Masikoro", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "msh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2621", "native_tokenizers": [], @@ -15625,9 +17936,11 @@ }, { "name": "Malagasy, Merina", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "plt", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15645,9 +17958,11 @@ }, { "name": "Malagasy, Sakalava", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "skg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15665,9 +17980,11 @@ }, { "name": "Malagasy, Tandroy-Mahafaly", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "tdx", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15685,9 +18002,11 @@ }, { "name": "Malagasy, Tesaka", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "tkg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2625", "native_tokenizers": [], @@ -15695,9 +18014,11 @@ }, { "name": "Malagasy, Tanosy", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "txy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2626", "native_tokenizers": [], @@ -15705,9 +18026,11 @@ }, { "name": "Malagasy, Antankarana", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "xmv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15725,15 +18048,18 @@ }, { "name": "Malagasy, Tsimihety", + "depth": 5, "iso_1_code": "mg", "iso_3_code": "xmw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2628", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15749,14 +18075,17 @@ }, { "name": "North", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lawangan", + "depth": 5, "iso_1_code": null, "iso_3_code": "lbx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2630", "native_tokenizers": [], @@ -15764,21 +18093,25 @@ }, { "name": "Tawoyan", + "depth": 5, "iso_1_code": null, "iso_3_code": "twy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2631", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2629", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15794,14 +18127,17 @@ }, { "name": "Sama-Bajaw", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yakan", + "depth": 4, "iso_1_code": null, "iso_3_code": "yka", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15819,14 +18155,17 @@ }, { "name": "Abaknon", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inabaknon", + "depth": 5, "iso_1_code": null, "iso_3_code": "abx", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15843,6 +18182,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15858,19 +18198,23 @@ }, { "name": "Sulu-Borneo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Borneo Coast Bajaw", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bajau, Indonesian", + "depth": 6, "iso_1_code": null, "iso_3_code": "bdl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2638", "native_tokenizers": [], @@ -15878,9 +18222,11 @@ }, { "name": "Bajau, West Coast", + "depth": 6, "iso_1_code": null, "iso_3_code": "bdr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2639", "native_tokenizers": [], @@ -15888,15 +18234,18 @@ }, { "name": "Mapun", + "depth": 6, "iso_1_code": null, "iso_3_code": "sjm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2640", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2637", "native_tokenizers": [], @@ -15904,14 +18253,17 @@ }, { "name": "Inner Sulu Sama", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sama, Central", + "depth": 6, "iso_1_code": null, "iso_3_code": "sml", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15929,9 +18281,11 @@ }, { "name": "Sama, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "ssb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2643", "native_tokenizers": [], @@ -15939,15 +18293,18 @@ }, { "name": "Sama, Balangingih", + "depth": 6, "iso_1_code": null, "iso_3_code": "sse", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2644", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15963,26 +18320,31 @@ }, { "name": "Western Sulu Sama", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sama, Pangutaran", + "depth": 6, "iso_1_code": null, "iso_3_code": "slm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2646", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2645", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -15997,6 +18359,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -16012,19 +18375,23 @@ }, { "name": "West", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kohin", + "depth": 5, "iso_1_code": null, "iso_3_code": "kkx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2649", "native_tokenizers": [], @@ -16032,9 +18399,11 @@ }, { "name": "Ot Danum", + "depth": 5, "iso_1_code": null, "iso_3_code": "otd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -16052,15 +18421,18 @@ }, { "name": "Siang", + "depth": 5, "iso_1_code": null, "iso_3_code": "sya", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2651", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -16076,14 +18448,17 @@ }, { "name": "South", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakumpai", + "depth": 5, "iso_1_code": null, "iso_3_code": "bkr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2653", "native_tokenizers": [], @@ -16091,9 +18466,11 @@ }, { "name": "Ngaju", + "depth": 5, "iso_1_code": null, "iso_3_code": "nij", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -16110,6 +18487,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -16124,6 +18502,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -16138,6 +18517,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -16153,19 +18533,23 @@ }, { "name": "Greater Central Philippine", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Philippine", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ata", + "depth": 4, "iso_1_code": null, "iso_3_code": "atm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2657", "native_tokenizers": [], @@ -16173,9 +18557,11 @@ }, { "name": "Ayta, Sorsogon", + "depth": 4, "iso_1_code": null, "iso_3_code": "ays", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2658", "native_tokenizers": [], @@ -16183,9 +18569,11 @@ }, { "name": "Binukidnon, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "kyn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2659", "native_tokenizers": [], @@ -16193,9 +18581,11 @@ }, { "name": "Binukidnon, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "mtw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2660", "native_tokenizers": [], @@ -16203,9 +18593,11 @@ }, { "name": "Sulod", + "depth": 4, "iso_1_code": null, "iso_3_code": "srg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2661", "native_tokenizers": [], @@ -16213,24 +18605,29 @@ }, { "name": "Bikol", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Coastal", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naga", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agta, Katubung", + "depth": 7, "iso_1_code": null, "iso_3_code": "agk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2665", "native_tokenizers": [], @@ -16238,9 +18635,11 @@ }, { "name": "Agta, Mt. Iraya", + "depth": 7, "iso_1_code": null, "iso_3_code": "atl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2666", "native_tokenizers": [], @@ -16248,9 +18647,11 @@ }, { "name": "Bikol, Central", + "depth": 7, "iso_1_code": null, "iso_3_code": "bcl", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16267,6 +18668,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16282,26 +18684,31 @@ }, { "name": "Virac", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bikol, Southern Catanduanes", + "depth": 7, "iso_1_code": null, "iso_3_code": "bln", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2669", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2668", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16317,14 +18724,17 @@ }, { "name": "Inland", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agta, Mt. Iriga", + "depth": 6, "iso_1_code": null, "iso_3_code": "agz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2671", "native_tokenizers": [], @@ -16332,9 +18742,11 @@ }, { "name": "Bikol, West Albay", + "depth": 6, "iso_1_code": null, "iso_3_code": "fbl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2672", "native_tokenizers": [], @@ -16342,9 +18754,11 @@ }, { "name": "Bikol, Libon", + "depth": 6, "iso_1_code": null, "iso_3_code": "lbl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2673", "native_tokenizers": [], @@ -16352,9 +18766,11 @@ }, { "name": "Bikol, Miraya", + "depth": 6, "iso_1_code": null, "iso_3_code": "rbl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2674", "native_tokenizers": [], @@ -16362,9 +18778,11 @@ }, { "name": "Bikol, Buhi\u2019non", + "depth": 6, "iso_1_code": null, "iso_3_code": "ubl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2675", "native_tokenizers": [], @@ -16372,26 +18790,31 @@ }, { "name": "Iriga", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bikol, Rinconada", + "depth": 7, "iso_1_code": null, "iso_3_code": "bto", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2677", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2676", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2670", "native_tokenizers": [], @@ -16399,26 +18822,31 @@ }, { "name": "Pandan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bikol, Northern Catanduanes", + "depth": 6, "iso_1_code": null, "iso_3_code": "cts", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2679", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2678", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16434,19 +18862,23 @@ }, { "name": "Bisayan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banton", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bantoanon", + "depth": 6, "iso_1_code": null, "iso_3_code": "bno", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16463,6 +18895,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16478,14 +18911,17 @@ }, { "name": "Cebuan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cebuano", + "depth": 6, "iso_1_code": null, "iso_3_code": "ceb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16502,6 +18938,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16517,14 +18954,17 @@ }, { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bantayanon", + "depth": 6, "iso_1_code": null, "iso_3_code": "bfx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2686", "native_tokenizers": [], @@ -16532,14 +18972,17 @@ }, { "name": "Peripheral", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ati", + "depth": 7, "iso_1_code": null, "iso_3_code": "atk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2688", "native_tokenizers": [], @@ -16547,9 +18990,11 @@ }, { "name": "Capiznon", + "depth": 7, "iso_1_code": null, "iso_3_code": "cps", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2689", "native_tokenizers": [], @@ -16557,9 +19002,11 @@ }, { "name": "Hiligaynon", + "depth": 7, "iso_1_code": null, "iso_3_code": "hil", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16577,9 +19024,11 @@ }, { "name": "Masbatenyo", + "depth": 7, "iso_1_code": null, "iso_3_code": "msb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16597,15 +19046,18 @@ }, { "name": "Porohanon", + "depth": 7, "iso_1_code": null, "iso_3_code": "prh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2692", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16621,20 +19073,24 @@ }, { "name": "Romblon", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romblomanon", + "depth": 7, "iso_1_code": null, "iso_3_code": "rol", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2694", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2693", "native_tokenizers": [], @@ -16642,14 +19098,17 @@ }, { "name": "Warayan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sorsoganon, Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "bks", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2696", "native_tokenizers": [], @@ -16657,9 +19116,11 @@ }, { "name": "Baybayanon", + "depth": 7, "iso_1_code": null, "iso_3_code": "bvy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2697", "native_tokenizers": [], @@ -16667,9 +19128,11 @@ }, { "name": "Kinabalian", + "depth": 7, "iso_1_code": null, "iso_3_code": "cbw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2698", "native_tokenizers": [], @@ -16677,20 +19140,24 @@ }, { "name": "Gubat", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sorsoganon, Southern", + "depth": 8, "iso_1_code": null, "iso_3_code": "srv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2700", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2699", "native_tokenizers": [], @@ -16698,14 +19165,17 @@ }, { "name": "Samar-Waray", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Waray-Waray", + "depth": 8, "iso_1_code": null, "iso_3_code": "war", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16722,6 +19192,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16736,6 +19207,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16750,6 +19222,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16765,14 +19238,17 @@ }, { "name": "South", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Surigaonon", + "depth": 6, "iso_1_code": null, "iso_3_code": "sgd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2704", "native_tokenizers": [], @@ -16780,9 +19256,11 @@ }, { "name": "Tandaganon", + "depth": 6, "iso_1_code": null, "iso_3_code": "tgn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2705", "native_tokenizers": [], @@ -16790,14 +19268,17 @@ }, { "name": "Butuan-Tausug", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Butuanon", + "depth": 7, "iso_1_code": null, "iso_3_code": "btw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2707", "native_tokenizers": [], @@ -16805,9 +19286,11 @@ }, { "name": "Tausug", + "depth": 7, "iso_1_code": null, "iso_3_code": "tsg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16824,6 +19307,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16838,6 +19322,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16853,14 +19338,17 @@ }, { "name": "West", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Caluyanun", + "depth": 6, "iso_1_code": null, "iso_3_code": "clu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16878,14 +19366,17 @@ }, { "name": "Aklan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aklanon", + "depth": 7, "iso_1_code": null, "iso_3_code": "akl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2712", "native_tokenizers": [], @@ -16893,15 +19384,18 @@ }, { "name": "Malaynon", + "depth": 7, "iso_1_code": null, "iso_3_code": "mlz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2713", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2711", "native_tokenizers": [], @@ -16909,14 +19403,17 @@ }, { "name": "Kinarayan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kinaray-a", + "depth": 7, "iso_1_code": null, "iso_3_code": "krj", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16933,6 +19430,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -16948,14 +19446,17 @@ }, { "name": "Kuyan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ratagnon", + "depth": 7, "iso_1_code": null, "iso_3_code": "btn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2717", "native_tokenizers": [], @@ -16963,15 +19464,18 @@ }, { "name": "Cuyonon", + "depth": 7, "iso_1_code": null, "iso_3_code": "cyo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2718", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2716", "native_tokenizers": [], @@ -16979,26 +19483,31 @@ }, { "name": "North Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inonhan", + "depth": 7, "iso_1_code": null, "iso_3_code": "loc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2720", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2719", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17013,6 +19522,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17028,14 +19538,17 @@ }, { "name": "Mamanwa", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Minamanwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "mmn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17052,6 +19565,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17067,25 +19581,30 @@ }, { "name": "Mansakan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Davawenyo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Davawenyo", + "depth": 6, "iso_1_code": null, "iso_3_code": "daw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2725", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2724", "native_tokenizers": [], @@ -17093,14 +19612,17 @@ }, { "name": "Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mandaya", + "depth": 6, "iso_1_code": null, "iso_3_code": "mry", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2727", "native_tokenizers": [], @@ -17108,9 +19630,11 @@ }, { "name": "Mansaka", + "depth": 6, "iso_1_code": null, "iso_3_code": "msk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17127,6 +19651,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17142,20 +19667,24 @@ }, { "name": "Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamayo", + "depth": 6, "iso_1_code": null, "iso_3_code": "kyk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2730", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2729", "native_tokenizers": [], @@ -17163,14 +19692,17 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tagakolu", + "depth": 6, "iso_1_code": null, "iso_3_code": "klg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2732", "native_tokenizers": [], @@ -17178,9 +19710,11 @@ }, { "name": "Kalagan, Kagan", + "depth": 6, "iso_1_code": null, "iso_3_code": "kll", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2733", "native_tokenizers": [], @@ -17188,9 +19722,11 @@ }, { "name": "Kalagan", + "depth": 6, "iso_1_code": null, "iso_3_code": "kqe", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17207,6 +19743,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17221,6 +19758,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17236,14 +19774,17 @@ }, { "name": "Tagalog", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Filipino", + "depth": 5, "iso_1_code": null, "iso_3_code": "fil", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17263,15 +19804,18 @@ }, { "name": "Tagalog", + "depth": 5, "iso_1_code": "tl", "iso_3_code": "tgl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2737", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17286,6 +19830,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17301,25 +19846,30 @@ }, { "name": "Danao", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Magindanao", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maguindanaon", + "depth": 5, "iso_1_code": null, "iso_3_code": "mdh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2740", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2739", "native_tokenizers": [], @@ -17327,14 +19877,17 @@ }, { "name": "Maranao-Iranon", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iranun", + "depth": 5, "iso_1_code": null, "iso_3_code": "ilm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2742", "native_tokenizers": [], @@ -17342,9 +19895,11 @@ }, { "name": "Iranun", + "depth": 5, "iso_1_code": null, "iso_3_code": "ilp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2743", "native_tokenizers": [], @@ -17352,9 +19907,11 @@ }, { "name": "Maranao", + "depth": 5, "iso_1_code": null, "iso_3_code": "mrw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17371,6 +19928,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17385,6 +19943,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17400,19 +19959,23 @@ }, { "name": "Gorontalo-Mongondow", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gorontalic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bolango", + "depth": 5, "iso_1_code": null, "iso_3_code": "bld", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2747", "native_tokenizers": [], @@ -17420,9 +19983,11 @@ }, { "name": "Buol", + "depth": 5, "iso_1_code": null, "iso_3_code": "blf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2748", "native_tokenizers": [], @@ -17430,9 +19995,11 @@ }, { "name": "Bintauna", + "depth": 5, "iso_1_code": null, "iso_3_code": "bne", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2749", "native_tokenizers": [], @@ -17440,9 +20007,11 @@ }, { "name": "Gorontalo", + "depth": 5, "iso_1_code": null, "iso_3_code": "gor", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17460,9 +20029,11 @@ }, { "name": "Kaidipang", + "depth": 5, "iso_1_code": null, "iso_3_code": "kzp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2751", "native_tokenizers": [], @@ -17470,9 +20041,11 @@ }, { "name": "Lolak", + "depth": 5, "iso_1_code": null, "iso_3_code": "llq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2752", "native_tokenizers": [], @@ -17480,15 +20053,18 @@ }, { "name": "Suwawa", + "depth": 5, "iso_1_code": null, "iso_3_code": "swu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2753", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17504,14 +20080,17 @@ }, { "name": "Mongondowic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mongondow", + "depth": 5, "iso_1_code": null, "iso_3_code": "mog", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17529,15 +20108,18 @@ }, { "name": "Ponosakan", + "depth": 5, "iso_1_code": null, "iso_3_code": "pns", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2756", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17552,6 +20134,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17567,24 +20150,29 @@ }, { "name": "Manobo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manobo, Dibabawon", + "depth": 6, "iso_1_code": null, "iso_3_code": "mbd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17602,9 +20190,11 @@ }, { "name": "Manobo, Rajah Kabunsuwan", + "depth": 6, "iso_1_code": null, "iso_3_code": "mqk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2761", "native_tokenizers": [], @@ -17612,9 +20202,11 @@ }, { "name": "Manobo, Agusan", + "depth": 6, "iso_1_code": null, "iso_3_code": "msm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17631,6 +20223,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17646,19 +20239,23 @@ }, { "name": "South", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ata-Tigwa", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manobo, Ata", + "depth": 7, "iso_1_code": null, "iso_3_code": "atd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17676,9 +20273,11 @@ }, { "name": "Manobo, Matigsalug", + "depth": 7, "iso_1_code": null, "iso_3_code": "mbt", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17695,6 +20294,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17710,14 +20310,17 @@ }, { "name": "Obo", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manobo, Obo", + "depth": 7, "iso_1_code": null, "iso_3_code": "obo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17734,6 +20337,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17748,6 +20352,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17763,14 +20368,17 @@ }, { "name": "West", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manobo, Western Bukidnon", + "depth": 6, "iso_1_code": null, "iso_3_code": "mbb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17788,9 +20396,11 @@ }, { "name": "Manobo, Ilianen", + "depth": 6, "iso_1_code": null, "iso_3_code": "mbi", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17807,6 +20417,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17821,6 +20432,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17836,14 +20448,17 @@ }, { "name": "North", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Binukid", + "depth": 5, "iso_1_code": null, "iso_3_code": "bkd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17861,9 +20476,11 @@ }, { "name": "Kagayanen", + "depth": 5, "iso_1_code": null, "iso_3_code": "cgc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17881,9 +20498,11 @@ }, { "name": "Higaonon", + "depth": 5, "iso_1_code": null, "iso_3_code": "mba", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2775", "native_tokenizers": [], @@ -17891,15 +20510,18 @@ }, { "name": "Manobo, Kinamiging", + "depth": 5, "iso_1_code": null, "iso_3_code": "mkx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2776", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17915,14 +20537,17 @@ }, { "name": "South", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tagabawa", + "depth": 5, "iso_1_code": null, "iso_3_code": "bgs", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17940,9 +20565,11 @@ }, { "name": "Manobo, Sarangani", + "depth": 5, "iso_1_code": null, "iso_3_code": "mbs", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17960,9 +20587,11 @@ }, { "name": "Manobo, Cotabato", + "depth": 5, "iso_1_code": null, "iso_3_code": "mta", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17979,6 +20608,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -17993,6 +20623,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18008,14 +20639,17 @@ }, { "name": "Palawanic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bonggi", + "depth": 4, "iso_1_code": null, "iso_3_code": "bdg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2782", "native_tokenizers": [], @@ -18023,9 +20657,11 @@ }, { "name": "Batak", + "depth": 4, "iso_1_code": null, "iso_3_code": "bya", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2783", "native_tokenizers": [], @@ -18033,9 +20669,11 @@ }, { "name": "Palawano, Central", + "depth": 4, "iso_1_code": null, "iso_3_code": "plc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2784", "native_tokenizers": [], @@ -18043,9 +20681,11 @@ }, { "name": "Palawano, Southwest", + "depth": 4, "iso_1_code": null, "iso_3_code": "plv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2785", "native_tokenizers": [], @@ -18053,9 +20693,11 @@ }, { "name": "Palawano, Brooke\u2019s Point", + "depth": 4, "iso_1_code": null, "iso_3_code": "plw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18073,9 +20715,11 @@ }, { "name": "Molbog", + "depth": 4, "iso_1_code": null, "iso_3_code": "pwm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2787", "native_tokenizers": [], @@ -18083,9 +20727,11 @@ }, { "name": "Tagbanwa", + "depth": 4, "iso_1_code": null, "iso_3_code": "tbw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18103,15 +20749,18 @@ }, { "name": "Tagbanwa, Central", + "depth": 4, "iso_1_code": null, "iso_3_code": "tgt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2789", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18127,19 +20776,23 @@ }, { "name": "South Mangyan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buhid-Taubuid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buhid", + "depth": 5, "iso_1_code": null, "iso_3_code": "bku", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18157,9 +20810,11 @@ }, { "name": "Bangon", + "depth": 5, "iso_1_code": null, "iso_3_code": "bnj", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18177,9 +20832,11 @@ }, { "name": "Tawbuid", + "depth": 5, "iso_1_code": null, "iso_3_code": "twb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18196,6 +20853,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18211,14 +20869,17 @@ }, { "name": "Hanunoo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hanunoo", + "depth": 5, "iso_1_code": null, "iso_3_code": "hnn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18235,6 +20896,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18249,6 +20911,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18264,14 +20927,17 @@ }, { "name": "Subanon", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Subanon, Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "suc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18289,14 +20955,17 @@ }, { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Subanen, Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": "laa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2800", "native_tokenizers": [], @@ -18304,9 +20973,11 @@ }, { "name": "Subanen, Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": "sfe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2801", "native_tokenizers": [], @@ -18314,9 +20985,11 @@ }, { "name": "Subanon, Kolibugan", + "depth": 5, "iso_1_code": null, "iso_3_code": "skn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2802", "native_tokenizers": [], @@ -18324,9 +20997,11 @@ }, { "name": "Subanen, Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": "stb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2803", "native_tokenizers": [], @@ -18334,9 +21009,11 @@ }, { "name": "Subanen, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "syb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18353,6 +21030,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18367,6 +21045,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18382,14 +21061,17 @@ }, { "name": "Umiray Dumaget", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manide", + "depth": 4, "iso_1_code": null, "iso_3_code": "abd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2806", "native_tokenizers": [], @@ -18397,9 +21079,11 @@ }, { "name": "Agta, Umiray Dumaget", + "depth": 4, "iso_1_code": null, "iso_3_code": "due", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18417,15 +21101,18 @@ }, { "name": "Inagta Alabat", + "depth": 4, "iso_1_code": null, "iso_3_code": "dul", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2808", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18440,6 +21127,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tl\")", @@ -18455,14 +21143,17 @@ }, { "name": "Javanese", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Javanese, New Caledonian", + "depth": 3, "iso_1_code": null, "iso_3_code": "jas", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2810", "native_tokenizers": [], @@ -18470,9 +21161,11 @@ }, { "name": "Javanese", + "depth": 3, "iso_1_code": "jv", "iso_3_code": "jav", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18491,9 +21184,11 @@ }, { "name": "Javanese, Suriname", + "depth": 3, "iso_1_code": null, "iso_3_code": "jvn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18511,9 +21206,11 @@ }, { "name": "Osing", + "depth": 3, "iso_1_code": null, "iso_3_code": "osi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2813", "native_tokenizers": [], @@ -18521,15 +21218,18 @@ }, { "name": "Tengger", + "depth": 3, "iso_1_code": null, "iso_3_code": "tes", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2814", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18545,14 +21245,17 @@ }, { "name": "Kalamian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agutaynen", + "depth": 3, "iso_1_code": null, "iso_3_code": "agn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18570,9 +21273,11 @@ }, { "name": "Tagbanwa, Calamian", + "depth": 3, "iso_1_code": null, "iso_3_code": "tbk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18589,6 +21294,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18604,14 +21310,17 @@ }, { "name": "Lampung", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lampung Nyo", + "depth": 3, "iso_1_code": null, "iso_3_code": "abl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2819", "native_tokenizers": [], @@ -18619,9 +21328,11 @@ }, { "name": "Komering", + "depth": 3, "iso_1_code": null, "iso_3_code": "kge", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2820", "native_tokenizers": [], @@ -18629,9 +21340,11 @@ }, { "name": "Lampung Api", + "depth": 3, "iso_1_code": null, "iso_3_code": "ljp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18648,6 +21361,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18663,14 +21377,17 @@ }, { "name": "Land Dayak", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Benyadu\u2019", + "depth": 3, "iso_1_code": null, "iso_3_code": "byd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2823", "native_tokenizers": [], @@ -18678,9 +21395,11 @@ }, { "name": "Sanggau", + "depth": 3, "iso_1_code": null, "iso_3_code": "scg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2824", "native_tokenizers": [], @@ -18688,14 +21407,17 @@ }, { "name": "Bakati\u2019", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakati\u2019", + "depth": 4, "iso_1_code": null, "iso_3_code": "bei", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2826", "native_tokenizers": [], @@ -18703,9 +21425,11 @@ }, { "name": "Bakati\u2019, Rara", + "depth": 4, "iso_1_code": null, "iso_3_code": "lra", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2827", "native_tokenizers": [], @@ -18713,15 +21437,18 @@ }, { "name": "Bakati\u2019, Sara", + "depth": 4, "iso_1_code": null, "iso_3_code": "sre", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2828", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2825", "native_tokenizers": [], @@ -18729,24 +21456,29 @@ }, { "name": "Bidayuh", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Core", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bidayuh, Biatah", + "depth": 6, "iso_1_code": null, "iso_3_code": "bth", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18763,6 +21495,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18778,20 +21511,24 @@ }, { "name": "Sembaan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bidayuh, Tringgus-Sembaan", + "depth": 6, "iso_1_code": null, "iso_3_code": "trx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2834", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2833", "native_tokenizers": [], @@ -18799,26 +21536,31 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bidayuh, Bau", + "depth": 6, "iso_1_code": null, "iso_3_code": "sne", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2836", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2835", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18834,14 +21576,17 @@ }, { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bidayuh Serian", + "depth": 5, "iso_1_code": null, "iso_3_code": "sdo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18858,6 +21603,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18872,6 +21618,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18887,14 +21634,17 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jangkang", + "depth": 4, "iso_1_code": null, "iso_3_code": "djo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2840", "native_tokenizers": [], @@ -18902,9 +21652,11 @@ }, { "name": "Beginci", + "depth": 4, "iso_1_code": null, "iso_3_code": "ebc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2841", "native_tokenizers": [], @@ -18912,9 +21664,11 @@ }, { "name": "Gerai", + "depth": 4, "iso_1_code": null, "iso_3_code": "gef", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2842", "native_tokenizers": [], @@ -18922,9 +21676,11 @@ }, { "name": "Ribun", + "depth": 4, "iso_1_code": null, "iso_3_code": "rir", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2843", "native_tokenizers": [], @@ -18932,9 +21688,11 @@ }, { "name": "Semandang", + "depth": 4, "iso_1_code": null, "iso_3_code": "sdq", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18952,15 +21710,18 @@ }, { "name": "Mateq", + "depth": 4, "iso_1_code": null, "iso_3_code": "xem", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2845", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18975,6 +21736,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -18990,14 +21752,17 @@ }, { "name": "Madurese", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kangean", + "depth": 3, "iso_1_code": null, "iso_3_code": "kkv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2847", "native_tokenizers": [], @@ -19005,9 +21770,11 @@ }, { "name": "Madura", + "depth": 3, "iso_1_code": null, "iso_3_code": "mad", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19024,6 +21791,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19039,24 +21807,29 @@ }, { "name": "Malayo-Chamic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chamic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Acehnese", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aceh", + "depth": 5, "iso_1_code": null, "iso_3_code": "ace", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19074,6 +21847,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19089,14 +21863,17 @@ }, { "name": "Coastal", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haroi", + "depth": 5, "iso_1_code": null, "iso_3_code": "hro", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2854", "native_tokenizers": [], @@ -19104,14 +21881,17 @@ }, { "name": "Cham", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cham, Western", + "depth": 6, "iso_1_code": null, "iso_3_code": "cja", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2856", "native_tokenizers": [], @@ -19119,21 +21899,25 @@ }, { "name": "Cham, Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": "cjm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2857", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2855", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2853", "native_tokenizers": [], @@ -19141,14 +21925,17 @@ }, { "name": "Highlands", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bih", + "depth": 5, "iso_1_code": null, "iso_3_code": "ibh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2859", "native_tokenizers": [], @@ -19156,9 +21943,11 @@ }, { "name": "Jarai", + "depth": 5, "iso_1_code": null, "iso_3_code": "jra", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19176,9 +21965,11 @@ }, { "name": "Rade", + "depth": 5, "iso_1_code": null, "iso_3_code": "rad", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19196,14 +21987,17 @@ }, { "name": "Chru-Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chru", + "depth": 6, "iso_1_code": null, "iso_3_code": "cje", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2863", "native_tokenizers": [], @@ -19211,14 +22005,17 @@ }, { "name": "Northern Cham", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsat", + "depth": 7, "iso_1_code": null, "iso_3_code": "huq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2865", "native_tokenizers": [], @@ -19226,9 +22023,11 @@ }, { "name": "Roglai, Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "rgs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2866", "native_tokenizers": [], @@ -19236,9 +22035,11 @@ }, { "name": "Roglai, Cacgia", + "depth": 7, "iso_1_code": null, "iso_3_code": "roc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2867", "native_tokenizers": [], @@ -19246,27 +22047,32 @@ }, { "name": "Roglai, Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "rog", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2868", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2864", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2862", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19281,6 +22087,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19296,14 +22103,17 @@ }, { "name": "Malayic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Keninjal", + "depth": 4, "iso_1_code": null, "iso_3_code": "knl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2870", "native_tokenizers": [], @@ -19311,9 +22121,11 @@ }, { "name": "Kendayan", + "depth": 4, "iso_1_code": null, "iso_3_code": "knx", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19331,9 +22143,11 @@ }, { "name": "Urak Lawoi\u2019", + "depth": 4, "iso_1_code": "ms", "iso_3_code": "urk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2872", "native_tokenizers": [], @@ -19343,9 +22157,11 @@ }, { "name": "Malayic Dayak", + "depth": 4, "iso_1_code": null, "iso_3_code": "xdy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2873", "native_tokenizers": [], @@ -19353,14 +22169,17 @@ }, { "name": "Ibanic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iban", + "depth": 5, "iso_1_code": null, "iso_3_code": "iba", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19378,9 +22197,11 @@ }, { "name": "Remun", + "depth": 5, "iso_1_code": null, "iso_3_code": "lkj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2876", "native_tokenizers": [], @@ -19388,9 +22209,11 @@ }, { "name": "Mualang", + "depth": 5, "iso_1_code": null, "iso_3_code": "mtd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2877", "native_tokenizers": [], @@ -19398,15 +22221,18 @@ }, { "name": "Seberuang", + "depth": 5, "iso_1_code": null, "iso_3_code": "sbx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2878", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19422,14 +22248,17 @@ }, { "name": "Malay", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banjar", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "bjn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19450,9 +22279,11 @@ }, { "name": "Malay, Bacanese", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "btj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2881", "native_tokenizers": [], @@ -19460,9 +22291,11 @@ }, { "name": "Malay, Berau", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "bve", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2882", "native_tokenizers": [], @@ -19470,9 +22303,11 @@ }, { "name": "Malay, Bukit", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "bvu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2883", "native_tokenizers": [], @@ -19480,9 +22315,11 @@ }, { "name": "Duano", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "dup", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2884", "native_tokenizers": [], @@ -19490,9 +22327,11 @@ }, { "name": "Haji", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "hji", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2885", "native_tokenizers": [], @@ -19500,9 +22339,11 @@ }, { "name": "Indonesian", + "depth": 5, "iso_1_code": "id", "iso_3_code": "ind", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"id\")", @@ -19522,9 +22363,11 @@ }, { "name": "Jakun", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "jak", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2887", "native_tokenizers": [], @@ -19532,9 +22375,11 @@ }, { "name": "Malay, Jambi", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "jax", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2888", "native_tokenizers": [], @@ -19542,9 +22387,11 @@ }, { "name": "Kubu", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "kvb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2889", "native_tokenizers": [], @@ -19552,9 +22399,11 @@ }, { "name": "Kerinci", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "kvr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2890", "native_tokenizers": [], @@ -19562,9 +22411,11 @@ }, { "name": "Brunei", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "kxd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2891", "native_tokenizers": [], @@ -19572,9 +22423,11 @@ }, { "name": "Sekak", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "lce", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2892", "native_tokenizers": [], @@ -19582,9 +22435,11 @@ }, { "name": "Lubu", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "lcf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2893", "native_tokenizers": [], @@ -19592,9 +22447,11 @@ }, { "name": "Col", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "liw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2894", "native_tokenizers": [], @@ -19602,9 +22459,11 @@ }, { "name": "Malay, Kedah", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "meo", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2895", "native_tokenizers": [], @@ -19612,9 +22471,11 @@ }, { "name": "Malay, Pattani", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "mfa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2896", "native_tokenizers": [], @@ -19622,9 +22483,11 @@ }, { "name": "Bangka", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "mfb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2897", "native_tokenizers": [], @@ -19632,9 +22495,11 @@ }, { "name": "Indonesian, Makassar", + "depth": 5, "iso_1_code": null, "iso_3_code": "mfp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2898", "native_tokenizers": [], @@ -19642,9 +22507,11 @@ }, { "name": "Minangkabau", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "min", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19665,9 +22532,11 @@ }, { "name": "Malay, Kota Bangun Kutai", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "mqg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2900", "native_tokenizers": [], @@ -19675,9 +22544,11 @@ }, { "name": "Malay, Sabah", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "msi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2901", "native_tokenizers": [], @@ -19685,9 +22556,11 @@ }, { "name": "Musi", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "mui", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19707,9 +22580,11 @@ }, { "name": "Orang Kanaq", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "orn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2903", "native_tokenizers": [], @@ -19717,9 +22592,11 @@ }, { "name": "Orang Seletar", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "ors", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2904", "native_tokenizers": [], @@ -19727,9 +22604,11 @@ }, { "name": "Pekal", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "pel", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2905", "native_tokenizers": [], @@ -19737,9 +22616,11 @@ }, { "name": "Malay, Central", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "pse", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19759,9 +22640,11 @@ }, { "name": "Temuan", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "tmw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2907", "native_tokenizers": [], @@ -19769,9 +22652,11 @@ }, { "name": "Kaur", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "vkk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2908", "native_tokenizers": [], @@ -19779,9 +22664,11 @@ }, { "name": "Malay, Tenggarong Kutai", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "vkt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2909", "native_tokenizers": [], @@ -19789,9 +22676,11 @@ }, { "name": "Malay", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "zlm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2910", "native_tokenizers": [], @@ -19799,9 +22688,11 @@ }, { "name": "Negeri Sembilan Malay", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "zmi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2911", "native_tokenizers": [], @@ -19809,9 +22700,11 @@ }, { "name": "Malay, Standard", + "depth": 5, "iso_1_code": "ms", "iso_3_code": "zsm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19831,6 +22724,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19845,6 +22739,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19859,6 +22754,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -19874,14 +22770,17 @@ }, { "name": "Minahasan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tonsawang", + "depth": 3, "iso_1_code": null, "iso_3_code": "tnw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2914", "native_tokenizers": [], @@ -19889,14 +22788,17 @@ }, { "name": "North", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tontemboan", + "depth": 4, "iso_1_code": null, "iso_3_code": "tnt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2916", "native_tokenizers": [], @@ -19904,14 +22806,17 @@ }, { "name": "Northeast", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tondano", + "depth": 5, "iso_1_code": null, "iso_3_code": "tdn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2918", "native_tokenizers": [], @@ -19919,9 +22824,11 @@ }, { "name": "Tombulu", + "depth": 5, "iso_1_code": null, "iso_3_code": "tom", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2919", "native_tokenizers": [], @@ -19929,27 +22836,32 @@ }, { "name": "Tonsea", + "depth": 5, "iso_1_code": null, "iso_3_code": "txs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2920", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2917", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2915", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2913", "native_tokenizers": [], @@ -19957,14 +22869,17 @@ }, { "name": "Moklen", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Moklen", + "depth": 3, "iso_1_code": null, "iso_3_code": "mkm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2922", "native_tokenizers": [], @@ -19972,15 +22887,18 @@ }, { "name": "Moken", + "depth": 3, "iso_1_code": null, "iso_3_code": "mwt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2923", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2921", "native_tokenizers": [], @@ -19988,20 +22906,24 @@ }, { "name": "Nasal", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nasal", + "depth": 3, "iso_1_code": null, "iso_3_code": "nsy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2925", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2924", "native_tokenizers": [], @@ -20009,24 +22931,29 @@ }, { "name": "North Borneo", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Melanau-Kajang", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kajang", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bukitan", + "depth": 5, "iso_1_code": null, "iso_3_code": "bkn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2929", "native_tokenizers": [], @@ -20034,9 +22961,11 @@ }, { "name": "Kajaman", + "depth": 5, "iso_1_code": null, "iso_3_code": "kag", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2930", "native_tokenizers": [], @@ -20044,9 +22973,11 @@ }, { "name": "Lahanan", + "depth": 5, "iso_1_code": null, "iso_3_code": "lhn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2931", "native_tokenizers": [], @@ -20054,9 +22985,11 @@ }, { "name": "Punan Batu", + "depth": 5, "iso_1_code": null, "iso_3_code": "pnm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2932", "native_tokenizers": [], @@ -20064,9 +22997,11 @@ }, { "name": "Sekapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "skp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2933", "native_tokenizers": [], @@ -20074,9 +23009,11 @@ }, { "name": "Sihan", + "depth": 5, "iso_1_code": null, "iso_3_code": "spg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2934", "native_tokenizers": [], @@ -20084,15 +23021,18 @@ }, { "name": "Ukit", + "depth": 5, "iso_1_code": null, "iso_3_code": "umi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2935", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2928", "native_tokenizers": [], @@ -20100,14 +23040,17 @@ }, { "name": "Melanau", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Melanau, Daro-Matu", + "depth": 5, "iso_1_code": null, "iso_3_code": "dro", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2937", "native_tokenizers": [], @@ -20115,9 +23058,11 @@ }, { "name": "Melanau, Kanowit-Tanjong", + "depth": 5, "iso_1_code": null, "iso_3_code": "kxn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2938", "native_tokenizers": [], @@ -20125,9 +23070,11 @@ }, { "name": "Melanau, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "mel", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2939", "native_tokenizers": [], @@ -20135,21 +23082,25 @@ }, { "name": "Melanau, Sibu", + "depth": 5, "iso_1_code": null, "iso_3_code": "sdx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2940", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2936", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2927", "native_tokenizers": [], @@ -20157,24 +23108,29 @@ }, { "name": "North Sarawakan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berawan-Lower Baram", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berawan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berawan, West", + "depth": 6, "iso_1_code": null, "iso_3_code": "zbw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2944", "native_tokenizers": [], @@ -20182,14 +23138,17 @@ }, { "name": "Central-East Berawan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berawan, Central", + "depth": 7, "iso_1_code": null, "iso_3_code": "zbc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2946", "native_tokenizers": [], @@ -20197,21 +23156,25 @@ }, { "name": "Berawan, East", + "depth": 7, "iso_1_code": null, "iso_3_code": "zbe", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2947", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2945", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2943", "native_tokenizers": [], @@ -20219,24 +23182,29 @@ }, { "name": "Lower Baram", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Belait", + "depth": 8, "iso_1_code": null, "iso_3_code": "beg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2951", "native_tokenizers": [], @@ -20244,15 +23212,18 @@ }, { "name": "Kiput", + "depth": 8, "iso_1_code": null, "iso_3_code": "kyi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2952", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2950", "native_tokenizers": [], @@ -20260,14 +23231,17 @@ }, { "name": "B", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lelak", + "depth": 8, "iso_1_code": null, "iso_3_code": "llk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2954", "native_tokenizers": [], @@ -20275,9 +23249,11 @@ }, { "name": "Narom", + "depth": 8, "iso_1_code": null, "iso_3_code": "nrm", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20295,15 +23271,18 @@ }, { "name": "Tutong", + "depth": 8, "iso_1_code": null, "iso_3_code": "ttg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2956", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20318,6 +23297,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20332,6 +23312,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20346,6 +23327,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20361,20 +23343,24 @@ }, { "name": "Bintulu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vaie", + "depth": 5, "iso_1_code": null, "iso_3_code": "bny", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2958", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2957", "native_tokenizers": [], @@ -20382,19 +23368,23 @@ }, { "name": "Dayic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kelabitic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kelabit", + "depth": 6, "iso_1_code": null, "iso_3_code": "kzi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2961", "native_tokenizers": [], @@ -20402,9 +23392,11 @@ }, { "name": "Lengilu", + "depth": 6, "iso_1_code": null, "iso_3_code": "lgi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2962", "native_tokenizers": [], @@ -20412,9 +23404,11 @@ }, { "name": "Lundayeh", + "depth": 6, "iso_1_code": null, "iso_3_code": "lnd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20432,9 +23426,11 @@ }, { "name": "Putoh", + "depth": 6, "iso_1_code": null, "iso_3_code": "put", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2964", "native_tokenizers": [], @@ -20442,9 +23438,11 @@ }, { "name": "Sa\u2019ban", + "depth": 6, "iso_1_code": null, "iso_3_code": "snv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2965", "native_tokenizers": [], @@ -20452,15 +23450,18 @@ }, { "name": "Tring", + "depth": 6, "iso_1_code": null, "iso_3_code": "tgq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2966", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20475,6 +23476,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20490,24 +23492,29 @@ }, { "name": "Kayan-Kenyah", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayanic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayan Proper", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayan, Busang", + "depth": 7, "iso_1_code": null, "iso_3_code": "bfg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2970", "native_tokenizers": [], @@ -20515,9 +23522,11 @@ }, { "name": "Bahau", + "depth": 7, "iso_1_code": null, "iso_3_code": "bhv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2971", "native_tokenizers": [], @@ -20525,9 +23534,11 @@ }, { "name": "Kayan, Baram", + "depth": 7, "iso_1_code": null, "iso_3_code": "kys", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2972", "native_tokenizers": [], @@ -20535,9 +23546,11 @@ }, { "name": "Kayan, Rejang", + "depth": 7, "iso_1_code": null, "iso_3_code": "ree", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2973", "native_tokenizers": [], @@ -20545,9 +23558,11 @@ }, { "name": "Kayan, Wahau", + "depth": 7, "iso_1_code": null, "iso_3_code": "whu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2974", "native_tokenizers": [], @@ -20555,9 +23570,11 @@ }, { "name": "Kayan Mahakam", + "depth": 7, "iso_1_code": null, "iso_3_code": "xay", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2975", "native_tokenizers": [], @@ -20565,9 +23582,11 @@ }, { "name": "Kayan, Mendalam", + "depth": 7, "iso_1_code": null, "iso_3_code": "xkd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2976", "native_tokenizers": [], @@ -20575,15 +23594,18 @@ }, { "name": "Kayan, Kayan River", + "depth": 7, "iso_1_code": null, "iso_3_code": "xkn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2977", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2969", "native_tokenizers": [], @@ -20591,14 +23613,17 @@ }, { "name": "Modang", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Modang", + "depth": 7, "iso_1_code": null, "iso_3_code": "mxd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2979", "native_tokenizers": [], @@ -20606,15 +23631,18 @@ }, { "name": "Segai", + "depth": 7, "iso_1_code": null, "iso_3_code": "sge", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2980", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2978", "native_tokenizers": [], @@ -20622,14 +23650,17 @@ }, { "name": "Muller-Schwaner \u2018Punan\u2019", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bukat", + "depth": 7, "iso_1_code": null, "iso_3_code": "bvk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2982", "native_tokenizers": [], @@ -20637,9 +23668,11 @@ }, { "name": "Hovongan", + "depth": 7, "iso_1_code": null, "iso_3_code": "hov", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2983", "native_tokenizers": [], @@ -20647,9 +23680,11 @@ }, { "name": "Aoheng", + "depth": 7, "iso_1_code": null, "iso_3_code": "pni", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2984", "native_tokenizers": [], @@ -20657,9 +23692,11 @@ }, { "name": "Punan Aput", + "depth": 7, "iso_1_code": null, "iso_3_code": "pud", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2985", "native_tokenizers": [], @@ -20667,9 +23704,11 @@ }, { "name": "Punan Merah", + "depth": 7, "iso_1_code": null, "iso_3_code": "puf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2986", "native_tokenizers": [], @@ -20677,15 +23716,18 @@ }, { "name": "Kereho", + "depth": 7, "iso_1_code": null, "iso_3_code": "xke", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2987", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2981", "native_tokenizers": [], @@ -20693,26 +23735,31 @@ }, { "name": "Murik Kayan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Murik", + "depth": 7, "iso_1_code": null, "iso_3_code": "mxr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2989", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2988", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2968", "native_tokenizers": [], @@ -20720,14 +23767,17 @@ }, { "name": "Kenyah", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kenyah, Mainstream", + "depth": 6, "iso_1_code": null, "iso_3_code": "xkl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2991", "native_tokenizers": [], @@ -20735,14 +23785,17 @@ }, { "name": "Kayanic Kenyah", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sebop", + "depth": 7, "iso_1_code": null, "iso_3_code": "sib", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2993", "native_tokenizers": [], @@ -20750,9 +23803,11 @@ }, { "name": "Long Wat", + "depth": 7, "iso_1_code": null, "iso_3_code": "ttw", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2994", "native_tokenizers": [], @@ -20760,9 +23815,11 @@ }, { "name": "Kenyah, Wahau", + "depth": 7, "iso_1_code": null, "iso_3_code": "whk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20779,6 +23836,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20794,14 +23852,17 @@ }, { "name": "Upper Pujungan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Uma\u2019 Lung", + "depth": 7, "iso_1_code": null, "iso_3_code": "ulu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2997", "native_tokenizers": [], @@ -20809,21 +23870,25 @@ }, { "name": "Uma\u2019 Lasan", + "depth": 7, "iso_1_code": null, "iso_3_code": "xky", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "2998", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "2996", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20839,14 +23904,17 @@ }, { "name": "Penan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Penan, Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": "pez", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3000", "native_tokenizers": [], @@ -20854,9 +23922,11 @@ }, { "name": "Penan, Western", + "depth": 6, "iso_1_code": null, "iso_3_code": "pne", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20873,6 +23943,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20887,6 +23958,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20902,26 +23974,31 @@ }, { "name": "Punan Tubu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Punan Tubu", + "depth": 5, "iso_1_code": null, "iso_3_code": "puj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3003", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3002", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -20937,14 +24014,17 @@ }, { "name": "Rejang-Sajau", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Basap", + "depth": 4, "iso_1_code": null, "iso_3_code": "bdb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3005", "native_tokenizers": [], @@ -20952,9 +24032,11 @@ }, { "name": "Burusu", + "depth": 4, "iso_1_code": null, "iso_3_code": "bqr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3006", "native_tokenizers": [], @@ -20962,9 +24044,11 @@ }, { "name": "Punan Bah-Biau", + "depth": 4, "iso_1_code": null, "iso_3_code": "pna", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3007", "native_tokenizers": [], @@ -20972,9 +24056,11 @@ }, { "name": "Punan Merap", + "depth": 4, "iso_1_code": null, "iso_3_code": "puc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3008", "native_tokenizers": [], @@ -20982,15 +24068,18 @@ }, { "name": "Sajau Basap", + "depth": 4, "iso_1_code": null, "iso_3_code": "sjb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3009", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3004", "native_tokenizers": [], @@ -20998,24 +24087,29 @@ }, { "name": "Sabahan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dusunic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bisaya-Lotud", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bisaya, Sabah", + "depth": 6, "iso_1_code": null, "iso_3_code": "bsy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3013", "native_tokenizers": [], @@ -21023,9 +24117,11 @@ }, { "name": "Lotud", + "depth": 6, "iso_1_code": null, "iso_3_code": "dtr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3014", "native_tokenizers": [], @@ -21033,26 +24129,31 @@ }, { "name": "Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bisaya, Brunei", + "depth": 7, "iso_1_code": null, "iso_3_code": "bsb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3016", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3015", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3012", "native_tokenizers": [], @@ -21060,14 +24161,17 @@ }, { "name": "Dusun", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuijau", + "depth": 6, "iso_1_code": null, "iso_3_code": "dkr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3018", "native_tokenizers": [], @@ -21075,9 +24179,11 @@ }, { "name": "Rungus", + "depth": 6, "iso_1_code": null, "iso_3_code": "drg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21095,9 +24201,11 @@ }, { "name": "Kota Marudu Talantang", + "depth": 6, "iso_1_code": null, "iso_3_code": "grm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3020", "native_tokenizers": [], @@ -21105,9 +24213,11 @@ }, { "name": "Kimaragang", + "depth": 6, "iso_1_code": null, "iso_3_code": "kqr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3021", "native_tokenizers": [], @@ -21115,9 +24225,11 @@ }, { "name": "Kadazan, Klias River", + "depth": 6, "iso_1_code": null, "iso_3_code": "kqt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3022", "native_tokenizers": [], @@ -21125,9 +24237,11 @@ }, { "name": "Tobilung", + "depth": 6, "iso_1_code": null, "iso_3_code": "tgb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3023", "native_tokenizers": [], @@ -21135,14 +24249,17 @@ }, { "name": "Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kadazan Dusun", + "depth": 7, "iso_1_code": null, "iso_3_code": "dtp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21160,9 +24277,11 @@ }, { "name": "Sugut Dusun", + "depth": 7, "iso_1_code": null, "iso_3_code": "kzs", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3026", "native_tokenizers": [], @@ -21170,15 +24289,18 @@ }, { "name": "Minokok", + "depth": 7, "iso_1_code": null, "iso_3_code": "mqq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3027", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21194,14 +24316,17 @@ }, { "name": "Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kadazan, Labuk-Kinabatangan", + "depth": 7, "iso_1_code": null, "iso_3_code": "dtb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21218,6 +24343,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21232,6 +24358,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21247,26 +24374,31 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dumpas", + "depth": 6, "iso_1_code": null, "iso_3_code": "dmv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3031", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3030", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21282,20 +24414,24 @@ }, { "name": "Ida\u2019an", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ida\u2019an", + "depth": 5, "iso_1_code": null, "iso_3_code": "dbj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3033", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3032", "native_tokenizers": [], @@ -21303,19 +24439,23 @@ }, { "name": "Murutic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Murut", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Okolod", + "depth": 6, "iso_1_code": null, "iso_3_code": "kqv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3036", "native_tokenizers": [], @@ -21323,9 +24463,11 @@ }, { "name": "Murut, Keningau", + "depth": 6, "iso_1_code": null, "iso_3_code": "kxi", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3037", "native_tokenizers": [], @@ -21333,9 +24475,11 @@ }, { "name": "Murut, Tahol", + "depth": 6, "iso_1_code": null, "iso_3_code": "mvv", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3038", "native_tokenizers": [], @@ -21343,9 +24487,11 @@ }, { "name": "Murut, Paluan", + "depth": 6, "iso_1_code": null, "iso_3_code": "plz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3039", "native_tokenizers": [], @@ -21353,9 +24499,11 @@ }, { "name": "Murut, Selungai", + "depth": 6, "iso_1_code": null, "iso_3_code": "slg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3040", "native_tokenizers": [], @@ -21363,9 +24511,11 @@ }, { "name": "Murut, Timugon", + "depth": 6, "iso_1_code": null, "iso_3_code": "tih", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21382,6 +24532,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21397,20 +24548,24 @@ }, { "name": "Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Murut, Bookan", + "depth": 6, "iso_1_code": null, "iso_3_code": "bnb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3043", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3042", "native_tokenizers": [], @@ -21418,14 +24573,17 @@ }, { "name": "Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Murut, Kalabakan", + "depth": 6, "iso_1_code": null, "iso_3_code": "kve", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3045", "native_tokenizers": [], @@ -21433,15 +24591,18 @@ }, { "name": "Murut, Sembakung", + "depth": 6, "iso_1_code": null, "iso_3_code": "sbr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3046", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3044", "native_tokenizers": [], @@ -21449,14 +24610,17 @@ }, { "name": "Tidung", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tidung, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "itd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3048", "native_tokenizers": [], @@ -21464,9 +24628,11 @@ }, { "name": "Tidung, Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": "ntd", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3049", "native_tokenizers": [], @@ -21474,15 +24640,18 @@ }, { "name": "Murut, Serudung", + "depth": 6, "iso_1_code": null, "iso_3_code": "srk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3050", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3047", "native_tokenizers": [], @@ -21490,14 +24659,17 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Papar", + "depth": 6, "iso_1_code": null, "iso_3_code": "dpp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3052", "native_tokenizers": [], @@ -21505,21 +24677,25 @@ }, { "name": "Gana", + "depth": 6, "iso_1_code": null, "iso_3_code": "gnq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3053", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3051", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21535,14 +24711,17 @@ }, { "name": "Paitanic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abai Sungai", + "depth": 5, "iso_1_code": null, "iso_3_code": "abf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3055", "native_tokenizers": [], @@ -21550,9 +24729,11 @@ }, { "name": "Tombonuo", + "depth": 5, "iso_1_code": null, "iso_3_code": "txa", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3056", "native_tokenizers": [], @@ -21560,14 +24741,17 @@ }, { "name": "Upper Kinabatangan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kinabatangan, Upper", + "depth": 6, "iso_1_code": null, "iso_3_code": "dmg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3058", "native_tokenizers": [], @@ -21575,9 +24759,11 @@ }, { "name": "Lobu, Tampias", + "depth": 6, "iso_1_code": null, "iso_3_code": "low", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3059", "native_tokenizers": [], @@ -21585,21 +24771,25 @@ }, { "name": "Lobu, Lanas", + "depth": 6, "iso_1_code": null, "iso_3_code": "ruu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3060", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3057", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3054", "native_tokenizers": [], @@ -21607,26 +24797,31 @@ }, { "name": "Unclassified", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tatana", + "depth": 5, "iso_1_code": null, "iso_3_code": "txx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3062", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3061", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21641,6 +24836,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21656,14 +24852,17 @@ }, { "name": "North Mangyan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alangan", + "depth": 3, "iso_1_code": null, "iso_3_code": "alj", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21681,9 +24880,11 @@ }, { "name": "Iraya", + "depth": 3, "iso_1_code": null, "iso_3_code": "iry", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21701,15 +24902,18 @@ }, { "name": "Tadyawan", + "depth": 3, "iso_1_code": null, "iso_3_code": "tdy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3066", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21725,25 +24929,30 @@ }, { "name": "Northern Luzon", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arta", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arta", + "depth": 4, "iso_1_code": null, "iso_3_code": "atz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3069", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3068", "native_tokenizers": [], @@ -21751,14 +24960,17 @@ }, { "name": "Ilocano", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ilocano", + "depth": 4, "iso_1_code": null, "iso_3_code": "ilo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21775,6 +24987,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21790,19 +25003,23 @@ }, { "name": "Meso-Cordilleran", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alta", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alta, Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": "agy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3074", "native_tokenizers": [], @@ -21810,15 +25027,18 @@ }, { "name": "Alta, Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": "aqn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3075", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3073", "native_tokenizers": [], @@ -21826,30 +25046,36 @@ }, { "name": "South-Central Cordilleran", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Cordilleran", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isinai", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isinay", + "depth": 7, "iso_1_code": null, "iso_3_code": "inn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3079", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3078", "native_tokenizers": [], @@ -21857,24 +25083,29 @@ }, { "name": "North Central Cordilleran", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalinga-Itneg", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Itneg", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Itneg, Binongan", + "depth": 9, "iso_1_code": null, "iso_3_code": "itb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3083", "native_tokenizers": [], @@ -21882,9 +25113,11 @@ }, { "name": "Itneg, Inlaud", + "depth": 9, "iso_1_code": null, "iso_3_code": "iti", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3084", "native_tokenizers": [], @@ -21892,9 +25125,11 @@ }, { "name": "Itneg, Maeng", + "depth": 9, "iso_1_code": null, "iso_3_code": "itt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3085", "native_tokenizers": [], @@ -21902,9 +25137,11 @@ }, { "name": "Itneg, Moyadan", + "depth": 9, "iso_1_code": null, "iso_3_code": "ity", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3086", "native_tokenizers": [], @@ -21912,15 +25149,18 @@ }, { "name": "Itneg, Masadiit", + "depth": 9, "iso_1_code": null, "iso_3_code": "tis", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3087", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3082", "native_tokenizers": [], @@ -21928,14 +25168,17 @@ }, { "name": "Kalinga", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalinga, Vanaw", + "depth": 9, "iso_1_code": null, "iso_3_code": "bjx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3089", "native_tokenizers": [], @@ -21943,9 +25186,11 @@ }, { "name": "Kalinga, Mabaka Valley", + "depth": 9, "iso_1_code": null, "iso_3_code": "kkg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3090", "native_tokenizers": [], @@ -21953,9 +25198,11 @@ }, { "name": "Kalinga, Majukayang", + "depth": 9, "iso_1_code": null, "iso_3_code": "kmd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21973,9 +25220,11 @@ }, { "name": "Kalinga, Limos", + "depth": 9, "iso_1_code": null, "iso_3_code": "kmk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -21993,9 +25242,11 @@ }, { "name": "Kalinga, Tanudan", + "depth": 9, "iso_1_code": null, "iso_3_code": "kml", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3093", "native_tokenizers": [], @@ -22003,9 +25254,11 @@ }, { "name": "Kalinga, Lubuagan", + "depth": 9, "iso_1_code": null, "iso_3_code": "knb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3094", "native_tokenizers": [], @@ -22013,9 +25266,11 @@ }, { "name": "Kalinga, Southern", + "depth": 9, "iso_1_code": null, "iso_3_code": "ksc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22033,15 +25288,18 @@ }, { "name": "Kalinga, Butbut", + "depth": 9, "iso_1_code": null, "iso_3_code": "kyb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3096", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22056,6 +25314,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22071,19 +25330,23 @@ }, { "name": "Nuclear Cordilleran", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balangaw", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balangao", + "depth": 9, "iso_1_code": null, "iso_3_code": "blw", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22100,6 +25363,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22115,19 +25379,23 @@ }, { "name": "Bontok-Kankanay", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bontok", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bontok, Eastern", + "depth": 10, "iso_1_code": null, "iso_3_code": "ebk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22145,9 +25413,11 @@ }, { "name": "Bontok, Central", + "depth": 10, "iso_1_code": null, "iso_3_code": "lbk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22165,9 +25435,11 @@ }, { "name": "Bontok, Southern", + "depth": 10, "iso_1_code": null, "iso_3_code": "obk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3104", "native_tokenizers": [], @@ -22175,9 +25447,11 @@ }, { "name": "Bontok, Northern", + "depth": 10, "iso_1_code": null, "iso_3_code": "rbk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3105", "native_tokenizers": [], @@ -22185,15 +25459,18 @@ }, { "name": "Bontok, Southwestern", + "depth": 10, "iso_1_code": null, "iso_3_code": "vbk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3106", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22209,14 +25486,17 @@ }, { "name": "Kankanay", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kankanaey", + "depth": 10, "iso_1_code": null, "iso_3_code": "kne", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22234,9 +25514,11 @@ }, { "name": "Kankanay, Northern", + "depth": 10, "iso_1_code": null, "iso_3_code": "xnn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22253,6 +25535,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22267,6 +25550,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22282,14 +25566,17 @@ }, { "name": "Ifugaw", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ifugao, Amganad", + "depth": 9, "iso_1_code": null, "iso_3_code": "ifa", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22307,9 +25594,11 @@ }, { "name": "Ifugao, Batad", + "depth": 9, "iso_1_code": null, "iso_3_code": "ifb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22327,9 +25616,11 @@ }, { "name": "Ifugao, Tuwali", + "depth": 9, "iso_1_code": null, "iso_3_code": "ifk", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22347,9 +25638,11 @@ }, { "name": "Ifugao, Mayoyao", + "depth": 9, "iso_1_code": null, "iso_3_code": "ifu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22366,6 +25659,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22380,6 +25674,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22394,6 +25689,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22408,6 +25704,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22423,25 +25720,30 @@ }, { "name": "Southern Cordilleran", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ilongot", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bogkalot", + "depth": 7, "iso_1_code": null, "iso_3_code": "ilk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3117", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3116", "native_tokenizers": [], @@ -22449,14 +25751,17 @@ }, { "name": "West Southern Cordilleran", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pangasinan", + "depth": 7, "iso_1_code": null, "iso_3_code": "pag", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22474,19 +25779,23 @@ }, { "name": "Nuclear Southern Cordilleran", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibaloy", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibaloi", + "depth": 9, "iso_1_code": null, "iso_3_code": "ibl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3122", "native_tokenizers": [], @@ -22494,15 +25803,18 @@ }, { "name": "I-wak", + "depth": 9, "iso_1_code": null, "iso_3_code": "iwk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3123", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3121", "native_tokenizers": [], @@ -22510,14 +25822,17 @@ }, { "name": "Kallahan", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kallahan, Keley-i", + "depth": 9, "iso_1_code": null, "iso_3_code": "ify", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22535,9 +25850,11 @@ }, { "name": "Kalanguya", + "depth": 9, "iso_1_code": null, "iso_3_code": "kak", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22554,6 +25871,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22569,26 +25887,31 @@ }, { "name": "Karaw", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karao", + "depth": 9, "iso_1_code": null, "iso_3_code": "kyj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3128", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3127", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22603,6 +25926,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22617,6 +25941,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22631,6 +25956,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22645,6 +25971,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22660,24 +25987,29 @@ }, { "name": "Northern Cordilleran", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cagayan Valley", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibanagic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atta, Pudtol", + "depth": 6, "iso_1_code": null, "iso_3_code": "atp", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3132", "native_tokenizers": [], @@ -22685,9 +26017,11 @@ }, { "name": "Atta, Pamplona", + "depth": 6, "iso_1_code": null, "iso_3_code": "att", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22705,9 +26039,11 @@ }, { "name": "Atta, Faire", + "depth": 6, "iso_1_code": null, "iso_3_code": "azt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3134", "native_tokenizers": [], @@ -22715,9 +26051,11 @@ }, { "name": "Ibanag", + "depth": 6, "iso_1_code": null, "iso_3_code": "ibg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22735,9 +26073,11 @@ }, { "name": "Itawit", + "depth": 6, "iso_1_code": null, "iso_3_code": "itv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22755,9 +26095,11 @@ }, { "name": "Yogad", + "depth": 6, "iso_1_code": null, "iso_3_code": "yog", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3137", "native_tokenizers": [], @@ -22765,14 +26107,17 @@ }, { "name": "Gaddangic", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agta, Central Cagayan", + "depth": 7, "iso_1_code": null, "iso_3_code": "agt", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22790,9 +26135,11 @@ }, { "name": "Gaddang", + "depth": 7, "iso_1_code": null, "iso_3_code": "gad", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3140", "native_tokenizers": [], @@ -22800,9 +26147,11 @@ }, { "name": "Ga\ua78cdang", + "depth": 7, "iso_1_code": null, "iso_3_code": "gdg", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22819,6 +26168,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22833,6 +26183,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22848,14 +26199,17 @@ }, { "name": "Isnag", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isnag", + "depth": 6, "iso_1_code": null, "iso_3_code": "isd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22873,15 +26227,18 @@ }, { "name": "Adasen", + "depth": 6, "iso_1_code": null, "iso_3_code": "tiu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3144", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22896,6 +26253,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22911,14 +26269,17 @@ }, { "name": "Northeastern Luzon", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agta, Pahanan", + "depth": 5, "iso_1_code": null, "iso_3_code": "apf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3146", "native_tokenizers": [], @@ -22926,9 +26287,11 @@ }, { "name": "Paranan", + "depth": 5, "iso_1_code": null, "iso_3_code": "prf", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22946,14 +26309,17 @@ }, { "name": "Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agta, Casiguran Dumagat", + "depth": 6, "iso_1_code": null, "iso_3_code": "dgc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22971,9 +26337,11 @@ }, { "name": "Agta, Dupaninan", + "depth": 6, "iso_1_code": null, "iso_3_code": "duo", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -22991,9 +26359,11 @@ }, { "name": "Agta, Dicamay", + "depth": 6, "iso_1_code": null, "iso_3_code": "duy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3151", "native_tokenizers": [], @@ -23001,15 +26371,18 @@ }, { "name": "Kasiguranin", + "depth": 6, "iso_1_code": null, "iso_3_code": "ksn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3152", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23024,6 +26397,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23038,6 +26412,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23052,6 +26427,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23067,14 +26443,17 @@ }, { "name": "Northwest Sumatra-Barrier Islands", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Enggano", + "depth": 3, "iso_1_code": null, "iso_3_code": "eno", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3154", "native_tokenizers": [], @@ -23082,9 +26461,11 @@ }, { "name": "Gayo", + "depth": 3, "iso_1_code": null, "iso_3_code": "gay", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3155", "native_tokenizers": [], @@ -23092,9 +26473,11 @@ }, { "name": "Mentawai", + "depth": 3, "iso_1_code": null, "iso_3_code": "mwv", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23112,9 +26495,11 @@ }, { "name": "Simeulue", + "depth": 3, "iso_1_code": null, "iso_3_code": "smr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3157", "native_tokenizers": [], @@ -23122,19 +26507,23 @@ }, { "name": "Batak", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Batak Dairi", + "depth": 5, "iso_1_code": null, "iso_3_code": "btd", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23152,9 +26541,11 @@ }, { "name": "Batak Karo", + "depth": 5, "iso_1_code": null, "iso_3_code": "btx", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23172,15 +26563,18 @@ }, { "name": "Batak Alas-Kluet", + "depth": 5, "iso_1_code": null, "iso_3_code": "btz", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3162", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23196,14 +26590,17 @@ }, { "name": "Simalungan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Batak Simalungun", + "depth": 5, "iso_1_code": null, "iso_3_code": "bts", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23220,6 +26617,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23235,14 +26633,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Batak Angkola", + "depth": 5, "iso_1_code": null, "iso_3_code": "akb", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23260,9 +26661,11 @@ }, { "name": "Batak Toba", + "depth": 5, "iso_1_code": null, "iso_3_code": "bbc", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23280,15 +26683,18 @@ }, { "name": "Batak Mandailing", + "depth": 5, "iso_1_code": null, "iso_3_code": "btm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3168", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23303,6 +26709,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23318,14 +26725,17 @@ }, { "name": "Nias", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nias", + "depth": 4, "iso_1_code": null, "iso_3_code": "nia", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23343,15 +26753,18 @@ }, { "name": "Sikule", + "depth": 4, "iso_1_code": null, "iso_3_code": "skh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3171", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23366,6 +26779,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23381,14 +26795,17 @@ }, { "name": "Palauan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Palauan", + "depth": 3, "iso_1_code": null, "iso_3_code": "pau", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23405,6 +26822,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23420,14 +26838,17 @@ }, { "name": "Rejang", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rejang", + "depth": 3, "iso_1_code": null, "iso_3_code": "rej", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23444,6 +26865,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23459,19 +26881,23 @@ }, { "name": "Sangiric", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sangil", + "depth": 4, "iso_1_code": null, "iso_3_code": "snl", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3178", "native_tokenizers": [], @@ -23479,9 +26905,11 @@ }, { "name": "Sangir", + "depth": 4, "iso_1_code": null, "iso_3_code": "sxn", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23499,15 +26927,18 @@ }, { "name": "Talaud", + "depth": 4, "iso_1_code": null, "iso_3_code": "tld", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3180", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23523,14 +26954,17 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bantik", + "depth": 4, "iso_1_code": null, "iso_3_code": "bnq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3182", "native_tokenizers": [], @@ -23538,21 +26972,25 @@ }, { "name": "Ratahan", + "depth": 4, "iso_1_code": null, "iso_3_code": "rth", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3183", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3181", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23568,19 +27006,23 @@ }, { "name": "South Sulawesi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bugis", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bugis", + "depth": 4, "iso_1_code": null, "iso_3_code": "bug", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23598,9 +27040,11 @@ }, { "name": "Koneq-koneq", + "depth": 4, "iso_1_code": null, "iso_3_code": "cml", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3187", "native_tokenizers": [], @@ -23608,14 +27052,17 @@ }, { "name": "Tamanic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Embaloh", + "depth": 5, "iso_1_code": null, "iso_3_code": "emb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3189", "native_tokenizers": [], @@ -23623,21 +27070,25 @@ }, { "name": "Taman", + "depth": 5, "iso_1_code": null, "iso_3_code": "tmn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3190", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3188", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23653,20 +27104,24 @@ }, { "name": "Lemolang", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Limola", + "depth": 4, "iso_1_code": null, "iso_3_code": "ley", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3192", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3191", "native_tokenizers": [], @@ -23674,14 +27129,17 @@ }, { "name": "Makassar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bentong", + "depth": 4, "iso_1_code": null, "iso_3_code": "bnu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3194", "native_tokenizers": [], @@ -23689,9 +27147,11 @@ }, { "name": "Konjo, Coastal", + "depth": 4, "iso_1_code": null, "iso_3_code": "kjc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3195", "native_tokenizers": [], @@ -23699,9 +27159,11 @@ }, { "name": "Konjo, Highland", + "depth": 4, "iso_1_code": null, "iso_3_code": "kjk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3196", "native_tokenizers": [], @@ -23709,9 +27171,11 @@ }, { "name": "Makasar", + "depth": 4, "iso_1_code": null, "iso_3_code": "mak", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23729,15 +27193,18 @@ }, { "name": "Selayar", + "depth": 4, "iso_1_code": null, "iso_3_code": "sly", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3198", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23753,25 +27220,30 @@ }, { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mamuju", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mamuju", + "depth": 5, "iso_1_code": null, "iso_3_code": "mqx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3201", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3200", "native_tokenizers": [], @@ -23779,20 +27251,24 @@ }, { "name": "Mandar", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mandar", + "depth": 5, "iso_1_code": null, "iso_3_code": "mdr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3203", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3202", "native_tokenizers": [], @@ -23800,14 +27276,17 @@ }, { "name": "Masenrempulu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malimpung", + "depth": 5, "iso_1_code": null, "iso_3_code": "mli", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3205", "native_tokenizers": [], @@ -23815,9 +27294,11 @@ }, { "name": "Duri", + "depth": 5, "iso_1_code": null, "iso_3_code": "mvp", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23835,9 +27316,11 @@ }, { "name": "Enrekang", + "depth": 5, "iso_1_code": null, "iso_3_code": "ptt", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3207", "native_tokenizers": [], @@ -23845,15 +27328,18 @@ }, { "name": "Maiwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "wmm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3208", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23869,14 +27355,17 @@ }, { "name": "Pitu Ulunna Salu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aralle-Tabulahan", + "depth": 5, "iso_1_code": null, "iso_3_code": "atq", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23894,9 +27383,11 @@ }, { "name": "Dakka", + "depth": 5, "iso_1_code": null, "iso_3_code": "dkk", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3211", "native_tokenizers": [], @@ -23904,9 +27395,11 @@ }, { "name": "Pannei", + "depth": 5, "iso_1_code": null, "iso_3_code": "pnc", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3212", "native_tokenizers": [], @@ -23914,9 +27407,11 @@ }, { "name": "Bambam", + "depth": 5, "iso_1_code": null, "iso_3_code": "ptu", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23934,15 +27429,18 @@ }, { "name": "Ulumanda\u2019", + "depth": 5, "iso_1_code": null, "iso_3_code": "ulm", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3214", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23958,14 +27456,17 @@ }, { "name": "Toraja-Sa\u2019dan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalumpang", + "depth": 5, "iso_1_code": null, "iso_3_code": "kli", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3216", "native_tokenizers": [], @@ -23973,9 +27474,11 @@ }, { "name": "Mamasa", + "depth": 5, "iso_1_code": null, "iso_3_code": "mqj", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -23993,9 +27496,11 @@ }, { "name": "Tae\u2019", + "depth": 5, "iso_1_code": null, "iso_3_code": "rob", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3218", "native_tokenizers": [], @@ -24003,9 +27508,11 @@ }, { "name": "Toraja-Sa\u2019dan", + "depth": 5, "iso_1_code": null, "iso_3_code": "sda", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -24023,15 +27530,18 @@ }, { "name": "Talondo\u2019", + "depth": 5, "iso_1_code": null, "iso_3_code": "tln", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3220", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -24046,6 +27556,7 @@ "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -24061,14 +27572,17 @@ }, { "name": "Seko", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Seko Tengah", + "depth": 4, "iso_1_code": null, "iso_3_code": "sko", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3222", "native_tokenizers": [], @@ -24076,9 +27590,11 @@ }, { "name": "Seko Padang", + "depth": 4, "iso_1_code": null, "iso_3_code": "skx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3223", "native_tokenizers": [], @@ -24086,14 +27602,17 @@ }, { "name": "Panasuan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Budong-Budong", + "depth": 5, "iso_1_code": null, "iso_3_code": "bdx", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3225", "native_tokenizers": [], @@ -24101,27 +27620,32 @@ }, { "name": "Panasuan", + "depth": 5, "iso_1_code": null, "iso_3_code": "psn", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3226", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3224", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3221", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -24137,14 +27661,17 @@ }, { "name": "Sundanese", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Badui", + "depth": 3, "iso_1_code": null, "iso_3_code": "bac", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3228", "native_tokenizers": [], @@ -24152,9 +27679,11 @@ }, { "name": "Sunda", + "depth": 3, "iso_1_code": "su", "iso_3_code": "sun", "children": [], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -24171,6 +27700,7 @@ ] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -24186,14 +27716,17 @@ }, { "name": "Unclassified", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bulungan", + "depth": 3, "iso_1_code": null, "iso_3_code": "blj", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3231", "native_tokenizers": [], @@ -24201,21 +27734,25 @@ }, { "name": "Gorap", + "depth": 3, "iso_1_code": null, "iso_3_code": "goq", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3232", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3230", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -24231,14 +27768,17 @@ }, { "name": "Northwest Formosan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pazeh", + "depth": 2, "iso_1_code": null, "iso_3_code": "pzh", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3234", "native_tokenizers": [], @@ -24246,9 +27786,11 @@ }, { "name": "Kulon", + "depth": 2, "iso_1_code": null, "iso_3_code": "uon", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3235", "native_tokenizers": [], @@ -24256,15 +27798,18 @@ }, { "name": "Saisiyat", + "depth": 2, "iso_1_code": null, "iso_3_code": "xsy", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3236", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3233", "native_tokenizers": [], @@ -24272,23 +27817,18 @@ }, { "name": "Paiwan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Paiwan", + "depth": 2, "iso_1_code": null, "iso_3_code": "pwn", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "3238", "native_tokenizers": [], "scripts": [ @@ -24296,35 +27836,32 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "3237", "native_tokenizers": [], "scripts": [] }, { "name": "Puyuma", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Puyuma", + "depth": 2, "iso_1_code": null, "iso_3_code": "pyu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3240", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3239", "native_tokenizers": [], @@ -24332,23 +27869,18 @@ }, { "name": "Rukai", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rukai", + "depth": 2, "iso_1_code": null, "iso_3_code": "dru", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "3242", "native_tokenizers": [], "scripts": [ @@ -24356,29 +27888,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "3241", "native_tokenizers": [], "scripts": [] }, { "name": "Tsouic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saaroa", + "depth": 2, "iso_1_code": null, "iso_3_code": "sxr", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3244", "native_tokenizers": [], @@ -24386,9 +27914,11 @@ }, { "name": "Tsou", + "depth": 2, "iso_1_code": null, "iso_3_code": "tsu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3245", "native_tokenizers": [], @@ -24396,15 +27926,18 @@ }, { "name": "Kanakanabu", + "depth": 2, "iso_1_code": null, "iso_3_code": "xnb", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3246", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3243", "native_tokenizers": [], @@ -24412,20 +27945,24 @@ }, { "name": "Unclassified", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ketangalan", + "depth": 2, "iso_1_code": null, "iso_3_code": "kae", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3248", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3247", "native_tokenizers": [], @@ -24433,19 +27970,23 @@ }, { "name": "Western Plains", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Western Plains", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Babuza", + "depth": 3, "iso_1_code": null, "iso_3_code": "bzg", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3251", "native_tokenizers": [], @@ -24453,15 +27994,18 @@ }, { "name": "Papora-Hoanya", + "depth": 3, "iso_1_code": null, "iso_3_code": "ppu", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3252", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3250", "native_tokenizers": [], @@ -24469,41 +28013,39 @@ }, { "name": "Thao", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Thao", + "depth": 3, "iso_1_code": null, "iso_3_code": "ssf", "children": [], + "family": "Austronesian", "tokenizers": {}, "node_i": "3254", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3253", "native_tokenizers": [], "scripts": [] } ], + "family": "Austronesian", "tokenizers": {}, "node_i": "3249", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Austronesian", + "tokenizers": {}, "node_i": "1436", "native_tokenizers": [], "scripts": [] diff --git a/data/Aymaran.json b/data/Aymaran.json index 2ccfa4a8043e7a8ee111777c90c4d5560b405065..ad6a23c3e2e7a0f7c5404e09d1a5402664045b3f 100644 --- a/data/Aymaran.json +++ b/data/Aymaran.json @@ -1,18 +1,22 @@ { "name": "Aymaran", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aymara", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aymara, Southern", + "depth": 2, "iso_1_code": "ay", "iso_3_code": "ayc", "children": [], + "family": "Aymaran", "tokenizers": {}, "node_i": "3257", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Aymara, Central", + "depth": 2, "iso_1_code": "ay", "iso_3_code": "ayr", "children": [], + "family": "Aymaran", "tokenizers": {}, "node_i": "3258", "native_tokenizers": [], @@ -31,6 +37,7 @@ ] } ], + "family": "Aymaran", "tokenizers": {}, "node_i": "3256", "native_tokenizers": [], @@ -38,26 +45,31 @@ }, { "name": "Tupe", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jaqaru", + "depth": 2, "iso_1_code": null, "iso_3_code": "jqr", "children": [], + "family": "Aymaran", "tokenizers": {}, "node_i": "3260", "native_tokenizers": [], "scripts": [] } ], + "family": "Aymaran", "tokenizers": {}, "node_i": "3259", "native_tokenizers": [], "scripts": [] } ], + "family": "Aymaran", "tokenizers": {}, "node_i": "3255", "native_tokenizers": [], diff --git a/data/Barbacoan.json b/data/Barbacoan.json index 0002e9a5533cfe614a8f94b6c88c240945b6cde7..2ded14b05af73427c4b717d39082f42841143c82 100644 --- a/data/Barbacoan.json +++ b/data/Barbacoan.json @@ -1,18 +1,22 @@ { "name": "Barbacoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awa-Cuaiquer", + "depth": 2, "iso_1_code": null, "iso_3_code": "kwi", "children": [], + "family": "Barbacoan", "tokenizers": {}, "node_i": "3263", "native_tokenizers": [], @@ -21,6 +25,7 @@ ] } ], + "family": "Barbacoan", "tokenizers": {}, "node_i": "3262", "native_tokenizers": [], @@ -28,14 +33,17 @@ }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chachi", + "depth": 2, "iso_1_code": null, "iso_3_code": "cbi", "children": [], + "family": "Barbacoan", "tokenizers": {}, "node_i": "3265", "native_tokenizers": [], @@ -45,9 +53,11 @@ }, { "name": "Tsafiki", + "depth": 2, "iso_1_code": null, "iso_3_code": "cof", "children": [], + "family": "Barbacoan", "tokenizers": {}, "node_i": "3266", "native_tokenizers": [], @@ -56,12 +66,14 @@ ] } ], + "family": "Barbacoan", "tokenizers": {}, "node_i": "3264", "native_tokenizers": [], "scripts": [] } ], + "family": "Barbacoan", "tokenizers": {}, "node_i": "3261", "native_tokenizers": [], diff --git a/data/Bayono-Awbono.json b/data/Bayono-Awbono.json index 5f49b9f9d1e92b70f2585239b04396553d3bd3b2..c0646c921b09c08d681602ed63e1b96cf4a170bd 100644 --- a/data/Bayono-Awbono.json +++ b/data/Bayono-Awbono.json @@ -1,13 +1,16 @@ { "name": "Bayono-Awbono", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awbono", + "depth": 1, "iso_1_code": null, "iso_3_code": "awh", "children": [], + "family": "Bayono-Awbono", "tokenizers": {}, "node_i": "3268", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Bayono", + "depth": 1, "iso_1_code": null, "iso_3_code": "byl", "children": [], + "family": "Bayono-Awbono", "tokenizers": {}, "node_i": "3269", "native_tokenizers": [], "scripts": [] } ], + "family": "Bayono-Awbono", "tokenizers": {}, "node_i": "3267", "native_tokenizers": [], diff --git a/data/Border.json b/data/Border.json index 355a04670d30f82533d371732206d7a97910c587..b4f7af7bf77bbd849c6e569c6754156a4a28b9f6 100644 --- a/data/Border.json +++ b/data/Border.json @@ -1,18 +1,22 @@ { "name": "Border", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bewani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ainbai", + "depth": 2, "iso_1_code": null, "iso_3_code": "aic", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3272", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Kilmeri", + "depth": 2, "iso_1_code": null, "iso_3_code": "kih", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3273", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Ningera", + "depth": 2, "iso_1_code": null, "iso_3_code": "nby", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3274", "native_tokenizers": [], @@ -40,9 +48,11 @@ }, { "name": "Pagi", + "depth": 2, "iso_1_code": null, "iso_3_code": "pgi", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3275", "native_tokenizers": [], @@ -50,15 +60,18 @@ }, { "name": "Umeda", + "depth": 2, "iso_1_code": null, "iso_3_code": "upi", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3276", "native_tokenizers": [], "scripts": [] } ], + "family": "Border", "tokenizers": {}, "node_i": "3271", "native_tokenizers": [], @@ -66,14 +79,17 @@ }, { "name": "Taikat", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Taikat", + "depth": 2, "iso_1_code": null, "iso_3_code": "aos", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3278", "native_tokenizers": [], @@ -81,15 +97,18 @@ }, { "name": "Awyi", + "depth": 2, "iso_1_code": null, "iso_3_code": "auw", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3279", "native_tokenizers": [], "scripts": [] } ], + "family": "Border", "tokenizers": {}, "node_i": "3277", "native_tokenizers": [], @@ -97,14 +116,17 @@ }, { "name": "Waris", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amanab", + "depth": 2, "iso_1_code": null, "iso_3_code": "amn", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3281", "native_tokenizers": [], @@ -114,9 +136,11 @@ }, { "name": "Daonda", + "depth": 2, "iso_1_code": null, "iso_3_code": "dnd", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3282", "native_tokenizers": [], @@ -124,9 +148,11 @@ }, { "name": "Imonda", + "depth": 2, "iso_1_code": null, "iso_3_code": "imn", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3283", "native_tokenizers": [], @@ -134,9 +160,11 @@ }, { "name": "Manem", + "depth": 2, "iso_1_code": null, "iso_3_code": "jet", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3284", "native_tokenizers": [], @@ -144,9 +172,11 @@ }, { "name": "Auwe", + "depth": 2, "iso_1_code": null, "iso_3_code": "smf", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3285", "native_tokenizers": [], @@ -154,9 +184,11 @@ }, { "name": "Viid", + "depth": 2, "iso_1_code": null, "iso_3_code": "snu", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3286", "native_tokenizers": [], @@ -164,9 +196,11 @@ }, { "name": "Sowanda", + "depth": 2, "iso_1_code": null, "iso_3_code": "sow", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3287", "native_tokenizers": [], @@ -174,9 +208,11 @@ }, { "name": "Waris", + "depth": 2, "iso_1_code": null, "iso_3_code": "wrs", "children": [], + "family": "Border", "tokenizers": {}, "node_i": "3288", "native_tokenizers": [], @@ -185,12 +221,14 @@ ] } ], + "family": "Border", "tokenizers": {}, "node_i": "3280", "native_tokenizers": [], "scripts": [] } ], + "family": "Border", "tokenizers": {}, "node_i": "3270", "native_tokenizers": [], diff --git a/data/Bororoan.json b/data/Bororoan.json index 28942fb24a4e010f1d629e0052e83e16045879a1..fc38de4323f8461a119f72108f3922bb1a618ccf 100644 --- a/data/Bororoan.json +++ b/data/Bororoan.json @@ -1,13 +1,16 @@ { "name": "Bororoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bor\u00f4ro", + "depth": 1, "iso_1_code": null, "iso_3_code": "bor", "children": [], + "family": "Bororoan", "tokenizers": {}, "node_i": "3290", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Otuke", + "depth": 1, "iso_1_code": null, "iso_3_code": "otu", "children": [], + "family": "Bororoan", "tokenizers": {}, "node_i": "3291", "native_tokenizers": [], @@ -27,15 +32,18 @@ }, { "name": "Umot\u00edna", + "depth": 1, "iso_1_code": null, "iso_3_code": "umo", "children": [], + "family": "Bororoan", "tokenizers": {}, "node_i": "3292", "native_tokenizers": [], "scripts": [] } ], + "family": "Bororoan", "tokenizers": {}, "node_i": "3289", "native_tokenizers": [], diff --git a/data/Botocudoan.json b/data/Botocudoan.json index e368231dd56bab7b37a90befd85039d55ad6bfae..51c879b5c76a569c36a0f79457c820b741223b21 100644 --- a/data/Botocudoan.json +++ b/data/Botocudoan.json @@ -1,19 +1,23 @@ { "name": "Botocudoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Krenak", + "depth": 1, "iso_1_code": null, "iso_3_code": "kqq", "children": [], + "family": "Botocudoan", "tokenizers": {}, "node_i": "3294", "native_tokenizers": [], "scripts": [] } ], + "family": "Botocudoan", "tokenizers": {}, "node_i": "3293", "native_tokenizers": [], diff --git a/data/Caddoan.json b/data/Caddoan.json index a57ff5f351b993dc0bf6807bc545b581e7c5d10e..3b8332d701729a40c172a75b8f0c44b7e477cf2a 100644 --- a/data/Caddoan.json +++ b/data/Caddoan.json @@ -1,13 +1,16 @@ { "name": "Caddoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Caddo", + "depth": 1, "iso_1_code": null, "iso_3_code": "cad", "children": [], + "family": "Caddoan", "tokenizers": {}, "node_i": "3296", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Northern Caddoan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wichita", + "depth": 2, "iso_1_code": null, "iso_3_code": "wic", "children": [], + "family": "Caddoan", "tokenizers": {}, "node_i": "3298", "native_tokenizers": [], @@ -30,14 +36,17 @@ }, { "name": "Kitsai-Proto-Pawnee", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kitsai", + "depth": 3, "iso_1_code": null, "iso_3_code": "kii", "children": [], + "family": "Caddoan", "tokenizers": {}, "node_i": "3300", "native_tokenizers": [], @@ -45,14 +54,17 @@ }, { "name": "Proto-Pawnee", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arikara", + "depth": 4, "iso_1_code": null, "iso_3_code": "ari", "children": [], + "family": "Caddoan", "tokenizers": {}, "node_i": "3302", "native_tokenizers": [], @@ -60,33 +72,39 @@ }, { "name": "Pawnee", + "depth": 4, "iso_1_code": null, "iso_3_code": "paw", "children": [], + "family": "Caddoan", "tokenizers": {}, "node_i": "3303", "native_tokenizers": [], "scripts": [] } ], + "family": "Caddoan", "tokenizers": {}, "node_i": "3301", "native_tokenizers": [], "scripts": [] } ], + "family": "Caddoan", "tokenizers": {}, "node_i": "3299", "native_tokenizers": [], "scripts": [] } ], + "family": "Caddoan", "tokenizers": {}, "node_i": "3297", "native_tokenizers": [], "scripts": [] } ], + "family": "Caddoan", "tokenizers": {}, "node_i": "3295", "native_tokenizers": [], diff --git a/data/Cahuapanan.json b/data/Cahuapanan.json index 566ccd4384bf7fe8d51c2cd9ce17f0cda8363665..83af661842918ab5e11b45f2b34a33630e579366 100644 --- a/data/Cahuapanan.json +++ b/data/Cahuapanan.json @@ -1,13 +1,16 @@ { "name": "Cahuapanan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shawi", + "depth": 1, "iso_1_code": null, "iso_3_code": "cbt", "children": [], + "family": "Cahuapanan", "tokenizers": {}, "node_i": "3305", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Jebero", + "depth": 1, "iso_1_code": null, "iso_3_code": "jeb", "children": [], + "family": "Cahuapanan", "tokenizers": {}, "node_i": "3306", "native_tokenizers": [], "scripts": [] } ], + "family": "Cahuapanan", "tokenizers": {}, "node_i": "3304", "native_tokenizers": [], diff --git a/data/Cariban.json b/data/Cariban.json index a5fa3d4cfcf77f27815dbd17c6331803910e30e3..62569b32582b56385dbb32ac2eb04419fbf2da99 100644 --- a/data/Cariban.json +++ b/data/Cariban.json @@ -1,13 +1,16 @@ { "name": "Cariban", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Carib", + "depth": 1, "iso_1_code": null, "iso_3_code": "car", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3308", "native_tokenizers": [], @@ -17,14 +20,17 @@ }, { "name": "Central", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apala\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": "apy", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3310", "native_tokenizers": [], @@ -34,14 +40,17 @@ }, { "name": "Cuman\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chaima", + "depth": 3, "iso_1_code": null, "iso_3_code": "ciy", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3312", "native_tokenizers": [], @@ -49,15 +58,18 @@ }, { "name": "Cumanagoto", + "depth": 3, "iso_1_code": null, "iso_3_code": "cuo", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3313", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3311", "native_tokenizers": [], @@ -65,20 +77,24 @@ }, { "name": "Makiritare", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maquiritari", + "depth": 3, "iso_1_code": null, "iso_3_code": "mch", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3315", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3314", "native_tokenizers": [], @@ -86,14 +102,17 @@ }, { "name": "Mapoyo-Yavarana", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mapoyo", + "depth": 3, "iso_1_code": null, "iso_3_code": "mcg", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3317", "native_tokenizers": [], @@ -101,9 +120,11 @@ }, { "name": "P\u00e9mono", + "depth": 3, "iso_1_code": null, "iso_3_code": "pev", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3318", "native_tokenizers": [], @@ -111,9 +132,11 @@ }, { "name": "Tamanaku", + "depth": 3, "iso_1_code": null, "iso_3_code": "tmz", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3319", "native_tokenizers": [], @@ -121,15 +144,18 @@ }, { "name": "Yabarana", + "depth": 3, "iso_1_code": null, "iso_3_code": "yar", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3320", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3316", "native_tokenizers": [], @@ -137,14 +163,17 @@ }, { "name": "Wayana", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaxui\u00e2na", + "depth": 3, "iso_1_code": null, "iso_3_code": "kbb", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3322", "native_tokenizers": [], @@ -152,9 +181,11 @@ }, { "name": "Wayana", + "depth": 3, "iso_1_code": null, "iso_3_code": "way", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3323", "native_tokenizers": [], @@ -163,12 +194,14 @@ ] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3321", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3309", "native_tokenizers": [], @@ -176,20 +209,24 @@ }, { "name": "Kashuyana", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sikiana", + "depth": 2, "iso_1_code": null, "iso_3_code": "sik", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3325", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3324", "native_tokenizers": [], @@ -197,24 +234,29 @@ }, { "name": "North Amazonian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pem\u00f3n", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pem\u00f3n proper", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pemon", + "depth": 4, "iso_1_code": null, "iso_3_code": "aoc", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3329", "native_tokenizers": [], @@ -222,9 +264,11 @@ }, { "name": "Macushi", + "depth": 4, "iso_1_code": null, "iso_3_code": "mbc", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3330", "native_tokenizers": [], @@ -234,14 +278,17 @@ }, { "name": "Kapong", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akawaio", + "depth": 5, "iso_1_code": null, "iso_3_code": "ake", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3332", "native_tokenizers": [], @@ -251,9 +298,11 @@ }, { "name": "Patamona", + "depth": 5, "iso_1_code": null, "iso_3_code": "pbc", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3333", "native_tokenizers": [], @@ -262,18 +311,21 @@ ] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3331", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3328", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3327", "native_tokenizers": [], @@ -281,26 +333,31 @@ }, { "name": "Yawaper\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Waimiri-Atroar\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": "atr", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3335", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3334", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3326", "native_tokenizers": [], @@ -308,14 +365,17 @@ }, { "name": "South Amazonian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "E\u2019\u00f1apa Woromaipu", + "depth": 2, "iso_1_code": null, "iso_3_code": "pbh", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3337", "native_tokenizers": [], @@ -323,14 +383,17 @@ }, { "name": "Arara", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arara, Par\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "aap", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3339", "native_tokenizers": [], @@ -338,15 +401,18 @@ }, { "name": "Ikpeng", + "depth": 3, "iso_1_code": null, "iso_3_code": "txi", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3340", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3338", "native_tokenizers": [], @@ -354,14 +420,17 @@ }, { "name": "Bakair\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakair\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": "bkq", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3342", "native_tokenizers": [], @@ -371,14 +440,17 @@ }, { "name": "Amonap", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuik\u00faro-Kalap\u00e1lo", + "depth": 4, "iso_1_code": null, "iso_3_code": "kui", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3344", "native_tokenizers": [], @@ -386,27 +458,32 @@ }, { "name": "Matipuhy", + "depth": 4, "iso_1_code": null, "iso_3_code": "mzo", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3345", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3343", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3341", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3336", "native_tokenizers": [], @@ -414,14 +491,17 @@ }, { "name": "Tiriy\u00f3", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Salum\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "slj", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3347", "native_tokenizers": [], @@ -429,20 +509,24 @@ }, { "name": "Karihona", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Carijona", + "depth": 3, "iso_1_code": null, "iso_3_code": "cbd", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3349", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3348", "native_tokenizers": [], @@ -450,14 +534,17 @@ }, { "name": "Tiriy\u00f3", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akurio", + "depth": 3, "iso_1_code": null, "iso_3_code": "ako", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3351", "native_tokenizers": [], @@ -465,21 +552,25 @@ }, { "name": "Tri\u00f3", + "depth": 3, "iso_1_code": null, "iso_3_code": "tri", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3352", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3350", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3346", "native_tokenizers": [], @@ -487,14 +578,17 @@ }, { "name": "Waiwai", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hixkary\u00e1na", + "depth": 2, "iso_1_code": null, "iso_3_code": "hix", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3354", "native_tokenizers": [], @@ -504,15 +598,18 @@ }, { "name": "Waiwai", + "depth": 2, "iso_1_code": null, "iso_3_code": "waw", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3355", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3353", "native_tokenizers": [], @@ -520,19 +617,23 @@ }, { "name": "Yukpa", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yucpa-Yapreria", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Japreria", + "depth": 3, "iso_1_code": null, "iso_3_code": "jru", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3358", "native_tokenizers": [], @@ -540,9 +641,11 @@ }, { "name": "Yukpa", + "depth": 3, "iso_1_code": null, "iso_3_code": "yup", "children": [], + "family": "Cariban", "tokenizers": {}, "node_i": "3359", "native_tokenizers": [], @@ -551,18 +654,21 @@ ] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3357", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3356", "native_tokenizers": [], "scripts": [] } ], + "family": "Cariban", "tokenizers": {}, "node_i": "3307", "native_tokenizers": [], diff --git a/data/Central Solomons.json b/data/Central Solomons.json index 1c08122aa7c5423961dfaef8c8b0d386b553a33b..2e00169e1e4fad4a71a7cd2c6418dbbc485496e1 100644 --- a/data/Central Solomons.json +++ b/data/Central Solomons.json @@ -1,13 +1,16 @@ { "name": "Central Solomons", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bilua", + "depth": 1, "iso_1_code": null, "iso_3_code": "blb", "children": [], + "family": "Central Solomons", "tokenizers": {}, "node_i": "3361", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Lavukaleve", + "depth": 1, "iso_1_code": null, "iso_3_code": "lvk", "children": [], + "family": "Central Solomons", "tokenizers": {}, "node_i": "3362", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Savosavo", + "depth": 1, "iso_1_code": null, "iso_3_code": "svs", "children": [], + "family": "Central Solomons", "tokenizers": {}, "node_i": "3363", "native_tokenizers": [], @@ -35,15 +42,18 @@ }, { "name": "Touo", + "depth": 1, "iso_1_code": null, "iso_3_code": "tqu", "children": [], + "family": "Central Solomons", "tokenizers": {}, "node_i": "3364", "native_tokenizers": [], "scripts": [] } ], + "family": "Central Solomons", "tokenizers": {}, "node_i": "3360", "native_tokenizers": [], diff --git a/data/Chapacuran.json b/data/Chapacuran.json index c0332ebf64c1064e30f70f39ac84b775816925b3..65b53de9fd55ee42918e2af05fa52c6a6998bcf6 100644 --- a/data/Chapacuran.json +++ b/data/Chapacuran.json @@ -1,18 +1,22 @@ { "name": "Chapacuran", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Itene", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Itene", + "depth": 2, "iso_1_code": null, "iso_3_code": "ite", "children": [], + "family": "Chapacuran", "tokenizers": {}, "node_i": "3367", "native_tokenizers": [], @@ -20,15 +24,18 @@ }, { "name": "Tor\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "trz", "children": [], + "family": "Chapacuran", "tokenizers": {}, "node_i": "3368", "native_tokenizers": [], "scripts": [] } ], + "family": "Chapacuran", "tokenizers": {}, "node_i": "3366", "native_tokenizers": [], @@ -36,14 +43,17 @@ }, { "name": "Wari", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oro Win", + "depth": 2, "iso_1_code": null, "iso_3_code": "orw", "children": [], + "family": "Chapacuran", "tokenizers": {}, "node_i": "3370", "native_tokenizers": [], @@ -51,21 +61,25 @@ }, { "name": "Paka\u00e1snovos", + "depth": 2, "iso_1_code": null, "iso_3_code": "pav", "children": [], + "family": "Chapacuran", "tokenizers": {}, "node_i": "3371", "native_tokenizers": [], "scripts": [] } ], + "family": "Chapacuran", "tokenizers": {}, "node_i": "3369", "native_tokenizers": [], "scripts": [] } ], + "family": "Chapacuran", "tokenizers": {}, "node_i": "3365", "native_tokenizers": [], diff --git a/data/Chibchan.json b/data/Chibchan.json index 325a661d39c2007968aa2e8ce9e73df372bf722f..5648aa6e49c21a7ad17faba6f2b8ad15c79f78e9 100644 --- a/data/Chibchan.json +++ b/data/Chibchan.json @@ -1,18 +1,22 @@ { "name": "Chibchan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chibchan A", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boruca", + "depth": 2, "iso_1_code": null, "iso_3_code": "brn", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3374", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Teribe", + "depth": 2, "iso_1_code": null, "iso_3_code": "tfr", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3375", "native_tokenizers": [], @@ -32,14 +38,17 @@ }, { "name": "Guaymi\u00edc", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ng\u00e4bere", + "depth": 3, "iso_1_code": null, "iso_3_code": "gym", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3377", "native_tokenizers": [], @@ -49,9 +58,11 @@ }, { "name": "Buglere", + "depth": 3, "iso_1_code": null, "iso_3_code": "sab", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3378", "native_tokenizers": [], @@ -60,6 +71,7 @@ ] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3376", "native_tokenizers": [], @@ -67,14 +79,17 @@ }, { "name": "Viceitic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bribri", + "depth": 3, "iso_1_code": null, "iso_3_code": "bzd", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3380", "native_tokenizers": [], @@ -84,9 +99,11 @@ }, { "name": "Cab\u00e9car", + "depth": 3, "iso_1_code": null, "iso_3_code": "cjp", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3381", "native_tokenizers": [], @@ -95,12 +112,14 @@ ] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3379", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3373", "native_tokenizers": [], @@ -108,14 +127,17 @@ }, { "name": "Chibchan B", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pech", + "depth": 2, "iso_1_code": null, "iso_3_code": "pay", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3383", "native_tokenizers": [], @@ -123,24 +145,29 @@ }, { "name": "Eastern Chibchan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Colombian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern Colombian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chimila", + "depth": 5, "iso_1_code": null, "iso_3_code": "cbg", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3387", "native_tokenizers": [], @@ -148,14 +175,17 @@ }, { "name": "Arhuacan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kogi", + "depth": 6, "iso_1_code": null, "iso_3_code": "kog", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3389", "native_tokenizers": [], @@ -165,14 +195,17 @@ }, { "name": "Southern and Eastern Arhuacan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arhuaco", + "depth": 7, "iso_1_code": null, "iso_3_code": "arh", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3391", "native_tokenizers": [], @@ -180,38 +213,45 @@ }, { "name": "Guamaca-Atanque", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sanka", + "depth": 8, "iso_1_code": null, "iso_3_code": "mbp", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3393", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3392", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3390", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3388", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3386", "native_tokenizers": [], @@ -219,14 +259,17 @@ }, { "name": "Southern Colombian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bar\u00ed", + "depth": 5, "iso_1_code": null, "iso_3_code": "mot", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3395", "native_tokenizers": [], @@ -234,14 +277,17 @@ }, { "name": "Cundicocuyese", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chibcha", + "depth": 6, "iso_1_code": null, "iso_3_code": "chb", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3397", "native_tokenizers": [], @@ -249,9 +295,11 @@ }, { "name": "Tunebo, Barro Negro", + "depth": 6, "iso_1_code": null, "iso_3_code": "tbn", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3398", "native_tokenizers": [], @@ -259,9 +307,11 @@ }, { "name": "Tunebo, Western", + "depth": 6, "iso_1_code": null, "iso_3_code": "tnb", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3399", "native_tokenizers": [], @@ -269,9 +319,11 @@ }, { "name": "Tunebo, Angosturas", + "depth": 6, "iso_1_code": null, "iso_3_code": "tnd", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3400", "native_tokenizers": [], @@ -279,9 +331,11 @@ }, { "name": "Tunebo, Central", + "depth": 6, "iso_1_code": null, "iso_3_code": "tuf", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3401", "native_tokenizers": [], @@ -290,18 +344,21 @@ ] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3396", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3394", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3385", "native_tokenizers": [], @@ -309,14 +366,17 @@ }, { "name": "Cuna", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuna, San Blas", + "depth": 4, "iso_1_code": null, "iso_3_code": "cuk", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3403", "native_tokenizers": [], @@ -326,9 +386,11 @@ }, { "name": "Kuna, Border", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvn", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3404", "native_tokenizers": [], @@ -337,12 +399,14 @@ ] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3402", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3384", "native_tokenizers": [], @@ -350,14 +414,17 @@ }, { "name": "Votic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mal\u00e9ku Ja\u00edka", + "depth": 3, "iso_1_code": null, "iso_3_code": "gut", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3406", "native_tokenizers": [], @@ -365,27 +432,32 @@ }, { "name": "Rama", + "depth": 3, "iso_1_code": null, "iso_3_code": "rma", "children": [], + "family": "Chibchan", "tokenizers": {}, "node_i": "3407", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3405", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3382", "native_tokenizers": [], "scripts": [] } ], + "family": "Chibchan", "tokenizers": {}, "node_i": "3372", "native_tokenizers": [], diff --git a/data/Chimakuan.json b/data/Chimakuan.json index 157318ab780469b3f52d927ccc05e2c21b37a9a4..25ba1c4df4371eace969b30abeb7b30f1791c2e1 100644 --- a/data/Chimakuan.json +++ b/data/Chimakuan.json @@ -1,13 +1,16 @@ { "name": "Chimakuan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quileute", + "depth": 1, "iso_1_code": null, "iso_3_code": "qui", "children": [], + "family": "Chimakuan", "tokenizers": {}, "node_i": "3409", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Chemakum", + "depth": 1, "iso_1_code": null, "iso_3_code": "xch", "children": [], + "family": "Chimakuan", "tokenizers": {}, "node_i": "3410", "native_tokenizers": [], "scripts": [] } ], + "family": "Chimakuan", "tokenizers": {}, "node_i": "3408", "native_tokenizers": [], diff --git a/data/Chinookan.json b/data/Chinookan.json index bdac0a5b5f6181b5d0667c7de14c77b7475abb89..600e41eaad817b040fb3d5c8f291a94fd3dedc2a 100644 --- a/data/Chinookan.json +++ b/data/Chinookan.json @@ -1,13 +1,16 @@ { "name": "Chinookan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinook", + "depth": 1, "iso_1_code": null, "iso_3_code": "chh", "children": [], + "family": "Chinookan", "tokenizers": {}, "node_i": "3412", "native_tokenizers": [], @@ -15,26 +18,31 @@ }, { "name": "Upper Chinookan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wasco-Wishram", + "depth": 2, "iso_1_code": null, "iso_3_code": "wac", "children": [], + "family": "Chinookan", "tokenizers": {}, "node_i": "3414", "native_tokenizers": [], "scripts": [] } ], + "family": "Chinookan", "tokenizers": {}, "node_i": "3413", "native_tokenizers": [], "scripts": [] } ], + "family": "Chinookan", "tokenizers": {}, "node_i": "3411", "native_tokenizers": [], diff --git a/data/Chipaya-Uru.json b/data/Chipaya-Uru.json index e7b3fd48d37ea036b56c65f6446a57efda5b6171..18a8eb2c2c5741e4d184b1dc64fe150fc73b5598 100644 --- a/data/Chipaya-Uru.json +++ b/data/Chipaya-Uru.json @@ -1,13 +1,16 @@ { "name": "Chipaya-Uru", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chipaya", + "depth": 1, "iso_1_code": null, "iso_3_code": "cap", "children": [], + "family": "Chipaya-Uru", "tokenizers": {}, "node_i": "3416", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Uru", + "depth": 1, "iso_1_code": null, "iso_3_code": "ure", "children": [], + "family": "Chipaya-Uru", "tokenizers": {}, "node_i": "3417", "native_tokenizers": [], "scripts": [] } ], + "family": "Chipaya-Uru", "tokenizers": {}, "node_i": "3415", "native_tokenizers": [], diff --git a/data/Chocoan.json b/data/Chocoan.json index cb49e5d1bda4fc5f4095f858b2a47e09a10aea2f..42d65511f6b3653c3f5d5fd8277767da47a905bf 100644 --- a/data/Chocoan.json +++ b/data/Chocoan.json @@ -1,13 +1,16 @@ { "name": "Chocoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Woun Meu", + "depth": 1, "iso_1_code": null, "iso_3_code": "noa", "children": [], + "family": "Chocoan", "tokenizers": {}, "node_i": "3419", "native_tokenizers": [], @@ -17,19 +20,23 @@ }, { "name": "Ember\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern Ember\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Embera Cat\u00edo", + "depth": 3, "iso_1_code": null, "iso_3_code": "cto", "children": [], + "family": "Chocoan", "tokenizers": {}, "node_i": "3422", "native_tokenizers": [], @@ -39,9 +46,11 @@ }, { "name": "Ember\u00e1, Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": "emp", "children": [], + "family": "Chocoan", "tokenizers": {}, "node_i": "3423", "native_tokenizers": [], @@ -50,6 +59,7 @@ ] } ], + "family": "Chocoan", "tokenizers": {}, "node_i": "3421", "native_tokenizers": [], @@ -57,14 +67,17 @@ }, { "name": "Southern Ember\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Embera Baud\u00f3", + "depth": 3, "iso_1_code": null, "iso_3_code": "bdc", "children": [], + "family": "Chocoan", "tokenizers": {}, "node_i": "3425", "native_tokenizers": [], @@ -72,9 +85,11 @@ }, { "name": "Embera Cham\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": "cmi", "children": [], + "family": "Chocoan", "tokenizers": {}, "node_i": "3426", "native_tokenizers": [], @@ -82,9 +97,11 @@ }, { "name": "Epena", + "depth": 3, "iso_1_code": null, "iso_3_code": "sja", "children": [], + "family": "Chocoan", "tokenizers": {}, "node_i": "3427", "native_tokenizers": [], @@ -94,27 +111,32 @@ }, { "name": "Embera Tad\u00f3", + "depth": 3, "iso_1_code": null, "iso_3_code": "tdc", "children": [], + "family": "Chocoan", "tokenizers": {}, "node_i": "3428", "native_tokenizers": [], "scripts": [] } ], + "family": "Chocoan", "tokenizers": {}, "node_i": "3424", "native_tokenizers": [], "scripts": [] } ], + "family": "Chocoan", "tokenizers": {}, "node_i": "3420", "native_tokenizers": [], "scripts": [] } ], + "family": "Chocoan", "tokenizers": {}, "node_i": "3418", "native_tokenizers": [], diff --git a/data/Cholonan.json b/data/Cholonan.json index 63bc6f2b380ba07bf84933774845469914696331..696dea5e51656f1082f4180546e9d6cc90c5c8c4 100644 --- a/data/Cholonan.json +++ b/data/Cholonan.json @@ -1,13 +1,16 @@ { "name": "Cholonan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chol\u00f3n", + "depth": 1, "iso_1_code": null, "iso_3_code": "cht", "children": [], + "family": "Cholonan", "tokenizers": {}, "node_i": "3430", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Hibito", + "depth": 1, "iso_1_code": null, "iso_3_code": "hib", "children": [], + "family": "Cholonan", "tokenizers": {}, "node_i": "3431", "native_tokenizers": [], "scripts": [] } ], + "family": "Cholonan", "tokenizers": {}, "node_i": "3429", "native_tokenizers": [], diff --git a/data/Chon.json b/data/Chon.json index 94c011ffa7119dc225643fd75293efb230b665e2..8d2f381bbb2ad64d7bcd830546c651895fd78cfa 100644 --- a/data/Chon.json +++ b/data/Chon.json @@ -1,13 +1,16 @@ { "name": "Chon", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tehuelche", + "depth": 1, "iso_1_code": null, "iso_3_code": "teh", "children": [], + "family": "Chon", "tokenizers": {}, "node_i": "3433", "native_tokenizers": [], @@ -15,26 +18,31 @@ }, { "name": "Island Chon", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ona", + "depth": 2, "iso_1_code": null, "iso_3_code": "ona", "children": [], + "family": "Chon", "tokenizers": {}, "node_i": "3435", "native_tokenizers": [], "scripts": [] } ], + "family": "Chon", "tokenizers": {}, "node_i": "3434", "native_tokenizers": [], "scripts": [] } ], + "family": "Chon", "tokenizers": {}, "node_i": "3432", "native_tokenizers": [], diff --git a/data/Chukotko-Kamchatkan.json b/data/Chukotko-Kamchatkan.json index 0501f436cedd8d5a10ca94b72065642e3d6053f9..3634c8c6fa83f31d4baae04a7866ff483a9894fa 100644 --- a/data/Chukotko-Kamchatkan.json +++ b/data/Chukotko-Kamchatkan.json @@ -1,23 +1,28 @@ { "name": "Chukotko-Kamchatkan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chukot", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chukchi", + "depth": 3, "iso_1_code": null, "iso_3_code": "ckt", "children": [], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3439", "native_tokenizers": [], @@ -26,6 +31,7 @@ ] } ], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3438", "native_tokenizers": [], @@ -33,14 +39,17 @@ }, { "name": "Koryak-Alyutor", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alutor", + "depth": 3, "iso_1_code": null, "iso_3_code": "alr", "children": [], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3441", "native_tokenizers": [], @@ -48,9 +57,11 @@ }, { "name": "Koryak", + "depth": 3, "iso_1_code": null, "iso_3_code": "kpy", "children": [], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3442", "native_tokenizers": [], @@ -58,21 +69,25 @@ }, { "name": "Kerek", + "depth": 3, "iso_1_code": null, "iso_3_code": "krk", "children": [], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3443", "native_tokenizers": [], "scripts": [] } ], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3440", "native_tokenizers": [], "scripts": [] } ], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3437", "native_tokenizers": [], @@ -80,14 +95,17 @@ }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Itelmen", + "depth": 2, "iso_1_code": null, "iso_3_code": "itl", "children": [], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3445", "native_tokenizers": [], @@ -96,12 +114,14 @@ ] } ], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3444", "native_tokenizers": [], "scripts": [] } ], + "family": "Chukotko-Kamchatkan", "tokenizers": {}, "node_i": "3436", "native_tokenizers": [], diff --git a/data/Chumashan.json b/data/Chumashan.json index b0d15d3aa3e9bd94fa06029a1dea910b6b4d557b..1cb3da414643394c5c1a12f258cdd67995d9e5c1 100644 --- a/data/Chumashan.json +++ b/data/Chumashan.json @@ -1,13 +1,16 @@ { "name": "Chumashan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Obispe\u00f1o", + "depth": 1, "iso_1_code": null, "iso_3_code": "obi", "children": [], + "family": "Chumashan", "tokenizers": {}, "node_i": "3447", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Central Chumash", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barbare\u00f1o", + "depth": 2, "iso_1_code": null, "iso_3_code": "boi", "children": [], + "family": "Chumashan", "tokenizers": {}, "node_i": "3449", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Inese\u00f1o", + "depth": 2, "iso_1_code": null, "iso_3_code": "inz", "children": [], + "family": "Chumashan", "tokenizers": {}, "node_i": "3450", "native_tokenizers": [], @@ -40,9 +48,11 @@ }, { "name": "Purisime\u00f1o", + "depth": 2, "iso_1_code": null, "iso_3_code": "puy", "children": [], + "family": "Chumashan", "tokenizers": {}, "node_i": "3451", "native_tokenizers": [], @@ -50,15 +60,18 @@ }, { "name": "Venture\u00f1o", + "depth": 2, "iso_1_code": null, "iso_3_code": "veo", "children": [], + "family": "Chumashan", "tokenizers": {}, "node_i": "3452", "native_tokenizers": [], "scripts": [] } ], + "family": "Chumashan", "tokenizers": {}, "node_i": "3448", "native_tokenizers": [], @@ -66,26 +79,31 @@ }, { "name": "Island Chumash", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cruze\u00f1o", + "depth": 2, "iso_1_code": null, "iso_3_code": "crz", "children": [], + "family": "Chumashan", "tokenizers": {}, "node_i": "3454", "native_tokenizers": [], "scripts": [] } ], + "family": "Chumashan", "tokenizers": {}, "node_i": "3453", "native_tokenizers": [], "scripts": [] } ], + "family": "Chumashan", "tokenizers": {}, "node_i": "3446", "native_tokenizers": [], diff --git "a/data/Cochim\303\255-Yuman.json" "b/data/Cochim\303\255-Yuman.json" index e0803ab716f8780f2636cf82245bcafec2d223dd..5a77599461977dc0f888a67cd52fc9451497703e 100644 --- "a/data/Cochim\303\255-Yuman.json" +++ "b/data/Cochim\303\255-Yuman.json" @@ -1,18 +1,22 @@ { "name": "Cochim\u00ed-Yuman", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yuman", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cochimi", + "depth": 2, "iso_1_code": null, "iso_3_code": "coj", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3457", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Kiliwa", + "depth": 2, "iso_1_code": null, "iso_3_code": "klb", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3458", "native_tokenizers": [], @@ -30,14 +36,17 @@ }, { "name": "Delta-California", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cocopa", + "depth": 3, "iso_1_code": null, "iso_3_code": "coc", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3460", "native_tokenizers": [], @@ -45,15 +54,18 @@ }, { "name": "Kumiai", + "depth": 3, "iso_1_code": null, "iso_3_code": "dih", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3461", "native_tokenizers": [], "scripts": [] } ], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3459", "native_tokenizers": [], @@ -61,14 +73,17 @@ }, { "name": "Pai", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Paipai", + "depth": 3, "iso_1_code": null, "iso_3_code": "ppi", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3463", "native_tokenizers": [], @@ -76,15 +91,18 @@ }, { "name": "Havasupai-Walapai-Yavapai", + "depth": 3, "iso_1_code": null, "iso_3_code": "yuf", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3464", "native_tokenizers": [], "scripts": [] } ], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3462", "native_tokenizers": [], @@ -92,19 +110,23 @@ }, { "name": "River", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mojave", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mohave", + "depth": 4, "iso_1_code": null, "iso_3_code": "mov", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3467", "native_tokenizers": [], @@ -112,9 +134,11 @@ }, { "name": "Maricopa", + "depth": 4, "iso_1_code": null, "iso_3_code": "mrc", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3468", "native_tokenizers": [], @@ -122,33 +146,39 @@ }, { "name": "Quechan", + "depth": 4, "iso_1_code": null, "iso_3_code": "yum", "children": [], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3469", "native_tokenizers": [], "scripts": [] } ], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3466", "native_tokenizers": [], "scripts": [] } ], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3465", "native_tokenizers": [], "scripts": [] } ], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3456", "native_tokenizers": [], "scripts": [] } ], + "family": "Cochim\u00ed-Yuman", "tokenizers": {}, "node_i": "3455", "native_tokenizers": [], diff --git a/data/Comecrudan.json b/data/Comecrudan.json index ecb9e8296346a7f114bf400eba790790a03ed57a..b7e1db5a843212d8e2e5c7ed522d8641f2bafc4c 100644 --- a/data/Comecrudan.json +++ b/data/Comecrudan.json @@ -1,13 +1,16 @@ { "name": "Comecrudan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mamulique", + "depth": 1, "iso_1_code": null, "iso_3_code": "emm", "children": [], + "family": "Comecrudan", "tokenizers": {}, "node_i": "3471", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Comecrudo", + "depth": 1, "iso_1_code": null, "iso_3_code": "xcm", "children": [], + "family": "Comecrudan", "tokenizers": {}, "node_i": "3472", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Cotoname", + "depth": 1, "iso_1_code": null, "iso_3_code": "xcn", "children": [], + "family": "Comecrudan", "tokenizers": {}, "node_i": "3473", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Coahuilteco", + "depth": 1, "iso_1_code": null, "iso_3_code": "xcw", "children": [], + "family": "Comecrudan", "tokenizers": {}, "node_i": "3474", "native_tokenizers": [], @@ -45,15 +54,18 @@ }, { "name": "Garza", + "depth": 1, "iso_1_code": null, "iso_3_code": "xgr", "children": [], + "family": "Comecrudan", "tokenizers": {}, "node_i": "3475", "native_tokenizers": [], "scripts": [] } ], + "family": "Comecrudan", "tokenizers": {}, "node_i": "3470", "native_tokenizers": [], diff --git a/data/Constructed language.json b/data/Constructed language.json index d051f96d89739cab19e7df98fdd4c4219d96ce8e..53fea32d933fd3be6117f53f55c75438d2f7b026 100644 --- a/data/Constructed language.json +++ b/data/Constructed language.json @@ -1,13 +1,16 @@ { "name": "Constructed language", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Esperanto", + "depth": 1, "iso_1_code": "eo", "iso_3_code": "epo", "children": [], + "family": "Constructed language", "tokenizers": {}, "node_i": "3477", "native_tokenizers": [], @@ -16,6 +19,7 @@ ] } ], + "family": "Constructed language", "tokenizers": {}, "node_i": "3476", "native_tokenizers": [], diff --git a/data/Coosan.json b/data/Coosan.json index 9db5231a1ad205f528c5a669b32e3909ad2e9c87..55834c04b9a92de5a0fcbefa8bebe182606ed3c9 100644 --- a/data/Coosan.json +++ b/data/Coosan.json @@ -1,13 +1,16 @@ { "name": "Coosan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Coos", + "depth": 1, "iso_1_code": null, "iso_3_code": "csz", "children": [], + "family": "Coosan", "tokenizers": {}, "node_i": "3479", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Miluk", + "depth": 1, "iso_1_code": null, "iso_3_code": "iml", "children": [], + "family": "Coosan", "tokenizers": {}, "node_i": "3480", "native_tokenizers": [], "scripts": [] } ], + "family": "Coosan", "tokenizers": {}, "node_i": "3478", "native_tokenizers": [], diff --git a/data/Creole.json b/data/Creole.json index 77376ed0b1b50ea66a550a72af2ea79305123224..0c5f54901a6528198368748f63ffd8f5b40cea9e 100644 --- a/data/Creole.json +++ b/data/Creole.json @@ -1,18 +1,22 @@ { "name": "Creole", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Afrikaans based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Flaaitaal", + "depth": 2, "iso_1_code": null, "iso_3_code": "fly", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3483", "native_tokenizers": [], @@ -20,15 +24,18 @@ }, { "name": "Oorlams", + "depth": 2, "iso_1_code": null, "iso_3_code": "oor", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3484", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3482", "native_tokenizers": [], @@ -36,14 +43,17 @@ }, { "name": "Arabic based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nubi", + "depth": 2, "iso_1_code": null, "iso_3_code": "kcn", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3486", "native_tokenizers": [], @@ -51,15 +61,18 @@ }, { "name": "Arabic, Juba", + "depth": 2, "iso_1_code": "ar", "iso_3_code": "pga", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3487", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3485", "native_tokenizers": [], @@ -67,20 +80,24 @@ }, { "name": "Assamese based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nagamese", + "depth": 2, "iso_1_code": null, "iso_3_code": "nag", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3489", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3488", "native_tokenizers": [], @@ -88,14 +105,17 @@ }, { "name": "Dutch based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berbice Dutch Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "brc", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3491", "native_tokenizers": [], @@ -103,9 +123,11 @@ }, { "name": "Negerhollands", + "depth": 2, "iso_1_code": null, "iso_3_code": "dcr", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3492", "native_tokenizers": [], @@ -113,9 +135,11 @@ }, { "name": "Javindo", + "depth": 2, "iso_1_code": null, "iso_3_code": "jvd", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3493", "native_tokenizers": [], @@ -123,9 +147,11 @@ }, { "name": "Petjo", + "depth": 2, "iso_1_code": null, "iso_3_code": "pey", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3494", "native_tokenizers": [], @@ -133,15 +159,18 @@ }, { "name": "Skepi Dutch Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "skw", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3495", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3490", "native_tokenizers": [], @@ -149,14 +178,17 @@ }, { "name": "English based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saramaccan", + "depth": 2, "iso_1_code": null, "iso_3_code": "srm", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -174,19 +206,23 @@ }, { "name": "Atlantic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Turks and Caicos English Creole", + "depth": 4, "iso_1_code": null, "iso_3_code": "tch", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3500", "native_tokenizers": [], @@ -194,14 +230,17 @@ }, { "name": "Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Afro-Seminole Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "afs", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3502", "native_tokenizers": [], @@ -209,9 +248,11 @@ }, { "name": "Bahamas English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "bah", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3503", "native_tokenizers": [], @@ -219,9 +260,11 @@ }, { "name": "Sea Island English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "gul", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -238,6 +281,7 @@ ] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -253,14 +297,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Leeward Caribbean English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "aig", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3506", "native_tokenizers": [], @@ -268,9 +315,11 @@ }, { "name": "Bajan", + "depth": 5, "iso_1_code": null, "iso_3_code": "bjs", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3507", "native_tokenizers": [], @@ -278,9 +327,11 @@ }, { "name": "Grenadian English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "gcl", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3508", "native_tokenizers": [], @@ -288,9 +339,11 @@ }, { "name": "Guyanese English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "gyn", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3509", "native_tokenizers": [], @@ -298,9 +351,11 @@ }, { "name": "Vincentian English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "svc", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3510", "native_tokenizers": [], @@ -308,9 +363,11 @@ }, { "name": "Tobagonian English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "tgh", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3511", "native_tokenizers": [], @@ -318,9 +375,11 @@ }, { "name": "Trinidadian English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "trf", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3512", "native_tokenizers": [], @@ -328,21 +387,25 @@ }, { "name": "Virgin Islands English Creole", + "depth": 5, "iso_1_code": null, "iso_3_code": "vic", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3513", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3505", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -358,14 +421,17 @@ }, { "name": "Krio", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Equatorial Guinean Pidgin", + "depth": 4, "iso_1_code": null, "iso_3_code": "fpe", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3515", "native_tokenizers": [], @@ -373,9 +439,11 @@ }, { "name": "Ghanaian Pidgin English", + "depth": 4, "iso_1_code": null, "iso_3_code": "gpe", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3516", "native_tokenizers": [], @@ -383,9 +451,11 @@ }, { "name": "Krio", + "depth": 4, "iso_1_code": null, "iso_3_code": "kri", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -403,9 +473,11 @@ }, { "name": "Pidgin, Nigerian", + "depth": 4, "iso_1_code": null, "iso_3_code": "pcm", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -425,9 +497,11 @@ }, { "name": "Pidgin, Cameroon", + "depth": 4, "iso_1_code": null, "iso_3_code": "wes", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -444,6 +518,7 @@ ] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -459,14 +534,17 @@ }, { "name": "Suriname", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sranan Tongo", + "depth": 4, "iso_1_code": null, "iso_3_code": "srn", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -484,14 +562,17 @@ }, { "name": "Ndyuka", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aukan", + "depth": 5, "iso_1_code": null, "iso_3_code": "djk", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -509,15 +590,18 @@ }, { "name": "Kwinti", + "depth": 5, "iso_1_code": null, "iso_3_code": "kww", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3524", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -532,6 +616,7 @@ "scripts": [] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -547,14 +632,17 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Belize English Creole", + "depth": 4, "iso_1_code": null, "iso_3_code": "bzj", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -572,9 +660,11 @@ }, { "name": "Nicaragua English Creole", + "depth": 4, "iso_1_code": null, "iso_3_code": "bzk", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3527", "native_tokenizers": [], @@ -582,9 +672,11 @@ }, { "name": "Islander English Creole", + "depth": 4, "iso_1_code": null, "iso_3_code": "icr", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -602,9 +694,11 @@ }, { "name": "Jamaican English Creole", + "depth": 4, "iso_1_code": null, "iso_3_code": "jam", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -621,6 +715,7 @@ ] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -635,6 +730,7 @@ "scripts": [] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -650,14 +746,17 @@ }, { "name": "Pacific", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bislama", + "depth": 3, "iso_1_code": "bi", "iso_3_code": "bis", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -675,9 +774,11 @@ }, { "name": "Hawaii Pidgin", + "depth": 3, "iso_1_code": null, "iso_3_code": "hwc", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -695,9 +796,11 @@ }, { "name": "Ngatik Men\u2019s Creole", + "depth": 3, "iso_1_code": null, "iso_3_code": "ngm", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3533", "native_tokenizers": [], @@ -705,9 +808,11 @@ }, { "name": "Pitcairn-Norfolk", + "depth": 3, "iso_1_code": null, "iso_3_code": "pih", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3534", "native_tokenizers": [], @@ -715,9 +820,11 @@ }, { "name": "Pijin", + "depth": 3, "iso_1_code": null, "iso_3_code": "pis", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -735,9 +842,11 @@ }, { "name": "Kriol", + "depth": 3, "iso_1_code": null, "iso_3_code": "rop", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -755,9 +864,11 @@ }, { "name": "Torres Strait Creole", + "depth": 3, "iso_1_code": null, "iso_3_code": "tcs", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -775,9 +886,11 @@ }, { "name": "Tok Pisin", + "depth": 3, "iso_1_code": null, "iso_3_code": "tpi", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -794,6 +907,7 @@ ] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -808,6 +922,7 @@ "scripts": [] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"pcm\")", @@ -823,23 +938,18 @@ }, { "name": "French based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lesser Antillean French Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "acf", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3540", "native_tokenizers": [], "scripts": [ @@ -848,9 +958,11 @@ }, { "name": "Tayo", + "depth": 2, "iso_1_code": null, "iso_3_code": "cks", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3541", "native_tokenizers": [], @@ -858,18 +970,12 @@ }, { "name": "Seychelles French Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "crs", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3542", "native_tokenizers": [], "scripts": [ @@ -878,18 +984,12 @@ }, { "name": "Guadeloupean French Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "gcf", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3543", "native_tokenizers": [], "scripts": [ @@ -898,18 +998,12 @@ }, { "name": "Guianese French Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "gcr", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3544", "native_tokenizers": [], "scripts": [ @@ -918,18 +1012,12 @@ }, { "name": "Haitian Creole", + "depth": 2, "iso_1_code": "ht", "iso_3_code": "hat", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3545", "native_tokenizers": [], "scripts": [ @@ -938,9 +1026,11 @@ }, { "name": "Karipuna French Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "kmv", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3546", "native_tokenizers": [], @@ -948,9 +1038,11 @@ }, { "name": "Louisiana Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "lou", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3547", "native_tokenizers": [], @@ -958,18 +1050,12 @@ }, { "name": "Morisyen", + "depth": 2, "iso_1_code": null, "iso_3_code": "mfe", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3548", "native_tokenizers": [], "scripts": [ @@ -978,18 +1064,12 @@ }, { "name": "R\u00e9union French Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "rcf", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3549", "native_tokenizers": [], "scripts": [ @@ -998,44 +1078,43 @@ }, { "name": "San Miguel French Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "scf", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3550", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3539", "native_tokenizers": [], "scripts": [] }, { "name": "German based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Unserdeutsch", + "depth": 2, "iso_1_code": null, "iso_3_code": "uln", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3552", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3551", "native_tokenizers": [], @@ -1043,20 +1122,24 @@ }, { "name": "Hindi based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andaman Hindi Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "hca", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3554", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3553", "native_tokenizers": [], @@ -1064,23 +1147,18 @@ }, { "name": "Iberian based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Papiamentu", + "depth": 2, "iso_1_code": null, "iso_3_code": "pap", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3556", "native_tokenizers": [], "scripts": [ @@ -1088,35 +1166,32 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3555", "native_tokenizers": [], "scripts": [] }, { "name": "Japanese-based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yilan Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "ycr", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3558", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3557", "native_tokenizers": [], @@ -1124,23 +1199,18 @@ }, { "name": "Kongo based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kituba", + "depth": 2, "iso_1_code": null, "iso_3_code": "ktu", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3560", "native_tokenizers": [], "scripts": [ @@ -1149,38 +1219,36 @@ }, { "name": "Kituba", + "depth": 2, "iso_1_code": null, "iso_3_code": "mkw", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3561", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3559", "native_tokenizers": [], "scripts": [] }, { "name": "Malay based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malay, Ambonese", + "depth": 2, "iso_1_code": null, "iso_3_code": "abs", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1198,9 +1266,11 @@ }, { "name": "Betawi", + "depth": 2, "iso_1_code": null, "iso_3_code": "bew", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1218,9 +1288,11 @@ }, { "name": "Malay, Banda", + "depth": 2, "iso_1_code": null, "iso_3_code": "bpq", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3565", "native_tokenizers": [], @@ -1228,9 +1300,11 @@ }, { "name": "Malaccan Malay Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "ccm", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3566", "native_tokenizers": [], @@ -1238,9 +1312,11 @@ }, { "name": "Malay, Cocos Islands", + "depth": 2, "iso_1_code": "ms", "iso_3_code": "coa", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3567", "native_tokenizers": [], @@ -1248,9 +1324,11 @@ }, { "name": "Malay, Larantuka", + "depth": 2, "iso_1_code": null, "iso_3_code": "lrt", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3568", "native_tokenizers": [], @@ -1258,9 +1336,11 @@ }, { "name": "Malay, North Moluccan", + "depth": 2, "iso_1_code": "ms", "iso_3_code": "max", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1280,9 +1360,11 @@ }, { "name": "Malay, Baba", + "depth": 2, "iso_1_code": null, "iso_3_code": "mbf", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1300,9 +1382,11 @@ }, { "name": "Malay, Balinese", + "depth": 2, "iso_1_code": null, "iso_3_code": "mhp", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3571", "native_tokenizers": [], @@ -1310,9 +1394,11 @@ }, { "name": "Malay, Kupang", + "depth": 2, "iso_1_code": null, "iso_3_code": "mkn", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1330,9 +1416,11 @@ }, { "name": "Indonesian, Peranakan", + "depth": 2, "iso_1_code": null, "iso_3_code": "pea", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3573", "native_tokenizers": [], @@ -1340,9 +1428,11 @@ }, { "name": "Malay, Papuan", + "depth": 2, "iso_1_code": null, "iso_3_code": "pmy", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3574", "native_tokenizers": [], @@ -1350,9 +1440,11 @@ }, { "name": "Sri Lankan Malay Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "sci", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3575", "native_tokenizers": [], @@ -1360,9 +1452,11 @@ }, { "name": "Malay, Manado", + "depth": 2, "iso_1_code": "ms", "iso_3_code": "xmm", "children": [], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1381,6 +1475,7 @@ ] } ], + "family": "Creole", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ms\")", @@ -1396,23 +1491,18 @@ }, { "name": "Ngbandi based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sango", + "depth": 2, "iso_1_code": "sg", "iso_3_code": "sag", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3578", "native_tokenizers": [], "scripts": [ @@ -1421,38 +1511,36 @@ }, { "name": "Sango, Riverain", + "depth": 2, "iso_1_code": null, "iso_3_code": "snj", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3579", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3577", "native_tokenizers": [], "scripts": [] }, { "name": "Portuguese based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angolar", + "depth": 2, "iso_1_code": null, "iso_3_code": "aoa", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3581", "native_tokenizers": [], @@ -1460,9 +1548,11 @@ }, { "name": "Cafundo Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "ccd", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3582", "native_tokenizers": [], @@ -1470,18 +1560,12 @@ }, { "name": "S\u00e3otomense", + "depth": 2, "iso_1_code": null, "iso_3_code": "cri", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3583", "native_tokenizers": [], "scripts": [ @@ -1490,9 +1574,11 @@ }, { "name": "Fa d\u2019Ambu", + "depth": 2, "iso_1_code": null, "iso_3_code": "fab", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3584", "native_tokenizers": [], @@ -1500,9 +1586,11 @@ }, { "name": "Indo-Portuguese", + "depth": 2, "iso_1_code": null, "iso_3_code": "idb", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3585", "native_tokenizers": [], @@ -1510,18 +1598,12 @@ }, { "name": "Kabuverdianu", + "depth": 2, "iso_1_code": null, "iso_3_code": "kea", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3586", "native_tokenizers": [], "scripts": [ @@ -1530,9 +1612,11 @@ }, { "name": "Malaccan Portuguese Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "mcm", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3587", "native_tokenizers": [], @@ -1540,9 +1624,11 @@ }, { "name": "Macanese", + "depth": 2, "iso_1_code": null, "iso_3_code": "mzs", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3588", "native_tokenizers": [], @@ -1550,18 +1636,12 @@ }, { "name": "Guinea-Bissau Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "pov", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3589", "native_tokenizers": [], "scripts": [ @@ -1570,9 +1650,11 @@ }, { "name": "Principense", + "depth": 2, "iso_1_code": null, "iso_3_code": "pre", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3590", "native_tokenizers": [], @@ -1580,9 +1662,11 @@ }, { "name": "Ternate\u00f1o", + "depth": 2, "iso_1_code": null, "iso_3_code": "tmg", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3591", "native_tokenizers": [], @@ -1590,9 +1674,11 @@ }, { "name": "Pidgin, Timor", + "depth": 2, "iso_1_code": null, "iso_3_code": "tvy", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3592", "native_tokenizers": [], @@ -1600,47 +1686,37 @@ }, { "name": "Korlai Portuguese Creole", + "depth": 2, "iso_1_code": null, "iso_3_code": "vkp", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3593", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3580", "native_tokenizers": [], "scripts": [] }, { "name": "Spanish based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chavacano", + "depth": 2, "iso_1_code": null, "iso_3_code": "cbk", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3595", "native_tokenizers": [], "scripts": [ @@ -1649,44 +1725,43 @@ }, { "name": "Palenquero", + "depth": 2, "iso_1_code": null, "iso_3_code": "pln", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3596", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3594", "native_tokenizers": [], "scripts": [] }, { "name": "Swahili based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cutchi-Swahili", + "depth": 2, "iso_1_code": null, "iso_3_code": "ccl", "children": [], + "family": "Creole", "tokenizers": {}, "node_i": "3598", "native_tokenizers": [], "scripts": [] } ], + "family": "Creole", "tokenizers": {}, "node_i": "3597", "native_tokenizers": [], @@ -1694,23 +1769,18 @@ }, { "name": "Tetun based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tetun Dili", + "depth": 2, "iso_1_code": null, "iso_3_code": "tdt", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3600", "native_tokenizers": [], "scripts": [ @@ -1718,29 +1788,15 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3599", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"ms\")", - "original_lang_name": "malay", - "original_lang_code": "msa", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Creole", + "tokenizers": {}, "node_i": "3481", "native_tokenizers": [], "scripts": [] diff --git a/data/Dravidian.json b/data/Dravidian.json index 3c16d782148a636cabf8d8c0cb4b7399e11ccbda..3c5a438af811fe539b2870da2e9246b747a0119f 100644 --- a/data/Dravidian.json +++ b/data/Dravidian.json @@ -1,23 +1,28 @@ { "name": "Dravidian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kolami-Naiki", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kolami, Northwestern", + "depth": 3, "iso_1_code": null, "iso_3_code": "kfb", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3604", "native_tokenizers": [], @@ -25,15 +30,18 @@ }, { "name": "Kolami, Southeastern", + "depth": 3, "iso_1_code": null, "iso_3_code": "nit", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3605", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3603", "native_tokenizers": [], @@ -41,14 +49,17 @@ }, { "name": "Parji-Gadaba", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gadaba, Mudhili", + "depth": 3, "iso_1_code": null, "iso_3_code": "gau", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3607", "native_tokenizers": [], @@ -56,9 +67,11 @@ }, { "name": "Gadaba, Pottangi Ollar", + "depth": 3, "iso_1_code": null, "iso_3_code": "gdb", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3608", "native_tokenizers": [], @@ -66,21 +79,25 @@ }, { "name": "Duruwa", + "depth": 3, "iso_1_code": null, "iso_3_code": "pci", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3609", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3606", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3602", "native_tokenizers": [], @@ -88,14 +105,17 @@ }, { "name": "Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Brahui", + "depth": 2, "iso_1_code": null, "iso_3_code": "brh", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3611", "native_tokenizers": [], @@ -105,9 +125,11 @@ }, { "name": "Kumarbhag Paharia", + "depth": 2, "iso_1_code": null, "iso_3_code": "kmj", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3612", "native_tokenizers": [], @@ -115,9 +137,11 @@ }, { "name": "Kurux", + "depth": 2, "iso_1_code": null, "iso_3_code": "kru", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3613", "native_tokenizers": [], @@ -127,9 +151,11 @@ }, { "name": "Sauria Paharia", + "depth": 2, "iso_1_code": null, "iso_3_code": "mjt", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3614", "native_tokenizers": [], @@ -137,15 +163,18 @@ }, { "name": "Kisan", + "depth": 2, "iso_1_code": null, "iso_3_code": "xis", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3615", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3610", "native_tokenizers": [], @@ -153,24 +182,29 @@ }, { "name": "South-Central", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gondi-Kui", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gondi", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maria, Dandami", + "depth": 4, "iso_1_code": null, "iso_3_code": "daq", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3619", "native_tokenizers": [], @@ -178,9 +212,11 @@ }, { "name": "Muria, Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "emu", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3620", "native_tokenizers": [], @@ -188,9 +224,11 @@ }, { "name": "Gondi, Aheri", + "depth": 4, "iso_1_code": null, "iso_3_code": "esg", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3621", "native_tokenizers": [], @@ -198,9 +236,11 @@ }, { "name": "Muria, Far Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "fmu", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3622", "native_tokenizers": [], @@ -210,9 +250,11 @@ }, { "name": "Gondi, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "gno", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3623", "native_tokenizers": [], @@ -220,9 +262,11 @@ }, { "name": "Khirwar", + "depth": 4, "iso_1_code": null, "iso_3_code": "kwx", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3624", "native_tokenizers": [], @@ -230,9 +274,11 @@ }, { "name": "Maria", + "depth": 4, "iso_1_code": null, "iso_3_code": "mrr", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3625", "native_tokenizers": [], @@ -240,9 +286,11 @@ }, { "name": "Muria, Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "mut", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3626", "native_tokenizers": [], @@ -250,9 +298,11 @@ }, { "name": "Nagarchal", + "depth": 4, "iso_1_code": null, "iso_3_code": "nbg", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3627", "native_tokenizers": [], @@ -260,9 +310,11 @@ }, { "name": "Pardhan", + "depth": 4, "iso_1_code": null, "iso_3_code": "pch", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3628", "native_tokenizers": [], @@ -270,9 +322,11 @@ }, { "name": "Gondi, Adilabad", + "depth": 4, "iso_1_code": null, "iso_3_code": "wsg", "children": [], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -289,6 +343,7 @@ ] } ], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -304,19 +359,23 @@ }, { "name": "Konda-Kui", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konda", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konda-Dora", + "depth": 5, "iso_1_code": null, "iso_3_code": "kfc", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3632", "native_tokenizers": [], @@ -324,15 +383,18 @@ }, { "name": "Mukha-Dora", + "depth": 5, "iso_1_code": null, "iso_3_code": "mmk", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3633", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3631", "native_tokenizers": [], @@ -340,19 +402,23 @@ }, { "name": "Manda-Kui", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kui-Kuvi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kui, Dawik", + "depth": 6, "iso_1_code": null, "iso_3_code": "dwk", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3636", "native_tokenizers": [], @@ -360,9 +426,11 @@ }, { "name": "Koya", + "depth": 6, "iso_1_code": null, "iso_3_code": "kff", "children": [], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -380,9 +448,11 @@ }, { "name": "Kuvi", + "depth": 6, "iso_1_code": null, "iso_3_code": "kxv", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3638", "native_tokenizers": [], @@ -390,15 +460,18 @@ }, { "name": "Kui", + "depth": 6, "iso_1_code": null, "iso_3_code": "uki", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3639", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -414,14 +487,17 @@ }, { "name": "Manda-Pengo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manda", + "depth": 6, "iso_1_code": null, "iso_3_code": "mha", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3641", "native_tokenizers": [], @@ -429,21 +505,25 @@ }, { "name": "Pengo", + "depth": 6, "iso_1_code": null, "iso_3_code": "peg", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3642", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3640", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -458,6 +538,7 @@ "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -472,6 +553,7 @@ "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -487,14 +569,17 @@ }, { "name": "Telugu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chenchu", + "depth": 3, "iso_1_code": null, "iso_3_code": "cde", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3644", "native_tokenizers": [], @@ -502,9 +587,11 @@ }, { "name": "Manna-Dora", + "depth": 3, "iso_1_code": null, "iso_3_code": "mju", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3645", "native_tokenizers": [], @@ -512,9 +599,11 @@ }, { "name": "Telugu", + "depth": 3, "iso_1_code": "te", "iso_3_code": "tel", "children": [], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -535,15 +624,18 @@ }, { "name": "Waddar", + "depth": 3, "iso_1_code": null, "iso_3_code": "wbq", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3647", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -558,6 +650,7 @@ "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Telu": { "full_object": "IndicNLPTokenizer(\"te\")", @@ -573,14 +666,17 @@ }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kurichiya", + "depth": 2, "iso_1_code": null, "iso_3_code": "kfh", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3649", "native_tokenizers": [], @@ -588,9 +684,11 @@ }, { "name": "Kurumba, Attapady", + "depth": 2, "iso_1_code": null, "iso_3_code": "pkr", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3650", "native_tokenizers": [], @@ -598,9 +696,11 @@ }, { "name": "Pathiya", + "depth": 2, "iso_1_code": null, "iso_3_code": "pty", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3651", "native_tokenizers": [], @@ -608,9 +708,11 @@ }, { "name": "Muduga", + "depth": 2, "iso_1_code": null, "iso_3_code": "udg", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3652", "native_tokenizers": [], @@ -618,9 +720,11 @@ }, { "name": "Kumbaran", + "depth": 2, "iso_1_code": null, "iso_3_code": "wkb", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3653", "native_tokenizers": [], @@ -628,9 +732,11 @@ }, { "name": "Kalanadi", + "depth": 2, "iso_1_code": null, "iso_3_code": "wkl", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3654", "native_tokenizers": [], @@ -638,9 +744,11 @@ }, { "name": "Kunduvadi", + "depth": 2, "iso_1_code": null, "iso_3_code": "wku", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3655", "native_tokenizers": [], @@ -648,19 +756,23 @@ }, { "name": "Tamil-Kannada", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kannada", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Badaga", + "depth": 4, "iso_1_code": null, "iso_3_code": "bfq", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3658", "native_tokenizers": [], @@ -668,9 +780,11 @@ }, { "name": "Holiya", + "depth": 4, "iso_1_code": null, "iso_3_code": "hoy", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3659", "native_tokenizers": [], @@ -678,9 +792,11 @@ }, { "name": "Kannada", + "depth": 4, "iso_1_code": "kn", "iso_3_code": "kan", "children": [], + "family": "Dravidian", "tokenizers": { "Knda": { "full_object": "IndicNLPTokenizer(\"kn\")", @@ -701,15 +817,18 @@ }, { "name": "Urali", + "depth": 4, "iso_1_code": null, "iso_3_code": "url", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3661", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Knda": { "full_object": "IndicNLPTokenizer(\"kn\")", @@ -725,19 +844,23 @@ }, { "name": "Tamil-Kodagu", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kodagu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kodava", + "depth": 5, "iso_1_code": null, "iso_3_code": "kfa", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3664", "native_tokenizers": [], @@ -745,9 +868,11 @@ }, { "name": "Kurumba, Kannada", + "depth": 5, "iso_1_code": null, "iso_3_code": "kfi", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3665", "native_tokenizers": [], @@ -755,9 +880,11 @@ }, { "name": "Kurumba, Mullu", + "depth": 5, "iso_1_code": null, "iso_3_code": "kpb", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3666", "native_tokenizers": [], @@ -765,9 +892,11 @@ }, { "name": "Kurumba, Alu", + "depth": 5, "iso_1_code": null, "iso_3_code": "xua", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3667", "native_tokenizers": [], @@ -775,15 +904,18 @@ }, { "name": "Kurumba, Jennu", + "depth": 5, "iso_1_code": null, "iso_3_code": "xuj", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3668", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3663", "native_tokenizers": [], @@ -791,14 +923,17 @@ }, { "name": "Tamil-Malayalam", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mannan", + "depth": 5, "iso_1_code": null, "iso_3_code": "mjv", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3670", "native_tokenizers": [], @@ -806,14 +941,17 @@ }, { "name": "Malayalam", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aranadan", + "depth": 6, "iso_1_code": null, "iso_3_code": "aaf", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3672", "native_tokenizers": [], @@ -821,9 +959,11 @@ }, { "name": "Kadar", + "depth": 6, "iso_1_code": null, "iso_3_code": "kej", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3673", "native_tokenizers": [], @@ -831,9 +971,11 @@ }, { "name": "Malayalam", + "depth": 6, "iso_1_code": "ml", "iso_3_code": "mal", "children": [], + "family": "Dravidian", "tokenizers": { "Mlym": { "full_object": "IndicNLPTokenizer(\"ml\")", @@ -854,9 +996,11 @@ }, { "name": "Malapandaram", + "depth": 6, "iso_1_code": null, "iso_3_code": "mjp", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3675", "native_tokenizers": [], @@ -864,9 +1008,11 @@ }, { "name": "Malaryan", + "depth": 6, "iso_1_code": null, "iso_3_code": "mjq", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3676", "native_tokenizers": [], @@ -874,9 +1020,11 @@ }, { "name": "Malavedan", + "depth": 6, "iso_1_code": null, "iso_3_code": "mjr", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3677", "native_tokenizers": [], @@ -884,9 +1032,11 @@ }, { "name": "Paliyan", + "depth": 6, "iso_1_code": null, "iso_3_code": "pcf", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3678", "native_tokenizers": [], @@ -894,9 +1044,11 @@ }, { "name": "Paniya", + "depth": 6, "iso_1_code": null, "iso_3_code": "pcg", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3679", "native_tokenizers": [], @@ -904,15 +1056,18 @@ }, { "name": "Ravula", + "depth": 6, "iso_1_code": null, "iso_3_code": "yea", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3680", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Mlym": { "full_object": "IndicNLPTokenizer(\"ml\")", @@ -928,14 +1083,17 @@ }, { "name": "Tamil", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eravallan", + "depth": 6, "iso_1_code": null, "iso_3_code": "era", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3682", "native_tokenizers": [], @@ -943,9 +1101,11 @@ }, { "name": "Irula", + "depth": 6, "iso_1_code": null, "iso_3_code": "iru", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3683", "native_tokenizers": [], @@ -953,9 +1113,11 @@ }, { "name": "Kaikadi", + "depth": 6, "iso_1_code": null, "iso_3_code": "kep", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3684", "native_tokenizers": [], @@ -963,9 +1125,11 @@ }, { "name": "Kanikkaran", + "depth": 6, "iso_1_code": null, "iso_3_code": "kev", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3685", "native_tokenizers": [], @@ -973,9 +1137,11 @@ }, { "name": "Muthuvan", + "depth": 6, "iso_1_code": null, "iso_3_code": "muv", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3686", "native_tokenizers": [], @@ -983,9 +1149,11 @@ }, { "name": "Sholaga", + "depth": 6, "iso_1_code": null, "iso_3_code": "sle", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3687", "native_tokenizers": [], @@ -993,9 +1161,11 @@ }, { "name": "Tamil", + "depth": 6, "iso_1_code": "ta", "iso_3_code": "tam", "children": [], + "family": "Dravidian", "tokenizers": { "Taml": { "full_object": "IndicNLPTokenizer(\"ta\")", @@ -1016,9 +1186,11 @@ }, { "name": "Kurumba, Betta", + "depth": 6, "iso_1_code": null, "iso_3_code": "xub", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3689", "native_tokenizers": [], @@ -1026,15 +1198,18 @@ }, { "name": "Yerukula", + "depth": 6, "iso_1_code": null, "iso_3_code": "yeu", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3690", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Taml": { "full_object": "IndicNLPTokenizer(\"ta\")", @@ -1049,6 +1224,7 @@ "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Mlym": { "full_object": "IndicNLPTokenizer(\"ml\")", @@ -1071,14 +1247,17 @@ }, { "name": "Toda-Kota", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kota", + "depth": 5, "iso_1_code": null, "iso_3_code": "kfe", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3692", "native_tokenizers": [], @@ -1086,21 +1265,25 @@ }, { "name": "Toda", + "depth": 5, "iso_1_code": null, "iso_3_code": "tcx", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3693", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3691", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Mlym": { "full_object": "IndicNLPTokenizer(\"ml\")", @@ -1123,26 +1306,31 @@ }, { "name": "Unclassified", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chetti, Wayanad", + "depth": 4, "iso_1_code": null, "iso_3_code": "ctt", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3695", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3694", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Knda": { "full_object": "IndicNLPTokenizer(\"kn\")", @@ -1172,14 +1360,17 @@ }, { "name": "Tulu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bellari", + "depth": 3, "iso_1_code": null, "iso_3_code": "brw", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3697", "native_tokenizers": [], @@ -1187,9 +1378,11 @@ }, { "name": "Kudiya", + "depth": 3, "iso_1_code": null, "iso_3_code": "kfg", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3698", "native_tokenizers": [], @@ -1197,9 +1390,11 @@ }, { "name": "Tulu", + "depth": 3, "iso_1_code": null, "iso_3_code": "tcy", "children": [], + "family": "Dravidian", "tokenizers": { "Knda": { "full_object": "IndicNLPTokenizer(\"kn\")", @@ -1217,14 +1412,17 @@ }, { "name": "Koraga", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koraga, Korra", + "depth": 4, "iso_1_code": null, "iso_3_code": "kfd", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3701", "native_tokenizers": [], @@ -1232,21 +1430,25 @@ }, { "name": "Koraga, Mudu", + "depth": 4, "iso_1_code": null, "iso_3_code": "vmd", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3702", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3700", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Knda": { "full_object": "IndicNLPTokenizer(\"kn\")", @@ -1262,14 +1464,17 @@ }, { "name": "Unclassified", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mala Malasar", + "depth": 3, "iso_1_code": null, "iso_3_code": "ima", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3704", "native_tokenizers": [], @@ -1277,9 +1482,11 @@ }, { "name": "Thachanadan", + "depth": 3, "iso_1_code": null, "iso_3_code": "thn", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3705", "native_tokenizers": [], @@ -1287,9 +1494,11 @@ }, { "name": "Ullatan", + "depth": 3, "iso_1_code": null, "iso_3_code": "ull", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3706", "native_tokenizers": [], @@ -1297,21 +1506,25 @@ }, { "name": "Malasar", + "depth": 3, "iso_1_code": null, "iso_3_code": "ymr", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3707", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3703", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": { "Knda": { "full_object": "IndicNLPTokenizer(\"kn\")", @@ -1341,14 +1554,17 @@ }, { "name": "Unclassified", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Allar", + "depth": 2, "iso_1_code": null, "iso_3_code": "all", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3709", "native_tokenizers": [], @@ -1356,9 +1572,11 @@ }, { "name": "Bharia", + "depth": 2, "iso_1_code": null, "iso_3_code": "bha", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3710", "native_tokenizers": [], @@ -1366,9 +1584,11 @@ }, { "name": "Malankuravan", + "depth": 2, "iso_1_code": null, "iso_3_code": "mjo", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3711", "native_tokenizers": [], @@ -1376,9 +1596,11 @@ }, { "name": "Pattapu", + "depth": 2, "iso_1_code": null, "iso_3_code": "ptq", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3712", "native_tokenizers": [], @@ -1386,51 +1608,26 @@ }, { "name": "Vishavan", + "depth": 2, "iso_1_code": null, "iso_3_code": "vis", "children": [], + "family": "Dravidian", "tokenizers": {}, "node_i": "3713", "native_tokenizers": [], "scripts": [] } ], + "family": "Dravidian", "tokenizers": {}, "node_i": "3708", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Telu": { - "full_object": "IndicNLPTokenizer(\"te\")", - "original_lang_name": "telugu", - "original_lang_code": "tel", - "script": "Telu", - "class_name": "IndicNLPTokenizer" - }, - "Knda": { - "full_object": "IndicNLPTokenizer(\"kn\")", - "original_lang_name": "kannada", - "original_lang_code": "kan", - "script": "Knda", - "class_name": "IndicNLPTokenizer" - }, - "Mlym": { - "full_object": "IndicNLPTokenizer(\"ml\")", - "original_lang_name": "malayalam", - "original_lang_code": "mal", - "script": "Mlym", - "class_name": "IndicNLPTokenizer" - }, - "Taml": { - "full_object": "IndicNLPTokenizer(\"ta\")", - "original_lang_name": "tamil", - "original_lang_code": "tam", - "script": "Taml", - "class_name": "IndicNLPTokenizer" - } - }, + "family": "Dravidian", + "tokenizers": {}, "node_i": "3601", "native_tokenizers": [], "scripts": [] diff --git "a/data/East Bird\342\200\231s Head-Sentani.json" "b/data/East Bird\342\200\231s Head-Sentani.json" index 280aab322670d07da6a2c72292bc99e200c71fb5..7264b9f8bec7c74224eaa1058bdaa1613d69da50 100644 --- "a/data/East Bird\342\200\231s Head-Sentani.json" +++ "b/data/East Bird\342\200\231s Head-Sentani.json" @@ -1,24 +1,29 @@ { "name": "East Bird\u2019s Head-Sentani", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burmeso", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burmeso", + "depth": 2, "iso_1_code": null, "iso_3_code": "bzu", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3716", "native_tokenizers": [], "scripts": [] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3715", "native_tokenizers": [], @@ -26,19 +31,23 @@ }, { "name": "East Bird\u2019s Head", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mantion", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sougb", + "depth": 3, "iso_1_code": null, "iso_3_code": "mnx", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3719", "native_tokenizers": [], @@ -47,6 +56,7 @@ ] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3718", "native_tokenizers": [], @@ -54,14 +64,17 @@ }, { "name": "Meax", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Meyah", + "depth": 3, "iso_1_code": null, "iso_3_code": "mej", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3721", "native_tokenizers": [], @@ -71,9 +84,11 @@ }, { "name": "Moskona", + "depth": 3, "iso_1_code": null, "iso_3_code": "mtj", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3722", "native_tokenizers": [], @@ -82,12 +97,14 @@ ] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3720", "native_tokenizers": [], "scripts": [] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3717", "native_tokenizers": [], @@ -95,25 +112,30 @@ }, { "name": "Sentani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Demta", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sowari", + "depth": 3, "iso_1_code": null, "iso_3_code": "dmy", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3725", "native_tokenizers": [], "scripts": [] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3724", "native_tokenizers": [], @@ -121,14 +143,17 @@ }, { "name": "Sentani Proper", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nafri", + "depth": 3, "iso_1_code": null, "iso_3_code": "nxx", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3727", "native_tokenizers": [], @@ -136,9 +161,11 @@ }, { "name": "Sentani", + "depth": 3, "iso_1_code": null, "iso_3_code": "set", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3728", "native_tokenizers": [], @@ -146,27 +173,32 @@ }, { "name": "Tabla", + "depth": 3, "iso_1_code": null, "iso_3_code": "tnm", "children": [], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3729", "native_tokenizers": [], "scripts": [] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3726", "native_tokenizers": [], "scripts": [] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3723", "native_tokenizers": [], "scripts": [] } ], + "family": "East Bird\u2019s Head-Sentani", "tokenizers": {}, "node_i": "3714", "native_tokenizers": [], diff --git a/data/East Geelvink Bay.json b/data/East Geelvink Bay.json index ceac33343175b677d014e29c1434680a0174a299..5e2fcc4b8e14b3d3983b5205492d51932bf58c03 100644 --- a/data/East Geelvink Bay.json +++ b/data/East Geelvink Bay.json @@ -1,13 +1,16 @@ { "name": "East Geelvink Bay", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anasi", + "depth": 1, "iso_1_code": null, "iso_3_code": "bpo", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3731", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Barapasi", + "depth": 1, "iso_1_code": null, "iso_3_code": "brp", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3732", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Burate", + "depth": 1, "iso_1_code": null, "iso_3_code": "bti", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3733", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Kehu", + "depth": 1, "iso_1_code": null, "iso_3_code": "khh", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3734", "native_tokenizers": [], @@ -45,9 +54,11 @@ }, { "name": "Kofei", + "depth": 1, "iso_1_code": null, "iso_3_code": "kpi", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3735", "native_tokenizers": [], @@ -55,9 +66,11 @@ }, { "name": "Nisa", + "depth": 1, "iso_1_code": null, "iso_3_code": "njs", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3736", "native_tokenizers": [], @@ -65,9 +78,11 @@ }, { "name": "Sauri", + "depth": 1, "iso_1_code": null, "iso_3_code": "srt", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3737", "native_tokenizers": [], @@ -75,9 +90,11 @@ }, { "name": "Tefaro", + "depth": 1, "iso_1_code": null, "iso_3_code": "tfo", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3738", "native_tokenizers": [], @@ -85,9 +102,11 @@ }, { "name": "Tunggare", + "depth": 1, "iso_1_code": null, "iso_3_code": "trt", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3739", "native_tokenizers": [], @@ -95,9 +114,11 @@ }, { "name": "Woria", + "depth": 1, "iso_1_code": null, "iso_3_code": "wor", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3740", "native_tokenizers": [], @@ -105,14 +126,17 @@ }, { "name": "Bauzi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bauzi", + "depth": 2, "iso_1_code": null, "iso_3_code": "bvz", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3742", "native_tokenizers": [], @@ -122,21 +146,25 @@ }, { "name": "Demisa", + "depth": 2, "iso_1_code": null, "iso_3_code": "dei", "children": [], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3743", "native_tokenizers": [], "scripts": [] } ], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3741", "native_tokenizers": [], "scripts": [] } ], + "family": "East Geelvink Bay", "tokenizers": {}, "node_i": "3730", "native_tokenizers": [], diff --git a/data/East New Britain.json b/data/East New Britain.json index e5ff91418d465e56fdf7c255403bcc138d4e7a46..0250eb5472ece7a8c79e1a72c2e47b44155d3b53 100644 --- a/data/East New Britain.json +++ b/data/East New Britain.json @@ -1,18 +1,22 @@ { "name": "East New Britain", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baining", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Qaqet", + "depth": 2, "iso_1_code": null, "iso_3_code": "byx", "children": [], + "family": "East New Britain", "tokenizers": {}, "node_i": "3746", "native_tokenizers": [], @@ -22,9 +26,11 @@ }, { "name": "Kairak", + "depth": 2, "iso_1_code": null, "iso_3_code": "ckr", "children": [], + "family": "East New Britain", "tokenizers": {}, "node_i": "3747", "native_tokenizers": [], @@ -32,9 +38,11 @@ }, { "name": "Mali", + "depth": 2, "iso_1_code": null, "iso_3_code": "gcc", "children": [], + "family": "East New Britain", "tokenizers": {}, "node_i": "3748", "native_tokenizers": [], @@ -42,9 +50,11 @@ }, { "name": "Simbali", + "depth": 2, "iso_1_code": null, "iso_3_code": "smg", "children": [], + "family": "East New Britain", "tokenizers": {}, "node_i": "3749", "native_tokenizers": [], @@ -52,9 +62,11 @@ }, { "name": "Ura", + "depth": 2, "iso_1_code": null, "iso_3_code": "uro", "children": [], + "family": "East New Britain", "tokenizers": {}, "node_i": "3750", "native_tokenizers": [], @@ -62,15 +74,18 @@ }, { "name": "Makolkol", + "depth": 2, "iso_1_code": null, "iso_3_code": "zmh", "children": [], + "family": "East New Britain", "tokenizers": {}, "node_i": "3751", "native_tokenizers": [], "scripts": [] } ], + "family": "East New Britain", "tokenizers": {}, "node_i": "3745", "native_tokenizers": [], @@ -78,26 +93,31 @@ }, { "name": "Taulil", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tulil", + "depth": 2, "iso_1_code": null, "iso_3_code": "tuh", "children": [], + "family": "East New Britain", "tokenizers": {}, "node_i": "3753", "native_tokenizers": [], "scripts": [] } ], + "family": "East New Britain", "tokenizers": {}, "node_i": "3752", "native_tokenizers": [], "scripts": [] } ], + "family": "East New Britain", "tokenizers": {}, "node_i": "3744", "native_tokenizers": [], diff --git a/data/Eastern Trans-Fly.json b/data/Eastern Trans-Fly.json index b8241944ee96dd6222a0118bc721b8cf406aeec6..e60d7caace060574bca7768eef2f884dd8149b12 100644 --- a/data/Eastern Trans-Fly.json +++ b/data/Eastern Trans-Fly.json @@ -1,13 +1,16 @@ { "name": "Eastern Trans-Fly", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bine", + "depth": 1, "iso_1_code": null, "iso_3_code": "bon", "children": [], + "family": "Eastern Trans-Fly", "tokenizers": {}, "node_i": "3755", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Wipi", + "depth": 1, "iso_1_code": null, "iso_3_code": "gdr", "children": [], + "family": "Eastern Trans-Fly", "tokenizers": {}, "node_i": "3756", "native_tokenizers": [], @@ -29,9 +34,11 @@ }, { "name": "Gizrra", + "depth": 1, "iso_1_code": null, "iso_3_code": "tof", "children": [], + "family": "Eastern Trans-Fly", "tokenizers": {}, "node_i": "3757", "native_tokenizers": [], @@ -39,15 +46,18 @@ }, { "name": "Meriam Mir", + "depth": 1, "iso_1_code": null, "iso_3_code": "ulk", "children": [], + "family": "Eastern Trans-Fly", "tokenizers": {}, "node_i": "3758", "native_tokenizers": [], "scripts": [] } ], + "family": "Eastern Trans-Fly", "tokenizers": {}, "node_i": "3754", "native_tokenizers": [], diff --git a/data/Eskimo-Aleut.json b/data/Eskimo-Aleut.json index ed382da9be41656535f6ba2164db14c2119bd695..9cf11808c0c5bf09c4a053d1a5de6b8f3bd0f28e 100644 --- a/data/Eskimo-Aleut.json +++ b/data/Eskimo-Aleut.json @@ -1,24 +1,29 @@ { "name": "Eskimo-Aleut", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aleut", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aleut", + "depth": 2, "iso_1_code": null, "iso_3_code": "ale", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3761", "native_tokenizers": [], "scripts": [] } ], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3760", "native_tokenizers": [], @@ -26,19 +31,23 @@ }, { "name": "Eskimo", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inuit-Inupiaq", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inupiatun, North Alaskan", + "depth": 3, "iso_1_code": "ik", "iso_3_code": "esi", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3764", "native_tokenizers": [], @@ -48,9 +57,11 @@ }, { "name": "Inupiatun, Northwest Alaska", + "depth": 3, "iso_1_code": "ik", "iso_3_code": "esk", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3765", "native_tokenizers": [], @@ -60,9 +71,11 @@ }, { "name": "Inuktitut, Eastern Canadian", + "depth": 3, "iso_1_code": "iu", "iso_3_code": "ike", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3766", "native_tokenizers": [], @@ -72,9 +85,11 @@ }, { "name": "Inuinnaqtun", + "depth": 3, "iso_1_code": "iu", "iso_3_code": "ikt", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3767", "native_tokenizers": [], @@ -84,9 +99,11 @@ }, { "name": "Greenlandic", + "depth": 3, "iso_1_code": "kl", "iso_3_code": "kal", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3768", "native_tokenizers": [], @@ -95,6 +112,7 @@ ] } ], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3763", "native_tokenizers": [], @@ -102,14 +120,17 @@ }, { "name": "Yupik", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yupik, Saint Lawrence Island", + "depth": 3, "iso_1_code": null, "iso_3_code": "ess", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3770", "native_tokenizers": [], @@ -119,9 +140,11 @@ }, { "name": "Yupik, Naukan", + "depth": 3, "iso_1_code": null, "iso_3_code": "ynk", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3771", "native_tokenizers": [], @@ -129,9 +152,11 @@ }, { "name": "Yupik, Sirenik", + "depth": 3, "iso_1_code": null, "iso_3_code": "ysr", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3772", "native_tokenizers": [], @@ -139,14 +164,17 @@ }, { "name": "Alaskan Yupik", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yupik, Pacific Gulf", + "depth": 4, "iso_1_code": null, "iso_3_code": "ems", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3774", "native_tokenizers": [], @@ -154,9 +182,11 @@ }, { "name": "Yupik, Central", + "depth": 4, "iso_1_code": null, "iso_3_code": "esu", "children": [], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3775", "native_tokenizers": [], @@ -165,24 +195,28 @@ ] } ], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3773", "native_tokenizers": [], "scripts": [] } ], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3769", "native_tokenizers": [], "scripts": [] } ], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3762", "native_tokenizers": [], "scripts": [] } ], + "family": "Eskimo-Aleut", "tokenizers": {}, "node_i": "3759", "native_tokenizers": [], diff --git a/data/Eyak-Athabaskan.json b/data/Eyak-Athabaskan.json index ab9db9be76e613f0cd68ac30b08dfa12405c1151..321a5f167dd0e1d79eb8f4e6b5b70c39e1c6f57c 100644 --- a/data/Eyak-Athabaskan.json +++ b/data/Eyak-Athabaskan.json @@ -1,13 +1,16 @@ { "name": "Eyak-Athabaskan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eyak", + "depth": 1, "iso_1_code": null, "iso_3_code": "eya", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3777", "native_tokenizers": [], @@ -15,19 +18,23 @@ }, { "name": "Athabaskan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apachean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Navajo", + "depth": 3, "iso_1_code": "nv", "iso_3_code": "nav", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3780", "native_tokenizers": [], @@ -37,14 +44,17 @@ }, { "name": "Apache", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apache, Jicarilla", + "depth": 4, "iso_1_code": null, "iso_3_code": "apj", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3782", "native_tokenizers": [], @@ -52,9 +62,11 @@ }, { "name": "Apache, Kiowa", + "depth": 4, "iso_1_code": null, "iso_3_code": "apk", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3783", "native_tokenizers": [], @@ -62,9 +74,11 @@ }, { "name": "Apache, Lipan", + "depth": 4, "iso_1_code": null, "iso_3_code": "apl", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3784", "native_tokenizers": [], @@ -72,9 +86,11 @@ }, { "name": "Apache, Mescalero-Chiricahua", + "depth": 4, "iso_1_code": null, "iso_3_code": "apm", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3785", "native_tokenizers": [], @@ -82,9 +98,11 @@ }, { "name": "Apache, Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "apw", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3786", "native_tokenizers": [], @@ -93,12 +111,14 @@ ] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3781", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3779", "native_tokenizers": [], @@ -106,14 +126,17 @@ }, { "name": "Northern Athabaskan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ahtena", + "depth": 3, "iso_1_code": null, "iso_3_code": "aht", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3788", "native_tokenizers": [], @@ -121,9 +144,11 @@ }, { "name": "Babine", + "depth": 3, "iso_1_code": null, "iso_3_code": "bcr", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3789", "native_tokenizers": [], @@ -131,9 +156,11 @@ }, { "name": "Beaver", + "depth": 3, "iso_1_code": null, "iso_3_code": "bea", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3790", "native_tokenizers": [], @@ -143,9 +170,11 @@ }, { "name": "Dene", + "depth": 3, "iso_1_code": null, "iso_3_code": "chp", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3791", "native_tokenizers": [], @@ -153,9 +182,11 @@ }, { "name": "Chilcotin", + "depth": 3, "iso_1_code": null, "iso_3_code": "clc", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3792", "native_tokenizers": [], @@ -163,9 +194,11 @@ }, { "name": "Tlicho", + "depth": 3, "iso_1_code": null, "iso_3_code": "dgr", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3793", "native_tokenizers": [], @@ -175,9 +208,11 @@ }, { "name": "Gwich\u2019in", + "depth": 3, "iso_1_code": null, "iso_3_code": "gwi", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3794", "native_tokenizers": [], @@ -187,9 +222,11 @@ }, { "name": "Han", + "depth": 3, "iso_1_code": null, "iso_3_code": "haa", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3795", "native_tokenizers": [], @@ -197,9 +234,11 @@ }, { "name": "Holikachuk", + "depth": 3, "iso_1_code": null, "iso_3_code": "hoi", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3796", "native_tokenizers": [], @@ -207,9 +246,11 @@ }, { "name": "Deg Xinag", + "depth": 3, "iso_1_code": null, "iso_3_code": "ing", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3797", "native_tokenizers": [], @@ -217,9 +258,11 @@ }, { "name": "Koyukon", + "depth": 3, "iso_1_code": null, "iso_3_code": "koy", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3798", "native_tokenizers": [], @@ -227,9 +270,11 @@ }, { "name": "Kuskokwim, Upper", + "depth": 3, "iso_1_code": null, "iso_3_code": "kuu", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3799", "native_tokenizers": [], @@ -237,9 +282,11 @@ }, { "name": "Sekani", + "depth": 3, "iso_1_code": null, "iso_3_code": "sek", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3800", "native_tokenizers": [], @@ -247,9 +294,11 @@ }, { "name": "Sarsi", + "depth": 3, "iso_1_code": null, "iso_3_code": "srs", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3801", "native_tokenizers": [], @@ -257,9 +306,11 @@ }, { "name": "Tanana, Lower", + "depth": 3, "iso_1_code": null, "iso_3_code": "taa", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3802", "native_tokenizers": [], @@ -267,9 +318,11 @@ }, { "name": "Tanana, Upper", + "depth": 3, "iso_1_code": null, "iso_3_code": "tau", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3803", "native_tokenizers": [], @@ -277,9 +330,11 @@ }, { "name": "Tanacross", + "depth": 3, "iso_1_code": null, "iso_3_code": "tcb", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3804", "native_tokenizers": [], @@ -287,9 +342,11 @@ }, { "name": "Tanaina", + "depth": 3, "iso_1_code": null, "iso_3_code": "tfn", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3805", "native_tokenizers": [], @@ -297,9 +354,11 @@ }, { "name": "Tsetsaut", + "depth": 3, "iso_1_code": null, "iso_3_code": "txc", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3806", "native_tokenizers": [], @@ -307,14 +366,17 @@ }, { "name": "Carrier", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Carrier, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "caf", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3808", "native_tokenizers": [], @@ -324,9 +386,11 @@ }, { "name": "Carrier", + "depth": 4, "iso_1_code": null, "iso_3_code": "crx", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3809", "native_tokenizers": [], @@ -335,6 +399,7 @@ ] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3807", "native_tokenizers": [], @@ -342,14 +407,17 @@ }, { "name": "Slavey-Hare", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Slavey, North", + "depth": 4, "iso_1_code": null, "iso_3_code": "scs", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3811", "native_tokenizers": [], @@ -357,15 +425,18 @@ }, { "name": "Slavey, South", + "depth": 4, "iso_1_code": null, "iso_3_code": "xsl", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3812", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3810", "native_tokenizers": [], @@ -373,14 +444,17 @@ }, { "name": "Tahltan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaska", + "depth": 4, "iso_1_code": null, "iso_3_code": "kkz", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3814", "native_tokenizers": [], @@ -388,9 +462,11 @@ }, { "name": "Tagish", + "depth": 4, "iso_1_code": null, "iso_3_code": "tgx", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3815", "native_tokenizers": [], @@ -398,15 +474,18 @@ }, { "name": "Tahltan", + "depth": 4, "iso_1_code": null, "iso_3_code": "tht", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3816", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3813", "native_tokenizers": [], @@ -414,14 +493,17 @@ }, { "name": "Tuchone", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tutchone, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "tce", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3818", "native_tokenizers": [], @@ -429,21 +511,25 @@ }, { "name": "Tutchone, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "ttm", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3819", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3817", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3787", "native_tokenizers": [], @@ -451,14 +537,17 @@ }, { "name": "Pacific Coast Athabaskan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwalhioqua-Tlatskanai", + "depth": 3, "iso_1_code": null, "iso_3_code": "qwt", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3821", "native_tokenizers": [], @@ -466,14 +555,17 @@ }, { "name": "California Athabaskan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hupa", + "depth": 4, "iso_1_code": null, "iso_3_code": "hup", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3823", "native_tokenizers": [], @@ -481,9 +573,11 @@ }, { "name": "Kato", + "depth": 4, "iso_1_code": null, "iso_3_code": "ktw", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3824", "native_tokenizers": [], @@ -491,9 +585,11 @@ }, { "name": "Mattole", + "depth": 4, "iso_1_code": null, "iso_3_code": "mvb", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3825", "native_tokenizers": [], @@ -501,15 +597,18 @@ }, { "name": "Wailaki", + "depth": 4, "iso_1_code": null, "iso_3_code": "wlk", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3826", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3822", "native_tokenizers": [], @@ -517,14 +616,17 @@ }, { "name": "Oregon Athabaskan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Galice", + "depth": 4, "iso_1_code": null, "iso_3_code": "gce", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3828", "native_tokenizers": [], @@ -532,9 +634,11 @@ }, { "name": "Upper Umpqua", + "depth": 4, "iso_1_code": null, "iso_3_code": "xup", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3829", "native_tokenizers": [], @@ -542,14 +646,17 @@ }, { "name": "Tolowa-Chetco", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chetco", + "depth": 5, "iso_1_code": null, "iso_3_code": "ctc", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3831", "native_tokenizers": [], @@ -557,15 +664,18 @@ }, { "name": "Tolowa", + "depth": 5, "iso_1_code": null, "iso_3_code": "tol", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3832", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3830", "native_tokenizers": [], @@ -573,14 +683,17 @@ }, { "name": "Tututni-Chasta Costa-Coquille", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Coquille", + "depth": 5, "iso_1_code": null, "iso_3_code": "coq", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3834", "native_tokenizers": [], @@ -588,33 +701,39 @@ }, { "name": "Tututni", + "depth": 5, "iso_1_code": null, "iso_3_code": "tuu", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3835", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3833", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3827", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3820", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3778", "native_tokenizers": [], @@ -622,26 +741,31 @@ }, { "name": "Tlingit", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tlingit", + "depth": 2, "iso_1_code": null, "iso_3_code": "tli", "children": [], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3837", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3836", "native_tokenizers": [], "scripts": [] } ], + "family": "Eyak-Athabaskan", "tokenizers": {}, "node_i": "3776", "native_tokenizers": [], diff --git a/data/Fas.json b/data/Fas.json index 39a3732a5caa6a7bb7b81adbb4d297f643068f02..4a5f5e105e3f5b8bb0bab5113b241b3ee1f0ee05 100644 --- a/data/Fas.json +++ b/data/Fas.json @@ -1,13 +1,16 @@ { "name": "Fas", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baibai", + "depth": 1, "iso_1_code": null, "iso_3_code": "bbf", "children": [], + "family": "Fas", "tokenizers": {}, "node_i": "3839", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Momu", + "depth": 1, "iso_1_code": null, "iso_3_code": "fqs", "children": [], + "family": "Fas", "tokenizers": {}, "node_i": "3840", "native_tokenizers": [], "scripts": [] } ], + "family": "Fas", "tokenizers": {}, "node_i": "3838", "native_tokenizers": [], diff --git a/data/Guajiboan.json b/data/Guajiboan.json index 8b80d8cffcdcb278fa690e5f8abe98856c25cfef..dcf218a94db2a6a341b8e2601a0a4e9411fa8976 100644 --- a/data/Guajiboan.json +++ b/data/Guajiboan.json @@ -1,13 +1,16 @@ { "name": "Guajiboan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cuiba", + "depth": 1, "iso_1_code": null, "iso_3_code": "cui", "children": [], + "family": "Guajiboan", "tokenizers": {}, "node_i": "3842", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Guayabero", + "depth": 1, "iso_1_code": null, "iso_3_code": "guo", "children": [], + "family": "Guajiboan", "tokenizers": {}, "node_i": "3843", "native_tokenizers": [], @@ -29,14 +34,17 @@ }, { "name": "Guajibo", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Playero", + "depth": 2, "iso_1_code": null, "iso_3_code": "gob", "children": [], + "family": "Guajiboan", "tokenizers": {}, "node_i": "3845", "native_tokenizers": [], @@ -44,9 +52,11 @@ }, { "name": "Guahibo", + "depth": 2, "iso_1_code": null, "iso_3_code": "guh", "children": [], + "family": "Guajiboan", "tokenizers": {}, "node_i": "3846", "native_tokenizers": [], @@ -56,21 +66,25 @@ }, { "name": "Macagu\u00e1n", + "depth": 2, "iso_1_code": null, "iso_3_code": "mbn", "children": [], + "family": "Guajiboan", "tokenizers": {}, "node_i": "3847", "native_tokenizers": [], "scripts": [] } ], + "family": "Guajiboan", "tokenizers": {}, "node_i": "3844", "native_tokenizers": [], "scripts": [] } ], + "family": "Guajiboan", "tokenizers": {}, "node_i": "3841", "native_tokenizers": [], diff --git a/data/Guaykuruan.json b/data/Guaykuruan.json index c28cd75a192ee4c699bff7789d783721f410b765..548c08ab291c80ba99a356e1d7d6d670e5ba43e6 100644 --- a/data/Guaykuruan.json +++ b/data/Guaykuruan.json @@ -1,18 +1,22 @@ { "name": "Guaykuruan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guaykur\u00fa", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abipon", + "depth": 2, "iso_1_code": null, "iso_3_code": "axb", "children": [], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3850", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Kadiw\u00e9u", + "depth": 2, "iso_1_code": null, "iso_3_code": "kbc", "children": [], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3851", "native_tokenizers": [], @@ -31,6 +37,7 @@ ] } ], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3849", "native_tokenizers": [], @@ -38,14 +45,17 @@ }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mocov\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": "moc", "children": [], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3853", "native_tokenizers": [], @@ -55,9 +65,11 @@ }, { "name": "Pilag\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "plg", "children": [], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3854", "native_tokenizers": [], @@ -67,9 +79,11 @@ }, { "name": "Toba", + "depth": 2, "iso_1_code": null, "iso_3_code": "tob", "children": [], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3855", "native_tokenizers": [], @@ -78,12 +92,14 @@ ] } ], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3852", "native_tokenizers": [], "scripts": [] } ], + "family": "Guaykuruan", "tokenizers": {}, "node_i": "3848", "native_tokenizers": [], diff --git a/data/Gum.json b/data/Gum.json index ffff97f25c21c9bd5c19b297571af9533556f184..18a23a98b3b4056554076eaa51636a62c895330f 100644 --- a/data/Gum.json +++ b/data/Gum.json @@ -1,8 +1,10 @@ { "name": "Gum", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [], + "family": "Gum", "tokenizers": {}, "node_i": "3856", "native_tokenizers": [], diff --git a/data/Haida.json b/data/Haida.json index 8fc9c8927b2dbbea17e605afa3aae512e6fc606a..69a9377ab20485d54cf1efa212f10cffdc2a3d43 100644 --- a/data/Haida.json +++ b/data/Haida.json @@ -1,13 +1,16 @@ { "name": "Haida", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haida, Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": "hax", "children": [], + "family": "Haida", "tokenizers": {}, "node_i": "3858", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Haida, Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": "hdn", "children": [], + "family": "Haida", "tokenizers": {}, "node_i": "3859", "native_tokenizers": [], "scripts": [] } ], + "family": "Haida", "tokenizers": {}, "node_i": "3857", "native_tokenizers": [], diff --git "a/data/Har\303\241kmbut.json" "b/data/Har\303\241kmbut.json" index c251545926c32a28faa3881b144d127cce281440..bc90276c9a0fd15faf69cec1db8ea287dc2a736e 100644 --- "a/data/Har\303\241kmbut.json" +++ "b/data/Har\303\241kmbut.json" @@ -1,13 +1,16 @@ { "name": "Har\u00e1kmbut", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amarakaeri", + "depth": 1, "iso_1_code": null, "iso_3_code": "amr", "children": [], + "family": "Har\u00e1kmbut", "tokenizers": {}, "node_i": "3861", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Huachipaeri", + "depth": 1, "iso_1_code": null, "iso_3_code": "hug", "children": [], + "family": "Har\u00e1kmbut", "tokenizers": {}, "node_i": "3862", "native_tokenizers": [], "scripts": [] } ], + "family": "Har\u00e1kmbut", "tokenizers": {}, "node_i": "3860", "native_tokenizers": [], diff --git a/data/Hmong-Mien.json b/data/Hmong-Mien.json index 28b10277b538f4dda0314dfc6e94230b08263a3b..63d24f20aa99ba3d3298e90fb339482fc6ad4d29 100644 --- a/data/Hmong-Mien.json +++ b/data/Hmong-Mien.json @@ -1,23 +1,28 @@ { "name": "Hmong-Mien", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hmongic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bunu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bunu, Younuo", + "depth": 3, "iso_1_code": null, "iso_3_code": "buh", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3866", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Bunu, Wunai", + "depth": 3, "iso_1_code": null, "iso_3_code": "bwn", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3867", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Bunu, Bu-Nao", + "depth": 3, "iso_1_code": null, "iso_3_code": "bwx", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3868", "native_tokenizers": [], @@ -45,15 +54,18 @@ }, { "name": "Bunu, Jiongnai", + "depth": 3, "iso_1_code": null, "iso_3_code": "pnu", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3869", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3865", "native_tokenizers": [], @@ -61,14 +73,17 @@ }, { "name": "Chuanqiandian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miao, Chuanqiandian Cluster", + "depth": 3, "iso_1_code": null, "iso_3_code": "cqd", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3871", "native_tokenizers": [], @@ -76,9 +91,11 @@ }, { "name": "Miao, Southern Mashan", + "depth": 3, "iso_1_code": null, "iso_3_code": "hma", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3872", "native_tokenizers": [], @@ -86,9 +103,11 @@ }, { "name": "Miao, Central Huishui", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmc", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3873", "native_tokenizers": [], @@ -96,9 +115,11 @@ }, { "name": "Miao, Large Flowery", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmd", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3874", "native_tokenizers": [], @@ -106,9 +127,11 @@ }, { "name": "Miao, Eastern Huishui", + "depth": 3, "iso_1_code": null, "iso_3_code": "hme", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3875", "native_tokenizers": [], @@ -116,9 +139,11 @@ }, { "name": "Hmong Don", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmf", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3876", "native_tokenizers": [], @@ -126,9 +151,11 @@ }, { "name": "Miao, Southwestern Guiyang", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmg", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3877", "native_tokenizers": [], @@ -136,9 +163,11 @@ }, { "name": "Miao, Southwestern Huishui", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmh", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3878", "native_tokenizers": [], @@ -146,9 +175,11 @@ }, { "name": "Miao, Northern Huishui", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmi", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3879", "native_tokenizers": [], @@ -156,9 +187,11 @@ }, { "name": "Ge", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmj", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3880", "native_tokenizers": [], @@ -166,9 +199,11 @@ }, { "name": "Miao, Luopohe", + "depth": 3, "iso_1_code": null, "iso_3_code": "hml", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3881", "native_tokenizers": [], @@ -176,9 +211,11 @@ }, { "name": "Miao, Central Mashan", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmm", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3882", "native_tokenizers": [], @@ -186,9 +223,11 @@ }, { "name": "Miao, Northern Mashan", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmp", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3883", "native_tokenizers": [], @@ -196,9 +235,11 @@ }, { "name": "Hmong D\u00f4", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmv", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3884", "native_tokenizers": [], @@ -206,9 +247,11 @@ }, { "name": "Miao, Western Mashan", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmw", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3885", "native_tokenizers": [], @@ -216,9 +259,11 @@ }, { "name": "Miao, Southern Guiyang", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmy", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3886", "native_tokenizers": [], @@ -226,9 +271,11 @@ }, { "name": "Sinicized Miao", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmz", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3887", "native_tokenizers": [], @@ -236,9 +283,11 @@ }, { "name": "Hmong Njua", + "depth": 3, "iso_1_code": null, "iso_3_code": "hnj", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3888", "native_tokenizers": [], @@ -248,9 +297,11 @@ }, { "name": "Miao, Horned", + "depth": 3, "iso_1_code": null, "iso_3_code": "hrm", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3889", "native_tokenizers": [], @@ -258,9 +309,11 @@ }, { "name": "Miao, Northern Guiyang", + "depth": 3, "iso_1_code": null, "iso_3_code": "huj", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3890", "native_tokenizers": [], @@ -268,9 +321,11 @@ }, { "name": "Hmong Daw", + "depth": 3, "iso_1_code": null, "iso_3_code": "mww", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3891", "native_tokenizers": [], @@ -280,15 +335,18 @@ }, { "name": "Miao, Small Flowery", + "depth": 3, "iso_1_code": null, "iso_3_code": "sfm", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3892", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3870", "native_tokenizers": [], @@ -296,20 +354,24 @@ }, { "name": "Pa-hng", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pa-Hng", + "depth": 3, "iso_1_code": null, "iso_3_code": "pha", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3894", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3893", "native_tokenizers": [], @@ -317,14 +379,17 @@ }, { "name": "Qiandong", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miao, Northern Qiandong", + "depth": 3, "iso_1_code": null, "iso_3_code": "hea", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3896", "native_tokenizers": [], @@ -332,9 +397,11 @@ }, { "name": "Miao, Eastern Qiandong", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmq", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3897", "native_tokenizers": [], @@ -342,9 +409,11 @@ }, { "name": "Miao, Southern Qiandong", + "depth": 3, "iso_1_code": null, "iso_3_code": "hms", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3898", "native_tokenizers": [], @@ -352,15 +421,18 @@ }, { "name": "N\u00e1-Meo", + "depth": 3, "iso_1_code": null, "iso_3_code": "neo", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3899", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3895", "native_tokenizers": [], @@ -368,14 +440,17 @@ }, { "name": "Xiangxi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miao, Western Xiangxi", + "depth": 3, "iso_1_code": null, "iso_3_code": "mmr", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3901", "native_tokenizers": [], @@ -383,21 +458,25 @@ }, { "name": "Miao, Eastern Xiangxi", + "depth": 3, "iso_1_code": null, "iso_3_code": "muq", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3902", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3900", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3864", "native_tokenizers": [], @@ -405,20 +484,24 @@ }, { "name": "Ho Nte", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "She", + "depth": 2, "iso_1_code": null, "iso_3_code": "shx", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3904", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3903", "native_tokenizers": [], @@ -426,25 +509,30 @@ }, { "name": "Mienic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biao-Jiao", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biao-Jiao Mien", + "depth": 3, "iso_1_code": null, "iso_3_code": "bje", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3907", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3906", "native_tokenizers": [], @@ -452,14 +540,17 @@ }, { "name": "Mian-Jin", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biao Mon", + "depth": 3, "iso_1_code": null, "iso_3_code": "bmt", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3909", "native_tokenizers": [], @@ -467,9 +558,11 @@ }, { "name": "Iu Mien", + "depth": 3, "iso_1_code": null, "iso_3_code": "ium", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3910", "native_tokenizers": [], @@ -479,15 +572,18 @@ }, { "name": "Kim Mun", + "depth": 3, "iso_1_code": null, "iso_3_code": "mji", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3911", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3908", "native_tokenizers": [], @@ -495,32 +591,38 @@ }, { "name": "Zaomin", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dzao Min", + "depth": 3, "iso_1_code": null, "iso_3_code": "bpn", "children": [], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3913", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3912", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3905", "native_tokenizers": [], "scripts": [] } ], + "family": "Hmong-Mien", "tokenizers": {}, "node_i": "3863", "native_tokenizers": [], diff --git a/data/Huavean.json b/data/Huavean.json index 092796bc88ab712db5e10d1f11671ebd146d8a3b..9a7494ac2c63a777246c77311bf992f9e755e117 100644 --- a/data/Huavean.json +++ b/data/Huavean.json @@ -1,13 +1,16 @@ { "name": "Huavean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Huave, San Francisco del Mar", + "depth": 1, "iso_1_code": null, "iso_3_code": "hue", "children": [], + "family": "Huavean", "tokenizers": {}, "node_i": "3915", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Huave, San Mateo del Mar", + "depth": 1, "iso_1_code": null, "iso_3_code": "huv", "children": [], + "family": "Huavean", "tokenizers": {}, "node_i": "3916", "native_tokenizers": [], @@ -27,9 +32,11 @@ }, { "name": "Huave, San Dionisio del Mar", + "depth": 1, "iso_1_code": null, "iso_3_code": "hve", "children": [], + "family": "Huavean", "tokenizers": {}, "node_i": "3917", "native_tokenizers": [], @@ -37,15 +44,18 @@ }, { "name": "Huave, Santa Mar\u00eda del Mar", + "depth": 1, "iso_1_code": null, "iso_3_code": "hvv", "children": [], + "family": "Huavean", "tokenizers": {}, "node_i": "3918", "native_tokenizers": [], "scripts": [] } ], + "family": "Huavean", "tokenizers": {}, "node_i": "3914", "native_tokenizers": [], diff --git a/data/Indo-European.json b/data/Indo-European.json index 2a7572755f588491018520562d2e9584b944c80b..2b06920d45371a58dddba4fa79dd364b43f3b107 100644 --- a/data/Indo-European.json +++ b/data/Indo-European.json @@ -1,23 +1,28 @@ { "name": "Indo-European", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Albanian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gheg", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Albanian, Gheg", + "depth": 3, "iso_1_code": "sq", "iso_3_code": "aln", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sq\")", @@ -36,6 +41,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sq\")", @@ -51,14 +57,17 @@ }, { "name": "Tosk", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Albanian, Arb\u00ebresh\u00eb", + "depth": 3, "iso_1_code": "sq", "iso_3_code": "aae", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3924", "native_tokenizers": [], @@ -66,9 +75,11 @@ }, { "name": "Albanian, Arvanitika", + "depth": 3, "iso_1_code": "sq", "iso_3_code": "aat", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3925", "native_tokenizers": [], @@ -76,9 +87,11 @@ }, { "name": "Albanian, Tosk", + "depth": 3, "iso_1_code": "sq", "iso_3_code": "als", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sq\")", @@ -97,6 +110,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sq\")", @@ -111,6 +125,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sq\")", @@ -126,14 +141,17 @@ }, { "name": "Armenian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Armenian", + "depth": 2, "iso_1_code": "hy", "iso_3_code": "hye", "children": [], + "family": "Indo-European", "tokenizers": { "Armn": { "full_object": "SpaCyTokenizer(\"hy\")", @@ -153,9 +171,11 @@ }, { "name": "Armenian, Western", + "depth": 2, "iso_1_code": null, "iso_3_code": "hyw", "children": [], + "family": "Indo-European", "tokenizers": { "Armn": { "full_object": "StanzaTokenizer(\"hyw\")", @@ -174,6 +194,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Armn": { "full_object": "SpaCyTokenizer(\"hy\")", @@ -189,24 +210,29 @@ }, { "name": "Balto-Slavic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baltic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lithuanian", + "depth": 4, "iso_1_code": "lt", "iso_3_code": "lit", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lt\")", @@ -226,9 +252,11 @@ }, { "name": "Latgalian", + "depth": 4, "iso_1_code": "lv", "iso_3_code": "ltg", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lv\")", @@ -248,9 +276,11 @@ }, { "name": "Latvian, Standard", + "depth": 4, "iso_1_code": "lv", "iso_3_code": "lvs", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lv\")", @@ -270,9 +300,11 @@ }, { "name": "Samogitian", + "depth": 4, "iso_1_code": null, "iso_3_code": "sgs", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lv\")", @@ -290,15 +322,18 @@ }, { "name": "Zemgalian", + "depth": 4, "iso_1_code": null, "iso_3_code": "xzm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3937", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lv\")", @@ -314,14 +349,17 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Prussian", + "depth": 4, "iso_1_code": null, "iso_3_code": "prg", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lv\")", @@ -339,15 +377,18 @@ }, { "name": "Sudovian", + "depth": 4, "iso_1_code": null, "iso_3_code": "xsv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3940", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lv\")", @@ -362,6 +403,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lv\")", @@ -377,19 +419,23 @@ }, { "name": "Slavic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Belarusian", + "depth": 4, "iso_1_code": "be", "iso_3_code": "bel", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"be\")", @@ -409,9 +455,11 @@ }, { "name": "Ruthenian", + "depth": 4, "iso_1_code": null, "iso_3_code": "rsk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3944", "native_tokenizers": [], @@ -419,9 +467,11 @@ }, { "name": "Rusyn", + "depth": 4, "iso_1_code": null, "iso_3_code": "rue", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"ru\")", @@ -439,9 +489,11 @@ }, { "name": "Russian", + "depth": 4, "iso_1_code": "ru", "iso_3_code": "rus", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"ru\")", @@ -461,9 +513,11 @@ }, { "name": "Ukrainian", + "depth": 4, "iso_1_code": "uk", "iso_3_code": "ukr", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"uk\")", @@ -482,6 +536,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"ru\")", @@ -497,19 +552,23 @@ }, { "name": "South", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bulgarian", + "depth": 5, "iso_1_code": "bg", "iso_3_code": "bul", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"bg\")", @@ -529,9 +588,11 @@ }, { "name": "Slavonic, Church", + "depth": 5, "iso_1_code": "cu", "iso_3_code": "chu", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"cu\")", @@ -551,9 +612,11 @@ }, { "name": "Macedonian", + "depth": 5, "iso_1_code": "mk", "iso_3_code": "mkd", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"mk\")", @@ -572,6 +635,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"bg\")", @@ -587,14 +651,17 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bosnian", + "depth": 5, "iso_1_code": "bs", "iso_3_code": "bos", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sr\")", @@ -614,9 +681,11 @@ }, { "name": "Chakavian", + "depth": 5, "iso_1_code": null, "iso_3_code": "ckm", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sr\")", @@ -634,9 +703,11 @@ }, { "name": "Montenegrin", + "depth": 5, "iso_1_code": "sh", "iso_3_code": "cnr", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sr\")", @@ -656,9 +727,11 @@ }, { "name": "Croatian", + "depth": 5, "iso_1_code": "hr", "iso_3_code": "hrv", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"hr\")", @@ -678,9 +751,11 @@ }, { "name": "Slovene", + "depth": 5, "iso_1_code": "sl", "iso_3_code": "slv", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sl\")", @@ -700,9 +775,11 @@ }, { "name": "Serbian", + "depth": 5, "iso_1_code": "sr", "iso_3_code": "srp", "children": [], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"sr\")", @@ -731,15 +808,18 @@ }, { "name": "Slavomolisano", + "depth": 5, "iso_1_code": null, "iso_3_code": "svm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3960", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sr\")", @@ -761,6 +841,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"bg\")", @@ -783,19 +864,23 @@ }, { "name": "West", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Czech-Slovak", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Czech", + "depth": 5, "iso_1_code": "cs", "iso_3_code": "ces", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"cs\")", @@ -815,9 +900,11 @@ }, { "name": "Knaanic", + "depth": 5, "iso_1_code": null, "iso_3_code": "czk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3964", "native_tokenizers": [], @@ -825,9 +912,11 @@ }, { "name": "Slovak", + "depth": 5, "iso_1_code": "sk", "iso_3_code": "slk", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sk\")", @@ -846,6 +935,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"cs\")", @@ -861,14 +951,17 @@ }, { "name": "Lechitic", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kashubian", + "depth": 5, "iso_1_code": null, "iso_3_code": "csb", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pl\")", @@ -886,9 +979,11 @@ }, { "name": "Polish", + "depth": 5, "iso_1_code": "pl", "iso_3_code": "pol", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pl\")", @@ -908,9 +1003,11 @@ }, { "name": "Polabian", + "depth": 5, "iso_1_code": null, "iso_3_code": "pox", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3969", "native_tokenizers": [], @@ -918,9 +1015,11 @@ }, { "name": "Silesian", + "depth": 5, "iso_1_code": null, "iso_3_code": "szl", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pl\")", @@ -937,6 +1036,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pl\")", @@ -952,14 +1052,17 @@ }, { "name": "Sorbian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sorbian, Lower", + "depth": 5, "iso_1_code": null, "iso_3_code": "dsb", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"dsb\")", @@ -979,9 +1082,11 @@ }, { "name": "Sorbian, Upper", + "depth": 5, "iso_1_code": null, "iso_3_code": "hsb", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"hsb\")", @@ -1000,6 +1105,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"hsb\")", @@ -1014,6 +1120,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pl\")", @@ -1028,6 +1135,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"ru\")", @@ -1049,6 +1157,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pl\")", @@ -1071,24 +1180,29 @@ }, { "name": "Celtic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Insular", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Brythonic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Breton", + "depth": 4, "iso_1_code": "br", "iso_3_code": "bre", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"cy\")", @@ -1106,9 +1220,11 @@ }, { "name": "Cornish", + "depth": 4, "iso_1_code": "kw", "iso_3_code": "cor", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"cy\")", @@ -1126,9 +1242,11 @@ }, { "name": "Welsh", + "depth": 4, "iso_1_code": "cy", "iso_3_code": "cym", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"cy\")", @@ -1147,6 +1265,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"cy\")", @@ -1162,14 +1281,17 @@ }, { "name": "Goidelic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Scottish Gaelic", + "depth": 4, "iso_1_code": "gd", "iso_3_code": "gla", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"gd\")", @@ -1189,9 +1311,11 @@ }, { "name": "Irish", + "depth": 4, "iso_1_code": "ga", "iso_3_code": "gle", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ga\")", @@ -1211,9 +1335,11 @@ }, { "name": "Manx", + "depth": 4, "iso_1_code": "gv", "iso_3_code": "glv", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"gv\")", @@ -1232,6 +1358,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ga\")", @@ -1246,6 +1373,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"cy\")", @@ -1260,6 +1388,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"cy\")", @@ -1275,24 +1404,29 @@ }, { "name": "Germanic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Scandinavian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u00d6vdalian", + "depth": 4, "iso_1_code": null, "iso_3_code": "ovd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3987", "native_tokenizers": [], @@ -1300,25 +1434,30 @@ }, { "name": "Danish-Swedish", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Danish-Bokmal", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Norwegian", + "depth": 6, "iso_1_code": "no", "iso_3_code": "nor", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3990", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "3989", "native_tokenizers": [], @@ -1326,19 +1465,23 @@ }, { "name": "Danish-Riksmal", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Danish", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Danish", + "depth": 7, "iso_1_code": "da", "iso_3_code": "dan", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"da\")", @@ -1357,6 +1500,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"da\")", @@ -1371,6 +1515,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"da\")", @@ -1386,14 +1531,17 @@ }, { "name": "Swedish", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Swedish", + "depth": 6, "iso_1_code": "sv", "iso_3_code": "swe", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sv\")", @@ -1412,6 +1560,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sv\")", @@ -1426,6 +1575,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sv\")", @@ -1440,6 +1590,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sv\")", @@ -1455,14 +1606,17 @@ }, { "name": "West Scandinavian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Faroese", + "depth": 4, "iso_1_code": "fo", "iso_3_code": "fao", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fo\")", @@ -1482,9 +1636,11 @@ }, { "name": "Icelandic", + "depth": 4, "iso_1_code": "is", "iso_3_code": "isl", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"is\")", @@ -1504,15 +1660,18 @@ }, { "name": "Norn", + "depth": 4, "iso_1_code": null, "iso_3_code": "nrn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "3999", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"is\")", @@ -1527,6 +1686,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"sv\")", @@ -1542,19 +1702,23 @@ }, { "name": "West", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "English", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "English", + "depth": 4, "iso_1_code": "en", "iso_3_code": "eng", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -1574,9 +1738,11 @@ }, { "name": "Scots", + "depth": 4, "iso_1_code": null, "iso_3_code": "sco", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -1594,15 +1760,18 @@ }, { "name": "Yola", + "depth": 4, "iso_1_code": null, "iso_3_code": "yol", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4004", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -1618,14 +1787,17 @@ }, { "name": "Frisian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Frisian, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "frr", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -1643,9 +1815,11 @@ }, { "name": "Frisian", + "depth": 4, "iso_1_code": "fy", "iso_3_code": "fry", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -1663,9 +1837,11 @@ }, { "name": "Saterfriesisch", + "depth": 4, "iso_1_code": null, "iso_3_code": "stq", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -1682,6 +1858,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -1697,19 +1874,23 @@ }, { "name": "High German", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "German", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hunsrik", + "depth": 5, "iso_1_code": null, "iso_3_code": "hrx", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -1727,19 +1908,23 @@ }, { "name": "Middle German", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Middle German", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "German, Standard", + "depth": 7, "iso_1_code": "de", "iso_3_code": "deu", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -1759,9 +1944,11 @@ }, { "name": "Silesian, Lower", + "depth": 7, "iso_1_code": null, "iso_3_code": "sli", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4015", "native_tokenizers": [], @@ -1769,9 +1956,11 @@ }, { "name": "Saxon, Upper", + "depth": 7, "iso_1_code": null, "iso_3_code": "sxu", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4016", "native_tokenizers": [], @@ -1779,15 +1968,18 @@ }, { "name": "Wymysorys", + "depth": 7, "iso_1_code": null, "iso_3_code": "wym", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4017", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -1803,14 +1995,17 @@ }, { "name": "West Middle German", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ripuarian", + "depth": 7, "iso_1_code": null, "iso_3_code": "ksh", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lb\")", @@ -1828,9 +2023,11 @@ }, { "name": "German, Pennsylvania", + "depth": 7, "iso_1_code": null, "iso_3_code": "pdc", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lb\")", @@ -1848,9 +2045,11 @@ }, { "name": "Palatinate Franconian", + "depth": 7, "iso_1_code": null, "iso_3_code": "pfl", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lb\")", @@ -1868,14 +2067,17 @@ }, { "name": "Moselle Franconian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luxembourgish", + "depth": 8, "iso_1_code": "lb", "iso_3_code": "ltz", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lb\")", @@ -1894,6 +2096,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lb\")", @@ -1908,6 +2111,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lb\")", @@ -1922,6 +2126,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -1937,14 +2142,17 @@ }, { "name": "Upper German", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Franconian", + "depth": 6, "iso_1_code": null, "iso_3_code": "vmf", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4025", "native_tokenizers": [], @@ -1952,14 +2160,17 @@ }, { "name": "Alemannic", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "German, Colonia Tovar", + "depth": 7, "iso_1_code": null, "iso_3_code": "gct", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4027", "native_tokenizers": [], @@ -1967,9 +2178,11 @@ }, { "name": "German, Swiss", + "depth": 7, "iso_1_code": null, "iso_3_code": "gsw", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -1987,9 +2200,11 @@ }, { "name": "Swabian", + "depth": 7, "iso_1_code": null, "iso_3_code": "swg", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -2007,15 +2222,18 @@ }, { "name": "Walser", + "depth": 7, "iso_1_code": null, "iso_3_code": "wae", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4030", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -2031,14 +2249,17 @@ }, { "name": "Bavarian-Austrian", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bavarian", + "depth": 7, "iso_1_code": null, "iso_3_code": "bar", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -2056,9 +2277,11 @@ }, { "name": "Cimbrian", + "depth": 7, "iso_1_code": null, "iso_3_code": "cim", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4033", "native_tokenizers": [], @@ -2066,9 +2289,11 @@ }, { "name": "Hutterisch", + "depth": 7, "iso_1_code": null, "iso_3_code": "geh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4034", "native_tokenizers": [], @@ -2076,15 +2301,18 @@ }, { "name": "M\u00f2cheno", + "depth": 7, "iso_1_code": null, "iso_3_code": "mhn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4035", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -2099,6 +2327,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -2113,6 +2342,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -2128,14 +2358,17 @@ }, { "name": "Yiddish", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yiddish, Eastern", + "depth": 5, "iso_1_code": "yi", "iso_3_code": "ydd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4037", "native_tokenizers": [], @@ -2145,21 +2378,25 @@ }, { "name": "Yiddish, Western", + "depth": 5, "iso_1_code": "yi", "iso_3_code": "yih", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4038", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4036", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"de\")", @@ -2175,19 +2412,23 @@ }, { "name": "Low Saxon-Low Franconian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Low Franconian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Afrikaans", + "depth": 5, "iso_1_code": "af", "iso_3_code": "afr", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"af\")", @@ -2207,9 +2448,11 @@ }, { "name": "Limburgish", + "depth": 5, "iso_1_code": "li", "iso_3_code": "lim", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2227,9 +2470,11 @@ }, { "name": "Dutch", + "depth": 5, "iso_1_code": "nl", "iso_3_code": "nld", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2249,9 +2494,11 @@ }, { "name": "West Flemish", + "depth": 5, "iso_1_code": null, "iso_3_code": "vls", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2269,9 +2516,11 @@ }, { "name": "Zeeuws", + "depth": 5, "iso_1_code": null, "iso_3_code": "zea", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2288,6 +2537,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2303,14 +2553,17 @@ }, { "name": "Low Saxon", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Achterhoeks", + "depth": 5, "iso_1_code": null, "iso_3_code": "act", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4047", "native_tokenizers": [], @@ -2318,9 +2571,11 @@ }, { "name": "Drents", + "depth": 5, "iso_1_code": null, "iso_3_code": "drt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4048", "native_tokenizers": [], @@ -2328,9 +2583,11 @@ }, { "name": "Saxon, East Frisian Low", + "depth": 5, "iso_1_code": null, "iso_3_code": "frs", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4049", "native_tokenizers": [], @@ -2338,9 +2595,11 @@ }, { "name": "Gronings", + "depth": 5, "iso_1_code": null, "iso_3_code": "gos", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2358,9 +2617,11 @@ }, { "name": "Saxon, Low", + "depth": 5, "iso_1_code": null, "iso_3_code": "nds", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2378,9 +2639,11 @@ }, { "name": "Plautdietsch", + "depth": 5, "iso_1_code": null, "iso_3_code": "pdt", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2398,9 +2661,11 @@ }, { "name": "Sallands", + "depth": 5, "iso_1_code": null, "iso_3_code": "sdz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4053", "native_tokenizers": [], @@ -2408,9 +2673,11 @@ }, { "name": "Stellingwerfs", + "depth": 5, "iso_1_code": null, "iso_3_code": "stl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4054", "native_tokenizers": [], @@ -2418,9 +2685,11 @@ }, { "name": "Twents", + "depth": 5, "iso_1_code": null, "iso_3_code": "twd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4055", "native_tokenizers": [], @@ -2428,9 +2697,11 @@ }, { "name": "Veluws", + "depth": 5, "iso_1_code": null, "iso_3_code": "vel", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4056", "native_tokenizers": [], @@ -2438,15 +2709,18 @@ }, { "name": "Westphalien", + "depth": 5, "iso_1_code": null, "iso_3_code": "wep", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4057", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2461,6 +2735,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"nl\")", @@ -2475,6 +2750,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -2489,6 +2765,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"en\")", @@ -2504,19 +2781,23 @@ }, { "name": "Greek", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Attic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cappadocian Greek", + "depth": 3, "iso_1_code": null, "iso_3_code": "cpg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4060", "native_tokenizers": [], @@ -2524,9 +2805,11 @@ }, { "name": "Greek", + "depth": 3, "iso_1_code": "el", "iso_3_code": "ell", "children": [], + "family": "Indo-European", "tokenizers": { "Grek": { "full_object": "SpaCyTokenizer(\"el\")", @@ -2546,9 +2829,11 @@ }, { "name": "Greek, Ancient", + "depth": 3, "iso_1_code": null, "iso_3_code": "grc", "children": [], + "family": "Indo-European", "tokenizers": { "Grek": { "full_object": "SpaCyTokenizer(\"grc\")", @@ -2568,9 +2853,11 @@ }, { "name": "Pontic", + "depth": 3, "iso_1_code": null, "iso_3_code": "pnt", "children": [], + "family": "Indo-European", "tokenizers": { "Grek": { "full_object": "SpaCyTokenizer(\"el\")", @@ -2588,15 +2875,18 @@ }, { "name": "Yevanic", + "depth": 3, "iso_1_code": null, "iso_3_code": "yej", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4064", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Grek": { "full_object": "SpaCyTokenizer(\"el\")", @@ -2612,26 +2902,31 @@ }, { "name": "Doric", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsakonian", + "depth": 3, "iso_1_code": null, "iso_3_code": "tsd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4066", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4065", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Grek": { "full_object": "SpaCyTokenizer(\"el\")", @@ -2647,19 +2942,23 @@ }, { "name": "Indo-Iranian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Indo-Aryan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sanskrit", + "depth": 3, "iso_1_code": "sa", "iso_3_code": "san", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"sa\")", @@ -2687,24 +2986,29 @@ }, { "name": "Intermediate Divisions", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awadhi", + "depth": 6, "iso_1_code": null, "iso_3_code": "awa", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -2722,9 +3026,11 @@ }, { "name": "Bagheli", + "depth": 6, "iso_1_code": null, "iso_3_code": "bfy", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4074", "native_tokenizers": [], @@ -2732,9 +3038,11 @@ }, { "name": "Fiji Hindi", + "depth": 6, "iso_1_code": null, "iso_3_code": "hif", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -2752,9 +3060,11 @@ }, { "name": "Chhattisgarhi", + "depth": 6, "iso_1_code": null, "iso_3_code": "hne", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -2772,9 +3082,11 @@ }, { "name": "Kamar", + "depth": 6, "iso_1_code": null, "iso_3_code": "keq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4077", "native_tokenizers": [], @@ -2782,15 +3094,18 @@ }, { "name": "Surgujia", + "depth": 6, "iso_1_code": null, "iso_3_code": "sgj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4078", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -2813,14 +3128,17 @@ }, { "name": "Eastern Pahari", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dotyali", + "depth": 6, "iso_1_code": "ne", "iso_3_code": "dty", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -2840,9 +3158,11 @@ }, { "name": "Jumli", + "depth": 6, "iso_1_code": null, "iso_3_code": "jml", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4081", "native_tokenizers": [], @@ -2850,9 +3170,11 @@ }, { "name": "Nepali", + "depth": 6, "iso_1_code": "ne", "iso_3_code": "npi", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -2879,6 +3201,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -2900,6 +3223,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -2922,14 +3246,17 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dawoodi", + "depth": 5, "iso_1_code": null, "iso_3_code": "dmk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4084", "native_tokenizers": [], @@ -2937,9 +3264,11 @@ }, { "name": "Parya", + "depth": 5, "iso_1_code": null, "iso_3_code": "paq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4085", "native_tokenizers": [], @@ -2947,9 +3276,11 @@ }, { "name": "Powari", + "depth": 5, "iso_1_code": null, "iso_3_code": "pwr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4086", "native_tokenizers": [], @@ -2957,14 +3288,17 @@ }, { "name": "Bhil", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bareli, Pauri", + "depth": 6, "iso_1_code": null, "iso_3_code": "bfb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4088", "native_tokenizers": [], @@ -2972,9 +3306,11 @@ }, { "name": "Bareli, Rathwi", + "depth": 6, "iso_1_code": null, "iso_3_code": "bgd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4089", "native_tokenizers": [], @@ -2982,9 +3318,11 @@ }, { "name": "Bauria", + "depth": 6, "iso_1_code": null, "iso_3_code": "bge", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4090", "native_tokenizers": [], @@ -2992,9 +3330,11 @@ }, { "name": "Bhili", + "depth": 6, "iso_1_code": null, "iso_3_code": "bhb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4091", "native_tokenizers": [], @@ -3002,9 +3342,11 @@ }, { "name": "Bhilali", + "depth": 6, "iso_1_code": null, "iso_3_code": "bhi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4092", "native_tokenizers": [], @@ -3012,9 +3354,11 @@ }, { "name": "Bareli, Palya", + "depth": 6, "iso_1_code": null, "iso_3_code": "bpx", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4093", "native_tokenizers": [], @@ -3022,9 +3366,11 @@ }, { "name": "Chodri", + "depth": 6, "iso_1_code": null, "iso_3_code": "cdi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4094", "native_tokenizers": [], @@ -3032,9 +3378,11 @@ }, { "name": "Dhodia", + "depth": 6, "iso_1_code": null, "iso_3_code": "dho", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4095", "native_tokenizers": [], @@ -3042,9 +3390,11 @@ }, { "name": "Dubli", + "depth": 6, "iso_1_code": null, "iso_3_code": "dub", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4096", "native_tokenizers": [], @@ -3052,9 +3402,11 @@ }, { "name": "Dungra Bhil", + "depth": 6, "iso_1_code": null, "iso_3_code": "duh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4097", "native_tokenizers": [], @@ -3062,9 +3414,11 @@ }, { "name": "Garasia, Adiwasi", + "depth": 6, "iso_1_code": null, "iso_3_code": "gas", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4098", "native_tokenizers": [], @@ -3072,9 +3426,11 @@ }, { "name": "Gamit", + "depth": 6, "iso_1_code": null, "iso_3_code": "gbl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4099", "native_tokenizers": [], @@ -3082,9 +3438,11 @@ }, { "name": "Garasia, Rajput", + "depth": 6, "iso_1_code": null, "iso_3_code": "gra", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4100", "native_tokenizers": [], @@ -3092,9 +3450,11 @@ }, { "name": "Mawchi", + "depth": 6, "iso_1_code": null, "iso_3_code": "mke", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4101", "native_tokenizers": [], @@ -3102,9 +3462,11 @@ }, { "name": "Nahali", + "depth": 6, "iso_1_code": null, "iso_3_code": "nlx", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4102", "native_tokenizers": [], @@ -3112,9 +3474,11 @@ }, { "name": "Noiri", + "depth": 6, "iso_1_code": null, "iso_3_code": "noi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4103", "native_tokenizers": [], @@ -3122,9 +3486,11 @@ }, { "name": "Pardhi", + "depth": 6, "iso_1_code": null, "iso_3_code": "pcl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4104", "native_tokenizers": [], @@ -3132,9 +3498,11 @@ }, { "name": "Rathawi", + "depth": 6, "iso_1_code": null, "iso_3_code": "rtw", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4105", "native_tokenizers": [], @@ -3142,15 +3510,18 @@ }, { "name": "Wagdi", + "depth": 6, "iso_1_code": null, "iso_3_code": "wbr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4106", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4087", "native_tokenizers": [], @@ -3158,20 +3529,24 @@ }, { "name": "Dom", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Domari", + "depth": 6, "iso_1_code": null, "iso_3_code": "rmt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4108", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4107", "native_tokenizers": [], @@ -3179,14 +3554,17 @@ }, { "name": "Gujarati", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aer", + "depth": 6, "iso_1_code": null, "iso_3_code": "aeq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4110", "native_tokenizers": [], @@ -3194,9 +3572,11 @@ }, { "name": "Koli, Kachi", + "depth": 6, "iso_1_code": null, "iso_3_code": "gjk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4111", "native_tokenizers": [], @@ -3204,9 +3584,11 @@ }, { "name": "Gujarati", + "depth": 6, "iso_1_code": "gu", "iso_3_code": "guj", "children": [], + "family": "Indo-European", "tokenizers": { "Gujr": { "full_object": "IndicNLPTokenizer(\"gu\")", @@ -3234,9 +3616,11 @@ }, { "name": "Jandavra", + "depth": 6, "iso_1_code": null, "iso_3_code": "jnd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4113", "native_tokenizers": [], @@ -3244,9 +3628,11 @@ }, { "name": "Koli, Parkari", + "depth": 6, "iso_1_code": null, "iso_3_code": "kvx", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4114", "native_tokenizers": [], @@ -3254,9 +3640,11 @@ }, { "name": "Koli, Wadiyari", + "depth": 6, "iso_1_code": null, "iso_3_code": "kxp", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4115", "native_tokenizers": [], @@ -3264,9 +3652,11 @@ }, { "name": "Sourashtra", + "depth": 6, "iso_1_code": null, "iso_3_code": "saz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4116", "native_tokenizers": [], @@ -3274,9 +3664,11 @@ }, { "name": "Vasavi", + "depth": 6, "iso_1_code": null, "iso_3_code": "vas", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4117", "native_tokenizers": [], @@ -3284,15 +3676,18 @@ }, { "name": "Vaghri", + "depth": 6, "iso_1_code": null, "iso_3_code": "vgr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4118", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Gujr": { "full_object": "IndicNLPTokenizer(\"gu\")", @@ -3315,14 +3710,17 @@ }, { "name": "Khandesi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ahirani", + "depth": 6, "iso_1_code": null, "iso_3_code": "ahr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4120", "native_tokenizers": [], @@ -3330,9 +3728,11 @@ }, { "name": "Dangi", + "depth": 6, "iso_1_code": null, "iso_3_code": "dhn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4121", "native_tokenizers": [], @@ -3340,15 +3740,18 @@ }, { "name": "Khandesi", + "depth": 6, "iso_1_code": null, "iso_3_code": "khn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4122", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4119", "native_tokenizers": [], @@ -3356,25 +3759,30 @@ }, { "name": "Pahari", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Pahari", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kumaoni", + "depth": 7, "iso_1_code": null, "iso_3_code": "kfy", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4125", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4124", "native_tokenizers": [], @@ -3382,20 +3790,24 @@ }, { "name": "Garhwali", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Garhwali", + "depth": 7, "iso_1_code": null, "iso_3_code": "gbm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4127", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4126", "native_tokenizers": [], @@ -3403,14 +3815,17 @@ }, { "name": "Western Pahari", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pahari, Mahasu", + "depth": 7, "iso_1_code": null, "iso_3_code": "bfz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4129", "native_tokenizers": [], @@ -3418,9 +3833,11 @@ }, { "name": "Bhadrawahi", + "depth": 7, "iso_1_code": null, "iso_3_code": "bhd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4130", "native_tokenizers": [], @@ -3428,9 +3845,11 @@ }, { "name": "Bhattiyali", + "depth": 7, "iso_1_code": null, "iso_3_code": "bht", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4131", "native_tokenizers": [], @@ -3438,9 +3857,11 @@ }, { "name": "Chambeali", + "depth": 7, "iso_1_code": null, "iso_3_code": "cdh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4132", "native_tokenizers": [], @@ -3448,9 +3869,11 @@ }, { "name": "Churahi", + "depth": 7, "iso_1_code": null, "iso_3_code": "cdj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4133", "native_tokenizers": [], @@ -3458,9 +3881,11 @@ }, { "name": "Dogri", + "depth": 7, "iso_1_code": null, "iso_3_code": "dgo", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4134", "native_tokenizers": [], @@ -3468,9 +3893,11 @@ }, { "name": "Gaddi", + "depth": 7, "iso_1_code": null, "iso_3_code": "gbk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4135", "native_tokenizers": [], @@ -3478,9 +3905,11 @@ }, { "name": "Hinduri", + "depth": 7, "iso_1_code": null, "iso_3_code": "hii", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4136", "native_tokenizers": [], @@ -3488,9 +3917,11 @@ }, { "name": "Khah", + "depth": 7, "iso_1_code": null, "iso_3_code": "hkh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4137", "native_tokenizers": [], @@ -3498,9 +3929,11 @@ }, { "name": "Jaunsari", + "depth": 7, "iso_1_code": null, "iso_3_code": "jns", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4138", "native_tokenizers": [], @@ -3508,9 +3941,11 @@ }, { "name": "Bilaspuri", + "depth": 7, "iso_1_code": null, "iso_3_code": "kfs", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4139", "native_tokenizers": [], @@ -3518,9 +3953,11 @@ }, { "name": "Pahari, Kullu", + "depth": 7, "iso_1_code": null, "iso_3_code": "kfx", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4140", "native_tokenizers": [], @@ -3528,9 +3965,11 @@ }, { "name": "Kinnauri, Pahari", + "depth": 7, "iso_1_code": null, "iso_3_code": "kjo", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4141", "native_tokenizers": [], @@ -3538,9 +3977,11 @@ }, { "name": "Mandeali", + "depth": 7, "iso_1_code": null, "iso_3_code": "mjl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4142", "native_tokenizers": [], @@ -3548,9 +3989,11 @@ }, { "name": "Pangwali", + "depth": 7, "iso_1_code": null, "iso_3_code": "pgg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4143", "native_tokenizers": [], @@ -3558,9 +4001,11 @@ }, { "name": "Sirmauri", + "depth": 7, "iso_1_code": null, "iso_3_code": "srx", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4144", "native_tokenizers": [], @@ -3568,21 +4013,25 @@ }, { "name": "Kangri", + "depth": 7, "iso_1_code": null, "iso_3_code": "xnr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4145", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4128", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4123", "native_tokenizers": [], @@ -3590,14 +4039,17 @@ }, { "name": "Panjabi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Punjabi, Eastern", + "depth": 6, "iso_1_code": "pa", "iso_3_code": "pan", "children": [], + "family": "Indo-European", "tokenizers": { "Guru": { "full_object": "IndicNLPTokenizer(\"pa\")", @@ -3625,14 +4077,17 @@ }, { "name": "Western Panjabi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hindko, Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "hnd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4149", "native_tokenizers": [], @@ -3640,9 +4095,11 @@ }, { "name": "Hindko, Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "hno", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4150", "native_tokenizers": [], @@ -3650,9 +4107,11 @@ }, { "name": "Inku", + "depth": 7, "iso_1_code": null, "iso_3_code": "jat", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4151", "native_tokenizers": [], @@ -3660,9 +4119,11 @@ }, { "name": "Pahari-Potwari", + "depth": 7, "iso_1_code": null, "iso_3_code": "phr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4152", "native_tokenizers": [], @@ -3670,9 +4131,11 @@ }, { "name": "Punjabi, Western", + "depth": 7, "iso_1_code": null, "iso_3_code": "pnb", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -3690,9 +4153,11 @@ }, { "name": "Saraiki", + "depth": 7, "iso_1_code": null, "iso_3_code": "skr", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -3710,15 +4175,18 @@ }, { "name": "Khetrani", + "depth": 7, "iso_1_code": null, "iso_3_code": "xhe", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4155", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -3733,6 +4201,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Guru": { "full_object": "IndicNLPTokenizer(\"pa\")", @@ -3762,14 +4231,17 @@ }, { "name": "Rajasthani", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gujari", + "depth": 6, "iso_1_code": null, "iso_3_code": "gju", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4157", "native_tokenizers": [], @@ -3777,14 +4249,17 @@ }, { "name": "Marwari", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhundari", + "depth": 7, "iso_1_code": null, "iso_3_code": "dhd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4159", "native_tokenizers": [], @@ -3792,9 +4267,11 @@ }, { "name": "Godwari", + "depth": 7, "iso_1_code": null, "iso_3_code": "gdx", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4160", "native_tokenizers": [], @@ -3802,9 +4279,11 @@ }, { "name": "Goaria", + "depth": 7, "iso_1_code": null, "iso_3_code": "gig", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4161", "native_tokenizers": [], @@ -3812,9 +4291,11 @@ }, { "name": "Jogi", + "depth": 7, "iso_1_code": null, "iso_3_code": "jog", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4162", "native_tokenizers": [], @@ -3822,9 +4303,11 @@ }, { "name": "Loarki", + "depth": 7, "iso_1_code": null, "iso_3_code": "lrk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4163", "native_tokenizers": [], @@ -3832,9 +4315,11 @@ }, { "name": "Dhatki", + "depth": 7, "iso_1_code": null, "iso_3_code": "mki", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4164", "native_tokenizers": [], @@ -3842,9 +4327,11 @@ }, { "name": "Mewari", + "depth": 7, "iso_1_code": null, "iso_3_code": "mtr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4165", "native_tokenizers": [], @@ -3852,9 +4339,11 @@ }, { "name": "Marwari", + "depth": 7, "iso_1_code": null, "iso_3_code": "mve", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4166", "native_tokenizers": [], @@ -3862,9 +4351,11 @@ }, { "name": "Marwari", + "depth": 7, "iso_1_code": null, "iso_3_code": "rwr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4167", "native_tokenizers": [], @@ -3872,9 +4363,11 @@ }, { "name": "Shekhawati", + "depth": 7, "iso_1_code": null, "iso_3_code": "swv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4168", "native_tokenizers": [], @@ -3882,15 +4375,18 @@ }, { "name": "Merwari", + "depth": 7, "iso_1_code": null, "iso_3_code": "wry", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4169", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4158", "native_tokenizers": [], @@ -3898,14 +4394,17 @@ }, { "name": "Unclassified", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bagri", + "depth": 7, "iso_1_code": null, "iso_3_code": "bgq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4171", "native_tokenizers": [], @@ -3913,9 +4412,11 @@ }, { "name": "Lohar, Gade", + "depth": 7, "iso_1_code": null, "iso_3_code": "gda", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4172", "native_tokenizers": [], @@ -3923,9 +4424,11 @@ }, { "name": "Gurgula", + "depth": 7, "iso_1_code": null, "iso_3_code": "ggg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4173", "native_tokenizers": [], @@ -3933,9 +4436,11 @@ }, { "name": "Haroti", + "depth": 7, "iso_1_code": null, "iso_3_code": "hoj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4174", "native_tokenizers": [], @@ -3943,9 +4448,11 @@ }, { "name": "Lambadi", + "depth": 7, "iso_1_code": null, "iso_3_code": "lmn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4175", "native_tokenizers": [], @@ -3953,9 +4460,11 @@ }, { "name": "Malvi", + "depth": 7, "iso_1_code": null, "iso_3_code": "mup", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -3973,15 +4482,18 @@ }, { "name": "Nimadi", + "depth": 7, "iso_1_code": null, "iso_3_code": "noe", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4177", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -3996,6 +4508,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -4011,19 +4524,23 @@ }, { "name": "Romani", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balkan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romani, Balkan", + "depth": 7, "iso_1_code": null, "iso_3_code": "rmn", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4031,20 +4548,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" } }, "node_i": "4180", @@ -4056,6 +4559,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4063,20 +4567,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" } }, "node_i": "4179", @@ -4085,14 +4575,17 @@ }, { "name": "Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romani, Carpathian", + "depth": 7, "iso_1_code": null, "iso_3_code": "rmc", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4110,9 +4603,11 @@ }, { "name": "Romani, Kalo Finnish", + "depth": 7, "iso_1_code": null, "iso_3_code": "rmf", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4183", "native_tokenizers": [], @@ -4120,9 +4615,11 @@ }, { "name": "Romani, Baltic", + "depth": 7, "iso_1_code": null, "iso_3_code": "rml", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4140,9 +4637,11 @@ }, { "name": "Romani, Sinte", + "depth": 7, "iso_1_code": null, "iso_3_code": "rmo", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4160,15 +4659,18 @@ }, { "name": "Romani, Welsh", + "depth": 7, "iso_1_code": null, "iso_3_code": "rmw", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4186", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4184,14 +4686,17 @@ }, { "name": "Vlax", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romani, Vlax", + "depth": 7, "iso_1_code": null, "iso_3_code": "rmy", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4199,13 +4704,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4188", @@ -4216,6 +4714,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4223,13 +4722,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4187", @@ -4237,6 +4729,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4244,20 +4737,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" } }, "node_i": "4178", @@ -4266,14 +4745,17 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sonha", + "depth": 6, "iso_1_code": null, "iso_3_code": "soi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4190", "native_tokenizers": [], @@ -4281,21 +4763,25 @@ }, { "name": "Mewati", + "depth": 6, "iso_1_code": null, "iso_3_code": "wtm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4191", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4189", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Gujr": { "full_object": "IndicNLPTokenizer(\"gu\")", @@ -4331,20 +4817,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" } }, "node_i": "4083", @@ -4352,6 +4824,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"ne\")", @@ -4387,20 +4860,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" } }, "node_i": "4070", @@ -4409,24 +4868,29 @@ }, { "name": "Outer Languages", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bengali-Assamese", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Assamese", + "depth": 6, "iso_1_code": "as", "iso_3_code": "asm", "children": [], + "family": "Indo-European", "tokenizers": { "Beng": { "full_object": "IndicNLPTokenizer(\"as\")", @@ -4454,9 +4918,11 @@ }, { "name": "Bengali", + "depth": 6, "iso_1_code": "bn", "iso_3_code": "ben", "children": [], + "family": "Indo-European", "tokenizers": { "Beng": { "full_object": "IndicNLPTokenizer(\"bn\")", @@ -4484,9 +4950,11 @@ }, { "name": "Bishnupuriya", + "depth": 6, "iso_1_code": null, "iso_3_code": "bpy", "children": [], + "family": "Indo-European", "tokenizers": { "Beng": { "full_object": "IndicNLPTokenizer(\"bn\")", @@ -4504,9 +4972,11 @@ }, { "name": "Chakma", + "depth": 6, "iso_1_code": null, "iso_3_code": "ccp", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4524,9 +4994,11 @@ }, { "name": "Chittagonian", + "depth": 6, "iso_1_code": null, "iso_3_code": "ctg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4199", "native_tokenizers": [], @@ -4534,9 +5006,11 @@ }, { "name": "Hajong", + "depth": 6, "iso_1_code": null, "iso_3_code": "haj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4200", "native_tokenizers": [], @@ -4544,9 +5018,11 @@ }, { "name": "Halbi", + "depth": 6, "iso_1_code": null, "iso_3_code": "hlb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4201", "native_tokenizers": [], @@ -4554,9 +5030,11 @@ }, { "name": "Kurmukar", + "depth": 6, "iso_1_code": null, "iso_3_code": "kfv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4202", "native_tokenizers": [], @@ -4564,9 +5042,11 @@ }, { "name": "Kharia Thar", + "depth": 6, "iso_1_code": null, "iso_3_code": "ksy", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4203", "native_tokenizers": [], @@ -4574,9 +5054,11 @@ }, { "name": "Kewat", + "depth": 6, "iso_1_code": null, "iso_3_code": "kyv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4204", "native_tokenizers": [], @@ -4584,9 +5066,11 @@ }, { "name": "Lodhi", + "depth": 6, "iso_1_code": null, "iso_3_code": "lbm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4205", "native_tokenizers": [], @@ -4594,9 +5078,11 @@ }, { "name": "Mal Paharia", + "depth": 6, "iso_1_code": null, "iso_3_code": "mkb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4206", "native_tokenizers": [], @@ -4604,9 +5090,11 @@ }, { "name": "Nahari", + "depth": 6, "iso_1_code": null, "iso_3_code": "nhh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4207", "native_tokenizers": [], @@ -4614,9 +5102,11 @@ }, { "name": "Rohingya", + "depth": 6, "iso_1_code": null, "iso_3_code": "rhg", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4634,9 +5124,11 @@ }, { "name": "Rajbanshi", + "depth": 6, "iso_1_code": null, "iso_3_code": "rjs", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4654,9 +5146,11 @@ }, { "name": "Rangpuri", + "depth": 6, "iso_1_code": null, "iso_3_code": "rkt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4210", "native_tokenizers": [], @@ -4664,9 +5158,11 @@ }, { "name": "Sylheti", + "depth": 6, "iso_1_code": null, "iso_3_code": "syl", "children": [], + "family": "Indo-European", "tokenizers": { "Beng": { "full_object": "IndicNLPTokenizer(\"bn\")", @@ -4692,9 +5188,11 @@ }, { "name": "Tangchangya", + "depth": 6, "iso_1_code": null, "iso_3_code": "tnv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4212", "native_tokenizers": [], @@ -4702,15 +5200,18 @@ }, { "name": "Mirgan", + "depth": 6, "iso_1_code": null, "iso_3_code": "zrg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4213", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Beng": { "full_object": "IndicNLPTokenizer(\"bn\")", @@ -4740,14 +5241,17 @@ }, { "name": "Bihari", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bhojpuri", + "depth": 6, "iso_1_code": null, "iso_3_code": "bho", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4765,9 +5269,11 @@ }, { "name": "Hindustani, Sarnami", + "depth": 6, "iso_1_code": null, "iso_3_code": "hns", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -4785,9 +5291,11 @@ }, { "name": "Kudmali", + "depth": 6, "iso_1_code": null, "iso_3_code": "kyw", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4217", "native_tokenizers": [], @@ -4795,9 +5303,11 @@ }, { "name": "Magahi", + "depth": 6, "iso_1_code": null, "iso_3_code": "mag", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4815,9 +5325,11 @@ }, { "name": "Maithili", + "depth": 6, "iso_1_code": null, "iso_3_code": "mai", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4837,9 +5349,11 @@ }, { "name": "Majhi", + "depth": 6, "iso_1_code": null, "iso_3_code": "mjz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4220", "native_tokenizers": [], @@ -4847,9 +5361,11 @@ }, { "name": "Sadri", + "depth": 6, "iso_1_code": null, "iso_3_code": "sck", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4867,9 +5383,11 @@ }, { "name": "Sadri, Oraon", + "depth": 6, "iso_1_code": null, "iso_3_code": "sdr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4222", "native_tokenizers": [], @@ -4877,9 +5395,11 @@ }, { "name": "Surjapuri", + "depth": 6, "iso_1_code": null, "iso_3_code": "sjp", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4223", "native_tokenizers": [], @@ -4887,9 +5407,11 @@ }, { "name": "Musasa", + "depth": 6, "iso_1_code": null, "iso_3_code": "smm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4224", "native_tokenizers": [], @@ -4897,9 +5419,11 @@ }, { "name": "Panchpargania", + "depth": 6, "iso_1_code": null, "iso_3_code": "tdb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4225", "native_tokenizers": [], @@ -4907,15 +5431,18 @@ }, { "name": "Bajjika", + "depth": 6, "iso_1_code": null, "iso_3_code": "vjk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4226", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4938,14 +5465,17 @@ }, { "name": "Oriya", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bodo Parja", + "depth": 6, "iso_1_code": null, "iso_3_code": "bdv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4228", "native_tokenizers": [], @@ -4953,9 +5483,11 @@ }, { "name": "Bhatri", + "depth": 6, "iso_1_code": null, "iso_3_code": "bgw", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4229", "native_tokenizers": [], @@ -4963,9 +5495,11 @@ }, { "name": "Bhunjia", + "depth": 6, "iso_1_code": null, "iso_3_code": "bhu", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4230", "native_tokenizers": [], @@ -4973,9 +5507,11 @@ }, { "name": "Desiya", + "depth": 6, "iso_1_code": null, "iso_3_code": "dso", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4231", "native_tokenizers": [], @@ -4983,9 +5519,11 @@ }, { "name": "Kupia", + "depth": 6, "iso_1_code": null, "iso_3_code": "key", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4232", "native_tokenizers": [], @@ -4993,9 +5531,11 @@ }, { "name": "Oriya, Adivasi", + "depth": 6, "iso_1_code": null, "iso_3_code": "ort", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4233", "native_tokenizers": [], @@ -5003,9 +5543,11 @@ }, { "name": "Odia", + "depth": 6, "iso_1_code": "or", "iso_3_code": "ory", "children": [], + "family": "Indo-European", "tokenizers": { "Orya": { "full_object": "IndicNLPTokenizer(\"or\")", @@ -5033,9 +5575,11 @@ }, { "name": "Reli", + "depth": 6, "iso_1_code": null, "iso_3_code": "rei", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4235", "native_tokenizers": [], @@ -5043,15 +5587,18 @@ }, { "name": "Sambalpuri", + "depth": 6, "iso_1_code": "or", "iso_3_code": "spv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4236", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Orya": { "full_object": "IndicNLPTokenizer(\"or\")", @@ -5074,14 +5621,17 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angika", + "depth": 6, "iso_1_code": null, "iso_3_code": "anp", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5099,9 +5649,11 @@ }, { "name": "Bote", + "depth": 6, "iso_1_code": null, "iso_3_code": "bmj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4239", "native_tokenizers": [], @@ -5109,15 +5661,18 @@ }, { "name": "Buksa", + "depth": 6, "iso_1_code": null, "iso_3_code": "tkb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4240", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5132,6 +5687,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Beng": { "full_object": "IndicNLPTokenizer(\"bn\")", @@ -5168,24 +5724,29 @@ }, { "name": "Northwestern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dardic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chitral", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khowar", + "depth": 7, "iso_1_code": null, "iso_3_code": "khw", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4244", "native_tokenizers": [], @@ -5193,15 +5754,18 @@ }, { "name": "Kalasha", + "depth": 7, "iso_1_code": null, "iso_3_code": "kls", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4245", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4243", "native_tokenizers": [], @@ -5209,14 +5773,17 @@ }, { "name": "Kashmiri", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kashmiri", + "depth": 7, "iso_1_code": "ks", "iso_3_code": "kas", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -5251,6 +5818,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -5280,14 +5848,17 @@ }, { "name": "Kohistani", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bateri", + "depth": 7, "iso_1_code": null, "iso_3_code": "btv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4249", "native_tokenizers": [], @@ -5295,9 +5866,11 @@ }, { "name": "Chilisso", + "depth": 7, "iso_1_code": null, "iso_3_code": "clh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4250", "native_tokenizers": [], @@ -5305,9 +5878,11 @@ }, { "name": "Gawri", + "depth": 7, "iso_1_code": null, "iso_3_code": "gwc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4251", "native_tokenizers": [], @@ -5315,9 +5890,11 @@ }, { "name": "Gowro", + "depth": 7, "iso_1_code": null, "iso_3_code": "gwf", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4252", "native_tokenizers": [], @@ -5325,9 +5902,11 @@ }, { "name": "Kohistani, Indus", + "depth": 7, "iso_1_code": null, "iso_3_code": "mvy", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4253", "native_tokenizers": [], @@ -5335,9 +5914,11 @@ }, { "name": "Mankiyali", + "depth": 7, "iso_1_code": null, "iso_3_code": "nlm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4254", "native_tokenizers": [], @@ -5345,9 +5926,11 @@ }, { "name": "Tirahi", + "depth": 7, "iso_1_code": null, "iso_3_code": "tra", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4255", "native_tokenizers": [], @@ -5355,9 +5938,11 @@ }, { "name": "Torwali", + "depth": 7, "iso_1_code": null, "iso_3_code": "trw", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4256", "native_tokenizers": [], @@ -5365,15 +5950,18 @@ }, { "name": "Degano", + "depth": 7, "iso_1_code": null, "iso_3_code": "wsv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4257", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4248", "native_tokenizers": [], @@ -5381,14 +5969,17 @@ }, { "name": "Kunar", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dameli", + "depth": 7, "iso_1_code": null, "iso_3_code": "dml", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4259", "native_tokenizers": [], @@ -5396,9 +5987,11 @@ }, { "name": "Gawar-Bati", + "depth": 7, "iso_1_code": null, "iso_3_code": "gwt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4260", "native_tokenizers": [], @@ -5406,9 +5999,11 @@ }, { "name": "Grangali", + "depth": 7, "iso_1_code": null, "iso_3_code": "nli", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4261", "native_tokenizers": [], @@ -5416,15 +6011,18 @@ }, { "name": "Shumashti", + "depth": 7, "iso_1_code": null, "iso_3_code": "sts", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4262", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4258", "native_tokenizers": [], @@ -5432,14 +6030,17 @@ }, { "name": "Pashai", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pashai, Northeast", + "depth": 7, "iso_1_code": null, "iso_3_code": "aee", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4264", "native_tokenizers": [], @@ -5447,9 +6048,11 @@ }, { "name": "Pashai, Northwest", + "depth": 7, "iso_1_code": null, "iso_3_code": "glh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4265", "native_tokenizers": [], @@ -5457,9 +6060,11 @@ }, { "name": "Pashai, Southwest", + "depth": 7, "iso_1_code": null, "iso_3_code": "psh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4266", "native_tokenizers": [], @@ -5467,15 +6072,18 @@ }, { "name": "Pashai, Southeast", + "depth": 7, "iso_1_code": null, "iso_3_code": "psi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4267", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4263", "native_tokenizers": [], @@ -5483,14 +6091,17 @@ }, { "name": "Shina", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Brokskat", + "depth": 7, "iso_1_code": null, "iso_3_code": "bkk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4269", "native_tokenizers": [], @@ -5498,9 +6109,11 @@ }, { "name": "Palula", + "depth": 7, "iso_1_code": null, "iso_3_code": "phl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4270", "native_tokenizers": [], @@ -5508,9 +6121,11 @@ }, { "name": "Shina, Kohistani", + "depth": 7, "iso_1_code": null, "iso_3_code": "plk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4271", "native_tokenizers": [], @@ -5518,9 +6133,11 @@ }, { "name": "Shina", + "depth": 7, "iso_1_code": null, "iso_3_code": "scl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4272", "native_tokenizers": [], @@ -5528,9 +6145,11 @@ }, { "name": "Savi", + "depth": 7, "iso_1_code": null, "iso_3_code": "sdg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4273", "native_tokenizers": [], @@ -5538,9 +6157,11 @@ }, { "name": "Kundal Shahi", + "depth": 7, "iso_1_code": null, "iso_3_code": "shd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4274", "native_tokenizers": [], @@ -5548,9 +6169,11 @@ }, { "name": "Ushojo", + "depth": 7, "iso_1_code": null, "iso_3_code": "ush", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4275", "native_tokenizers": [], @@ -5558,21 +6181,25 @@ }, { "name": "Kalkoti", + "depth": 7, "iso_1_code": null, "iso_3_code": "xka", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4276", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4268", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -5602,14 +6229,17 @@ }, { "name": "Sindhi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jadgali", + "depth": 6, "iso_1_code": null, "iso_3_code": "jdg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4278", "native_tokenizers": [], @@ -5617,9 +6247,11 @@ }, { "name": "Kacchi", + "depth": 6, "iso_1_code": null, "iso_3_code": "kfr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4279", "native_tokenizers": [], @@ -5627,9 +6259,11 @@ }, { "name": "Lasi", + "depth": 6, "iso_1_code": null, "iso_3_code": "lss", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4280", "native_tokenizers": [], @@ -5637,9 +6271,11 @@ }, { "name": "Luwati", + "depth": 6, "iso_1_code": null, "iso_3_code": "luv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4281", "native_tokenizers": [], @@ -5647,9 +6283,11 @@ }, { "name": "Sindhi Bhil", + "depth": 6, "iso_1_code": null, "iso_3_code": "sbn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4282", "native_tokenizers": [], @@ -5657,9 +6295,11 @@ }, { "name": "Sindhi", + "depth": 6, "iso_1_code": "sd", "iso_3_code": "snd", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -5694,6 +6334,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -5722,6 +6363,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -5751,14 +6393,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marathi", + "depth": 5, "iso_1_code": "mr", "iso_3_code": "mar", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"mr\")", @@ -5786,14 +6431,17 @@ }, { "name": "Konkani", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konkani, Goan", + "depth": 6, "iso_1_code": null, "iso_3_code": "gom", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"kK\")", @@ -5821,9 +6469,11 @@ }, { "name": "Kukna", + "depth": 6, "iso_1_code": null, "iso_3_code": "kex", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"kK\")", @@ -5841,9 +6491,11 @@ }, { "name": "Katkari", + "depth": 6, "iso_1_code": null, "iso_3_code": "kfu", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4289", "native_tokenizers": [], @@ -5851,9 +6503,11 @@ }, { "name": "Konkani", + "depth": 6, "iso_1_code": null, "iso_3_code": "knn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4290", "native_tokenizers": [], @@ -5861,9 +6515,11 @@ }, { "name": "Phudagi", + "depth": 6, "iso_1_code": null, "iso_3_code": "phd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4291", "native_tokenizers": [], @@ -5871,9 +6527,11 @@ }, { "name": "Samvedi", + "depth": 6, "iso_1_code": null, "iso_3_code": "smv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4292", "native_tokenizers": [], @@ -5881,15 +6539,18 @@ }, { "name": "Varli", + "depth": 6, "iso_1_code": null, "iso_3_code": "vav", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4293", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"kK\")", @@ -5912,14 +6573,17 @@ }, { "name": "Sinhalese-Maldivian", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maldivian", + "depth": 6, "iso_1_code": "dv", "iso_3_code": "div", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4295", "native_tokenizers": [], @@ -5929,9 +6593,11 @@ }, { "name": "Sinhala", + "depth": 6, "iso_1_code": "si", "iso_3_code": "sin", "children": [], + "family": "Indo-European", "tokenizers": { "Sinh": { "full_object": "IndicNLPTokenizer(\"si\")", @@ -5951,15 +6617,18 @@ }, { "name": "Veddah", + "depth": 6, "iso_1_code": null, "iso_3_code": "ved", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4297", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Sinh": { "full_object": "IndicNLPTokenizer(\"si\")", @@ -5975,14 +6644,17 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bhalay", + "depth": 6, "iso_1_code": null, "iso_3_code": "bhx", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4299", "native_tokenizers": [], @@ -5990,9 +6662,11 @@ }, { "name": "Deccan", + "depth": 6, "iso_1_code": null, "iso_3_code": "dcc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4300", "native_tokenizers": [], @@ -6000,9 +6674,11 @@ }, { "name": "Gowlan", + "depth": 6, "iso_1_code": null, "iso_3_code": "goj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4301", "native_tokenizers": [], @@ -6010,21 +6686,25 @@ }, { "name": "Varhadi-Nagpuri", + "depth": 6, "iso_1_code": null, "iso_3_code": "vah", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4302", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4298", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"mr\")", @@ -6053,6 +6733,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Beng": { "full_object": "IndicNLPTokenizer(\"bn\")", @@ -6103,14 +6784,17 @@ }, { "name": "Tharu", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tharu, Rana", + "depth": 4, "iso_1_code": null, "iso_3_code": "thr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4304", "native_tokenizers": [], @@ -6118,9 +6802,11 @@ }, { "name": "Tharu, Kathariya", + "depth": 4, "iso_1_code": null, "iso_3_code": "tkt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4305", "native_tokenizers": [], @@ -6128,14 +6814,17 @@ }, { "name": "Eastern Tharu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tharu, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "the", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4307", "native_tokenizers": [], @@ -6143,9 +6832,11 @@ }, { "name": "Tharu, Dangaura", + "depth": 5, "iso_1_code": null, "iso_3_code": "thl", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6163,15 +6854,18 @@ }, { "name": "Tharu, Mid-Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": "thq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4309", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6186,6 +6880,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6201,14 +6896,17 @@ }, { "name": "Unclassified", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andh", + "depth": 4, "iso_1_code": null, "iso_3_code": "anr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4311", "native_tokenizers": [], @@ -6216,9 +6914,11 @@ }, { "name": "Bazigar", + "depth": 4, "iso_1_code": null, "iso_3_code": "bfr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4312", "native_tokenizers": [], @@ -6226,9 +6926,11 @@ }, { "name": "Chinali", + "depth": 4, "iso_1_code": null, "iso_3_code": "cih", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4313", "native_tokenizers": [], @@ -6236,9 +6938,11 @@ }, { "name": "Danuwar", + "depth": 4, "iso_1_code": null, "iso_3_code": "dhw", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4314", "native_tokenizers": [], @@ -6246,9 +6950,11 @@ }, { "name": "Darai", + "depth": 4, "iso_1_code": null, "iso_3_code": "dry", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4315", "native_tokenizers": [], @@ -6256,9 +6962,11 @@ }, { "name": "Dewas Rai", + "depth": 4, "iso_1_code": null, "iso_3_code": "dwz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4316", "native_tokenizers": [], @@ -6266,9 +6974,11 @@ }, { "name": "Kanjari", + "depth": 4, "iso_1_code": null, "iso_3_code": "kft", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4317", "native_tokenizers": [], @@ -6276,9 +6986,11 @@ }, { "name": "Kumal", + "depth": 4, "iso_1_code": null, "iso_3_code": "kra", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4318", "native_tokenizers": [], @@ -6286,9 +6998,11 @@ }, { "name": "Lohar, Lahul", + "depth": 4, "iso_1_code": null, "iso_3_code": "lhl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4319", "native_tokenizers": [], @@ -6296,9 +7010,11 @@ }, { "name": "Memoni", + "depth": 4, "iso_1_code": null, "iso_3_code": "mby", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4320", "native_tokenizers": [], @@ -6306,9 +7022,11 @@ }, { "name": "Oadki", + "depth": 4, "iso_1_code": null, "iso_3_code": "odk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4321", "native_tokenizers": [], @@ -6316,9 +7034,11 @@ }, { "name": "Pali", + "depth": 4, "iso_1_code": "pi", "iso_3_code": "pli", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4322", "native_tokenizers": [], @@ -6326,15 +7046,18 @@ }, { "name": "Vaagri Booli", + "depth": 4, "iso_1_code": null, "iso_3_code": "vaa", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4323", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4310", "native_tokenizers": [], @@ -6342,25 +7065,30 @@ }, { "name": "Western Hindi", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bundeli", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bundeli", + "depth": 5, "iso_1_code": null, "iso_3_code": "bns", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4326", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4325", "native_tokenizers": [], @@ -6368,14 +7096,17 @@ }, { "name": "Hindustani", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hindi", + "depth": 5, "iso_1_code": "hi", "iso_3_code": "hin", "children": [], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6403,9 +7134,11 @@ }, { "name": "Urdu", + "depth": 5, "iso_1_code": "ur", "iso_3_code": "urd", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -6433,14 +7166,17 @@ }, { "name": "Sansi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kabutra", + "depth": 6, "iso_1_code": null, "iso_3_code": "kbu", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4331", "native_tokenizers": [], @@ -6448,21 +7184,25 @@ }, { "name": "Sansi", + "depth": 6, "iso_1_code": null, "iso_3_code": "ssi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4332", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4330", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6492,14 +7232,17 @@ }, { "name": "Unclassified", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haryanvi", + "depth": 5, "iso_1_code": null, "iso_3_code": "bgc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4334", "native_tokenizers": [], @@ -6507,9 +7250,11 @@ }, { "name": "Bhaya", + "depth": 5, "iso_1_code": null, "iso_3_code": "bhe", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4335", "native_tokenizers": [], @@ -6517,9 +7262,11 @@ }, { "name": "Kanauji", + "depth": 5, "iso_1_code": null, "iso_3_code": "bjj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4336", "native_tokenizers": [], @@ -6527,9 +7274,11 @@ }, { "name": "Braj Bhasha", + "depth": 5, "iso_1_code": null, "iso_3_code": "bra", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4337", "native_tokenizers": [], @@ -6537,9 +7286,11 @@ }, { "name": "Ghera", + "depth": 5, "iso_1_code": null, "iso_3_code": "ghr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4338", "native_tokenizers": [], @@ -6547,21 +7298,25 @@ }, { "name": "Gowli", + "depth": 5, "iso_1_code": null, "iso_3_code": "gok", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4339", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4333", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6590,6 +7345,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6646,20 +7402,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" } }, "node_i": "4068", @@ -6668,14 +7410,17 @@ }, { "name": "Iranian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Avestan", + "depth": 3, "iso_1_code": "ae", "iso_3_code": "ave", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4341", "native_tokenizers": [], @@ -6683,28 +7428,24 @@ }, { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northeastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ossetic", + "depth": 5, "iso_1_code": "os", "iso_3_code": "oss", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "4344", "native_tokenizers": [], "scripts": [ @@ -6713,9 +7454,11 @@ }, { "name": "Yagnobi", + "depth": 5, "iso_1_code": null, "iso_3_code": "yai", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4345", "native_tokenizers": [], @@ -6723,43 +7466,42 @@ }, { "name": "Yassic", + "depth": 5, "iso_1_code": null, "iso_3_code": "ysc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4346", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "4343", "native_tokenizers": [], "scripts": [] }, { "name": "Southeastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pamir", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ishkashimi", + "depth": 6, "iso_1_code": null, "iso_3_code": "isk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4349", "native_tokenizers": [], @@ -6767,9 +7509,11 @@ }, { "name": "Munji", + "depth": 6, "iso_1_code": null, "iso_3_code": "mnj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4350", "native_tokenizers": [], @@ -6777,9 +7521,11 @@ }, { "name": "Sanglechi", + "depth": 6, "iso_1_code": null, "iso_3_code": "sgy", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4351", "native_tokenizers": [], @@ -6787,9 +7533,11 @@ }, { "name": "Wakhi", + "depth": 6, "iso_1_code": null, "iso_3_code": "wbl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4352", "native_tokenizers": [], @@ -6797,9 +7545,11 @@ }, { "name": "Yadgha", + "depth": 6, "iso_1_code": null, "iso_3_code": "ydg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4353", "native_tokenizers": [], @@ -6807,23 +7557,18 @@ }, { "name": "Shugni-Yazgulami", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shughni", + "depth": 7, "iso_1_code": null, "iso_3_code": "sgh", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "4355", "native_tokenizers": [], "scripts": [ @@ -6832,9 +7577,11 @@ }, { "name": "Sarikoli", + "depth": 7, "iso_1_code": null, "iso_3_code": "srh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4356", "native_tokenizers": [], @@ -6842,52 +7589,43 @@ }, { "name": "Yazghulami", + "depth": 7, "iso_1_code": null, "iso_3_code": "yah", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4357", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "4354", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "4348", "native_tokenizers": [], "scripts": [] }, { "name": "Pashto", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pashto, Southern", + "depth": 6, "iso_1_code": "ps", "iso_3_code": "pbt", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -6905,9 +7643,11 @@ }, { "name": "Pashto, Northern", + "depth": 6, "iso_1_code": "ps", "iso_3_code": "pbu", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4360", "native_tokenizers": [], @@ -6915,9 +7655,11 @@ }, { "name": "Pashto, Central", + "depth": 6, "iso_1_code": "ps", "iso_3_code": "pst", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4361", "native_tokenizers": [], @@ -6925,15 +7667,18 @@ }, { "name": "Waneci", + "depth": 6, "iso_1_code": null, "iso_3_code": "wne", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4362", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -6948,6 +7693,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -6955,13 +7701,6 @@ "original_lang_code": "urd", "script": "Arab", "class_name": "IndicNLPTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4347", @@ -6969,6 +7708,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -6976,13 +7716,6 @@ "original_lang_code": "urd", "script": "Arab", "class_name": "IndicNLPTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4342", @@ -6991,24 +7724,29 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northwestern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balochi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balochi, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "bcc", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7026,9 +7764,11 @@ }, { "name": "Balochi, Western", + "depth": 6, "iso_1_code": null, "iso_3_code": "bgn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4367", "native_tokenizers": [], @@ -7036,9 +7776,11 @@ }, { "name": "Balochi, Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": "bgp", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4368", "native_tokenizers": [], @@ -7046,9 +7788,11 @@ }, { "name": "Bashkardi", + "depth": 6, "iso_1_code": null, "iso_3_code": "bsg", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4369", "native_tokenizers": [], @@ -7056,15 +7800,18 @@ }, { "name": "Koroshi", + "depth": 6, "iso_1_code": null, "iso_3_code": "ktl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4370", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7080,14 +7827,17 @@ }, { "name": "Caspian", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gilaki", + "depth": 6, "iso_1_code": null, "iso_3_code": "glk", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7105,9 +7855,11 @@ }, { "name": "Mazandarani", + "depth": 6, "iso_1_code": null, "iso_3_code": "mzn", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7125,15 +7877,18 @@ }, { "name": "Shahmirzadi", + "depth": 6, "iso_1_code": null, "iso_3_code": "srz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4374", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7149,14 +7904,17 @@ }, { "name": "Central Iran", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ashtiani", + "depth": 6, "iso_1_code": null, "iso_3_code": "atn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4376", "native_tokenizers": [], @@ -7164,9 +7922,11 @@ }, { "name": "Dari, Zoroastrian", + "depth": 6, "iso_1_code": null, "iso_3_code": "gbz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4377", "native_tokenizers": [], @@ -7174,9 +7934,11 @@ }, { "name": "Gazi", + "depth": 6, "iso_1_code": null, "iso_3_code": "gzi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4378", "native_tokenizers": [], @@ -7184,9 +7946,11 @@ }, { "name": "Khunsari", + "depth": 6, "iso_1_code": null, "iso_3_code": "kfm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4379", "native_tokenizers": [], @@ -7194,9 +7958,11 @@ }, { "name": "Natanzi", + "depth": 6, "iso_1_code": null, "iso_3_code": "ntz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4380", "native_tokenizers": [], @@ -7204,9 +7970,11 @@ }, { "name": "Nayini", + "depth": 6, "iso_1_code": null, "iso_3_code": "nyq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4381", "native_tokenizers": [], @@ -7214,9 +7982,11 @@ }, { "name": "Parsi-Dari", + "depth": 6, "iso_1_code": null, "iso_3_code": "prd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4382", "native_tokenizers": [], @@ -7224,9 +7994,11 @@ }, { "name": "Sivandi", + "depth": 6, "iso_1_code": null, "iso_3_code": "siy", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4383", "native_tokenizers": [], @@ -7234,9 +8006,11 @@ }, { "name": "Soi", + "depth": 6, "iso_1_code": null, "iso_3_code": "soj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4384", "native_tokenizers": [], @@ -7244,15 +8018,18 @@ }, { "name": "Vafsi", + "depth": 6, "iso_1_code": null, "iso_3_code": "vaf", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4385", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4375", "native_tokenizers": [], @@ -7260,14 +8037,17 @@ }, { "name": "Kurdish", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kurdish, Central", + "depth": 6, "iso_1_code": "ku", "iso_3_code": "ckb", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7285,9 +8065,11 @@ }, { "name": "Kurdish, Northern", + "depth": 6, "iso_1_code": "ku", "iso_3_code": "kmr", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7295,13 +8077,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4388", @@ -7315,9 +8090,11 @@ }, { "name": "Laki", + "depth": 6, "iso_1_code": null, "iso_3_code": "lki", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7335,9 +8112,11 @@ }, { "name": "Kurdish, Southern", + "depth": 6, "iso_1_code": "ku", "iso_3_code": "sdh", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7354,6 +8133,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7368,13 +8148,6 @@ "original_lang_code": "urd", "script": "Arab", "class_name": "IndicNLPTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4386", @@ -7383,14 +8156,17 @@ }, { "name": "Ormuri-Parachi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ormuri", + "depth": 6, "iso_1_code": null, "iso_3_code": "oru", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4392", "native_tokenizers": [], @@ -7398,15 +8174,18 @@ }, { "name": "Parachi", + "depth": 6, "iso_1_code": null, "iso_3_code": "prc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4393", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4391", "native_tokenizers": [], @@ -7414,14 +8193,17 @@ }, { "name": "Semnani", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lasgerdi", + "depth": 6, "iso_1_code": null, "iso_3_code": "lsa", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4395", "native_tokenizers": [], @@ -7429,9 +8211,11 @@ }, { "name": "Sangisari", + "depth": 6, "iso_1_code": null, "iso_3_code": "sgr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4396", "native_tokenizers": [], @@ -7439,9 +8223,11 @@ }, { "name": "Semnani", + "depth": 6, "iso_1_code": null, "iso_3_code": "smy", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4397", "native_tokenizers": [], @@ -7449,15 +8235,18 @@ }, { "name": "Sorkhei", + "depth": 6, "iso_1_code": null, "iso_3_code": "sqo", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4398", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4394", "native_tokenizers": [], @@ -7465,14 +8254,17 @@ }, { "name": "Talysh", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alviri-Vidari", + "depth": 6, "iso_1_code": null, "iso_3_code": "avd", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4400", "native_tokenizers": [], @@ -7480,9 +8272,11 @@ }, { "name": "Eshtehardi", + "depth": 6, "iso_1_code": null, "iso_3_code": "esh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4401", "native_tokenizers": [], @@ -7490,9 +8284,11 @@ }, { "name": "Gozarkhani", + "depth": 6, "iso_1_code": null, "iso_3_code": "goz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4402", "native_tokenizers": [], @@ -7500,9 +8296,11 @@ }, { "name": "Harzani", + "depth": 6, "iso_1_code": null, "iso_3_code": "hrz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4403", "native_tokenizers": [], @@ -7510,9 +8308,11 @@ }, { "name": "Karingani", + "depth": 6, "iso_1_code": null, "iso_3_code": "kgn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4404", "native_tokenizers": [], @@ -7520,9 +8320,11 @@ }, { "name": "Koresh-e Rostam", + "depth": 6, "iso_1_code": null, "iso_3_code": "okh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4405", "native_tokenizers": [], @@ -7530,9 +8332,11 @@ }, { "name": "Razajerdi", + "depth": 6, "iso_1_code": null, "iso_3_code": "rat", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4406", "native_tokenizers": [], @@ -7540,9 +8344,11 @@ }, { "name": "Rudbari", + "depth": 6, "iso_1_code": null, "iso_3_code": "rdb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4407", "native_tokenizers": [], @@ -7550,9 +8356,11 @@ }, { "name": "Shahrudi", + "depth": 6, "iso_1_code": null, "iso_3_code": "shm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4408", "native_tokenizers": [], @@ -7560,9 +8368,11 @@ }, { "name": "Takestani", + "depth": 6, "iso_1_code": null, "iso_3_code": "tks", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4409", "native_tokenizers": [], @@ -7570,9 +8380,11 @@ }, { "name": "Talysh", + "depth": 6, "iso_1_code": null, "iso_3_code": "tly", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7590,9 +8402,11 @@ }, { "name": "Taromi, Upper", + "depth": 6, "iso_1_code": null, "iso_3_code": "tov", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4411", "native_tokenizers": [], @@ -7600,9 +8414,11 @@ }, { "name": "Maraghei", + "depth": 6, "iso_1_code": null, "iso_3_code": "vmh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4412", "native_tokenizers": [], @@ -7610,9 +8426,11 @@ }, { "name": "Kho\u2019ini", + "depth": 6, "iso_1_code": null, "iso_3_code": "xkc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4413", "native_tokenizers": [], @@ -7620,9 +8438,11 @@ }, { "name": "Kajali", + "depth": 6, "iso_1_code": null, "iso_3_code": "xkj", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4414", "native_tokenizers": [], @@ -7630,15 +8450,18 @@ }, { "name": "Kabatei", + "depth": 6, "iso_1_code": null, "iso_3_code": "xkp", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4415", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7654,20 +8477,24 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dezfuli", + "depth": 6, "iso_1_code": null, "iso_3_code": "def", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4417", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4416", "native_tokenizers": [], @@ -7675,14 +8502,17 @@ }, { "name": "Zaza-Gorani", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bajelani", + "depth": 6, "iso_1_code": null, "iso_3_code": "bjm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4419", "native_tokenizers": [], @@ -7690,9 +8520,11 @@ }, { "name": "Zazaki, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "diq", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7710,9 +8542,11 @@ }, { "name": "Gurani", + "depth": 6, "iso_1_code": null, "iso_3_code": "hac", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7730,9 +8564,11 @@ }, { "name": "Zazaki, Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": "kiu", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7750,9 +8586,11 @@ }, { "name": "Shabak", + "depth": 6, "iso_1_code": null, "iso_3_code": "sdb", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4423", "native_tokenizers": [], @@ -7760,15 +8598,18 @@ }, { "name": "Sarli", + "depth": 6, "iso_1_code": null, "iso_3_code": "sdf", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4424", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7790,6 +8631,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -7804,13 +8646,6 @@ "original_lang_code": "urd", "script": "Arab", "class_name": "IndicNLPTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4364", @@ -7819,19 +8654,23 @@ }, { "name": "Southwestern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fars", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fars, Southwestern", + "depth": 6, "iso_1_code": null, "iso_3_code": "fay", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4427", "native_tokenizers": [], @@ -7839,15 +8678,18 @@ }, { "name": "Lari", + "depth": 6, "iso_1_code": null, "iso_3_code": "lrl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4428", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4426", "native_tokenizers": [], @@ -7855,14 +8697,17 @@ }, { "name": "Luri", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakhti\u00e2ri", + "depth": 6, "iso_1_code": null, "iso_3_code": "bqi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4430", "native_tokenizers": [], @@ -7870,9 +8715,11 @@ }, { "name": "Luri, Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": "lrc", "children": [], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7890,9 +8737,11 @@ }, { "name": "Luri, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "luz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4432", "native_tokenizers": [], @@ -7900,15 +8749,18 @@ }, { "name": "Kumzari", + "depth": 6, "iso_1_code": null, "iso_3_code": "zum", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4433", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -7924,14 +8776,17 @@ }, { "name": "Persian", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aimaq", + "depth": 6, "iso_1_code": null, "iso_3_code": "aiq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4435", "native_tokenizers": [], @@ -7939,9 +8794,11 @@ }, { "name": "Bukharic", + "depth": 6, "iso_1_code": null, "iso_3_code": "bhh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4436", "native_tokenizers": [], @@ -7949,9 +8806,11 @@ }, { "name": "Dehwari", + "depth": 6, "iso_1_code": null, "iso_3_code": "deh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4437", "native_tokenizers": [], @@ -7959,9 +8818,11 @@ }, { "name": "Hazaragi", + "depth": 6, "iso_1_code": null, "iso_3_code": "haz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4438", "native_tokenizers": [], @@ -7969,9 +8830,11 @@ }, { "name": "Dzhidi", + "depth": 6, "iso_1_code": null, "iso_3_code": "jpr", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4439", "native_tokenizers": [], @@ -7979,9 +8842,11 @@ }, { "name": "Persian, Iranian", + "depth": 6, "iso_1_code": "fa", "iso_3_code": "pes", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4440", "native_tokenizers": [], @@ -7989,9 +8854,11 @@ }, { "name": "Pahlavani", + "depth": 6, "iso_1_code": null, "iso_3_code": "phv", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4441", "native_tokenizers": [], @@ -7999,9 +8866,11 @@ }, { "name": "Dari", + "depth": 6, "iso_1_code": "fa", "iso_3_code": "prs", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4442", "native_tokenizers": [], @@ -8009,18 +8878,12 @@ }, { "name": "Tajik", + "depth": 6, "iso_1_code": "tg", "iso_3_code": "tgk", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "4443", "native_tokenizers": [], "scripts": [ @@ -8028,29 +8891,25 @@ ] } ], - "tokenizers": { - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "4434", "native_tokenizers": [], "scripts": [] }, { "name": "Tat", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Judeo-Tat", + "depth": 6, "iso_1_code": null, "iso_3_code": "jdt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4445", "native_tokenizers": [], @@ -8058,21 +8917,25 @@ }, { "name": "Tat, Muslim", + "depth": 6, "iso_1_code": null, "iso_3_code": "ttt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4446", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4444", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Arab": { "full_object": "IndicNLPTokenizer(\"ur\")", @@ -8080,13 +8943,6 @@ "original_lang_code": "urd", "script": "Arab", "class_name": "IndicNLPTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4425", @@ -8094,6 +8950,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -8108,13 +8965,6 @@ "original_lang_code": "urd", "script": "Arab", "class_name": "IndicNLPTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4363", @@ -8122,6 +8972,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"kmr\")", @@ -8136,13 +8987,6 @@ "original_lang_code": "urd", "script": "Arab", "class_name": "IndicNLPTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4340", @@ -8151,14 +8995,17 @@ }, { "name": "Nuristani", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ashkun", + "depth": 3, "iso_1_code": null, "iso_3_code": "ask", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4448", "native_tokenizers": [], @@ -8166,9 +9013,11 @@ }, { "name": "Kateviri", + "depth": 3, "iso_1_code": null, "iso_3_code": "bsh", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4449", "native_tokenizers": [], @@ -8176,9 +9025,11 @@ }, { "name": "Prasuni", + "depth": 3, "iso_1_code": null, "iso_3_code": "prn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4450", "native_tokenizers": [], @@ -8186,9 +9037,11 @@ }, { "name": "Tregami", + "depth": 3, "iso_1_code": null, "iso_3_code": "trm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4451", "native_tokenizers": [], @@ -8196,9 +9049,11 @@ }, { "name": "Waigali", + "depth": 3, "iso_1_code": null, "iso_3_code": "wbk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4452", "native_tokenizers": [], @@ -8206,15 +9061,18 @@ }, { "name": "Komviri", + "depth": 3, "iso_1_code": null, "iso_3_code": "xvi", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4453", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4447", "native_tokenizers": [], @@ -8222,26 +9080,31 @@ }, { "name": "Unclassified", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Badeshi", + "depth": 3, "iso_1_code": null, "iso_3_code": "bdz", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4455", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": {}, "node_i": "4454", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -8298,20 +9161,6 @@ "original_lang_code": "kmr", "script": "Latn", "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" } }, "node_i": "4067", @@ -8320,19 +9169,23 @@ }, { "name": "Italic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Latino-Faliscan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Latin", + "depth": 3, "iso_1_code": "la", "iso_3_code": "lat", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"la\")", @@ -8351,6 +9204,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"la\")", @@ -8366,19 +9220,23 @@ }, { "name": "Romance", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romanian", + "depth": 4, "iso_1_code": "ro", "iso_3_code": "ron", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ro\")", @@ -8386,13 +9244,6 @@ "original_lang_code": "ron", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4461", @@ -8406,9 +9257,11 @@ }, { "name": "Romanian, Istro", + "depth": 4, "iso_1_code": null, "iso_3_code": "ruo", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4462", "native_tokenizers": [], @@ -8416,9 +9269,11 @@ }, { "name": "Aromanian", + "depth": 4, "iso_1_code": null, "iso_3_code": "rup", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ro\")", @@ -8436,15 +9291,18 @@ }, { "name": "Romanian, Megleno", + "depth": 4, "iso_1_code": null, "iso_3_code": "ruq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4464", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ro\")", @@ -8452,13 +9310,6 @@ "original_lang_code": "ron", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4460", @@ -8467,19 +9318,23 @@ }, { "name": "Italo-Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Italo-Dalmatian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dalmatian", + "depth": 5, "iso_1_code": null, "iso_3_code": "dlm", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4467", "native_tokenizers": [], @@ -8487,9 +9342,11 @@ }, { "name": "Istriot", + "depth": 5, "iso_1_code": null, "iso_3_code": "ist", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4468", "native_tokenizers": [], @@ -8497,9 +9354,11 @@ }, { "name": "Italian", + "depth": 5, "iso_1_code": "it", "iso_3_code": "ita", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"it\")", @@ -8519,9 +9378,11 @@ }, { "name": "Judeo-Italian", + "depth": 5, "iso_1_code": null, "iso_3_code": "itk", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4470", "native_tokenizers": [], @@ -8529,9 +9390,11 @@ }, { "name": "Napoletano", + "depth": 5, "iso_1_code": null, "iso_3_code": "nap", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"it\")", @@ -8549,9 +9412,11 @@ }, { "name": "Sicilian", + "depth": 5, "iso_1_code": null, "iso_3_code": "scn", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"it\")", @@ -8568,6 +9433,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"it\")", @@ -8583,29 +9449,35 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gallo-Iberian", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gallo-Romance", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gallo-Italian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Emilian", + "depth": 8, "iso_1_code": null, "iso_3_code": "egl", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4477", "native_tokenizers": [], @@ -8613,9 +9485,11 @@ }, { "name": "Ligurian", + "depth": 8, "iso_1_code": null, "iso_3_code": "lij", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lij\")", @@ -8635,9 +9509,11 @@ }, { "name": "Lombard", + "depth": 8, "iso_1_code": null, "iso_3_code": "lmo", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lij\")", @@ -8655,9 +9531,11 @@ }, { "name": "Piedmontese", + "depth": 8, "iso_1_code": null, "iso_3_code": "pms", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lij\")", @@ -8675,9 +9553,11 @@ }, { "name": "Romagnol", + "depth": 8, "iso_1_code": null, "iso_3_code": "rgn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4481", "native_tokenizers": [], @@ -8685,9 +9565,11 @@ }, { "name": "Venetian", + "depth": 8, "iso_1_code": null, "iso_3_code": "vec", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lij\")", @@ -8704,6 +9586,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lij\")", @@ -8719,24 +9602,29 @@ }, { "name": "Gallo-Rhaetian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "O\u00efl", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "French", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "French", + "depth": 10, "iso_1_code": "fr", "iso_3_code": "fra", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8756,9 +9644,11 @@ }, { "name": "French, Cajun", + "depth": 10, "iso_1_code": null, "iso_3_code": "frc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4487", "native_tokenizers": [], @@ -8766,9 +9656,11 @@ }, { "name": "Guern\u00e9siais", + "depth": 10, "iso_1_code": null, "iso_3_code": "nrf", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8786,9 +9678,11 @@ }, { "name": "Picard", + "depth": 10, "iso_1_code": null, "iso_3_code": "pcd", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8806,9 +9700,11 @@ }, { "name": "Walloon", + "depth": 10, "iso_1_code": "wa", "iso_3_code": "wln", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8825,6 +9721,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8840,14 +9737,17 @@ }, { "name": "Southeastern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arpitan", + "depth": 10, "iso_1_code": null, "iso_3_code": "frp", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8864,6 +9764,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8878,6 +9779,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8893,14 +9795,17 @@ }, { "name": "Rhaetian", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Friulian", + "depth": 9, "iso_1_code": null, "iso_3_code": "fur", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8918,9 +9823,11 @@ }, { "name": "Ladin", + "depth": 9, "iso_1_code": null, "iso_3_code": "lld", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8938,9 +9845,11 @@ }, { "name": "Romansh", + "depth": 9, "iso_1_code": "rm", "iso_3_code": "roh", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8957,6 +9866,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8971,6 +9881,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -8985,6 +9896,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fr\")", @@ -9000,19 +9912,23 @@ }, { "name": "Ibero-Romance", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Iberian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Catalan", + "depth": 8, "iso_1_code": "ca", "iso_3_code": "cat", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ca\")", @@ -9031,6 +9947,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"ca\")", @@ -9046,14 +9963,17 @@ }, { "name": "Oc", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Occitan", + "depth": 8, "iso_1_code": "oc", "iso_3_code": "oci", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9071,15 +9991,18 @@ }, { "name": "Shuadit", + "depth": 8, "iso_1_code": null, "iso_3_code": "sdt", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4502", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9095,19 +10018,23 @@ }, { "name": "West Iberian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asturo-Leonese", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asturian", + "depth": 9, "iso_1_code": null, "iso_3_code": "ast", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9125,9 +10052,11 @@ }, { "name": "Mirandese", + "depth": 9, "iso_1_code": null, "iso_3_code": "mwl", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9144,6 +10073,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9159,14 +10089,17 @@ }, { "name": "Castilian", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Extremaduran", + "depth": 9, "iso_1_code": null, "iso_3_code": "ext", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9184,9 +10117,11 @@ }, { "name": "Ladino", + "depth": 9, "iso_1_code": null, "iso_3_code": "lad", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9205,9 +10140,11 @@ }, { "name": "Spanish", + "depth": 9, "iso_1_code": "es", "iso_3_code": "spa", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9227,15 +10164,18 @@ }, { "name": "Spanish, Charapa", + "depth": 9, "iso_1_code": null, "iso_3_code": "spq", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4511", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9251,14 +10191,17 @@ }, { "name": "Portuguese-Galician", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Minderico", + "depth": 9, "iso_1_code": null, "iso_3_code": "drc", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4513", "native_tokenizers": [], @@ -9266,9 +10209,11 @@ }, { "name": "Fala", + "depth": 9, "iso_1_code": null, "iso_3_code": "fax", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4514", "native_tokenizers": [], @@ -9276,9 +10221,11 @@ }, { "name": "Galician", + "depth": 9, "iso_1_code": "gl", "iso_3_code": "glg", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"gl\")", @@ -9298,9 +10245,11 @@ }, { "name": "Portuguese", + "depth": 9, "iso_1_code": "pt", "iso_3_code": "por", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pt\")", @@ -9319,6 +10268,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"pt\")", @@ -9333,6 +10283,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9347,6 +10298,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9361,6 +10313,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9376,19 +10329,23 @@ }, { "name": "Pyrenean-Mozarabic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pyrenean", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aragonese", + "depth": 7, "iso_1_code": "an", "iso_3_code": "arg", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9405,6 +10362,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9419,6 +10377,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9433,6 +10392,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9447,6 +10407,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9462,19 +10423,23 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Corsican", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Corsican", + "depth": 5, "iso_1_code": "co", "iso_3_code": "cos", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9491,6 +10456,7 @@ ] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9506,14 +10472,17 @@ }, { "name": "Sardinian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sardinian, Sassarese", + "depth": 5, "iso_1_code": "sc", "iso_3_code": "sdc", "children": [], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9531,9 +10500,11 @@ }, { "name": "Sardinian, Gallurese", + "depth": 5, "iso_1_code": "sc", "iso_3_code": "sdn", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4525", "native_tokenizers": [], @@ -9541,9 +10512,11 @@ }, { "name": "Sardinian, Logudorese", + "depth": 5, "iso_1_code": "sc", "iso_3_code": "src", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4526", "native_tokenizers": [], @@ -9551,15 +10524,18 @@ }, { "name": "Sardinian, Campidanese", + "depth": 5, "iso_1_code": "sc", "iso_3_code": "sro", "children": [], + "family": "Indo-European", "tokenizers": {}, "node_i": "4527", "native_tokenizers": [], "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9574,6 +10550,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9588,6 +10565,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9595,13 +10573,6 @@ "original_lang_code": "spa", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4459", @@ -9609,6 +10580,7 @@ "scripts": [] } ], + "family": "Indo-European", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"es\")", @@ -9616,13 +10588,6 @@ "original_lang_code": "spa", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" } }, "node_i": "4456", @@ -9630,85 +10595,8 @@ "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"en\")", - "original_lang_name": "english", - "original_lang_code": "eng", - "script": "Latn", - "class_name": "SpaCyTokenizer" - }, - "Armn": { - "full_object": "SpaCyTokenizer(\"hy\")", - "original_lang_name": "armenian", - "original_lang_code": "hye", - "script": "Armn", - "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "SpaCyTokenizer(\"ru\")", - "original_lang_name": "russian", - "original_lang_code": "rus", - "script": "Cyrl", - "class_name": "SpaCyTokenizer" - }, - "Grek": { - "full_object": "SpaCyTokenizer(\"el\")", - "original_lang_name": "greek", - "original_lang_code": "ell", - "script": "Grek", - "class_name": "SpaCyTokenizer" - }, - "Deva": { - "full_object": "IndicNLPTokenizer(\"hi\")", - "original_lang_name": "hindi", - "original_lang_code": "hin", - "script": "Deva", - "class_name": "IndicNLPTokenizer" - }, - "Gujr": { - "full_object": "IndicNLPTokenizer(\"gu\")", - "original_lang_name": "gujarati", - "original_lang_code": "guj", - "script": "Gujr", - "class_name": "IndicNLPTokenizer" - }, - "Guru": { - "full_object": "IndicNLPTokenizer(\"pa\")", - "original_lang_name": "punjabi", - "original_lang_code": "pan", - "script": "Guru", - "class_name": "IndicNLPTokenizer" - }, - "Beng": { - "full_object": "IndicNLPTokenizer(\"bn\")", - "original_lang_name": "bengali", - "original_lang_code": "ben", - "script": "Beng", - "class_name": "IndicNLPTokenizer" - }, - "Orya": { - "full_object": "IndicNLPTokenizer(\"or\")", - "original_lang_name": "oriya", - "original_lang_code": "ori", - "script": "Orya", - "class_name": "IndicNLPTokenizer" - }, - "Arab": { - "full_object": "IndicNLPTokenizer(\"ur\")", - "original_lang_name": "urdu", - "original_lang_code": "urd", - "script": "Arab", - "class_name": "IndicNLPTokenizer" - }, - "Sinh": { - "full_object": "IndicNLPTokenizer(\"si\")", - "original_lang_name": "sinhala", - "original_lang_code": "sin", - "script": "Sinh", - "class_name": "IndicNLPTokenizer" - } - }, + "family": "Indo-European", + "tokenizers": {}, "node_i": "3919", "native_tokenizers": [], "scripts": [] diff --git a/data/Iroquoian.json b/data/Iroquoian.json index ff0d57debcabbe27936f8dd06f3f4ebe7fb4a15f..e4c6a08ea67fb33fc05f74ec63bfaa164b638301 100644 --- a/data/Iroquoian.json +++ b/data/Iroquoian.json @@ -1,13 +1,16 @@ { "name": "Iroquoian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cherokee", + "depth": 1, "iso_1_code": null, "iso_3_code": "chr", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4529", "native_tokenizers": [], @@ -18,19 +21,23 @@ }, { "name": "Northern Iroquoian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Five Nations-Huronian-Susquehannock", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Susquehannock", + "depth": 3, "iso_1_code": null, "iso_3_code": "sqn", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4532", "native_tokenizers": [], @@ -38,14 +45,17 @@ }, { "name": "Five Nations-Susquehannock", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cayuga", + "depth": 4, "iso_1_code": null, "iso_3_code": "cay", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4534", "native_tokenizers": [], @@ -53,9 +63,11 @@ }, { "name": "Onondaga", + "depth": 4, "iso_1_code": null, "iso_3_code": "ono", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4535", "native_tokenizers": [], @@ -63,9 +75,11 @@ }, { "name": "Seneca", + "depth": 4, "iso_1_code": null, "iso_3_code": "see", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4536", "native_tokenizers": [], @@ -73,14 +87,17 @@ }, { "name": "Mohawk-Oneida", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mohawk", + "depth": 5, "iso_1_code": null, "iso_3_code": "moh", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4538", "native_tokenizers": [], @@ -90,21 +107,25 @@ }, { "name": "Oneida", + "depth": 5, "iso_1_code": null, "iso_3_code": "one", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4539", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4537", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4533", "native_tokenizers": [], @@ -112,14 +133,17 @@ }, { "name": "Huronian", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Laurentian", + "depth": 4, "iso_1_code": null, "iso_3_code": "lre", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4541", "native_tokenizers": [], @@ -127,14 +151,17 @@ }, { "name": "Huron-Petun", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wendat", + "depth": 5, "iso_1_code": null, "iso_3_code": "wdt", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4543", "native_tokenizers": [], @@ -142,27 +169,32 @@ }, { "name": "Wyandot", + "depth": 5, "iso_1_code": null, "iso_3_code": "wyn", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4544", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4542", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4540", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4531", "native_tokenizers": [], @@ -170,14 +202,17 @@ }, { "name": "Tuscarora-Nottoway", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nottoway", + "depth": 3, "iso_1_code": null, "iso_3_code": "ntw", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4546", "native_tokenizers": [], @@ -185,9 +220,11 @@ }, { "name": "Nottoway-Meherrin", + "depth": 3, "iso_1_code": null, "iso_3_code": "nwy", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4547", "native_tokenizers": [], @@ -195,27 +232,32 @@ }, { "name": "Tuscarora", + "depth": 3, "iso_1_code": null, "iso_3_code": "tus", "children": [], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4548", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4545", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4530", "native_tokenizers": [], "scripts": [] } ], + "family": "Iroquoian", "tokenizers": {}, "node_i": "4528", "native_tokenizers": [], diff --git a/data/Jabutian.json b/data/Jabutian.json index 2ff85d3375147cf4befc43bcbca5e60b8363a302..432e18e15cfcd766c65cdbb8447f8128db7c15fe 100644 --- a/data/Jabutian.json +++ b/data/Jabutian.json @@ -1,13 +1,16 @@ { "name": "Jabutian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arikap\u00fa", + "depth": 1, "iso_1_code": null, "iso_3_code": "ark", "children": [], + "family": "Jabutian", "tokenizers": {}, "node_i": "4550", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Jabut\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": "jbt", "children": [], + "family": "Jabutian", "tokenizers": {}, "node_i": "4551", "native_tokenizers": [], "scripts": [] } ], + "family": "Jabutian", "tokenizers": {}, "node_i": "4549", "native_tokenizers": [], diff --git a/data/Japonic.json b/data/Japonic.json index af1bbd1f279a635432f28b89a89bdc0bb82d47db..f7d7b2a0cf36e9977de142ca68523a1ce3366495 100644 --- a/data/Japonic.json +++ b/data/Japonic.json @@ -1,13 +1,16 @@ { "name": "Japonic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Japanese", + "depth": 1, "iso_1_code": "ja", "iso_3_code": "jpn", "children": [], + "family": "Japonic", "tokenizers": { "Jpan": { "full_object": "SpaCyTokenizer(\"ja\"),", @@ -27,24 +30,29 @@ }, { "name": "Ryukyuan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amami-Okinawan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern Amami-Okinawan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amami-Oshima, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "ams", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4557", "native_tokenizers": [], @@ -52,9 +60,11 @@ }, { "name": "Kikai", + "depth": 4, "iso_1_code": null, "iso_3_code": "kzg", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4558", "native_tokenizers": [], @@ -62,9 +72,11 @@ }, { "name": "Amami-Oshima, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "ryn", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4559", "native_tokenizers": [], @@ -72,15 +84,18 @@ }, { "name": "Toku-No-Shima", + "depth": 4, "iso_1_code": null, "iso_3_code": "tkn", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4560", "native_tokenizers": [], "scripts": [] } ], + "family": "Japonic", "tokenizers": {}, "node_i": "4556", "native_tokenizers": [], @@ -88,14 +103,17 @@ }, { "name": "Southern Amami-Okinawan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oki-No-Erabu", + "depth": 4, "iso_1_code": null, "iso_3_code": "okn", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4562", "native_tokenizers": [], @@ -103,9 +121,11 @@ }, { "name": "Okinawan, Central", + "depth": 4, "iso_1_code": null, "iso_3_code": "ryu", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4563", "native_tokenizers": [], @@ -113,9 +133,11 @@ }, { "name": "Kunigami", + "depth": 4, "iso_1_code": null, "iso_3_code": "xug", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4564", "native_tokenizers": [], @@ -123,21 +145,25 @@ }, { "name": "Yoron", + "depth": 4, "iso_1_code": null, "iso_3_code": "yox", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4565", "native_tokenizers": [], "scripts": [] } ], + "family": "Japonic", "tokenizers": {}, "node_i": "4561", "native_tokenizers": [], "scripts": [] } ], + "family": "Japonic", "tokenizers": {}, "node_i": "4555", "native_tokenizers": [], @@ -145,14 +171,17 @@ }, { "name": "Sakishima", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miyako", + "depth": 3, "iso_1_code": null, "iso_3_code": "mvi", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4567", "native_tokenizers": [], @@ -160,9 +189,11 @@ }, { "name": "Yaeyama", + "depth": 3, "iso_1_code": null, "iso_3_code": "rys", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4568", "native_tokenizers": [], @@ -170,36 +201,33 @@ }, { "name": "Yonaguni", + "depth": 3, "iso_1_code": null, "iso_3_code": "yoi", "children": [], + "family": "Japonic", "tokenizers": {}, "node_i": "4569", "native_tokenizers": [], "scripts": [] } ], + "family": "Japonic", "tokenizers": {}, "node_i": "4566", "native_tokenizers": [], "scripts": [] } ], + "family": "Japonic", "tokenizers": {}, "node_i": "4554", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Jpan": { - "full_object": "SpaCyTokenizer(\"ja\"),", - "original_lang_name": "japanese", - "original_lang_code": "jpn", - "script": "Jpan", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Japonic", + "tokenizers": {}, "node_i": "4552", "native_tokenizers": [], "scripts": [] diff --git a/data/Jean.json b/data/Jean.json index 31d9f933c983ab901ef5e25642b5e92a8638bdc1..f71f53a53c60fd863202b69b2a9bfe9e24281053 100644 --- a/data/Jean.json +++ b/data/Jean.json @@ -1,18 +1,22 @@ { "name": "Jean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Acro\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "acs", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4572", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Xav\u00e1nte", + "depth": 2, "iso_1_code": null, "iso_3_code": "xav", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4573", "native_tokenizers": [], @@ -32,9 +38,11 @@ }, { "name": "Xer\u00e9nte", + "depth": 2, "iso_1_code": null, "iso_3_code": "xer", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4574", "native_tokenizers": [], @@ -42,15 +50,18 @@ }, { "name": "Xakriab\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "xkr", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4575", "native_tokenizers": [], "scripts": [] } ], + "family": "Jean", "tokenizers": {}, "node_i": "4571", "native_tokenizers": [], @@ -58,14 +69,17 @@ }, { "name": "Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apinag\u00e9", + "depth": 2, "iso_1_code": null, "iso_3_code": "apn", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4577", "native_tokenizers": [], @@ -75,9 +89,11 @@ }, { "name": "Panar\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "kre", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4578", "native_tokenizers": [], @@ -85,9 +101,11 @@ }, { "name": "Suy\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "suy", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4579", "native_tokenizers": [], @@ -95,9 +113,11 @@ }, { "name": "Kayap\u00f3", + "depth": 2, "iso_1_code": null, "iso_3_code": "txu", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4580", "native_tokenizers": [], @@ -107,14 +127,17 @@ }, { "name": "Timbira", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gavi\u00e3o, Par\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "gvp", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4582", "native_tokenizers": [], @@ -122,9 +145,11 @@ }, { "name": "Canela", + "depth": 3, "iso_1_code": null, "iso_3_code": "ram", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4583", "native_tokenizers": [], @@ -132,9 +157,11 @@ }, { "name": "Krah\u00f4", + "depth": 3, "iso_1_code": null, "iso_3_code": "xra", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4584", "native_tokenizers": [], @@ -142,9 +169,11 @@ }, { "name": "Kreye", + "depth": 3, "iso_1_code": null, "iso_3_code": "xre", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4585", "native_tokenizers": [], @@ -152,21 +181,25 @@ }, { "name": "Krikati-Timbira", + "depth": 3, "iso_1_code": null, "iso_3_code": "xri", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4586", "native_tokenizers": [], "scripts": [] } ], + "family": "Jean", "tokenizers": {}, "node_i": "4581", "native_tokenizers": [], "scripts": [] } ], + "family": "Jean", "tokenizers": {}, "node_i": "4576", "native_tokenizers": [], @@ -174,14 +207,17 @@ }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Xokleng", + "depth": 2, "iso_1_code": null, "iso_3_code": "xok", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4588", "native_tokenizers": [], @@ -189,14 +225,17 @@ }, { "name": "Kaingang", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaingang", + "depth": 3, "iso_1_code": null, "iso_3_code": "kgp", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4590", "native_tokenizers": [], @@ -206,27 +245,32 @@ }, { "name": "Kaing\u00e1ng, S\u00e3o Paulo", + "depth": 3, "iso_1_code": null, "iso_3_code": "zkp", "children": [], + "family": "Jean", "tokenizers": {}, "node_i": "4591", "native_tokenizers": [], "scripts": [] } ], + "family": "Jean", "tokenizers": {}, "node_i": "4589", "native_tokenizers": [], "scripts": [] } ], + "family": "Jean", "tokenizers": {}, "node_i": "4587", "native_tokenizers": [], "scripts": [] } ], + "family": "Jean", "tokenizers": {}, "node_i": "4570", "native_tokenizers": [], diff --git a/data/Jicaquean.json b/data/Jicaquean.json index c64407cfa77b9179f92bdf09e538aa71d1ec3a5a..3499a58dcc92753a0878a1735679472c44cd1803 100644 --- a/data/Jicaquean.json +++ b/data/Jicaquean.json @@ -1,13 +1,16 @@ { "name": "Jicaquean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tol", + "depth": 1, "iso_1_code": null, "iso_3_code": "jic", "children": [], + "family": "Jicaquean", "tokenizers": {}, "node_i": "4593", "native_tokenizers": [], @@ -16,6 +19,7 @@ ] } ], + "family": "Jicaquean", "tokenizers": {}, "node_i": "4592", "native_tokenizers": [], diff --git a/data/Jivaroan.json b/data/Jivaroan.json index 21f4aeded7b4bc8ba2e771d18b32c5392b4aab9f..15b03d25b1eb78d73107b430554915c6e1550e20 100644 --- a/data/Jivaroan.json +++ b/data/Jivaroan.json @@ -1,13 +1,16 @@ { "name": "Jivaroan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awaj\u00fan", + "depth": 1, "iso_1_code": null, "iso_3_code": "agr", "children": [], + "family": "Jivaroan", "tokenizers": {}, "node_i": "4595", "native_tokenizers": [], @@ -17,14 +20,17 @@ }, { "name": "J\u00edvaro", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Achuar-Shiwiar", + "depth": 2, "iso_1_code": null, "iso_3_code": "acu", "children": [], + "family": "Jivaroan", "tokenizers": {}, "node_i": "4597", "native_tokenizers": [], @@ -34,9 +40,11 @@ }, { "name": "Wamp\u00eds", + "depth": 2, "iso_1_code": null, "iso_3_code": "hub", "children": [], + "family": "Jivaroan", "tokenizers": {}, "node_i": "4598", "native_tokenizers": [], @@ -46,9 +54,11 @@ }, { "name": "Shuar", + "depth": 2, "iso_1_code": null, "iso_3_code": "jiv", "children": [], + "family": "Jivaroan", "tokenizers": {}, "node_i": "4599", "native_tokenizers": [], @@ -57,12 +67,14 @@ ] } ], + "family": "Jivaroan", "tokenizers": {}, "node_i": "4596", "native_tokenizers": [], "scripts": [] } ], + "family": "Jivaroan", "tokenizers": {}, "node_i": "4594", "native_tokenizers": [], diff --git a/data/Kamakanan.json b/data/Kamakanan.json index 7f8efc5e6f0e9f4c0d167ef3b895b56a44a2b34c..b4f784ac9a0b09957feebba53928edae9aa05717 100644 --- a/data/Kamakanan.json +++ b/data/Kamakanan.json @@ -1,30 +1,36 @@ { "name": "Kamakanan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamak\u00e1n", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamakan", + "depth": 2, "iso_1_code": null, "iso_3_code": "vkm", "children": [], + "family": "Kamakanan", "tokenizers": {}, "node_i": "4602", "native_tokenizers": [], "scripts": [] } ], + "family": "Kamakanan", "tokenizers": {}, "node_i": "4601", "native_tokenizers": [], "scripts": [] } ], + "family": "Kamakanan", "tokenizers": {}, "node_i": "4600", "native_tokenizers": [], diff --git "a/data/Karaj\303\241.json" "b/data/Karaj\303\241.json" index fbd785882c1dc480aabc97e9af39a805c1dcf864..252323b4530fceb235208d1cd8f33706841db1e9 100644 --- "a/data/Karaj\303\241.json" +++ "b/data/Karaj\303\241.json" @@ -1,13 +1,16 @@ { "name": "Karaj\u00e1", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karaj\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "kpj", "children": [], + "family": "Karaj\u00e1", "tokenizers": {}, "node_i": "4604", "native_tokenizers": [], @@ -16,6 +19,7 @@ ] } ], + "family": "Karaj\u00e1", "tokenizers": {}, "node_i": "4603", "native_tokenizers": [], diff --git a/data/Kartvelian.json b/data/Kartvelian.json index cd69324b6e30df438c83ac476d3a89222fc62b19..e09220a3d449b8e0c9ec3f2591184ae5489acdf9 100644 --- a/data/Kartvelian.json +++ b/data/Kartvelian.json @@ -1,18 +1,22 @@ { "name": "Kartvelian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Georgian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Judeo-Georgian", + "depth": 2, "iso_1_code": null, "iso_3_code": "jge", "children": [], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4607", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Georgian", + "depth": 2, "iso_1_code": "ka", "iso_3_code": "kat", "children": [], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4608", "native_tokenizers": [], @@ -31,6 +37,7 @@ ] } ], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4606", "native_tokenizers": [], @@ -38,20 +45,24 @@ }, { "name": "Svan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Svan", + "depth": 2, "iso_1_code": null, "iso_3_code": "sva", "children": [], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4610", "native_tokenizers": [], "scripts": [] } ], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4609", "native_tokenizers": [], @@ -59,14 +70,17 @@ }, { "name": "Zan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Laz", + "depth": 2, "iso_1_code": null, "iso_3_code": "lzz", "children": [], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4612", "native_tokenizers": [], @@ -74,9 +88,11 @@ }, { "name": "Mingrelian", + "depth": 2, "iso_1_code": null, "iso_3_code": "xmf", "children": [], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4613", "native_tokenizers": [], @@ -85,12 +101,14 @@ ] } ], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4611", "native_tokenizers": [], "scripts": [] } ], + "family": "Kartvelian", "tokenizers": {}, "node_i": "4605", "native_tokenizers": [], diff --git a/data/Katukinan.json b/data/Katukinan.json index 681e594749d8436c5d428602f5990f4cf7710c42..308ca316bb6b0beaf6bffb0c79dd27df10269ba1 100644 --- a/data/Katukinan.json +++ b/data/Katukinan.json @@ -1,13 +1,16 @@ { "name": "Katukinan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Katuk\u00edna", + "depth": 1, "iso_1_code": null, "iso_3_code": "kav", "children": [], + "family": "Katukinan", "tokenizers": {}, "node_i": "4615", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Kanamar\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": "knm", "children": [], + "family": "Katukinan", "tokenizers": {}, "node_i": "4616", "native_tokenizers": [], @@ -25,15 +30,18 @@ }, { "name": "Katawixi", + "depth": 1, "iso_1_code": null, "iso_3_code": "xat", "children": [], + "family": "Katukinan", "tokenizers": {}, "node_i": "4617", "native_tokenizers": [], "scripts": [] } ], + "family": "Katukinan", "tokenizers": {}, "node_i": "4614", "native_tokenizers": [], diff --git a/data/Kaure.json b/data/Kaure.json index 2d279dbd623161284e7661de1d2f1a29a4f185fc..d1fc922e83dbe2b2c2b53ddabb8a6d62deef699d 100644 --- a/data/Kaure.json +++ b/data/Kaure.json @@ -1,24 +1,29 @@ { "name": "Kaure", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kapore", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kapauri", + "depth": 2, "iso_1_code": null, "iso_3_code": "khp", "children": [], + "family": "Kaure", "tokenizers": {}, "node_i": "4620", "native_tokenizers": [], "scripts": [] } ], + "family": "Kaure", "tokenizers": {}, "node_i": "4619", "native_tokenizers": [], @@ -26,14 +31,17 @@ }, { "name": "Kaure Proper", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaure", + "depth": 2, "iso_1_code": null, "iso_3_code": "bpp", "children": [], + "family": "Kaure", "tokenizers": {}, "node_i": "4622", "native_tokenizers": [], @@ -41,21 +49,25 @@ }, { "name": "Kosare", + "depth": 2, "iso_1_code": null, "iso_3_code": "kiq", "children": [], + "family": "Kaure", "tokenizers": {}, "node_i": "4623", "native_tokenizers": [], "scripts": [] } ], + "family": "Kaure", "tokenizers": {}, "node_i": "4621", "native_tokenizers": [], "scripts": [] } ], + "family": "Kaure", "tokenizers": {}, "node_i": "4618", "native_tokenizers": [], diff --git a/data/Kaweskaran.json b/data/Kaweskaran.json index 2a043218581f387d6eaee3b49a0c20a5c2d13867..d3d737f00a22ab7e5129d4a4b35f40c1ffcedee8 100644 --- a/data/Kaweskaran.json +++ b/data/Kaweskaran.json @@ -1,19 +1,23 @@ { "name": "Kaweskaran", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Qawasqar", + "depth": 1, "iso_1_code": null, "iso_3_code": "alc", "children": [], + "family": "Kaweskaran", "tokenizers": {}, "node_i": "4625", "native_tokenizers": [], "scripts": [] } ], + "family": "Kaweskaran", "tokenizers": {}, "node_i": "4624", "native_tokenizers": [], diff --git a/data/Keresan.json b/data/Keresan.json index 8850316267f775ff7d1277179ae73617265abbd5..9879f8ba6ff147663f8b5ce9e9870abd138e5b20 100644 --- a/data/Keresan.json +++ b/data/Keresan.json @@ -1,13 +1,16 @@ { "name": "Keresan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Keres, Eastern", + "depth": 1, "iso_1_code": null, "iso_3_code": "kee", "children": [], + "family": "Keresan", "tokenizers": {}, "node_i": "4627", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Keres, Western", + "depth": 1, "iso_1_code": null, "iso_3_code": "kjq", "children": [], + "family": "Keresan", "tokenizers": {}, "node_i": "4628", "native_tokenizers": [], "scripts": [] } ], + "family": "Keresan", "tokenizers": {}, "node_i": "4626", "native_tokenizers": [], diff --git a/data/Khoe-Kwadi.json b/data/Khoe-Kwadi.json index 57163daee41163875131adf532f90d4b93a0b40e..fb1489cc30d944d4668ef09435a38636d7594104 100644 --- a/data/Khoe-Kwadi.json +++ b/data/Khoe-Kwadi.json @@ -1,34 +1,41 @@ { "name": "Khoe-Kwadi", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khoe", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalahari Khoe", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North-Central", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shua", + "depth": 4, "iso_1_code": null, "iso_3_code": "shg", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4633", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4632", "native_tokenizers": [], @@ -36,14 +43,17 @@ }, { "name": "Northeast", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tshuwau", + "depth": 4, "iso_1_code": null, "iso_3_code": "hio", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4635", "native_tokenizers": [], @@ -51,15 +61,18 @@ }, { "name": "Kua", + "depth": 4, "iso_1_code": null, "iso_3_code": "tyu", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4636", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4634", "native_tokenizers": [], @@ -67,14 +80,17 @@ }, { "name": "Northwest", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u01c1Ani", + "depth": 4, "iso_1_code": null, "iso_3_code": "hnh", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4638", "native_tokenizers": [], @@ -82,15 +98,18 @@ }, { "name": "Khwedam", + "depth": 4, "iso_1_code": null, "iso_3_code": "xuu", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4639", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4637", "native_tokenizers": [], @@ -98,14 +117,17 @@ }, { "name": "Southwest", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u01c1Gana", + "depth": 4, "iso_1_code": null, "iso_3_code": "gnk", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4641", "native_tokenizers": [], @@ -113,9 +135,11 @@ }, { "name": "\u01c0Gwi", + "depth": 4, "iso_1_code": null, "iso_3_code": "gwj", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4642", "native_tokenizers": [], @@ -123,9 +147,11 @@ }, { "name": "Naro", + "depth": 4, "iso_1_code": null, "iso_3_code": "nhr", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4643", "native_tokenizers": [], @@ -134,12 +160,14 @@ ] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4640", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4631", "native_tokenizers": [], @@ -147,25 +175,30 @@ }, { "name": "Khoekhoe", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hainum", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hai|\u01c1om", + "depth": 4, "iso_1_code": null, "iso_3_code": "hgm", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4646", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4645", "native_tokenizers": [], @@ -173,14 +206,17 @@ }, { "name": "Nama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Korana", + "depth": 4, "iso_1_code": null, "iso_3_code": "kqz", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4648", "native_tokenizers": [], @@ -188,9 +224,11 @@ }, { "name": "Khoekhoe", + "depth": 4, "iso_1_code": null, "iso_3_code": "naq", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4649", "native_tokenizers": [], @@ -200,27 +238,32 @@ }, { "name": "Xiri", + "depth": 4, "iso_1_code": null, "iso_3_code": "xii", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4650", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4647", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4644", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4630", "native_tokenizers": [], @@ -228,26 +271,31 @@ }, { "name": "Kwadi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwadi", + "depth": 2, "iso_1_code": null, "iso_3_code": "kwz", "children": [], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4652", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4651", "native_tokenizers": [], "scripts": [] } ], + "family": "Khoe-Kwadi", "tokenizers": {}, "node_i": "4629", "native_tokenizers": [], diff --git a/data/Kiowa-Tanoan.json b/data/Kiowa-Tanoan.json index 0fe160c31cac67ae171475dec0f127f36345f410..1f287866132523608a97b0105450d87bd276f4b8 100644 --- a/data/Kiowa-Tanoan.json +++ b/data/Kiowa-Tanoan.json @@ -1,13 +1,16 @@ { "name": "Kiowa-Tanoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kiowa", + "depth": 1, "iso_1_code": null, "iso_3_code": "kio", "children": [], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4654", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Piro", + "depth": 1, "iso_1_code": null, "iso_3_code": "pie", "children": [], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4655", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Tewa", + "depth": 1, "iso_1_code": null, "iso_3_code": "tew", "children": [], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4656", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Jemez", + "depth": 1, "iso_1_code": null, "iso_3_code": "tow", "children": [], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4657", "native_tokenizers": [], @@ -47,14 +56,17 @@ }, { "name": "Tanoan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tiwa, Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": "tix", "children": [], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4659", "native_tokenizers": [], @@ -62,21 +74,25 @@ }, { "name": "Tiwa, Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": "twf", "children": [], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4660", "native_tokenizers": [], "scripts": [] } ], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4658", "native_tokenizers": [], "scripts": [] } ], + "family": "Kiowa-Tanoan", "tokenizers": {}, "node_i": "4653", "native_tokenizers": [], diff --git a/data/Koreanic.json b/data/Koreanic.json index d3f01b285f0864f848ff1ad222b9ccb375bfe3a8..a52a429766c0efa0e8e4dc5305863efce45d0b41 100644 --- a/data/Koreanic.json +++ b/data/Koreanic.json @@ -1,13 +1,16 @@ { "name": "Koreanic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jejueo", + "depth": 1, "iso_1_code": null, "iso_3_code": "jje", "children": [], + "family": "Koreanic", "tokenizers": {}, "node_i": "4662", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Korean", + "depth": 1, "iso_1_code": "ko", "iso_3_code": "kor", "children": [], + "family": "Koreanic", "tokenizers": { "Hang": { "full_object": "KiwiTokenizer()", @@ -36,15 +41,8 @@ ] } ], - "tokenizers": { - "Hang": { - "full_object": "KiwiTokenizer()", - "original_lang_name": "korean", - "original_lang_code": "kor", - "script": "Hang", - "class_name": "KiwiTokenizer" - } - }, + "family": "Koreanic", + "tokenizers": {}, "node_i": "4661", "native_tokenizers": [], "scripts": [] diff --git a/data/Kra-Dai.json b/data/Kra-Dai.json index 210d93a773f5ce3a3dfa3799ee99ca148d25bfeb..e25875756b5aa1b13f8e91bb35998a64236b1456 100644 --- a/data/Kra-Dai.json +++ b/data/Kra-Dai.json @@ -1,13 +1,16 @@ { "name": "Kra-Dai", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nora", + "depth": 1, "iso_1_code": null, "iso_3_code": "nrr", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4665", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Hlai", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jiamao", + "depth": 2, "iso_1_code": null, "iso_3_code": "jio", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4667", "native_tokenizers": [], @@ -30,15 +36,18 @@ }, { "name": "Hlai", + "depth": 2, "iso_1_code": null, "iso_3_code": "lic", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4668", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4666", "native_tokenizers": [], @@ -46,19 +55,23 @@ }, { "name": "Kam-Tai", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kam-Sui", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ai-Cham", + "depth": 3, "iso_1_code": null, "iso_3_code": "aih", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4671", "native_tokenizers": [], @@ -66,9 +79,11 @@ }, { "name": "Biao", + "depth": 3, "iso_1_code": null, "iso_3_code": "byk", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4672", "native_tokenizers": [], @@ -76,9 +91,11 @@ }, { "name": "Chadong", + "depth": 3, "iso_1_code": null, "iso_3_code": "cdy", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4673", "native_tokenizers": [], @@ -86,9 +103,11 @@ }, { "name": "Cao Miao", + "depth": 3, "iso_1_code": null, "iso_3_code": "cov", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4674", "native_tokenizers": [], @@ -96,9 +115,11 @@ }, { "name": "Dong, Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": "doc", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4675", "native_tokenizers": [], @@ -106,9 +127,11 @@ }, { "name": "Dong, Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": "kmc", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4676", "native_tokenizers": [], @@ -116,9 +139,11 @@ }, { "name": "Kang", + "depth": 3, "iso_1_code": null, "iso_3_code": "kyp", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4677", "native_tokenizers": [], @@ -126,9 +151,11 @@ }, { "name": "Mak", + "depth": 3, "iso_1_code": null, "iso_3_code": "mkg", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4678", "native_tokenizers": [], @@ -136,9 +163,11 @@ }, { "name": "Mulam", + "depth": 3, "iso_1_code": null, "iso_3_code": "mlm", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4679", "native_tokenizers": [], @@ -146,9 +175,11 @@ }, { "name": "Maonan", + "depth": 3, "iso_1_code": null, "iso_3_code": "mmd", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4680", "native_tokenizers": [], @@ -156,9 +187,11 @@ }, { "name": "Sui", + "depth": 3, "iso_1_code": null, "iso_3_code": "swi", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4681", "native_tokenizers": [], @@ -166,15 +199,18 @@ }, { "name": "T\u2019en", + "depth": 3, "iso_1_code": null, "iso_3_code": "tct", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4682", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4670", "native_tokenizers": [], @@ -182,14 +218,17 @@ }, { "name": "Lakkja", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lakkia", + "depth": 3, "iso_1_code": null, "iso_3_code": "lbc", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4684", "native_tokenizers": [], @@ -197,15 +236,18 @@ }, { "name": "Lingao", + "depth": 3, "iso_1_code": null, "iso_3_code": "onb", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4685", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4683", "native_tokenizers": [], @@ -213,14 +255,17 @@ }, { "name": "Tai", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tai Khang", + "depth": 3, "iso_1_code": null, "iso_3_code": "tnu", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4687", "native_tokenizers": [], @@ -228,9 +273,11 @@ }, { "name": "Tai Pao", + "depth": 3, "iso_1_code": null, "iso_3_code": "tpo", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4688", "native_tokenizers": [], @@ -238,9 +285,11 @@ }, { "name": "Tai Yo", + "depth": 3, "iso_1_code": null, "iso_3_code": "tyj", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4689", "native_tokenizers": [], @@ -248,9 +297,11 @@ }, { "name": "Kuan", + "depth": 3, "iso_1_code": null, "iso_3_code": "uan", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4690", "native_tokenizers": [], @@ -258,14 +309,17 @@ }, { "name": "Central", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cao Lan", + "depth": 4, "iso_1_code": null, "iso_3_code": "mlc", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4692", "native_tokenizers": [], @@ -273,9 +327,11 @@ }, { "name": "Nung", + "depth": 4, "iso_1_code": null, "iso_3_code": "nut", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4693", "native_tokenizers": [], @@ -283,9 +339,11 @@ }, { "name": "Ts\u2019\u00fcn-Lao", + "depth": 4, "iso_1_code": null, "iso_3_code": "tsl", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4694", "native_tokenizers": [], @@ -293,9 +351,11 @@ }, { "name": "T\u00e0y", + "depth": 4, "iso_1_code": null, "iso_3_code": "tyz", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4695", "native_tokenizers": [], @@ -303,9 +363,11 @@ }, { "name": "Zhuang, Minz", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zgm", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4696", "native_tokenizers": [], @@ -313,9 +375,11 @@ }, { "name": "Zhuang, Dai", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zhd", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4697", "native_tokenizers": [], @@ -323,9 +387,11 @@ }, { "name": "Zhuang, Nong", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zhn", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4698", "native_tokenizers": [], @@ -333,9 +399,11 @@ }, { "name": "Zhuang, Yang", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zyg", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4699", "native_tokenizers": [], @@ -343,9 +411,11 @@ }, { "name": "Zhuang, Yongnan", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zyn", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4700", "native_tokenizers": [], @@ -353,15 +423,18 @@ }, { "name": "Zhuang, Zuojiang", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zzj", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4701", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4691", "native_tokenizers": [], @@ -369,14 +442,17 @@ }, { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bouyei", + "depth": 4, "iso_1_code": null, "iso_3_code": "pcc", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4703", "native_tokenizers": [], @@ -384,9 +460,11 @@ }, { "name": "Saek", + "depth": 4, "iso_1_code": null, "iso_3_code": "skb", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4704", "native_tokenizers": [], @@ -394,9 +472,11 @@ }, { "name": "Yoy", + "depth": 4, "iso_1_code": null, "iso_3_code": "yoy", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4705", "native_tokenizers": [], @@ -404,9 +484,11 @@ }, { "name": "Zhuang, Central Hongshuihe", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zch", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4706", "native_tokenizers": [], @@ -414,9 +496,11 @@ }, { "name": "Zhuang, Eastern Hongshuihe", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zeh", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4707", "native_tokenizers": [], @@ -424,9 +508,11 @@ }, { "name": "Zhuang, Guibei", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zgb", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4708", "native_tokenizers": [], @@ -434,9 +520,11 @@ }, { "name": "Zhuang, Guibian", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zgn", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4709", "native_tokenizers": [], @@ -444,9 +532,11 @@ }, { "name": "Zhuang, Liujiang", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zlj", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4710", "native_tokenizers": [], @@ -454,9 +544,11 @@ }, { "name": "Zhuang, Lianshan", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zln", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4711", "native_tokenizers": [], @@ -464,9 +556,11 @@ }, { "name": "Zhuang, Liuqian", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zlq", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4712", "native_tokenizers": [], @@ -474,9 +568,11 @@ }, { "name": "Zhuang, Qiubei", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zqe", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4713", "native_tokenizers": [], @@ -484,9 +580,11 @@ }, { "name": "Zhuang, Yongbei", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zyb", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4714", "native_tokenizers": [], @@ -496,15 +594,18 @@ }, { "name": "Zhuang, Youjiang", + "depth": 4, "iso_1_code": "za", "iso_3_code": "zyj", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4715", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4702", "native_tokenizers": [], @@ -512,14 +613,17 @@ }, { "name": "Southwestern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ahom", + "depth": 4, "iso_1_code": null, "iso_3_code": "aho", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4717", "native_tokenizers": [], @@ -527,9 +631,11 @@ }, { "name": "Aiton", + "depth": 4, "iso_1_code": null, "iso_3_code": "aio", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4718", "native_tokenizers": [], @@ -537,9 +643,11 @@ }, { "name": "Tai Dam", + "depth": 4, "iso_1_code": null, "iso_3_code": "blt", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4719", "native_tokenizers": [], @@ -549,9 +657,11 @@ }, { "name": "Tai Ya", + "depth": 4, "iso_1_code": null, "iso_3_code": "cuu", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4720", "native_tokenizers": [], @@ -559,9 +669,11 @@ }, { "name": "L\u00fc", + "depth": 4, "iso_1_code": null, "iso_3_code": "khb", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4721", "native_tokenizers": [], @@ -569,9 +681,11 @@ }, { "name": "Khamti", + "depth": 4, "iso_1_code": null, "iso_3_code": "kht", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4722", "native_tokenizers": [], @@ -579,9 +693,11 @@ }, { "name": "Kh\u00fcn", + "depth": 4, "iso_1_code": null, "iso_3_code": "kkh", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4723", "native_tokenizers": [], @@ -589,9 +705,11 @@ }, { "name": "Khamyang", + "depth": 4, "iso_1_code": null, "iso_3_code": "ksu", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4724", "native_tokenizers": [], @@ -599,9 +717,11 @@ }, { "name": "Lao", + "depth": 4, "iso_1_code": "lo", "iso_3_code": "lao", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4725", "native_tokenizers": [], @@ -611,9 +731,11 @@ }, { "name": "Thai, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "nod", "children": [], + "family": "Kra-Dai", "tokenizers": { "Thai": { "full_object": "ThaiTokenizer()", @@ -631,9 +753,11 @@ }, { "name": "Nyaw", + "depth": 4, "iso_1_code": null, "iso_3_code": "nyw", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4727", "native_tokenizers": [], @@ -641,9 +765,11 @@ }, { "name": "Pa Di", + "depth": 4, "iso_1_code": null, "iso_3_code": "pdi", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4728", "native_tokenizers": [], @@ -651,9 +777,11 @@ }, { "name": "Phake", + "depth": 4, "iso_1_code": null, "iso_3_code": "phk", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4729", "native_tokenizers": [], @@ -661,9 +789,11 @@ }, { "name": "Phu Thai", + "depth": 4, "iso_1_code": null, "iso_3_code": "pht", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4730", "native_tokenizers": [], @@ -671,9 +801,11 @@ }, { "name": "Phuan", + "depth": 4, "iso_1_code": null, "iso_3_code": "phu", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4731", "native_tokenizers": [], @@ -681,9 +813,11 @@ }, { "name": "Shan", + "depth": 4, "iso_1_code": null, "iso_3_code": "shn", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4732", "native_tokenizers": [], @@ -693,9 +827,11 @@ }, { "name": "Thai Song", + "depth": 4, "iso_1_code": null, "iso_3_code": "soa", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4733", "native_tokenizers": [], @@ -703,9 +839,11 @@ }, { "name": "Thai, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "sou", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4734", "native_tokenizers": [], @@ -713,9 +851,11 @@ }, { "name": "Tai N\u00fca", + "depth": 4, "iso_1_code": null, "iso_3_code": "tdd", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4735", "native_tokenizers": [], @@ -723,9 +863,11 @@ }, { "name": "Thai", + "depth": 4, "iso_1_code": "th", "iso_3_code": "tha", "children": [], + "family": "Kra-Dai", "tokenizers": { "Thai": { "full_object": "ThaiTokenizer()", @@ -745,9 +887,11 @@ }, { "name": "Tai Long", + "depth": 4, "iso_1_code": null, "iso_3_code": "thi", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4737", "native_tokenizers": [], @@ -755,9 +899,11 @@ }, { "name": "Tai Hongjin", + "depth": 4, "iso_1_code": null, "iso_3_code": "tiz", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4738", "native_tokenizers": [], @@ -765,9 +911,11 @@ }, { "name": "Tai Laing", + "depth": 4, "iso_1_code": null, "iso_3_code": "tjl", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4739", "native_tokenizers": [], @@ -775,9 +923,11 @@ }, { "name": "Tai Thanh", + "depth": 4, "iso_1_code": null, "iso_3_code": "tmm", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4740", "native_tokenizers": [], @@ -785,9 +935,11 @@ }, { "name": "Thai, Northeastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "tts", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4741", "native_tokenizers": [], @@ -795,9 +947,11 @@ }, { "name": "Tai D\u00f3n", + "depth": 4, "iso_1_code": null, "iso_3_code": "twh", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4742", "native_tokenizers": [], @@ -805,9 +959,11 @@ }, { "name": "Thu Lao", + "depth": 4, "iso_1_code": null, "iso_3_code": "tyl", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4743", "native_tokenizers": [], @@ -815,9 +971,11 @@ }, { "name": "Tai Daeng", + "depth": 4, "iso_1_code": null, "iso_3_code": "tyr", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4744", "native_tokenizers": [], @@ -825,9 +983,11 @@ }, { "name": "T\u00e0y Sa Pa", + "depth": 4, "iso_1_code": null, "iso_3_code": "tys", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4745", "native_tokenizers": [], @@ -835,9 +995,11 @@ }, { "name": "T\u00e0y Tac", + "depth": 4, "iso_1_code": null, "iso_3_code": "tyt", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4746", "native_tokenizers": [], @@ -845,15 +1007,18 @@ }, { "name": "Yong", + "depth": 4, "iso_1_code": null, "iso_3_code": "yno", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4747", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": { "Thai": { "full_object": "ThaiTokenizer()", @@ -868,6 +1033,7 @@ "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": { "Thai": { "full_object": "ThaiTokenizer()", @@ -882,6 +1048,7 @@ "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": { "Thai": { "full_object": "ThaiTokenizer()", @@ -897,25 +1064,30 @@ }, { "name": "Kra", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Kra", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buyang, Baha", + "depth": 3, "iso_1_code": null, "iso_3_code": "yha", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4750", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4749", "native_tokenizers": [], @@ -923,14 +1095,17 @@ }, { "name": "Eastern Kra", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cun", + "depth": 3, "iso_1_code": null, "iso_3_code": "cuq", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4752", "native_tokenizers": [], @@ -938,9 +1113,11 @@ }, { "name": "En", + "depth": 3, "iso_1_code": null, "iso_3_code": "enc", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4753", "native_tokenizers": [], @@ -948,9 +1125,11 @@ }, { "name": "Qabiao", + "depth": 3, "iso_1_code": null, "iso_3_code": "laq", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4754", "native_tokenizers": [], @@ -958,9 +1137,11 @@ }, { "name": "Laha", + "depth": 3, "iso_1_code": null, "iso_3_code": "lha", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4755", "native_tokenizers": [], @@ -968,9 +1149,11 @@ }, { "name": "Buyang, Langnian", + "depth": 3, "iso_1_code": null, "iso_3_code": "yln", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4756", "native_tokenizers": [], @@ -978,9 +1161,11 @@ }, { "name": "Yerong", + "depth": 3, "iso_1_code": null, "iso_3_code": "yrn", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4757", "native_tokenizers": [], @@ -988,15 +1173,18 @@ }, { "name": "Buyang, E\u2019ma", + "depth": 3, "iso_1_code": null, "iso_3_code": "yzg", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4758", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4751", "native_tokenizers": [], @@ -1004,14 +1192,17 @@ }, { "name": "Western Kra", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A\u2019ou", + "depth": 3, "iso_1_code": null, "iso_3_code": "aou", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4760", "native_tokenizers": [], @@ -1019,9 +1210,11 @@ }, { "name": "Gelao, Green", + "depth": 3, "iso_1_code": null, "iso_3_code": "giq", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4761", "native_tokenizers": [], @@ -1029,9 +1222,11 @@ }, { "name": "Gelao, Red", + "depth": 3, "iso_1_code": null, "iso_3_code": "gir", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4762", "native_tokenizers": [], @@ -1039,9 +1234,11 @@ }, { "name": "Mulao", + "depth": 3, "iso_1_code": null, "iso_3_code": "giu", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4763", "native_tokenizers": [], @@ -1049,9 +1246,11 @@ }, { "name": "Duoluo", + "depth": 3, "iso_1_code": null, "iso_3_code": "giw", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4764", "native_tokenizers": [], @@ -1059,9 +1258,11 @@ }, { "name": "Qau", + "depth": 3, "iso_1_code": null, "iso_3_code": "gqu", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4765", "native_tokenizers": [], @@ -1069,9 +1270,11 @@ }, { "name": "Lachi", + "depth": 3, "iso_1_code": null, "iso_3_code": "lbt", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4766", "native_tokenizers": [], @@ -1079,36 +1282,33 @@ }, { "name": "Lachi, White", + "depth": 3, "iso_1_code": null, "iso_3_code": "lwh", "children": [], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4767", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4759", "native_tokenizers": [], "scripts": [] } ], + "family": "Kra-Dai", "tokenizers": {}, "node_i": "4748", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Thai": { - "full_object": "ThaiTokenizer()", - "original_lang_name": "thai", - "original_lang_code": "tha", - "script": "Thai", - "class_name": "ThaiTokenizer" - } - }, + "family": "Kra-Dai", + "tokenizers": {}, "node_i": "4664", "native_tokenizers": [], "scripts": [] diff --git a/data/Kuki-Chin-Naga.json b/data/Kuki-Chin-Naga.json index 8fe2aeb299b7d4f6c923de566a9dee680c290e36..6d66a13f5e5aee9ddfaea79080a1dd7c09274f97 100644 --- a/data/Kuki-Chin-Naga.json +++ b/data/Kuki-Chin-Naga.json @@ -1,8 +1,10 @@ { "name": "Kuki-Chin-Naga", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [], + "family": "Kuki-Chin-Naga", "tokenizers": {}, "node_i": "4768", "native_tokenizers": [], diff --git a/data/Kwomtari.json b/data/Kwomtari.json index af21ec03ccd0e8268e949498fe2d6b4e4239b279..a5c00411617fccce7a50cb787052ddd9da8a57ae 100644 --- a/data/Kwomtari.json +++ b/data/Kwomtari.json @@ -1,24 +1,29 @@ { "name": "Kwomtari", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guriaso", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Muno", + "depth": 2, "iso_1_code": null, "iso_3_code": "grx", "children": [], + "family": "Kwomtari", "tokenizers": {}, "node_i": "4771", "native_tokenizers": [], "scripts": [] } ], + "family": "Kwomtari", "tokenizers": {}, "node_i": "4770", "native_tokenizers": [], @@ -26,14 +31,17 @@ }, { "name": "Nuclear Kwomtari", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nai", + "depth": 2, "iso_1_code": null, "iso_3_code": "bio", "children": [], + "family": "Kwomtari", "tokenizers": {}, "node_i": "4773", "native_tokenizers": [], @@ -41,21 +49,25 @@ }, { "name": "Kwomtari", + "depth": 2, "iso_1_code": null, "iso_3_code": "kwo", "children": [], + "family": "Kwomtari", "tokenizers": {}, "node_i": "4774", "native_tokenizers": [], "scripts": [] } ], + "family": "Kwomtari", "tokenizers": {}, "node_i": "4772", "native_tokenizers": [], "scripts": [] } ], + "family": "Kwomtari", "tokenizers": {}, "node_i": "4769", "native_tokenizers": [], diff --git "a/data/Kx\342\200\231a.json" "b/data/Kx\342\200\231a.json" index 006e0191b992fffdf092b92997faf6cb60dec49c..f1488cc1d998c9ef9c563f72041dd313f286345c 100644 --- "a/data/Kx\342\200\231a.json" +++ "b/data/Kx\342\200\231a.json" @@ -1,13 +1,16 @@ { "name": "Kx\u2019a", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u01c2\u2019Amkhoe", + "depth": 1, "iso_1_code": null, "iso_3_code": "huc", "children": [], + "family": "Kx\u2019a", "tokenizers": {}, "node_i": "4776", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "!Kung", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kung-Ekoka", + "depth": 2, "iso_1_code": null, "iso_3_code": "knw", "children": [], + "family": "Kx\u2019a", "tokenizers": {}, "node_i": "4778", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Ju\u01c0\u2019hoansi", + "depth": 2, "iso_1_code": null, "iso_3_code": "ktz", "children": [], + "family": "Kx\u2019a", "tokenizers": {}, "node_i": "4779", "native_tokenizers": [], @@ -42,21 +50,25 @@ }, { "name": "Northwestern !Kung", + "depth": 2, "iso_1_code": null, "iso_3_code": "vaj", "children": [], + "family": "Kx\u2019a", "tokenizers": {}, "node_i": "4780", "native_tokenizers": [], "scripts": [] } ], + "family": "Kx\u2019a", "tokenizers": {}, "node_i": "4777", "native_tokenizers": [], "scripts": [] } ], + "family": "Kx\u2019a", "tokenizers": {}, "node_i": "4775", "native_tokenizers": [], diff --git a/data/Lakes Plain.json b/data/Lakes Plain.json index 1329a0d8c7e97296351ea7cb2f5114beb1226e02..78b12fa1aa033e0f0b938fd019d6893d6326b967 100644 --- a/data/Lakes Plain.json +++ b/data/Lakes Plain.json @@ -1,24 +1,29 @@ { "name": "Lakes Plain", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awera", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awera", + "depth": 2, "iso_1_code": null, "iso_3_code": "awr", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4783", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4782", "native_tokenizers": [], @@ -26,14 +31,17 @@ }, { "name": "East", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Foau", + "depth": 2, "iso_1_code": null, "iso_3_code": "flh", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4785", "native_tokenizers": [], @@ -41,15 +49,18 @@ }, { "name": "Taburta", + "depth": 2, "iso_1_code": null, "iso_3_code": "tbp", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4786", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4784", "native_tokenizers": [], @@ -57,14 +68,17 @@ }, { "name": "Rasawa-Saponi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rasawa", + "depth": 2, "iso_1_code": null, "iso_3_code": "rac", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4788", "native_tokenizers": [], @@ -72,15 +86,18 @@ }, { "name": "Saponi", + "depth": 2, "iso_1_code": null, "iso_3_code": "spi", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4789", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4787", "native_tokenizers": [], @@ -88,19 +105,23 @@ }, { "name": "Tariku", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Edopi", + "depth": 3, "iso_1_code": null, "iso_3_code": "dbf", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4792", "native_tokenizers": [], @@ -108,15 +129,18 @@ }, { "name": "Iau", + "depth": 3, "iso_1_code": null, "iso_3_code": "tmu", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4793", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4791", "native_tokenizers": [], @@ -124,20 +148,24 @@ }, { "name": "Duvle", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duvle", + "depth": 3, "iso_1_code": null, "iso_3_code": "duv", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4795", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4794", "native_tokenizers": [], @@ -145,14 +173,17 @@ }, { "name": "East", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Obokuitai", + "depth": 3, "iso_1_code": null, "iso_3_code": "afz", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4797", "native_tokenizers": [], @@ -160,9 +191,11 @@ }, { "name": "Biritai", + "depth": 3, "iso_1_code": null, "iso_3_code": "bqq", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4798", "native_tokenizers": [], @@ -170,9 +203,11 @@ }, { "name": "Eritai", + "depth": 3, "iso_1_code": null, "iso_3_code": "ert", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4799", "native_tokenizers": [], @@ -180,9 +215,11 @@ }, { "name": "Kwerisa", + "depth": 3, "iso_1_code": null, "iso_3_code": "kkb", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4800", "native_tokenizers": [], @@ -190,9 +227,11 @@ }, { "name": "Papasena", + "depth": 3, "iso_1_code": null, "iso_3_code": "pas", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4801", "native_tokenizers": [], @@ -200,9 +239,11 @@ }, { "name": "Kaiy", + "depth": 3, "iso_1_code": null, "iso_3_code": "tcq", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4802", "native_tokenizers": [], @@ -210,9 +251,11 @@ }, { "name": "Doutai", + "depth": 3, "iso_1_code": null, "iso_3_code": "tds", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4803", "native_tokenizers": [], @@ -220,9 +263,11 @@ }, { "name": "Sikaritai", + "depth": 3, "iso_1_code": null, "iso_3_code": "tty", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4804", "native_tokenizers": [], @@ -230,15 +275,18 @@ }, { "name": "Waritai", + "depth": 3, "iso_1_code": null, "iso_3_code": "wbe", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4805", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4796", "native_tokenizers": [], @@ -246,14 +294,17 @@ }, { "name": "West", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fayu", + "depth": 3, "iso_1_code": null, "iso_3_code": "fau", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4807", "native_tokenizers": [], @@ -261,9 +312,11 @@ }, { "name": "Kirikiri", + "depth": 3, "iso_1_code": null, "iso_3_code": "kiy", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4808", "native_tokenizers": [], @@ -271,27 +324,32 @@ }, { "name": "Tause", + "depth": 3, "iso_1_code": null, "iso_3_code": "tad", "children": [], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4809", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4806", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4790", "native_tokenizers": [], "scripts": [] } ], + "family": "Lakes Plain", "tokenizers": {}, "node_i": "4781", "native_tokenizers": [], diff --git a/data/Language isolate.json b/data/Language isolate.json index d670e2aebd3d1644fba8d140ebdc39efda9fceff..c4a92bb46b34dbe6add5b025c03302767c4cdfed 100644 --- a/data/Language isolate.json +++ b/data/Language isolate.json @@ -1,22 +1,17 @@ { "name": "Language isolate", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ainu", + "depth": 1, "iso_1_code": null, "iso_3_code": "ain", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4811", "native_tokenizers": [], "scripts": [ @@ -25,9 +20,11 @@ }, { "name": "Mpur", + "depth": 1, "iso_1_code": null, "iso_3_code": "akc", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4812", "native_tokenizers": [], @@ -35,9 +32,11 @@ }, { "name": "Andoque", + "depth": 1, "iso_1_code": null, "iso_3_code": "ano", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4813", "native_tokenizers": [], @@ -45,9 +44,11 @@ }, { "name": "Atakapa", + "depth": 1, "iso_1_code": null, "iso_3_code": "aqp", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4814", "native_tokenizers": [], @@ -55,9 +56,11 @@ }, { "name": "Arutani", + "depth": 1, "iso_1_code": null, "iso_3_code": "atx", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4815", "native_tokenizers": [], @@ -65,18 +68,12 @@ }, { "name": "Waorani", + "depth": 1, "iso_1_code": null, "iso_3_code": "auc", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4816", "native_tokenizers": [], "scripts": [ @@ -85,9 +82,11 @@ }, { "name": "Aushiri", + "depth": 1, "iso_1_code": null, "iso_3_code": "avs", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4817", "native_tokenizers": [], @@ -95,9 +94,11 @@ }, { "name": "Odiai", + "depth": 1, "iso_1_code": null, "iso_3_code": "bhf", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4818", "native_tokenizers": [], @@ -105,9 +106,11 @@ }, { "name": "Abinomn", + "depth": 1, "iso_1_code": null, "iso_3_code": "bsa", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4819", "native_tokenizers": [], @@ -115,9 +118,11 @@ }, { "name": "Burushaski", + "depth": 1, "iso_1_code": null, "iso_3_code": "bsk", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4820", "native_tokenizers": [], @@ -125,9 +130,11 @@ }, { "name": "Callawalla", + "depth": 1, "iso_1_code": null, "iso_3_code": "caw", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4821", "native_tokenizers": [], @@ -135,18 +142,12 @@ }, { "name": "Chiquitano", + "depth": 1, "iso_1_code": null, "iso_3_code": "cax", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4822", "native_tokenizers": [], "scripts": [ @@ -155,9 +156,11 @@ }, { "name": "Canichana", + "depth": 1, "iso_1_code": null, "iso_3_code": "caz", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4823", "native_tokenizers": [], @@ -165,18 +168,12 @@ }, { "name": "Kandozi-Chapra", + "depth": 1, "iso_1_code": null, "iso_3_code": "cbu", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4824", "native_tokenizers": [], "scripts": [ @@ -185,9 +182,11 @@ }, { "name": "Cent\u00fa\u00fam", + "depth": 1, "iso_1_code": null, "iso_3_code": "cet", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4825", "native_tokenizers": [], @@ -195,9 +194,11 @@ }, { "name": "Chimariko", + "depth": 1, "iso_1_code": null, "iso_3_code": "cid", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4826", "native_tokenizers": [], @@ -205,18 +206,12 @@ }, { "name": "Cof\u00e1n", + "depth": 1, "iso_1_code": null, "iso_3_code": "con", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4827", "native_tokenizers": [], "scripts": [ @@ -225,9 +220,11 @@ }, { "name": "Chitimacha", + "depth": 1, "iso_1_code": null, "iso_3_code": "ctm", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4828", "native_tokenizers": [], @@ -235,9 +232,11 @@ }, { "name": "Cuitlatec", + "depth": 1, "iso_1_code": null, "iso_3_code": "cuy", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4829", "native_tokenizers": [], @@ -245,9 +244,11 @@ }, { "name": "Cayubaba", + "depth": 1, "iso_1_code": null, "iso_3_code": "cyb", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4830", "native_tokenizers": [], @@ -255,9 +256,11 @@ }, { "name": "Bangime", + "depth": 1, "iso_1_code": null, "iso_3_code": "dba", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4831", "native_tokenizers": [], @@ -265,9 +268,11 @@ }, { "name": "Esselen", + "depth": 1, "iso_1_code": null, "iso_3_code": "esq", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4832", "native_tokenizers": [], @@ -275,9 +280,11 @@ }, { "name": "Basque", + "depth": 1, "iso_1_code": "eu", "iso_3_code": "eus", "children": [], + "family": "Language isolate", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"eu\")", @@ -297,9 +304,11 @@ }, { "name": "Iat\u00ea", + "depth": 1, "iso_1_code": null, "iso_3_code": "fun", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4834", "native_tokenizers": [], @@ -307,9 +316,11 @@ }, { "name": "Laal", + "depth": 1, "iso_1_code": null, "iso_3_code": "gdm", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4835", "native_tokenizers": [], @@ -317,9 +328,11 @@ }, { "name": "Tayap", + "depth": 1, "iso_1_code": null, "iso_3_code": "gpn", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4836", "native_tokenizers": [], @@ -327,9 +340,11 @@ }, { "name": "Guat\u00f3", + "depth": 1, "iso_1_code": null, "iso_3_code": "gta", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4837", "native_tokenizers": [], @@ -337,9 +352,11 @@ }, { "name": "Hatam", + "depth": 1, "iso_1_code": null, "iso_3_code": "had", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4838", "native_tokenizers": [], @@ -347,9 +364,11 @@ }, { "name": "Hadza", + "depth": 1, "iso_1_code": null, "iso_3_code": "hts", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4839", "native_tokenizers": [], @@ -357,9 +376,11 @@ }, { "name": "Ir\u00e1ntxe", + "depth": 1, "iso_1_code": null, "iso_3_code": "irn", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4840", "native_tokenizers": [], @@ -367,9 +388,11 @@ }, { "name": "Itonama", + "depth": 1, "iso_1_code": null, "iso_3_code": "ito", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4841", "native_tokenizers": [], @@ -377,18 +400,12 @@ }, { "name": "Cams\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "kbh", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4842", "native_tokenizers": [], "scripts": [ @@ -397,9 +414,11 @@ }, { "name": "Kusunda", + "depth": 1, "iso_1_code": null, "iso_3_code": "kgg", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4843", "native_tokenizers": [], @@ -407,18 +426,12 @@ }, { "name": "Abun", + "depth": 1, "iso_1_code": null, "iso_3_code": "kgr", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4844", "native_tokenizers": [], "scripts": [ @@ -427,9 +440,11 @@ }, { "name": "Klamath-Modoc", + "depth": 1, "iso_1_code": null, "iso_3_code": "kla", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4845", "native_tokenizers": [], @@ -437,9 +452,11 @@ }, { "name": "Kol", + "depth": 1, "iso_1_code": null, "iso_3_code": "kol", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4846", "native_tokenizers": [], @@ -447,18 +464,12 @@ }, { "name": "Kuot", + "depth": 1, "iso_1_code": null, "iso_3_code": "kto", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4847", "native_tokenizers": [], "scripts": [ @@ -467,9 +478,11 @@ }, { "name": "Kutenai", + "depth": 1, "iso_1_code": null, "iso_3_code": "kut", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4848", "native_tokenizers": [], @@ -477,9 +490,11 @@ }, { "name": "Kunza", + "depth": 1, "iso_1_code": null, "iso_3_code": "kuz", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4849", "native_tokenizers": [], @@ -487,9 +502,11 @@ }, { "name": "Kano\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "kxo", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4850", "native_tokenizers": [], @@ -497,9 +514,11 @@ }, { "name": "Karok", + "depth": 1, "iso_1_code": null, "iso_3_code": "kyh", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4851", "native_tokenizers": [], @@ -507,9 +526,11 @@ }, { "name": "Karir\u00ed-Xoc\u00f3", + "depth": 1, "iso_1_code": null, "iso_3_code": "kzw", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4852", "native_tokenizers": [], @@ -517,9 +538,11 @@ }, { "name": "Leco", + "depth": 1, "iso_1_code": null, "iso_3_code": "lec", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4853", "native_tokenizers": [], @@ -527,9 +550,11 @@ }, { "name": "Molale", + "depth": 1, "iso_1_code": null, "iso_3_code": "mbe", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4854", "native_tokenizers": [], @@ -537,9 +562,11 @@ }, { "name": "Mawes", + "depth": 1, "iso_1_code": null, "iso_3_code": "mgk", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4855", "native_tokenizers": [], @@ -547,9 +574,11 @@ }, { "name": "Elseng", + "depth": 1, "iso_1_code": null, "iso_3_code": "mrf", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4856", "native_tokenizers": [], @@ -557,9 +586,11 @@ }, { "name": "Massep", + "depth": 1, "iso_1_code": null, "iso_3_code": "mvs", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4857", "native_tokenizers": [], @@ -567,9 +598,11 @@ }, { "name": "Muniche", + "depth": 1, "iso_1_code": null, "iso_3_code": "myr", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4858", "native_tokenizers": [], @@ -577,9 +610,11 @@ }, { "name": "Movima", + "depth": 1, "iso_1_code": null, "iso_3_code": "mzp", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4859", "native_tokenizers": [], @@ -587,9 +622,11 @@ }, { "name": "Yale", + "depth": 1, "iso_1_code": null, "iso_3_code": "nce", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4860", "native_tokenizers": [], @@ -597,9 +634,11 @@ }, { "name": "Natchez", + "depth": 1, "iso_1_code": null, "iso_3_code": "ncz", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4861", "native_tokenizers": [], @@ -607,9 +646,11 @@ }, { "name": "Gilyak", + "depth": 1, "iso_1_code": null, "iso_3_code": "niv", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4862", "native_tokenizers": [], @@ -617,9 +658,11 @@ }, { "name": "Nihali", + "depth": 1, "iso_1_code": null, "iso_3_code": "nll", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4863", "native_tokenizers": [], @@ -627,9 +670,11 @@ }, { "name": "Mochica", + "depth": 1, "iso_1_code": null, "iso_3_code": "omc", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4864", "native_tokenizers": [], @@ -637,9 +682,11 @@ }, { "name": "Omurano", + "depth": 1, "iso_1_code": null, "iso_3_code": "omu", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4865", "native_tokenizers": [], @@ -647,9 +694,11 @@ }, { "name": "Ofay\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "opy", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4866", "native_tokenizers": [], @@ -657,9 +706,11 @@ }, { "name": "Oti", + "depth": 1, "iso_1_code": null, "iso_3_code": "oti", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4867", "native_tokenizers": [], @@ -667,9 +718,11 @@ }, { "name": "Pankarar\u00fa", + "depth": 1, "iso_1_code": null, "iso_3_code": "paz", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4868", "native_tokenizers": [], @@ -677,9 +730,11 @@ }, { "name": "Pyu", + "depth": 1, "iso_1_code": null, "iso_3_code": "pby", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4869", "native_tokenizers": [], @@ -687,9 +742,11 @@ }, { "name": "Puelche", + "depth": 1, "iso_1_code": null, "iso_3_code": "pue", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4870", "native_tokenizers": [], @@ -697,9 +754,11 @@ }, { "name": "Puquina", + "depth": 1, "iso_1_code": null, "iso_3_code": "puq", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4871", "native_tokenizers": [], @@ -707,18 +766,12 @@ }, { "name": "Rikbaktsa", + "depth": 1, "iso_1_code": null, "iso_3_code": "rkb", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4872", "native_tokenizers": [], "scripts": [ @@ -727,9 +780,11 @@ }, { "name": "Sandawe", + "depth": 1, "iso_1_code": null, "iso_3_code": "sad", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4873", "native_tokenizers": [], @@ -737,9 +792,11 @@ }, { "name": "Seri", + "depth": 1, "iso_1_code": null, "iso_3_code": "sei", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4874", "native_tokenizers": [], @@ -747,9 +804,11 @@ }, { "name": "Shasta", + "depth": 1, "iso_1_code": null, "iso_3_code": "sht", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4875", "native_tokenizers": [], @@ -757,9 +816,11 @@ }, { "name": "Siuslaw", + "depth": 1, "iso_1_code": null, "iso_3_code": "sis", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4876", "native_tokenizers": [], @@ -767,9 +828,11 @@ }, { "name": "Salinan", + "depth": 1, "iso_1_code": null, "iso_3_code": "sln", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4877", "native_tokenizers": [], @@ -777,9 +840,11 @@ }, { "name": "Sap\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "spc", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4878", "native_tokenizers": [], @@ -787,18 +852,12 @@ }, { "name": "Sulka", + "depth": 1, "iso_1_code": null, "iso_3_code": "sua", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4879", "native_tokenizers": [], "scripts": [ @@ -807,9 +866,11 @@ }, { "name": "Aikan\u00e3", + "depth": 1, "iso_1_code": null, "iso_3_code": "tba", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4880", "native_tokenizers": [], @@ -817,18 +878,12 @@ }, { "name": "Ticuna", + "depth": 1, "iso_1_code": null, "iso_3_code": "tca", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4881", "native_tokenizers": [], "scripts": [ @@ -837,9 +892,11 @@ }, { "name": "Taruma", + "depth": 1, "iso_1_code": null, "iso_3_code": "tdm", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4882", "native_tokenizers": [], @@ -847,9 +904,11 @@ }, { "name": "Timucua", + "depth": 1, "iso_1_code": null, "iso_3_code": "tjm", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4883", "native_tokenizers": [], @@ -857,9 +916,11 @@ }, { "name": "Trumai", + "depth": 1, "iso_1_code": null, "iso_3_code": "tpy", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4884", "native_tokenizers": [], @@ -867,9 +928,11 @@ }, { "name": "Tonkawa", + "depth": 1, "iso_1_code": null, "iso_3_code": "tqw", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4885", "native_tokenizers": [], @@ -877,9 +940,11 @@ }, { "name": "Taushiro", + "depth": 1, "iso_1_code": null, "iso_3_code": "trr", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4886", "native_tokenizers": [], @@ -887,9 +952,11 @@ }, { "name": "Tux\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "tud", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4887", "native_tokenizers": [], @@ -897,9 +964,11 @@ }, { "name": "Tunica", + "depth": 1, "iso_1_code": null, "iso_3_code": "tun", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4888", "native_tokenizers": [], @@ -907,9 +976,11 @@ }, { "name": "Uamu\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "uam", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4889", "native_tokenizers": [], @@ -917,18 +988,12 @@ }, { "name": "Urarina", + "depth": 1, "iso_1_code": null, "iso_3_code": "ura", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4890", "native_tokenizers": [], "scripts": [ @@ -937,9 +1002,11 @@ }, { "name": "Vilela", + "depth": 1, "iso_1_code": null, "iso_3_code": "vil", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4891", "native_tokenizers": [], @@ -947,9 +1014,11 @@ }, { "name": "Washo", + "depth": 1, "iso_1_code": null, "iso_3_code": "was", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4892", "native_tokenizers": [], @@ -957,18 +1026,12 @@ }, { "name": "Warao", + "depth": 1, "iso_1_code": null, "iso_3_code": "wba", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4893", "native_tokenizers": [], "scripts": [ @@ -977,9 +1040,11 @@ }, { "name": "M\u00e1ku", + "depth": 1, "iso_1_code": null, "iso_3_code": "xak", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4894", "native_tokenizers": [], @@ -987,9 +1052,11 @@ }, { "name": "Cayuse", + "depth": 1, "iso_1_code": null, "iso_3_code": "xcy", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4895", "native_tokenizers": [], @@ -997,9 +1064,11 @@ }, { "name": "Xinca", + "depth": 1, "iso_1_code": null, "iso_3_code": "xin", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4896", "native_tokenizers": [], @@ -1007,9 +1076,11 @@ }, { "name": "Xukur\u00fa", + "depth": 1, "iso_1_code": null, "iso_3_code": "xoo", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4897", "native_tokenizers": [], @@ -1017,9 +1088,11 @@ }, { "name": "Tasmanian, Northeastern", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpb", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4898", "native_tokenizers": [], @@ -1027,9 +1100,11 @@ }, { "name": "Tasmanian, Oyster Bay", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpd", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4899", "native_tokenizers": [], @@ -1037,9 +1112,11 @@ }, { "name": "Tasmanian, Southeast", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpf", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4900", "native_tokenizers": [], @@ -1047,9 +1124,11 @@ }, { "name": "Tasmanian, North Midlands", + "depth": 1, "iso_1_code": null, "iso_3_code": "xph", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4901", "native_tokenizers": [], @@ -1057,9 +1136,11 @@ }, { "name": "Tasmanian, Port Sorell", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpl", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4902", "native_tokenizers": [], @@ -1067,9 +1148,11 @@ }, { "name": "Tasmanian, Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpv", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4903", "native_tokenizers": [], @@ -1077,9 +1160,11 @@ }, { "name": "Tasmanian, Northwestern", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpw", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4904", "native_tokenizers": [], @@ -1087,9 +1172,11 @@ }, { "name": "Tasmanian, Southwestern", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpx", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4905", "native_tokenizers": [], @@ -1097,9 +1184,11 @@ }, { "name": "Tasmanian, Bruny Island", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpz", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4906", "native_tokenizers": [], @@ -1107,9 +1196,11 @@ }, { "name": "Kwaza", + "depth": 1, "iso_1_code": null, "iso_3_code": "xwa", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4907", "native_tokenizers": [], @@ -1117,9 +1208,11 @@ }, { "name": "Y\u00e1mana", + "depth": 1, "iso_1_code": null, "iso_3_code": "yag", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4908", "native_tokenizers": [], @@ -1127,9 +1220,11 @@ }, { "name": "Hod\u00ef", + "depth": 1, "iso_1_code": null, "iso_3_code": "yau", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4909", "native_tokenizers": [], @@ -1137,9 +1232,11 @@ }, { "name": "Yana", + "depth": 1, "iso_1_code": null, "iso_3_code": "ynn", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4910", "native_tokenizers": [], @@ -1147,9 +1244,11 @@ }, { "name": "Yuchi", + "depth": 1, "iso_1_code": null, "iso_3_code": "yuc", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4911", "native_tokenizers": [], @@ -1157,18 +1256,12 @@ }, { "name": "Yuracare", + "depth": 1, "iso_1_code": null, "iso_3_code": "yuz", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4912", "native_tokenizers": [], "scripts": [ @@ -1177,9 +1270,11 @@ }, { "name": "Karankawa", + "depth": 1, "iso_1_code": null, "iso_3_code": "zkk", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4913", "native_tokenizers": [], @@ -1187,24 +1282,19 @@ }, { "name": "Zuni", + "depth": 1, "iso_1_code": null, "iso_3_code": "zun", "children": [], + "family": "Language isolate", "tokenizers": {}, "node_i": "4914", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"eu\")", - "original_lang_name": "basque", - "original_lang_code": "eus", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Language isolate", + "tokenizers": {}, "node_i": "4810", "native_tokenizers": [], "scripts": [] diff --git a/data/Lencan.json b/data/Lencan.json index 9f43dda358ff176ece7dc2148c41a0a3e85abbdb..46a0c38ba4d2bd9c5205c1a592adf26046d6629b 100644 --- a/data/Lencan.json +++ b/data/Lencan.json @@ -1,19 +1,23 @@ { "name": "Lencan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lenca", + "depth": 1, "iso_1_code": null, "iso_3_code": "len", "children": [], + "family": "Lencan", "tokenizers": {}, "node_i": "4916", "native_tokenizers": [], "scripts": [] } ], + "family": "Lencan", "tokenizers": {}, "node_i": "4915", "native_tokenizers": [], diff --git a/data/Lower Mamberamo.json b/data/Lower Mamberamo.json index ef3488ad22f56ea41eb57c2e7e67890bda4e8144..0c2eae711089fcc3131850397d1a723f875cd6e6 100644 --- a/data/Lower Mamberamo.json +++ b/data/Lower Mamberamo.json @@ -1,13 +1,16 @@ { "name": "Lower Mamberamo", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Warembori", + "depth": 1, "iso_1_code": null, "iso_3_code": "wsa", "children": [], + "family": "Lower Mamberamo", "tokenizers": {}, "node_i": "4918", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Yoke", + "depth": 1, "iso_1_code": null, "iso_3_code": "yki", "children": [], + "family": "Lower Mamberamo", "tokenizers": {}, "node_i": "4919", "native_tokenizers": [], "scripts": [] } ], + "family": "Lower Mamberamo", "tokenizers": {}, "node_i": "4917", "native_tokenizers": [], diff --git a/data/Maiduan.json b/data/Maiduan.json index ef816215c01ece85cd6c03aef29fb9c10de2f736..9e3b5331f6d264d7d274b38fe2487104370026f7 100644 --- a/data/Maiduan.json +++ b/data/Maiduan.json @@ -1,13 +1,16 @@ { "name": "Maiduan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maidu, Northwest", + "depth": 1, "iso_1_code": null, "iso_3_code": "mjd", "children": [], + "family": "Maiduan", "tokenizers": {}, "node_i": "4921", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Nisenan", + "depth": 1, "iso_1_code": null, "iso_3_code": "nsz", "children": [], + "family": "Maiduan", "tokenizers": {}, "node_i": "4922", "native_tokenizers": [], @@ -25,14 +30,17 @@ }, { "name": "Maidu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maidu, Northeast", + "depth": 2, "iso_1_code": null, "iso_3_code": "nmu", "children": [], + "family": "Maiduan", "tokenizers": {}, "node_i": "4924", "native_tokenizers": [], @@ -40,21 +48,25 @@ }, { "name": "Maidu, Valley", + "depth": 2, "iso_1_code": null, "iso_3_code": "vmv", "children": [], + "family": "Maiduan", "tokenizers": {}, "node_i": "4925", "native_tokenizers": [], "scripts": [] } ], + "family": "Maiduan", "tokenizers": {}, "node_i": "4923", "native_tokenizers": [], "scripts": [] } ], + "family": "Maiduan", "tokenizers": {}, "node_i": "4920", "native_tokenizers": [], diff --git a/data/Maipurean.json b/data/Maipurean.json index 2003a8eb48ffa9e56f499fa163dfae31a1afc4cb..c3d1d31c5fd7a8ebac4fd6c7ab1b0d569d26f9a7 100644 --- a/data/Maipurean.json +++ b/data/Maipurean.json @@ -1,28 +1,34 @@ { "name": "Maipurean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Palikur", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Palik\u00far", + "depth": 4, "iso_1_code": null, "iso_3_code": "plu", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4930", "native_tokenizers": [], @@ -31,12 +37,14 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4929", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4928", "native_tokenizers": [], @@ -44,19 +52,23 @@ }, { "name": "Maritime", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ta-Maipurean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arawak", + "depth": 4, "iso_1_code": null, "iso_3_code": "arw", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4933", "native_tokenizers": [], @@ -64,9 +76,11 @@ }, { "name": "Wayuu", + "depth": 4, "iso_1_code": null, "iso_3_code": "guc", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4934", "native_tokenizers": [], @@ -76,9 +90,11 @@ }, { "name": "Paraujano", + "depth": 4, "iso_1_code": null, "iso_3_code": "pbg", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4935", "native_tokenizers": [], @@ -86,9 +102,11 @@ }, { "name": "Ta\u00edno", + "depth": 4, "iso_1_code": null, "iso_3_code": "tnq", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4936", "native_tokenizers": [], @@ -96,14 +114,17 @@ }, { "name": "I\u00f1eri", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Garifuna", + "depth": 5, "iso_1_code": null, "iso_3_code": "cab", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4938", "native_tokenizers": [], @@ -113,21 +134,25 @@ }, { "name": "Island Carib", + "depth": 5, "iso_1_code": null, "iso_3_code": "crb", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4939", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4937", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4932", "native_tokenizers": [], @@ -135,14 +160,17 @@ }, { "name": "Wapixana", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atorada", + "depth": 4, "iso_1_code": null, "iso_3_code": "aox", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4941", "native_tokenizers": [], @@ -150,9 +178,11 @@ }, { "name": "Mapidian", + "depth": 4, "iso_1_code": null, "iso_3_code": "mpw", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4942", "native_tokenizers": [], @@ -160,9 +190,11 @@ }, { "name": "Wapishana", + "depth": 4, "iso_1_code": null, "iso_3_code": "wap", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4943", "native_tokenizers": [], @@ -171,12 +203,14 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4940", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4931", "native_tokenizers": [], @@ -184,14 +218,17 @@ }, { "name": "Upper Amazon", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Res\u00edgaro", + "depth": 3, "iso_1_code": null, "iso_3_code": "rgr", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4945", "native_tokenizers": [], @@ -199,25 +236,30 @@ }, { "name": "Central Upper Amazon", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bar\u00e9", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bar\u00e9", + "depth": 5, "iso_1_code": null, "iso_3_code": "bae", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4948", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4947", "native_tokenizers": [], @@ -225,14 +267,17 @@ }, { "name": "Yavitero", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baniva", + "depth": 5, "iso_1_code": null, "iso_3_code": "bvv", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4950", "native_tokenizers": [], @@ -240,21 +285,25 @@ }, { "name": "Yavitero", + "depth": 5, "iso_1_code": null, "iso_3_code": "yvt", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4951", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4949", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4946", "native_tokenizers": [], @@ -262,14 +311,17 @@ }, { "name": "Eastern Nawiki", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tariana", + "depth": 4, "iso_1_code": null, "iso_3_code": "tae", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4953", "native_tokenizers": [], @@ -277,14 +329,17 @@ }, { "name": "Karu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baniwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "bwi", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4955", "native_tokenizers": [], @@ -294,21 +349,25 @@ }, { "name": "Curripaco", + "depth": 5, "iso_1_code": null, "iso_3_code": "kpc", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4956", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4954", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4952", "native_tokenizers": [], @@ -316,14 +375,17 @@ }, { "name": "Unclassified", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Xiri\u00e2na", + "depth": 4, "iso_1_code": null, "iso_3_code": "xir", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4958", "native_tokenizers": [], @@ -331,15 +393,18 @@ }, { "name": "Yaba\u00e2na", + "depth": 4, "iso_1_code": null, "iso_3_code": "ybn", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4959", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4957", "native_tokenizers": [], @@ -347,14 +412,17 @@ }, { "name": "Western Nawiki", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cabiyar\u00ed", + "depth": 4, "iso_1_code": null, "iso_3_code": "cbb", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4961", "native_tokenizers": [], @@ -362,9 +430,11 @@ }, { "name": "Yucuna", + "depth": 4, "iso_1_code": null, "iso_3_code": "ycn", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4962", "native_tokenizers": [], @@ -374,14 +444,17 @@ }, { "name": "Piapoco", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Achagua", + "depth": 5, "iso_1_code": null, "iso_3_code": "aca", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4964", "native_tokenizers": [], @@ -391,9 +464,11 @@ }, { "name": "Piapoco", + "depth": 5, "iso_1_code": null, "iso_3_code": "pio", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4965", "native_tokenizers": [], @@ -402,6 +477,7 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4963", "native_tokenizers": [], @@ -409,14 +485,17 @@ }, { "name": "Warekena", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guarequena", + "depth": 5, "iso_1_code": null, "iso_3_code": "gae", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4967", "native_tokenizers": [], @@ -424,33 +503,39 @@ }, { "name": "Mandahuaca", + "depth": 5, "iso_1_code": null, "iso_3_code": "mht", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4968", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4966", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4960", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4944", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4927", "native_tokenizers": [], @@ -458,19 +543,23 @@ }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Campa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ash\u00e1ninka", + "depth": 3, "iso_1_code": null, "iso_3_code": "cni", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4971", "native_tokenizers": [], @@ -480,14 +569,17 @@ }, { "name": "Ash\u00e9ninga", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ash\u00e9ninka, Pajonal", + "depth": 4, "iso_1_code": null, "iso_3_code": "cjo", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4973", "native_tokenizers": [], @@ -497,9 +589,11 @@ }, { "name": "Nanti", + "depth": 4, "iso_1_code": null, "iso_3_code": "cox", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4974", "native_tokenizers": [], @@ -507,9 +601,11 @@ }, { "name": "Ash\u00e9ninka, Ucayali-Yur\u00faa", + "depth": 4, "iso_1_code": null, "iso_3_code": "cpb", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4975", "native_tokenizers": [], @@ -519,9 +615,11 @@ }, { "name": "Ajy\u00edninka Apurucayali", + "depth": 4, "iso_1_code": null, "iso_3_code": "cpc", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4976", "native_tokenizers": [], @@ -531,9 +629,11 @@ }, { "name": "Ash\u00e9ninka, Pichis", + "depth": 4, "iso_1_code": null, "iso_3_code": "cpu", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4977", "native_tokenizers": [], @@ -543,9 +643,11 @@ }, { "name": "Ash\u00e9ninka, South Ucayali", + "depth": 4, "iso_1_code": null, "iso_3_code": "cpy", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4978", "native_tokenizers": [], @@ -555,9 +657,11 @@ }, { "name": "Nomatsigenga", + "depth": 4, "iso_1_code": null, "iso_3_code": "not", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4979", "native_tokenizers": [], @@ -567,9 +671,11 @@ }, { "name": "Ash\u00e9ninka, Peren\u00e9", + "depth": 4, "iso_1_code": null, "iso_3_code": "prq", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4980", "native_tokenizers": [], @@ -578,6 +684,7 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4972", "native_tokenizers": [], @@ -585,14 +692,17 @@ }, { "name": "Machiguenga", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Caquinte", + "depth": 4, "iso_1_code": null, "iso_3_code": "cot", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4982", "native_tokenizers": [], @@ -602,9 +712,11 @@ }, { "name": "Matsigenka", + "depth": 4, "iso_1_code": null, "iso_3_code": "mcb", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4983", "native_tokenizers": [], @@ -613,12 +725,14 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4981", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4970", "native_tokenizers": [], @@ -626,19 +740,23 @@ }, { "name": "Central", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pares\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Parec\u00eds", + "depth": 4, "iso_1_code": null, "iso_3_code": "pab", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4986", "native_tokenizers": [], @@ -648,15 +766,18 @@ }, { "name": "Saraveca", + "depth": 4, "iso_1_code": null, "iso_3_code": "sar", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4987", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4985", "native_tokenizers": [], @@ -664,14 +785,17 @@ }, { "name": "Waur\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mehin\u00e1ku", + "depth": 4, "iso_1_code": null, "iso_3_code": "mmh", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4989", "native_tokenizers": [], @@ -679,14 +803,17 @@ }, { "name": "Waur\u00e1-Meinaku", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Waur\u00e1", + "depth": 5, "iso_1_code": null, "iso_3_code": "wau", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4991", "native_tokenizers": [], @@ -694,27 +821,32 @@ }, { "name": "Yawalapit\u00ed", + "depth": 5, "iso_1_code": null, "iso_3_code": "yaw", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4992", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4990", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4988", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4984", "native_tokenizers": [], @@ -722,19 +854,23 @@ }, { "name": "Southern Outlier", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mojo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baure", + "depth": 4, "iso_1_code": null, "iso_3_code": "brg", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4995", "native_tokenizers": [], @@ -742,9 +878,11 @@ }, { "name": "Paunaka", + "depth": 4, "iso_1_code": null, "iso_3_code": "pnk", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4996", "native_tokenizers": [], @@ -752,14 +890,17 @@ }, { "name": "Mojo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ignaciano", + "depth": 5, "iso_1_code": null, "iso_3_code": "ign", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4998", "native_tokenizers": [], @@ -769,9 +910,11 @@ }, { "name": "Trinitario", + "depth": 5, "iso_1_code": null, "iso_3_code": "trn", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "4999", "native_tokenizers": [], @@ -780,12 +923,14 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4997", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4994", "native_tokenizers": [], @@ -793,14 +938,17 @@ }, { "name": "Piro", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apurin\u00e3", + "depth": 4, "iso_1_code": null, "iso_3_code": "apu", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5001", "native_tokenizers": [], @@ -810,9 +958,11 @@ }, { "name": "I\u00f1apari", + "depth": 4, "iso_1_code": null, "iso_3_code": "inp", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5002", "native_tokenizers": [], @@ -820,14 +970,17 @@ }, { "name": "Piro", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mashco Piro", + "depth": 5, "iso_1_code": null, "iso_3_code": "cuj", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5004", "native_tokenizers": [], @@ -835,9 +988,11 @@ }, { "name": "Machinere", + "depth": 5, "iso_1_code": null, "iso_3_code": "mpd", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5005", "native_tokenizers": [], @@ -845,9 +1000,11 @@ }, { "name": "Yine", + "depth": 5, "iso_1_code": null, "iso_3_code": "pib", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5006", "native_tokenizers": [], @@ -856,12 +1013,14 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "5003", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "5000", "native_tokenizers": [], @@ -869,14 +1028,17 @@ }, { "name": "Terena", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chan\u00e9", + "depth": 4, "iso_1_code": null, "iso_3_code": "caj", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5008", "native_tokenizers": [], @@ -884,9 +1046,11 @@ }, { "name": "Guana", + "depth": 4, "iso_1_code": null, "iso_3_code": "gqn", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5009", "native_tokenizers": [], @@ -894,9 +1058,11 @@ }, { "name": "Ter\u00eana", + "depth": 4, "iso_1_code": null, "iso_3_code": "ter", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5010", "native_tokenizers": [], @@ -905,12 +1071,14 @@ ] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "5007", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4993", "native_tokenizers": [], @@ -918,14 +1086,17 @@ }, { "name": "Western", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yanesha\u2019", + "depth": 3, "iso_1_code": null, "iso_3_code": "ame", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5012", "native_tokenizers": [], @@ -935,21 +1106,25 @@ }, { "name": "Chamicuro", + "depth": 3, "iso_1_code": null, "iso_3_code": "ccc", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5013", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "5011", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4969", "native_tokenizers": [], @@ -957,14 +1132,17 @@ }, { "name": "Unclassified", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mawayana", + "depth": 2, "iso_1_code": null, "iso_3_code": "mzx", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5015", "native_tokenizers": [], @@ -972,21 +1150,25 @@ }, { "name": "Enawen\u00e9-Naw\u00e9", + "depth": 2, "iso_1_code": null, "iso_3_code": "unk", "children": [], + "family": "Maipurean", "tokenizers": {}, "node_i": "5016", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "5014", "native_tokenizers": [], "scripts": [] } ], + "family": "Maipurean", "tokenizers": {}, "node_i": "4926", "native_tokenizers": [], diff --git a/data/Mairasi.json b/data/Mairasi.json index 9e35457c6e0c328c533df475a5c44b60104dab62..56bbe1db6fc7d5da7356d6483c843f9f75592017 100644 --- a/data/Mairasi.json +++ b/data/Mairasi.json @@ -1,13 +1,16 @@ { "name": "Mairasi", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Semimi", + "depth": 1, "iso_1_code": null, "iso_3_code": "etz", "children": [], + "family": "Mairasi", "tokenizers": {}, "node_i": "5018", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Mer", + "depth": 1, "iso_1_code": null, "iso_3_code": "mnu", "children": [], + "family": "Mairasi", "tokenizers": {}, "node_i": "5019", "native_tokenizers": [], @@ -25,15 +30,18 @@ }, { "name": "Mairasi", + "depth": 1, "iso_1_code": null, "iso_3_code": "zrs", "children": [], + "family": "Mairasi", "tokenizers": {}, "node_i": "5020", "native_tokenizers": [], "scripts": [] } ], + "family": "Mairasi", "tokenizers": {}, "node_i": "5017", "native_tokenizers": [], diff --git a/data/Mapudungu.json b/data/Mapudungu.json index 5458daf5abe81c369d794bfb6b36c587b5c92f17..ee314246955d84b75867d2558b1e9f329fe93c6d 100644 --- a/data/Mapudungu.json +++ b/data/Mapudungu.json @@ -1,13 +1,16 @@ { "name": "Mapudungu", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mapudungun", + "depth": 1, "iso_1_code": null, "iso_3_code": "arn", "children": [], + "family": "Mapudungu", "tokenizers": {}, "node_i": "5022", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Huilliche", + "depth": 1, "iso_1_code": null, "iso_3_code": "huh", "children": [], + "family": "Mapudungu", "tokenizers": {}, "node_i": "5023", "native_tokenizers": [], "scripts": [] } ], + "family": "Mapudungu", "tokenizers": {}, "node_i": "5021", "native_tokenizers": [], diff --git a/data/Mascoyan.json b/data/Mascoyan.json index 617813cbc2a7964524b1694e4a84bb0fa000f501..5094eb8fc0f1a690b283a81853058862691627fa 100644 --- a/data/Mascoyan.json +++ b/data/Mascoyan.json @@ -1,13 +1,16 @@ { "name": "Mascoyan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angait\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "aqt", "children": [], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5025", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Enlhet", + "depth": 1, "iso_1_code": null, "iso_3_code": "enl", "children": [], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5026", "native_tokenizers": [], @@ -27,9 +32,11 @@ }, { "name": "Enxet", + "depth": 1, "iso_1_code": null, "iso_3_code": "enx", "children": [], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5027", "native_tokenizers": [], @@ -39,9 +46,11 @@ }, { "name": "Guana", + "depth": 1, "iso_1_code": null, "iso_3_code": "gva", "children": [], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5028", "native_tokenizers": [], @@ -49,9 +58,11 @@ }, { "name": "Sanapan\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "spn", "children": [], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5029", "native_tokenizers": [], @@ -59,26 +70,31 @@ }, { "name": "Mascoy", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Toba-Maskoy", + "depth": 2, "iso_1_code": null, "iso_3_code": "tmf", "children": [], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5031", "native_tokenizers": [], "scripts": [] } ], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5030", "native_tokenizers": [], "scripts": [] } ], + "family": "Mascoyan", "tokenizers": {}, "node_i": "5024", "native_tokenizers": [], diff --git a/data/Matacoan.json b/data/Matacoan.json index b234cb51c14d625c646a75fb75c7e192e73c8722..3c3c7aa0dcc89b60608630083737f9c5ed4d4834 100644 --- a/data/Matacoan.json +++ b/data/Matacoan.json @@ -1,13 +1,16 @@ { "name": "Matacoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nivacl\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "cag", "children": [], + "family": "Matacoan", "tokenizers": {}, "node_i": "5033", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Maka", + "depth": 1, "iso_1_code": null, "iso_3_code": "mca", "children": [], + "family": "Matacoan", "tokenizers": {}, "node_i": "5034", "native_tokenizers": [], @@ -29,14 +34,17 @@ }, { "name": "Chorote", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chorote, Iyo\u2019wujwa", + "depth": 2, "iso_1_code": null, "iso_3_code": "crq", "children": [], + "family": "Matacoan", "tokenizers": {}, "node_i": "5036", "native_tokenizers": [], @@ -44,9 +52,11 @@ }, { "name": "Chorote, Iyojwa\u2019ja", + "depth": 2, "iso_1_code": null, "iso_3_code": "crt", "children": [], + "family": "Matacoan", "tokenizers": {}, "node_i": "5037", "native_tokenizers": [], @@ -55,6 +65,7 @@ ] } ], + "family": "Matacoan", "tokenizers": {}, "node_i": "5035", "native_tokenizers": [], @@ -62,14 +73,17 @@ }, { "name": "Mataco", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Weenhayek", + "depth": 2, "iso_1_code": null, "iso_3_code": "mtp", "children": [], + "family": "Matacoan", "tokenizers": {}, "node_i": "5039", "native_tokenizers": [], @@ -79,9 +93,11 @@ }, { "name": "Pilcomayo Wich\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": "mzh", "children": [], + "family": "Matacoan", "tokenizers": {}, "node_i": "5040", "native_tokenizers": [], @@ -91,9 +107,11 @@ }, { "name": "Bermejo Wich\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": "wlv", "children": [], + "family": "Matacoan", "tokenizers": {}, "node_i": "5041", "native_tokenizers": [], @@ -102,12 +120,14 @@ ] } ], + "family": "Matacoan", "tokenizers": {}, "node_i": "5038", "native_tokenizers": [], "scripts": [] } ], + "family": "Matacoan", "tokenizers": {}, "node_i": "5032", "native_tokenizers": [], diff --git a/data/Maxakalian.json b/data/Maxakalian.json index d2959a6097172802a6348c651c9f709d2f9ba6d0..1f6910ef5a19c759e84f98edec21ffbddf4fd4ef 100644 --- a/data/Maxakalian.json +++ b/data/Maxakalian.json @@ -1,13 +1,16 @@ { "name": "Maxakalian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maxakal\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": "mbl", "children": [], + "family": "Maxakalian", "tokenizers": {}, "node_i": "5043", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Patax\u00f3 H\u00e3-Ha-H\u00e3e", + "depth": 1, "iso_1_code": null, "iso_3_code": "pth", "children": [], + "family": "Maxakalian", "tokenizers": {}, "node_i": "5044", "native_tokenizers": [], "scripts": [] } ], + "family": "Maxakalian", "tokenizers": {}, "node_i": "5042", "native_tokenizers": [], diff --git a/data/Mayan.json b/data/Mayan.json index 78120e63120b7bea6aa919501d8f8b5b86c43050..88e157d4a705d3f08aad5abfaa81caa46d239465 100644 --- a/data/Mayan.json +++ b/data/Mayan.json @@ -1,18 +1,22 @@ { "name": "Mayan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Huastecan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chicomuceltec", + "depth": 2, "iso_1_code": null, "iso_3_code": "cob", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5047", "native_tokenizers": [], @@ -20,14 +24,17 @@ }, { "name": "Huastec", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Huastec", + "depth": 3, "iso_1_code": null, "iso_3_code": "hus", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5049", "native_tokenizers": [], @@ -36,12 +43,14 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5048", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5046", "native_tokenizers": [], @@ -49,34 +58,41 @@ }, { "name": "Yucatecan-Core Mayan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Core Mayan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cholan-Tzeltalan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cholan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chol-Chontal", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chontal, Tabasco", + "depth": 6, "iso_1_code": null, "iso_3_code": "chf", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5055", "native_tokenizers": [], @@ -86,14 +102,17 @@ }, { "name": "Chol", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chol", + "depth": 7, "iso_1_code": null, "iso_3_code": "ctu", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5057", "native_tokenizers": [], @@ -102,12 +121,14 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5056", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5054", "native_tokenizers": [], @@ -115,14 +136,17 @@ }, { "name": "Chorti-Cholti", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ch\u2019orti\u2019", + "depth": 6, "iso_1_code": null, "iso_3_code": "caa", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5059", "native_tokenizers": [], @@ -131,12 +155,14 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5058", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5053", "native_tokenizers": [], @@ -144,19 +170,23 @@ }, { "name": "Tzeltalan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tzeltal", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tzeltal", + "depth": 6, "iso_1_code": null, "iso_3_code": "tzh", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5062", "native_tokenizers": [], @@ -165,6 +195,7 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5061", "native_tokenizers": [], @@ -172,14 +203,17 @@ }, { "name": "Tzotzil", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tzotzil", + "depth": 6, "iso_1_code": null, "iso_3_code": "tzo", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5064", "native_tokenizers": [], @@ -188,24 +222,28 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5063", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5060", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5052", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5051", "native_tokenizers": [], @@ -213,19 +251,23 @@ }, { "name": "K\u2019ichean-Mamean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "K\u2019ichean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Q\ua78ceqchi\ua78c", + "depth": 4, "iso_1_code": null, "iso_3_code": "kek", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5067", "native_tokenizers": [], @@ -235,9 +277,11 @@ }, { "name": "Uspanteko", + "depth": 4, "iso_1_code": null, "iso_3_code": "usp", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5068", "native_tokenizers": [], @@ -247,19 +291,23 @@ }, { "name": "Poqom-K\u2019ichean", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Core K\u2019ichean", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Achi", + "depth": 6, "iso_1_code": null, "iso_3_code": "acr", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5071", "native_tokenizers": [], @@ -269,9 +317,11 @@ }, { "name": "K\u2019iche\u2019", + "depth": 6, "iso_1_code": null, "iso_3_code": "quc", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5072", "native_tokenizers": [], @@ -281,9 +331,11 @@ }, { "name": "Sipakapense", + "depth": 6, "iso_1_code": null, "iso_3_code": "qum", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5073", "native_tokenizers": [], @@ -291,9 +343,11 @@ }, { "name": "Sakapulteko", + "depth": 6, "iso_1_code": null, "iso_3_code": "quv", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5074", "native_tokenizers": [], @@ -301,14 +355,17 @@ }, { "name": "Kaqchikel-Tz\u2019utujil", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaqchikel", + "depth": 7, "iso_1_code": null, "iso_3_code": "cak", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5076", "native_tokenizers": [], @@ -318,9 +375,11 @@ }, { "name": "Tz\u2019utujil", + "depth": 7, "iso_1_code": null, "iso_3_code": "tzj", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5077", "native_tokenizers": [], @@ -329,12 +388,14 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5075", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5070", "native_tokenizers": [], @@ -342,25 +403,30 @@ }, { "name": "Poqom", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Poqomam", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Poqomam", + "depth": 7, "iso_1_code": null, "iso_3_code": "poc", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5080", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5079", "native_tokenizers": [], @@ -368,14 +434,17 @@ }, { "name": "Poqomchi\u2019", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Poqomchi\u2019", + "depth": 7, "iso_1_code": null, "iso_3_code": "poh", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5082", "native_tokenizers": [], @@ -384,24 +453,28 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5081", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5078", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5069", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5066", "native_tokenizers": [], @@ -409,19 +482,23 @@ }, { "name": "Mamean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awakateko-Ixil", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awakateko", + "depth": 5, "iso_1_code": null, "iso_3_code": "agu", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5085", "native_tokenizers": [], @@ -431,9 +508,11 @@ }, { "name": "Ixil", + "depth": 5, "iso_1_code": null, "iso_3_code": "ixl", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5086", "native_tokenizers": [], @@ -442,6 +521,7 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5084", "native_tokenizers": [], @@ -449,14 +529,17 @@ }, { "name": "Teco-Mam", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mam", + "depth": 5, "iso_1_code": null, "iso_3_code": "mam", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5088", "native_tokenizers": [], @@ -466,9 +549,11 @@ }, { "name": "Tektiteko", + "depth": 5, "iso_1_code": null, "iso_3_code": "ttc", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5089", "native_tokenizers": [], @@ -477,18 +562,21 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5087", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5083", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5065", "native_tokenizers": [], @@ -496,19 +584,23 @@ }, { "name": "Q\u2019anjob\u2019alan-Chujean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chujean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chuj", + "depth": 4, "iso_1_code": null, "iso_3_code": "cac", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5092", "native_tokenizers": [], @@ -518,9 +610,11 @@ }, { "name": "Tojolabal", + "depth": 4, "iso_1_code": null, "iso_3_code": "toj", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5093", "native_tokenizers": [], @@ -529,6 +623,7 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5091", "native_tokenizers": [], @@ -536,14 +631,17 @@ }, { "name": "Q\u2019anjob\u2019alan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mocho", + "depth": 4, "iso_1_code": null, "iso_3_code": "mhc", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5095", "native_tokenizers": [], @@ -551,14 +649,17 @@ }, { "name": "Q\u2019anjob\u2019al-Akateko-Jakalteko", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jakalteko", + "depth": 5, "iso_1_code": null, "iso_3_code": "jac", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5097", "native_tokenizers": [], @@ -568,9 +669,11 @@ }, { "name": "Q\u2019anjob\u2019al", + "depth": 5, "iso_1_code": null, "iso_3_code": "kjb", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5098", "native_tokenizers": [], @@ -580,9 +683,11 @@ }, { "name": "Akateko", + "depth": 5, "iso_1_code": null, "iso_3_code": "knj", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5099", "native_tokenizers": [], @@ -591,18 +696,21 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5096", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5094", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5090", "native_tokenizers": [], @@ -610,19 +718,23 @@ }, { "name": "Yucatecan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mopan-Itz\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Itza\u2019", + "depth": 4, "iso_1_code": null, "iso_3_code": "itz", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5102", "native_tokenizers": [], @@ -630,9 +742,11 @@ }, { "name": "Maya, Mop\u00e1n", + "depth": 4, "iso_1_code": null, "iso_3_code": "mop", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5103", "native_tokenizers": [], @@ -641,6 +755,7 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5101", "native_tokenizers": [], @@ -648,14 +763,17 @@ }, { "name": "Yucatec-Lacandon", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lacandon", + "depth": 4, "iso_1_code": null, "iso_3_code": "lac", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5105", "native_tokenizers": [], @@ -665,9 +783,11 @@ }, { "name": "Maya, Yucatec", + "depth": 4, "iso_1_code": null, "iso_3_code": "yua", "children": [], + "family": "Mayan", "tokenizers": {}, "node_i": "5106", "native_tokenizers": [], @@ -676,24 +796,28 @@ ] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5104", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5100", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5050", "native_tokenizers": [], "scripts": [] } ], + "family": "Mayan", "tokenizers": {}, "node_i": "5045", "native_tokenizers": [], diff --git a/data/Maybrat.json b/data/Maybrat.json index 3fe322a32addb88b81df89ce341d94a015e91d71..74668215da155717bdf0205730d49645b93d5ff6 100644 --- a/data/Maybrat.json +++ b/data/Maybrat.json @@ -1,13 +1,16 @@ { "name": "Maybrat", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mai Brat", + "depth": 1, "iso_1_code": null, "iso_3_code": "ayz", "children": [], + "family": "Maybrat", "tokenizers": {}, "node_i": "5108", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Karon Dori", + "depth": 1, "iso_1_code": null, "iso_3_code": "kgw", "children": [], + "family": "Maybrat", "tokenizers": {}, "node_i": "5109", "native_tokenizers": [], "scripts": [] } ], + "family": "Maybrat", "tokenizers": {}, "node_i": "5107", "native_tokenizers": [], diff --git a/data/Misumalpan.json b/data/Misumalpan.json index 43b025c2d2b9c35a7bd74468d4ec5c226e31c4ef..b901f50b62718aa5a6a916a51c5d4581bef054f2 100644 --- a/data/Misumalpan.json +++ b/data/Misumalpan.json @@ -1,13 +1,16 @@ { "name": "Misumalpan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "M\u00edskito", + "depth": 1, "iso_1_code": null, "iso_3_code": "miq", "children": [], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5111", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Ulwa", + "depth": 1, "iso_1_code": null, "iso_3_code": "ulw", "children": [], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5112", "native_tokenizers": [], @@ -27,9 +32,11 @@ }, { "name": "Mayangna", + "depth": 1, "iso_1_code": null, "iso_3_code": "yan", "children": [], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5113", "native_tokenizers": [], @@ -39,19 +46,23 @@ }, { "name": "Sumu-Cacaopera-Matagalpa", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cacaopera-Matagalpa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cacaopera", + "depth": 3, "iso_1_code": null, "iso_3_code": "ccr", "children": [], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5116", "native_tokenizers": [], @@ -59,27 +70,32 @@ }, { "name": "Matagalpa", + "depth": 3, "iso_1_code": null, "iso_3_code": "mtn", "children": [], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5117", "native_tokenizers": [], "scripts": [] } ], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5115", "native_tokenizers": [], "scripts": [] } ], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5114", "native_tokenizers": [], "scripts": [] } ], + "family": "Misumalpan", "tokenizers": {}, "node_i": "5110", "native_tokenizers": [], diff --git a/data/Miwok-Costanoan.json b/data/Miwok-Costanoan.json index 11fbc2601c15a2ba6a5c3c4126403e5d70f9b78c..0ee06af5519ad0a4cc92208af6e55156e030c0e5 100644 --- a/data/Miwok-Costanoan.json +++ b/data/Miwok-Costanoan.json @@ -1,18 +1,22 @@ { "name": "Miwok-Costanoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Costanoan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ohlone, Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": "css", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5120", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Ohlone, Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": "cst", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5121", "native_tokenizers": [], @@ -30,15 +36,18 @@ }, { "name": "Karkin", + "depth": 2, "iso_1_code": null, "iso_3_code": "krb", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5122", "native_tokenizers": [], "scripts": [] } ], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5119", "native_tokenizers": [], @@ -46,19 +55,23 @@ }, { "name": "Miwokan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Miwokan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bay Miwok", + "depth": 3, "iso_1_code": null, "iso_3_code": "mkq", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5125", "native_tokenizers": [], @@ -66,9 +79,11 @@ }, { "name": "Miwok, Plains", + "depth": 3, "iso_1_code": null, "iso_3_code": "pmw", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5126", "native_tokenizers": [], @@ -76,14 +91,17 @@ }, { "name": "Sierra Miwok", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miwok, Central Sierra", + "depth": 4, "iso_1_code": null, "iso_3_code": "csm", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5128", "native_tokenizers": [], @@ -91,9 +109,11 @@ }, { "name": "Miwok, Northern Sierra", + "depth": 4, "iso_1_code": null, "iso_3_code": "nsq", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5129", "native_tokenizers": [], @@ -101,21 +121,25 @@ }, { "name": "Miwok, Southern Sierra", + "depth": 4, "iso_1_code": null, "iso_3_code": "skd", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5130", "native_tokenizers": [], "scripts": [] } ], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5127", "native_tokenizers": [], "scripts": [] } ], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5124", "native_tokenizers": [], @@ -123,14 +147,17 @@ }, { "name": "Western Miwokan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miwok, Coast", + "depth": 3, "iso_1_code": null, "iso_3_code": "csi", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5132", "native_tokenizers": [], @@ -138,27 +165,32 @@ }, { "name": "Miwok, Lake", + "depth": 3, "iso_1_code": null, "iso_3_code": "lmw", "children": [], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5133", "native_tokenizers": [], "scripts": [] } ], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5131", "native_tokenizers": [], "scripts": [] } ], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5123", "native_tokenizers": [], "scripts": [] } ], + "family": "Miwok-Costanoan", "tokenizers": {}, "node_i": "5118", "native_tokenizers": [], diff --git a/data/Mixe-Zoquean.json b/data/Mixe-Zoquean.json index 7c10f957c717de13b124b34fa5649c28673e88c1..3946e81033ef07211ffe705f7f165e676ec5a439 100644 --- a/data/Mixe-Zoquean.json +++ b/data/Mixe-Zoquean.json @@ -1,18 +1,22 @@ { "name": "Mixe-Zoquean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mixean", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Popoluca, Oluta", + "depth": 2, "iso_1_code": null, "iso_3_code": "plo", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5136", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Popoluca, Sayula", + "depth": 2, "iso_1_code": null, "iso_3_code": "pos", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5137", "native_tokenizers": [], @@ -32,14 +38,17 @@ }, { "name": "Oaxaca Mixean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mixe, Totontepec", + "depth": 3, "iso_1_code": null, "iso_3_code": "mto", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5139", "native_tokenizers": [], @@ -49,9 +58,11 @@ }, { "name": "Mixe, North Central", + "depth": 3, "iso_1_code": null, "iso_3_code": "neq", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5140", "native_tokenizers": [], @@ -59,9 +70,11 @@ }, { "name": "Mixe, Quetzaltepec", + "depth": 3, "iso_1_code": null, "iso_3_code": "pxm", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5141", "native_tokenizers": [], @@ -71,14 +84,17 @@ }, { "name": "Lowland Mixe", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mixe, Coatl\u00e1n", + "depth": 4, "iso_1_code": null, "iso_3_code": "mco", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5143", "native_tokenizers": [], @@ -88,9 +104,11 @@ }, { "name": "Mixe, Isthmus", + "depth": 4, "iso_1_code": null, "iso_3_code": "mir", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5144", "native_tokenizers": [], @@ -100,9 +118,11 @@ }, { "name": "Mixe, Mazatl\u00e1n", + "depth": 4, "iso_1_code": null, "iso_3_code": "mzl", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5145", "native_tokenizers": [], @@ -111,6 +131,7 @@ ] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5142", "native_tokenizers": [], @@ -118,14 +139,17 @@ }, { "name": "Midland Mixe", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mixe, Juquila", + "depth": 4, "iso_1_code": null, "iso_3_code": "mxq", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5147", "native_tokenizers": [], @@ -134,6 +158,7 @@ ] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5146", "native_tokenizers": [], @@ -141,14 +166,17 @@ }, { "name": "South Highland Mixe", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mixe, Tlahuitoltepec", + "depth": 4, "iso_1_code": null, "iso_3_code": "mxp", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5149", "native_tokenizers": [], @@ -157,18 +185,21 @@ ] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5148", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5138", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5135", "native_tokenizers": [], @@ -176,14 +207,17 @@ }, { "name": "Zoquean", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zoque, Chimalapa", + "depth": 2, "iso_1_code": null, "iso_3_code": "zoh", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5151", "native_tokenizers": [], @@ -191,14 +225,17 @@ }, { "name": "Chiapas Zoquean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zoque, Copainal\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "zoc", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5153", "native_tokenizers": [], @@ -208,9 +245,11 @@ }, { "name": "Zoque, Francisco Le\u00f3n", + "depth": 3, "iso_1_code": null, "iso_3_code": "zos", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5154", "native_tokenizers": [], @@ -220,26 +259,31 @@ }, { "name": "Northeast Zoque", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zoque, Ray\u00f3n", + "depth": 4, "iso_1_code": null, "iso_3_code": "zor", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5156", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5155", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5152", "native_tokenizers": [], @@ -247,14 +291,17 @@ }, { "name": "Gulf Zoquean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Popoluca, Highland", + "depth": 3, "iso_1_code": null, "iso_3_code": "poi", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5158", "native_tokenizers": [], @@ -264,9 +311,11 @@ }, { "name": "Popoluca, Texistepec", + "depth": 3, "iso_1_code": null, "iso_3_code": "poq", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5159", "native_tokenizers": [], @@ -274,27 +323,32 @@ }, { "name": "Zoque, Tabasco", + "depth": 3, "iso_1_code": null, "iso_3_code": "zoq", "children": [], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5160", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5157", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5150", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixe-Zoquean", "tokenizers": {}, "node_i": "5134", "native_tokenizers": [], diff --git a/data/Mixed language.json b/data/Mixed language.json index 5a8b542084d432ef8f721294d0cfdeba298d5d27..e71c73a4891b1830ac6b64a4bb49ae5bd4a96a1e 100644 --- a/data/Mixed language.json +++ b/data/Mixed language.json @@ -1,13 +1,16 @@ { "name": "Mixed language", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "E", + "depth": 1, "iso_1_code": null, "iso_3_code": "eee", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5162", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "N\u2019Ko", + "depth": 1, "iso_1_code": null, "iso_3_code": "nqo", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5163", "native_tokenizers": [], @@ -27,20 +32,24 @@ }, { "name": "Armenian-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lomavren", + "depth": 2, "iso_1_code": null, "iso_3_code": "rmi", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5165", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5164", "native_tokenizers": [], @@ -48,20 +57,24 @@ }, { "name": "Bantu-Cushitic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbugu", + "depth": 2, "iso_1_code": null, "iso_3_code": "mhd", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5167", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5166", "native_tokenizers": [], @@ -69,20 +82,24 @@ }, { "name": "Basque-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Erromintxela", + "depth": 2, "iso_1_code": null, "iso_3_code": "emx", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5169", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5168", "native_tokenizers": [], @@ -90,20 +107,24 @@ }, { "name": "Cakchiquel-Quich\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaqchikel-K\u2019iche\u2019 Mixed Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ckz", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5171", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5170", "native_tokenizers": [], @@ -111,20 +132,24 @@ }, { "name": "Cebuano-Spanish-English", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eskayan", + "depth": 2, "iso_1_code": null, "iso_3_code": "esy", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5173", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5172", "native_tokenizers": [], @@ -132,20 +157,24 @@ }, { "name": "Chinese-Tibetan-Bonan Mongour", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wutunhua", + "depth": 2, "iso_1_code": null, "iso_3_code": "wuh", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5175", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5174", "native_tokenizers": [], @@ -153,20 +182,24 @@ }, { "name": "Danish-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Traveller Danish", + "depth": 2, "iso_1_code": null, "iso_3_code": "rmd", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5177", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5176", "native_tokenizers": [], @@ -174,14 +207,17 @@ }, { "name": "English-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angloromani", + "depth": 2, "iso_1_code": null, "iso_3_code": "rme", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5179", "native_tokenizers": [], @@ -190,6 +226,7 @@ ] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5178", "native_tokenizers": [], @@ -197,20 +234,24 @@ }, { "name": "French-Cree", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Michif", + "depth": 2, "iso_1_code": null, "iso_3_code": "crg", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5181", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5180", "native_tokenizers": [], @@ -218,20 +259,24 @@ }, { "name": "German-Yiddish-Romani-Rotwelsch", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yeniche", + "depth": 2, "iso_1_code": null, "iso_3_code": "yec", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5183", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5182", "native_tokenizers": [], @@ -239,20 +284,24 @@ }, { "name": "Greek-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romano-Greek", + "depth": 2, "iso_1_code": null, "iso_3_code": "rge", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5185", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5184", "native_tokenizers": [], @@ -260,20 +309,24 @@ }, { "name": "Gurindji-Kriol", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gurindji Kriol", + "depth": 2, "iso_1_code": null, "iso_3_code": "gjr", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5187", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5186", "native_tokenizers": [], @@ -281,14 +334,17 @@ }, { "name": "Iberian-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cal\u00f3", + "depth": 2, "iso_1_code": null, "iso_3_code": "rmq", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5189", "native_tokenizers": [], @@ -297,6 +353,7 @@ ] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5188", "native_tokenizers": [], @@ -304,20 +361,24 @@ }, { "name": "Irish-undocumented", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shelta", + "depth": 2, "iso_1_code": null, "iso_3_code": "sth", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5191", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5190", "native_tokenizers": [], @@ -325,20 +386,24 @@ }, { "name": "Kannada-Malayalam-Tamil", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chetti, Moundadan", + "depth": 2, "iso_1_code": null, "iso_3_code": "cty", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5193", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5192", "native_tokenizers": [], @@ -346,20 +411,24 @@ }, { "name": "Norwegian-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Norwegian, Traveller", + "depth": 2, "iso_1_code": null, "iso_3_code": "rmg", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5195", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5194", "native_tokenizers": [], @@ -367,20 +436,24 @@ }, { "name": "Russian-Aleut", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aleut, Mednyj", + "depth": 2, "iso_1_code": null, "iso_3_code": "mud", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5197", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5196", "native_tokenizers": [], @@ -388,20 +461,24 @@ }, { "name": "Serbian-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romano-Serbian", + "depth": 2, "iso_1_code": null, "iso_3_code": "rsb", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5199", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5198", "native_tokenizers": [], @@ -409,20 +486,24 @@ }, { "name": "Songhay-Berber", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tagdal", + "depth": 2, "iso_1_code": null, "iso_3_code": "tda", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5201", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5200", "native_tokenizers": [], @@ -430,20 +511,24 @@ }, { "name": "Spanish-Quichua", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Media Lengua", + "depth": 2, "iso_1_code": null, "iso_3_code": "mue", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5203", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5202", "native_tokenizers": [], @@ -451,20 +536,24 @@ }, { "name": "Swedish-Romani", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Romani, Tavringer", + "depth": 2, "iso_1_code": null, "iso_3_code": "rmu", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5205", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5204", "native_tokenizers": [], @@ -472,20 +561,24 @@ }, { "name": "Yapese-Ulithi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nguluwan", + "depth": 2, "iso_1_code": null, "iso_3_code": "nuw", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5207", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5206", "native_tokenizers": [], @@ -493,26 +586,31 @@ }, { "name": "Zulu-Bantu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Camtho", + "depth": 2, "iso_1_code": null, "iso_3_code": "cmt", "children": [], + "family": "Mixed language", "tokenizers": {}, "node_i": "5209", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5208", "native_tokenizers": [], "scripts": [] } ], + "family": "Mixed language", "tokenizers": {}, "node_i": "5161", "native_tokenizers": [], diff --git a/data/Mongol-Langam.json b/data/Mongol-Langam.json index 133f30198cb7614653071d9e07afdfc2156fd4fa..89c8f82a0b8ab4784d5739bee7a903ba5d606bcc 100644 --- a/data/Mongol-Langam.json +++ b/data/Mongol-Langam.json @@ -1,13 +1,16 @@ { "name": "Mongol-Langam", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pondi", + "depth": 1, "iso_1_code": null, "iso_3_code": "lnm", "children": [], + "family": "Mongol-Langam", "tokenizers": {}, "node_i": "5211", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Mwakai", + "depth": 1, "iso_1_code": null, "iso_3_code": "mgt", "children": [], + "family": "Mongol-Langam", "tokenizers": {}, "node_i": "5212", "native_tokenizers": [], @@ -25,15 +30,18 @@ }, { "name": "Ulwa", + "depth": 1, "iso_1_code": null, "iso_3_code": "yla", "children": [], + "family": "Mongol-Langam", "tokenizers": {}, "node_i": "5213", "native_tokenizers": [], "scripts": [] } ], + "family": "Mongol-Langam", "tokenizers": {}, "node_i": "5210", "native_tokenizers": [], diff --git a/data/Mongolic.json b/data/Mongolic.json index 8bc79158dac17c4cf2650f2842f449723207ebe6..d3a32e67aeb5d8dbae61cefdfd2973f4d6a29637 100644 --- a/data/Mongolic.json +++ b/data/Mongolic.json @@ -1,29 +1,35 @@ { "name": "Mongolic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dagur", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Daur", + "depth": 3, "iso_1_code": null, "iso_3_code": "dta", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5217", "native_tokenizers": [], "scripts": [] } ], + "family": "Mongolic", "tokenizers": {}, "node_i": "5216", "native_tokenizers": [], @@ -31,14 +37,17 @@ }, { "name": "Mongour", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kangjia", + "depth": 3, "iso_1_code": null, "iso_3_code": "kxs", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5219", "native_tokenizers": [], @@ -46,9 +55,11 @@ }, { "name": "Tu", + "depth": 3, "iso_1_code": null, "iso_3_code": "mjg", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5220", "native_tokenizers": [], @@ -56,9 +67,11 @@ }, { "name": "Bonan", + "depth": 3, "iso_1_code": null, "iso_3_code": "peh", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5221", "native_tokenizers": [], @@ -66,9 +79,11 @@ }, { "name": "Dongxiang", + "depth": 3, "iso_1_code": null, "iso_3_code": "sce", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5222", "native_tokenizers": [], @@ -76,15 +91,18 @@ }, { "name": "Yugur, East", + "depth": 3, "iso_1_code": null, "iso_3_code": "yuy", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5223", "native_tokenizers": [], "scripts": [] } ], + "family": "Mongolic", "tokenizers": {}, "node_i": "5218", "native_tokenizers": [], @@ -92,14 +110,17 @@ }, { "name": "Oirat-Khalkha", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khamnigan Mongol", + "depth": 3, "iso_1_code": null, "iso_3_code": "ykh", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5225", "native_tokenizers": [], @@ -107,19 +128,23 @@ }, { "name": "Khalkha-Buriat", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buriat", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buriat, Mongolia", + "depth": 5, "iso_1_code": null, "iso_3_code": "bxm", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5228", "native_tokenizers": [], @@ -127,9 +152,11 @@ }, { "name": "Buriat, Russia", + "depth": 5, "iso_1_code": null, "iso_3_code": "bxr", "children": [], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -149,15 +176,18 @@ }, { "name": "Buriat, China", + "depth": 5, "iso_1_code": null, "iso_3_code": "bxu", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5230", "native_tokenizers": [], "scripts": [] } ], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -173,14 +203,17 @@ }, { "name": "Mongolian Proper", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mongolian, Halh", + "depth": 5, "iso_1_code": "mn", "iso_3_code": "khk", "children": [], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -198,15 +231,18 @@ }, { "name": "Mongolian, Peripheral", + "depth": 5, "iso_1_code": "mn", "iso_3_code": "mvf", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5233", "native_tokenizers": [], "scripts": [] } ], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -221,6 +257,7 @@ "scripts": [] } ], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -236,14 +273,17 @@ }, { "name": "Oirat-Kalmyk-Darkhat", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalmyk-Oirat", + "depth": 4, "iso_1_code": null, "iso_3_code": "xal", "children": [], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -260,6 +300,7 @@ ] } ], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -274,6 +315,7 @@ "scripts": [] } ], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -288,6 +330,7 @@ "scripts": [] } ], + "family": "Mongolic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"bxr\")", @@ -303,35 +346,32 @@ }, { "name": "Western", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mogholi", + "depth": 2, "iso_1_code": null, "iso_3_code": "mhj", "children": [], + "family": "Mongolic", "tokenizers": {}, "node_i": "5237", "native_tokenizers": [], "scripts": [] } ], + "family": "Mongolic", "tokenizers": {}, "node_i": "5236", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"bxr\")", - "original_lang_name": "russia_buriat", - "original_lang_code": "bxr", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Mongolic", + "tokenizers": {}, "node_i": "5214", "native_tokenizers": [], "scripts": [] diff --git a/data/Mosetenan.json b/data/Mosetenan.json index 15f6a27708eed9c6f54bc84f49ac0fdcb7b1a989..c315b746fac094c83b3614fad220ae916916c366 100644 --- a/data/Mosetenan.json +++ b/data/Mosetenan.json @@ -1,13 +1,16 @@ { "name": "Mosetenan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsiman\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "cas", "children": [], + "family": "Mosetenan", "tokenizers": {}, "node_i": "5239", "native_tokenizers": [], @@ -16,6 +19,7 @@ ] } ], + "family": "Mosetenan", "tokenizers": {}, "node_i": "5238", "native_tokenizers": [], diff --git a/data/Muran.json b/data/Muran.json index 0927ed79a1f8722bf776f9a46e6097984bd535bc..93b3844f0829b400976a9fab149c22f7a6624d2b 100644 --- a/data/Muran.json +++ b/data/Muran.json @@ -1,19 +1,23 @@ { "name": "Muran", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pirah\u00e3", + "depth": 1, "iso_1_code": null, "iso_3_code": "myp", "children": [], + "family": "Muran", "tokenizers": {}, "node_i": "5241", "native_tokenizers": [], "scripts": [] } ], + "family": "Muran", "tokenizers": {}, "node_i": "5240", "native_tokenizers": [], diff --git a/data/Muskogean.json b/data/Muskogean.json index 8a52c4896e8d672a62f9a884b807e7ddb23a0c76..94b9482885a33e6f219a82584762c0d5982314dd 100644 --- a/data/Muskogean.json +++ b/data/Muskogean.json @@ -1,28 +1,34 @@ { "name": "Muskogean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Muskogean", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Muskogean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apalachee-Alabama-Koasati", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apalachee", + "depth": 4, "iso_1_code": null, "iso_3_code": "xap", "children": [], + "family": "Muskogean", "tokenizers": {}, "node_i": "5246", "native_tokenizers": [], @@ -30,14 +36,17 @@ }, { "name": "Alabama-Koasati", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alabama", + "depth": 5, "iso_1_code": null, "iso_3_code": "akz", "children": [], + "family": "Muskogean", "tokenizers": {}, "node_i": "5248", "native_tokenizers": [], @@ -45,21 +54,25 @@ }, { "name": "Koasati", + "depth": 5, "iso_1_code": null, "iso_3_code": "cku", "children": [], + "family": "Muskogean", "tokenizers": {}, "node_i": "5249", "native_tokenizers": [], "scripts": [] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5247", "native_tokenizers": [], "scripts": [] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5245", "native_tokenizers": [], @@ -67,26 +80,31 @@ }, { "name": "Hitchiti-Mikasuki", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mikasuki", + "depth": 4, "iso_1_code": null, "iso_3_code": "mik", "children": [], + "family": "Muskogean", "tokenizers": {}, "node_i": "5251", "native_tokenizers": [], "scripts": [] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5250", "native_tokenizers": [], "scripts": [] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5244", "native_tokenizers": [], @@ -94,14 +112,17 @@ }, { "name": "Creek-Seminole", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Muskogee", + "depth": 3, "iso_1_code": null, "iso_3_code": "mus", "children": [], + "family": "Muskogean", "tokenizers": {}, "node_i": "5253", "native_tokenizers": [], @@ -110,12 +131,14 @@ ] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5252", "native_tokenizers": [], "scripts": [] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5243", "native_tokenizers": [], @@ -123,14 +146,17 @@ }, { "name": "Western Muskogean", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Choctaw", + "depth": 2, "iso_1_code": null, "iso_3_code": "cho", "children": [], + "family": "Muskogean", "tokenizers": {}, "node_i": "5255", "native_tokenizers": [], @@ -140,21 +166,25 @@ }, { "name": "Chickasaw", + "depth": 2, "iso_1_code": null, "iso_3_code": "cic", "children": [], + "family": "Muskogean", "tokenizers": {}, "node_i": "5256", "native_tokenizers": [], "scripts": [] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5254", "native_tokenizers": [], "scripts": [] } ], + "family": "Muskogean", "tokenizers": {}, "node_i": "5242", "native_tokenizers": [], diff --git a/data/Nakh-Daghestanian.json b/data/Nakh-Daghestanian.json index 151859b52a589d853b0fe89da5ee2d9b400e9103..bb4182955410320b5b3145ac8117f726952a8e7e 100644 --- a/data/Nakh-Daghestanian.json +++ b/data/Nakh-Daghestanian.json @@ -1,23 +1,28 @@ { "name": "Nakh-Daghestanian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Avar-Andic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akhvakh", + "depth": 3, "iso_1_code": null, "iso_3_code": "akv", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5260", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Andi", + "depth": 3, "iso_1_code": null, "iso_3_code": "ani", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5261", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Botlikh", + "depth": 3, "iso_1_code": null, "iso_3_code": "bph", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5262", "native_tokenizers": [], @@ -45,9 +54,11 @@ }, { "name": "Chamalal", + "depth": 3, "iso_1_code": null, "iso_3_code": "cji", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5263", "native_tokenizers": [], @@ -55,9 +66,11 @@ }, { "name": "Ghodoberi", + "depth": 3, "iso_1_code": null, "iso_3_code": "gdo", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5264", "native_tokenizers": [], @@ -65,9 +78,11 @@ }, { "name": "Karata", + "depth": 3, "iso_1_code": null, "iso_3_code": "kpt", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5265", "native_tokenizers": [], @@ -75,9 +90,11 @@ }, { "name": "Bagvalal", + "depth": 3, "iso_1_code": null, "iso_3_code": "kva", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5266", "native_tokenizers": [], @@ -85,15 +102,18 @@ }, { "name": "Tindi", + "depth": 3, "iso_1_code": null, "iso_3_code": "tin", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5267", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5259", "native_tokenizers": [], @@ -101,14 +121,17 @@ }, { "name": "Avar", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Avar", + "depth": 3, "iso_1_code": "av", "iso_3_code": "ava", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5269", "native_tokenizers": [], @@ -117,12 +140,14 @@ ] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5268", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5258", "native_tokenizers": [], @@ -130,14 +155,17 @@ }, { "name": "Dargi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dargwa", + "depth": 2, "iso_1_code": null, "iso_3_code": "dar", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5271", "native_tokenizers": [], @@ -147,9 +175,11 @@ }, { "name": "Kubachi", + "depth": 2, "iso_1_code": null, "iso_3_code": "ugh", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5272", "native_tokenizers": [], @@ -157,15 +187,18 @@ }, { "name": "Kaitag", + "depth": 2, "iso_1_code": null, "iso_3_code": "xdq", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5273", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5270", "native_tokenizers": [], @@ -173,20 +206,24 @@ }, { "name": "Khinalugh", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Khinalugh", + "depth": 2, "iso_1_code": null, "iso_3_code": "kjj", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5275", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5274", "native_tokenizers": [], @@ -194,14 +231,17 @@ }, { "name": "Lak", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lak", + "depth": 2, "iso_1_code": null, "iso_3_code": "lbe", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5277", "native_tokenizers": [], @@ -210,6 +250,7 @@ ] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5276", "native_tokenizers": [], @@ -217,25 +258,30 @@ }, { "name": "Lezgic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Archi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Archi", + "depth": 3, "iso_1_code": null, "iso_3_code": "aqc", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5280", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5279", "native_tokenizers": [], @@ -243,19 +289,23 @@ }, { "name": "Nuclear Lezgic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Lezgic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aghul", + "depth": 4, "iso_1_code": null, "iso_3_code": "agx", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5283", "native_tokenizers": [], @@ -265,9 +315,11 @@ }, { "name": "Lezgi", + "depth": 4, "iso_1_code": null, "iso_3_code": "lez", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5284", "native_tokenizers": [], @@ -277,9 +329,11 @@ }, { "name": "Tabasaran", + "depth": 4, "iso_1_code": null, "iso_3_code": "tab", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5285", "native_tokenizers": [], @@ -288,6 +342,7 @@ ] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5282", "native_tokenizers": [], @@ -295,14 +350,17 @@ }, { "name": "South Lezgic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Budukh", + "depth": 4, "iso_1_code": null, "iso_3_code": "bdk", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5287", "native_tokenizers": [], @@ -310,15 +368,18 @@ }, { "name": "Kryts", + "depth": 4, "iso_1_code": null, "iso_3_code": "kry", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5288", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5286", "native_tokenizers": [], @@ -326,14 +387,17 @@ }, { "name": "West Lezgic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rutul", + "depth": 4, "iso_1_code": null, "iso_3_code": "rut", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5290", "native_tokenizers": [], @@ -341,9 +405,11 @@ }, { "name": "Tsakhur", + "depth": 4, "iso_1_code": null, "iso_3_code": "tkr", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5291", "native_tokenizers": [], @@ -352,12 +418,14 @@ ] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5289", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5281", "native_tokenizers": [], @@ -365,26 +433,31 @@ }, { "name": "Udi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Udi", + "depth": 3, "iso_1_code": null, "iso_3_code": "udi", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5293", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5292", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5278", "native_tokenizers": [], @@ -392,25 +465,30 @@ }, { "name": "Nakh", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Batsi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bats", + "depth": 3, "iso_1_code": null, "iso_3_code": "bbl", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5296", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5295", "native_tokenizers": [], @@ -418,14 +496,17 @@ }, { "name": "Chechen-Ingush", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chechen", + "depth": 3, "iso_1_code": "ce", "iso_3_code": "che", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5298", "native_tokenizers": [], @@ -435,9 +516,11 @@ }, { "name": "Ingush", + "depth": 3, "iso_1_code": null, "iso_3_code": "inh", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5299", "native_tokenizers": [], @@ -446,12 +529,14 @@ ] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5297", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5294", "native_tokenizers": [], @@ -459,19 +544,23 @@ }, { "name": "Tsezic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Tsezic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hunzib", + "depth": 3, "iso_1_code": null, "iso_3_code": "huz", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5302", "native_tokenizers": [], @@ -479,9 +568,11 @@ }, { "name": "Bezhta", + "depth": 3, "iso_1_code": null, "iso_3_code": "kap", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5303", "native_tokenizers": [], @@ -490,6 +581,7 @@ ] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5301", "native_tokenizers": [], @@ -497,14 +589,17 @@ }, { "name": "West Tsezic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dido", + "depth": 3, "iso_1_code": null, "iso_3_code": "ddo", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5305", "native_tokenizers": [], @@ -512,9 +607,11 @@ }, { "name": "Hinukh", + "depth": 3, "iso_1_code": null, "iso_3_code": "gin", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5306", "native_tokenizers": [], @@ -522,27 +619,32 @@ }, { "name": "Khvarshi", + "depth": 3, "iso_1_code": null, "iso_3_code": "khv", "children": [], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5307", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5304", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5300", "native_tokenizers": [], "scripts": [] } ], + "family": "Nakh-Daghestanian", "tokenizers": {}, "node_i": "5257", "native_tokenizers": [], diff --git a/data/Nambikwara.json b/data/Nambikwara.json index 51b7a709d40d2aa7b7f2239c64f362303f23df65..57b4291ac9424fc6c1d3d96e509a3ffc10d894a6 100644 --- a/data/Nambikwara.json +++ b/data/Nambikwara.json @@ -1,13 +1,16 @@ { "name": "Nambikwara", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saban\u00ea", + "depth": 1, "iso_1_code": null, "iso_3_code": "sae", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5309", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Nambikwara Complex", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nambiku\u00e1ra, Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": "nab", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5311", "native_tokenizers": [], @@ -32,14 +38,17 @@ }, { "name": "Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alapmunte", + "depth": 3, "iso_1_code": null, "iso_3_code": "apv", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5313", "native_tokenizers": [], @@ -47,9 +56,11 @@ }, { "name": "Mamaind\u00ea", + "depth": 3, "iso_1_code": null, "iso_3_code": "wmd", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5314", "native_tokenizers": [], @@ -57,9 +68,11 @@ }, { "name": "Yalakalore", + "depth": 3, "iso_1_code": null, "iso_3_code": "xyl", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5315", "native_tokenizers": [], @@ -67,14 +80,17 @@ }, { "name": "Roosevelt Cluster", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lakond\u00ea", + "depth": 4, "iso_1_code": null, "iso_3_code": "lkd", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5317", "native_tokenizers": [], @@ -82,9 +98,11 @@ }, { "name": "Latund\u00ea", + "depth": 4, "iso_1_code": null, "iso_3_code": "ltn", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5318", "native_tokenizers": [], @@ -92,33 +110,39 @@ }, { "name": "Tawand\u00ea", + "depth": 4, "iso_1_code": null, "iso_3_code": "xtw", "children": [], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5319", "native_tokenizers": [], "scripts": [] } ], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5316", "native_tokenizers": [], "scripts": [] } ], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5312", "native_tokenizers": [], "scripts": [] } ], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5310", "native_tokenizers": [], "scripts": [] } ], + "family": "Nambikwara", "tokenizers": {}, "node_i": "5308", "native_tokenizers": [], diff --git a/data/Niger-Congo.json b/data/Niger-Congo.json index 3acd3160af9fd2465f05c6373fd86a45fd287cfe..7a321020d8f2b972069d40338a8fdea4a19eba15 100644 --- a/data/Niger-Congo.json +++ b/data/Niger-Congo.json @@ -1,34 +1,41 @@ { "name": "Niger-Congo", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atlantic-Congo", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atlantic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bijago", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bijag\u00f3", + "depth": 4, "iso_1_code": null, "iso_3_code": "bjg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5324", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5323", "native_tokenizers": [], @@ -36,24 +43,29 @@ }, { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bak", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balant-Ganja", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balanta-Ganja", + "depth": 6, "iso_1_code": null, "iso_3_code": "bjt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5328", "native_tokenizers": [], @@ -61,15 +73,18 @@ }, { "name": "Balanta", + "depth": 6, "iso_1_code": null, "iso_3_code": "ble", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5329", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5327", "native_tokenizers": [], @@ -77,25 +92,30 @@ }, { "name": "Jola", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bayot", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bayot", + "depth": 7, "iso_1_code": null, "iso_3_code": "bda", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5332", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5331", "native_tokenizers": [], @@ -103,24 +123,29 @@ }, { "name": "Jola Proper", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jola Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gusilay", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bandial", + "depth": 9, "iso_1_code": null, "iso_3_code": "bqj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -138,15 +163,18 @@ }, { "name": "Gusilay", + "depth": 9, "iso_1_code": null, "iso_3_code": "gsl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5337", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -162,14 +190,17 @@ }, { "name": "Her-Ejamat", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jola-Felupe", + "depth": 9, "iso_1_code": null, "iso_3_code": "eja", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5339", "native_tokenizers": [], @@ -177,15 +208,18 @@ }, { "name": "Kerak", + "depth": 9, "iso_1_code": null, "iso_3_code": "hhr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5340", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5338", "native_tokenizers": [], @@ -193,14 +227,17 @@ }, { "name": "Jola-Fonyi", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jola-Fonyi", + "depth": 9, "iso_1_code": null, "iso_3_code": "dyo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -217,6 +254,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -232,14 +270,17 @@ }, { "name": "Jola-Kasa", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jola-Kasa", + "depth": 9, "iso_1_code": null, "iso_3_code": "csk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -256,6 +297,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -270,6 +312,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -285,14 +328,17 @@ }, { "name": "Karon-Mlomp", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karon", + "depth": 8, "iso_1_code": null, "iso_3_code": "krx", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -310,15 +356,18 @@ }, { "name": "Mlomp", + "depth": 8, "iso_1_code": null, "iso_3_code": "mlo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5347", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -334,14 +383,17 @@ }, { "name": "Kwatay", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuwaataay", + "depth": 8, "iso_1_code": null, "iso_3_code": "cwt", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -358,6 +410,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -372,6 +425,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -386,6 +440,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -401,14 +456,17 @@ }, { "name": "Manjaku-Papel", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mankanya", + "depth": 6, "iso_1_code": null, "iso_3_code": "knf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -426,9 +484,11 @@ }, { "name": "Mandjak", + "depth": 6, "iso_1_code": null, "iso_3_code": "mfv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5352", "native_tokenizers": [], @@ -436,15 +496,18 @@ }, { "name": "Papel", + "depth": 6, "iso_1_code": null, "iso_3_code": "pbo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5353", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -459,6 +522,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -474,14 +538,17 @@ }, { "name": "Cangin", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Laalaa", + "depth": 5, "iso_1_code": null, "iso_3_code": "cae", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5355", "native_tokenizers": [], @@ -489,9 +556,11 @@ }, { "name": "Paloor", + "depth": 5, "iso_1_code": null, "iso_3_code": "fap", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5356", "native_tokenizers": [], @@ -499,9 +568,11 @@ }, { "name": "Ndut", + "depth": 5, "iso_1_code": null, "iso_3_code": "ndv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5357", "native_tokenizers": [], @@ -509,9 +580,11 @@ }, { "name": "Saafi-Saafi", + "depth": 5, "iso_1_code": null, "iso_3_code": "sav", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5358", "native_tokenizers": [], @@ -519,9 +592,11 @@ }, { "name": "Noon", + "depth": 5, "iso_1_code": null, "iso_3_code": "snf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -538,6 +613,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -553,19 +629,23 @@ }, { "name": "Eastern Senegal-Guinea", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banyun", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bainouk-Gunyu\u00f1o", + "depth": 6, "iso_1_code": null, "iso_3_code": "bab", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5362", "native_tokenizers": [], @@ -573,9 +653,11 @@ }, { "name": "Bainouk-Samik", + "depth": 6, "iso_1_code": null, "iso_3_code": "bcb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5363", "native_tokenizers": [], @@ -583,15 +665,18 @@ }, { "name": "Bainouk-Gunyaamolo", + "depth": 6, "iso_1_code": null, "iso_3_code": "bcz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5364", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5361", "native_tokenizers": [], @@ -599,14 +684,17 @@ }, { "name": "Nun", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kasanga", + "depth": 6, "iso_1_code": null, "iso_3_code": "ccj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5366", "native_tokenizers": [], @@ -614,15 +702,18 @@ }, { "name": "Kobiana", + "depth": 6, "iso_1_code": null, "iso_3_code": "kcj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5367", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5365", "native_tokenizers": [], @@ -630,14 +721,17 @@ }, { "name": "Tenda", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biafada", + "depth": 6, "iso_1_code": null, "iso_3_code": "bif", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5369", "native_tokenizers": [], @@ -645,9 +739,11 @@ }, { "name": "Oniyan", + "depth": 6, "iso_1_code": null, "iso_3_code": "bsc", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -665,9 +761,11 @@ }, { "name": "Wamey", + "depth": 6, "iso_1_code": null, "iso_3_code": "cou", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -685,9 +783,11 @@ }, { "name": "Badyara", + "depth": 6, "iso_1_code": null, "iso_3_code": "pbp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5372", "native_tokenizers": [], @@ -695,9 +795,11 @@ }, { "name": "M\u00e9nik", + "depth": 6, "iso_1_code": null, "iso_3_code": "tnr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -714,6 +816,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -728,6 +831,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -743,14 +847,17 @@ }, { "name": "Mbulungish-Nalu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbulungish", + "depth": 5, "iso_1_code": null, "iso_3_code": "mbv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5375", "native_tokenizers": [], @@ -758,15 +865,18 @@ }, { "name": "Nalu", + "depth": 5, "iso_1_code": null, "iso_3_code": "naj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5376", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5374", "native_tokenizers": [], @@ -774,29 +884,35 @@ }, { "name": "Senegambian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fula-Wolof", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fula", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fulfulde, Western Niger", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fuh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -814,9 +930,11 @@ }, { "name": "Fulfulde, Central-Eastern Niger", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fuq", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -834,9 +952,11 @@ }, { "name": "Fulfulde, Nigerian", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fuv", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -854,6 +974,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -869,14 +990,17 @@ }, { "name": "Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fulfulde, Adamawa", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fub", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -894,15 +1018,18 @@ }, { "name": "Fulfulde, Bagirmi", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fui", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5386", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -918,14 +1045,17 @@ }, { "name": "West Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fulfulde, Maasina", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "ffm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -943,9 +1073,11 @@ }, { "name": "Fulfulde, Borgu", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fue", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -963,9 +1095,11 @@ }, { "name": "Pular", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fuf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -982,6 +1116,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -997,26 +1132,31 @@ }, { "name": "Western", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pulaar", + "depth": 8, "iso_1_code": "ff", "iso_3_code": "fuc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5392", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5391", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1032,14 +1172,17 @@ }, { "name": "Wolof", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wolof, Gambian", + "depth": 7, "iso_1_code": null, "iso_3_code": "wof", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5394", "native_tokenizers": [], @@ -1047,9 +1190,11 @@ }, { "name": "Wolof", + "depth": 7, "iso_1_code": "wo", "iso_3_code": "wol", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1068,6 +1213,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1082,6 +1228,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1097,14 +1244,17 @@ }, { "name": "Serer", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Serer-Sine", + "depth": 6, "iso_1_code": null, "iso_3_code": "srr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1121,6 +1271,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1135,6 +1286,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1149,6 +1301,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1164,19 +1317,23 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Limba", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Limba, West-Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "lia", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1194,15 +1351,18 @@ }, { "name": "Limba, East", + "depth": 5, "iso_1_code": null, "iso_3_code": "lma", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5401", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1218,29 +1378,35 @@ }, { "name": "Mel", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bullom-Kissi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bullom", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bom-Kim", + "depth": 8, "iso_1_code": null, "iso_3_code": "bmf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5406", "native_tokenizers": [], @@ -1248,15 +1414,18 @@ }, { "name": "Bullom So", + "depth": 8, "iso_1_code": null, "iso_3_code": "buy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5407", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5405", "native_tokenizers": [], @@ -1264,26 +1433,31 @@ }, { "name": "Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sherbro", + "depth": 8, "iso_1_code": null, "iso_3_code": "bun", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5409", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5408", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5404", "native_tokenizers": [], @@ -1291,14 +1465,17 @@ }, { "name": "Kissi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kissi, Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "kqs", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1316,9 +1493,11 @@ }, { "name": "Kisi, Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "kss", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1335,6 +1514,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1349,6 +1529,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1364,20 +1545,24 @@ }, { "name": "Gola", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gola", + "depth": 6, "iso_1_code": null, "iso_3_code": "gol", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5414", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5413", "native_tokenizers": [], @@ -1385,19 +1570,23 @@ }, { "name": "Temne", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baga", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baga Pokur", + "depth": 7, "iso_1_code": null, "iso_3_code": "bcg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5417", "native_tokenizers": [], @@ -1405,9 +1594,11 @@ }, { "name": "Baga Koga", + "depth": 7, "iso_1_code": null, "iso_3_code": "bgo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5418", "native_tokenizers": [], @@ -1415,9 +1606,11 @@ }, { "name": "Baga Manduri", + "depth": 7, "iso_1_code": null, "iso_3_code": "bmd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5419", "native_tokenizers": [], @@ -1425,9 +1618,11 @@ }, { "name": "Baga Kaloum", + "depth": 7, "iso_1_code": null, "iso_3_code": "bqf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5420", "native_tokenizers": [], @@ -1435,9 +1630,11 @@ }, { "name": "Baga Sitemu", + "depth": 7, "iso_1_code": null, "iso_3_code": "bsp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1455,9 +1652,11 @@ }, { "name": "Baga Soban\u00e9", + "depth": 7, "iso_1_code": null, "iso_3_code": "bsv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5422", "native_tokenizers": [], @@ -1465,15 +1664,18 @@ }, { "name": "Landoma", + "depth": 7, "iso_1_code": null, "iso_3_code": "ldm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5423", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1489,14 +1691,17 @@ }, { "name": "Temne-Banta", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Themne", + "depth": 7, "iso_1_code": null, "iso_3_code": "tem", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1513,6 +1718,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1527,6 +1733,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1541,6 +1748,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1556,26 +1764,31 @@ }, { "name": "Sua", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mansoanka", + "depth": 5, "iso_1_code": null, "iso_3_code": "msw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5427", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5426", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1590,6 +1803,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"wo\")", @@ -1605,25 +1819,30 @@ }, { "name": "Ijoid", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Defaka", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Defaka", + "depth": 4, "iso_1_code": null, "iso_3_code": "afn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5430", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5429", "native_tokenizers": [], @@ -1631,25 +1850,30 @@ }, { "name": "Ijo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ijo, Southeast", + "depth": 5, "iso_1_code": null, "iso_3_code": "ijs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5433", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5432", "native_tokenizers": [], @@ -1657,19 +1881,23 @@ }, { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northeastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nkoroo", + "depth": 6, "iso_1_code": null, "iso_3_code": "nkx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5436", "native_tokenizers": [], @@ -1677,14 +1905,17 @@ }, { "name": "Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibani", + "depth": 7, "iso_1_code": null, "iso_3_code": "iby", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5438", "native_tokenizers": [], @@ -1692,9 +1923,11 @@ }, { "name": "Kalabari", + "depth": 7, "iso_1_code": null, "iso_3_code": "ijn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5439", "native_tokenizers": [], @@ -1702,27 +1935,32 @@ }, { "name": "Kirike", + "depth": 7, "iso_1_code": null, "iso_3_code": "okr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5440", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5437", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5435", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5434", "native_tokenizers": [], @@ -1730,19 +1968,23 @@ }, { "name": "West", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inland Ijo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biseni", + "depth": 6, "iso_1_code": null, "iso_3_code": "ije", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5443", "native_tokenizers": [], @@ -1750,9 +1992,11 @@ }, { "name": "Okodia", + "depth": 6, "iso_1_code": null, "iso_3_code": "okd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5444", "native_tokenizers": [], @@ -1760,21 +2004,25 @@ }, { "name": "Oruma", + "depth": 6, "iso_1_code": null, "iso_3_code": "orr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5445", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5442", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5441", "native_tokenizers": [], @@ -1782,32 +2030,38 @@ }, { "name": "West Ijo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Izon", + "depth": 5, "iso_1_code": null, "iso_3_code": "ijc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5447", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5446", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5431", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5428", "native_tokenizers": [], @@ -1815,30 +2069,36 @@ }, { "name": "Volta-Congo", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Benue-Congo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akpes", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akpes", + "depth": 5, "iso_1_code": null, "iso_3_code": "ibe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5451", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5450", "native_tokenizers": [], @@ -1846,24 +2106,29 @@ }, { "name": "Bantoid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dakoid", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Samba Daka", + "depth": 7, "iso_1_code": null, "iso_3_code": "ccg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5455", "native_tokenizers": [], @@ -1871,9 +2136,11 @@ }, { "name": "Dirim", + "depth": 7, "iso_1_code": null, "iso_3_code": "dir", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5456", "native_tokenizers": [], @@ -1881,9 +2148,11 @@ }, { "name": "Dong", + "depth": 7, "iso_1_code": null, "iso_3_code": "doh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5457", "native_tokenizers": [], @@ -1891,9 +2160,11 @@ }, { "name": "Lamja-Dengsa-Tola", + "depth": 7, "iso_1_code": null, "iso_3_code": "ldh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5458", "native_tokenizers": [], @@ -1901,15 +2172,18 @@ }, { "name": "Gaa", + "depth": 7, "iso_1_code": null, "iso_3_code": "ttb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5459", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5454", "native_tokenizers": [], @@ -1917,20 +2191,24 @@ }, { "name": "Fam", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fam", + "depth": 7, "iso_1_code": null, "iso_3_code": "fam", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5461", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5460", "native_tokenizers": [], @@ -1938,24 +2216,29 @@ }, { "name": "Mambiloid", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mambila-Konja", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konja", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwanja", + "depth": 9, "iso_1_code": null, "iso_3_code": "knp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5465", "native_tokenizers": [], @@ -1963,15 +2246,18 @@ }, { "name": "Twendi", + "depth": 9, "iso_1_code": null, "iso_3_code": "twn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5466", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5464", "native_tokenizers": [], @@ -1979,14 +2265,17 @@ }, { "name": "Magu-Kamkam-Kila", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbongno", + "depth": 9, "iso_1_code": null, "iso_3_code": "bgu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5468", "native_tokenizers": [], @@ -1994,9 +2283,11 @@ }, { "name": "Somyev", + "depth": 9, "iso_1_code": null, "iso_3_code": "kgt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5469", "native_tokenizers": [], @@ -2004,9 +2295,11 @@ }, { "name": "Mvanip", + "depth": 9, "iso_1_code": null, "iso_3_code": "mcj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5470", "native_tokenizers": [], @@ -2014,15 +2307,18 @@ }, { "name": "Ndunda", + "depth": 9, "iso_1_code": null, "iso_3_code": "nuh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5471", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5467", "native_tokenizers": [], @@ -2030,14 +2326,17 @@ }, { "name": "Mambila", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mambila, Cameroon", + "depth": 9, "iso_1_code": null, "iso_3_code": "mcu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2055,9 +2354,11 @@ }, { "name": "Mambila, Nigeria", + "depth": 9, "iso_1_code": null, "iso_3_code": "mzk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2074,6 +2375,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2089,26 +2391,31 @@ }, { "name": "Njerup", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Njerep", + "depth": 9, "iso_1_code": null, "iso_3_code": "njr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5476", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5475", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2124,20 +2431,24 @@ }, { "name": "Ndoro", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndoola", + "depth": 8, "iso_1_code": null, "iso_3_code": "ndr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5478", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5477", "native_tokenizers": [], @@ -2145,25 +2456,30 @@ }, { "name": "Suga-Vute", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suga", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nizaa", + "depth": 9, "iso_1_code": null, "iso_3_code": "sgi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5481", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5480", "native_tokenizers": [], @@ -2171,14 +2487,17 @@ }, { "name": "Vute", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vute", + "depth": 9, "iso_1_code": null, "iso_3_code": "vut", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2196,15 +2515,18 @@ }, { "name": "Wawa", + "depth": 9, "iso_1_code": null, "iso_3_code": "www", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5484", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2219,6 +2541,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2233,6 +2556,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2247,6 +2571,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2262,19 +2587,23 @@ }, { "name": "Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Beboid", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sari", + "depth": 7, "iso_1_code": null, "iso_3_code": "asj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5487", "native_tokenizers": [], @@ -2282,9 +2611,11 @@ }, { "name": "Mbuk", + "depth": 7, "iso_1_code": null, "iso_3_code": "bpc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5488", "native_tokenizers": [], @@ -2292,9 +2623,11 @@ }, { "name": "Bukwen", + "depth": 7, "iso_1_code": null, "iso_3_code": "buz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5489", "native_tokenizers": [], @@ -2302,9 +2635,11 @@ }, { "name": "Naami", + "depth": 7, "iso_1_code": null, "iso_3_code": "bzv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5490", "native_tokenizers": [], @@ -2312,9 +2647,11 @@ }, { "name": "Chung", + "depth": 7, "iso_1_code": null, "iso_3_code": "cnq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5491", "native_tokenizers": [], @@ -2322,9 +2659,11 @@ }, { "name": "Kemedzung", + "depth": 7, "iso_1_code": null, "iso_3_code": "dmo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5492", "native_tokenizers": [], @@ -2332,9 +2671,11 @@ }, { "name": "Mashi", + "depth": 7, "iso_1_code": null, "iso_3_code": "jms", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5493", "native_tokenizers": [], @@ -2342,9 +2683,11 @@ }, { "name": "Naki", + "depth": 7, "iso_1_code": null, "iso_3_code": "mff", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5494", "native_tokenizers": [], @@ -2352,9 +2695,11 @@ }, { "name": "Nchane", + "depth": 7, "iso_1_code": null, "iso_3_code": "ncr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5495", "native_tokenizers": [], @@ -2362,9 +2707,11 @@ }, { "name": "Noone", + "depth": 7, "iso_1_code": null, "iso_3_code": "nhu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2381,6 +2728,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2396,14 +2744,17 @@ }, { "name": "Ekoid", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ejagham", + "depth": 7, "iso_1_code": null, "iso_3_code": "etu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2421,9 +2772,11 @@ }, { "name": "Ndoe", + "depth": 7, "iso_1_code": null, "iso_3_code": "nbb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5499", "native_tokenizers": [], @@ -2431,14 +2784,17 @@ }, { "name": "Bakor", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abanyom", + "depth": 8, "iso_1_code": null, "iso_3_code": "abm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5501", "native_tokenizers": [], @@ -2446,9 +2802,11 @@ }, { "name": "Ekajuk", + "depth": 8, "iso_1_code": null, "iso_3_code": "eka", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2466,9 +2824,11 @@ }, { "name": "Nkem-Nkum", + "depth": 8, "iso_1_code": null, "iso_3_code": "isi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5503", "native_tokenizers": [], @@ -2476,9 +2836,11 @@ }, { "name": "Nnam", + "depth": 8, "iso_1_code": null, "iso_3_code": "nbp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5504", "native_tokenizers": [], @@ -2486,9 +2848,11 @@ }, { "name": "Nde-Nsele-Nta", + "depth": 8, "iso_1_code": null, "iso_3_code": "ndd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5505", "native_tokenizers": [], @@ -2496,15 +2860,18 @@ }, { "name": "Efutop", + "depth": 8, "iso_1_code": null, "iso_3_code": "ofu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5506", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2519,6 +2886,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2534,19 +2902,23 @@ }, { "name": "Jarawan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cameroon", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nagumi", + "depth": 8, "iso_1_code": null, "iso_3_code": "ngv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5509", "native_tokenizers": [], @@ -2554,15 +2926,18 @@ }, { "name": "Mbonga", + "depth": 8, "iso_1_code": null, "iso_3_code": "xmb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5510", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5508", "native_tokenizers": [], @@ -2570,14 +2945,17 @@ }, { "name": "Nigerian", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbat", + "depth": 8, "iso_1_code": null, "iso_3_code": "bau", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5512", "native_tokenizers": [], @@ -2585,9 +2963,11 @@ }, { "name": "Kulung", + "depth": 8, "iso_1_code": null, "iso_3_code": "bbu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5513", "native_tokenizers": [], @@ -2595,9 +2975,11 @@ }, { "name": "Bille", + "depth": 8, "iso_1_code": null, "iso_3_code": "bil", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5514", "native_tokenizers": [], @@ -2605,9 +2987,11 @@ }, { "name": "Lame", + "depth": 8, "iso_1_code": null, "iso_3_code": "bma", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5515", "native_tokenizers": [], @@ -2615,9 +2999,11 @@ }, { "name": "Duguri", + "depth": 8, "iso_1_code": null, "iso_3_code": "dbm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5516", "native_tokenizers": [], @@ -2625,9 +3011,11 @@ }, { "name": "Dulubu", + "depth": 8, "iso_1_code": null, "iso_3_code": "dbo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5517", "native_tokenizers": [], @@ -2635,9 +3023,11 @@ }, { "name": "Shiki", + "depth": 8, "iso_1_code": null, "iso_3_code": "gua", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5518", "native_tokenizers": [], @@ -2645,9 +3035,11 @@ }, { "name": "Gwa", + "depth": 8, "iso_1_code": null, "iso_3_code": "gwb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5519", "native_tokenizers": [], @@ -2655,9 +3047,11 @@ }, { "name": "Gwak", + "depth": 8, "iso_1_code": null, "iso_3_code": "jgk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5520", "native_tokenizers": [], @@ -2665,9 +3059,11 @@ }, { "name": "Bankal", + "depth": 8, "iso_1_code": null, "iso_3_code": "jjr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5521", "native_tokenizers": [], @@ -2675,9 +3071,11 @@ }, { "name": "Labir", + "depth": 8, "iso_1_code": null, "iso_3_code": "jku", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5522", "native_tokenizers": [], @@ -2685,9 +3083,11 @@ }, { "name": "Mbula-Bwazza", + "depth": 8, "iso_1_code": null, "iso_3_code": "mbu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5523", "native_tokenizers": [], @@ -2695,21 +3095,25 @@ }, { "name": "Mama", + "depth": 8, "iso_1_code": null, "iso_3_code": "mma", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5524", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5511", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5507", "native_tokenizers": [], @@ -2717,14 +3121,17 @@ }, { "name": "Mamfe", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Denya", + "depth": 7, "iso_1_code": null, "iso_3_code": "anv", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2742,9 +3149,11 @@ }, { "name": "Kenyang", + "depth": 7, "iso_1_code": null, "iso_3_code": "ken", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2762,15 +3171,18 @@ }, { "name": "Kendem", + "depth": 7, "iso_1_code": null, "iso_3_code": "kvm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5528", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -2786,20 +3198,24 @@ }, { "name": "Mbe", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbe", + "depth": 7, "iso_1_code": null, "iso_3_code": "mfo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5530", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5529", "native_tokenizers": [], @@ -2807,35 +3223,42 @@ }, { "name": "Narrow Bantu", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "D", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bembe-Buyi (D.54)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bembe", + "depth": 10, "iso_1_code": null, "iso_3_code": "bmb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5535", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5534", "native_tokenizers": [], @@ -2843,20 +3266,24 @@ }, { "name": "Bembe-Buyi (D.55)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buyu", + "depth": 10, "iso_1_code": null, "iso_3_code": "byi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5537", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5536", "native_tokenizers": [], @@ -2864,20 +3291,24 @@ }, { "name": "Bira-Nyali (D.301)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kari", + "depth": 10, "iso_1_code": null, "iso_3_code": "kbj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5539", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5538", "native_tokenizers": [], @@ -2885,20 +3316,24 @@ }, { "name": "Bira-Nyali (D.302)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boguru", + "depth": 10, "iso_1_code": null, "iso_3_code": "bqu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5541", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5540", "native_tokenizers": [], @@ -2906,20 +3341,24 @@ }, { "name": "Bira-Nyali (D.303)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngbinda", + "depth": 10, "iso_1_code": null, "iso_3_code": "nbd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5543", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5542", "native_tokenizers": [], @@ -2927,20 +3366,24 @@ }, { "name": "Bira-Nyali (D.304)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Homa", + "depth": 10, "iso_1_code": null, "iso_3_code": "hom", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5545", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5544", "native_tokenizers": [], @@ -2948,20 +3391,24 @@ }, { "name": "Bira-Nyali (D.305)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyanga-li", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5547", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5546", "native_tokenizers": [], @@ -2969,20 +3416,24 @@ }, { "name": "Bira-Nyali (D.307)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mayeka", + "depth": 10, "iso_1_code": null, "iso_3_code": "myc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5549", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5548", "native_tokenizers": [], @@ -2990,20 +3441,24 @@ }, { "name": "Bira-Nyali (D.308)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bodo", + "depth": 10, "iso_1_code": null, "iso_3_code": "boy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5551", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5550", "native_tokenizers": [], @@ -3011,20 +3466,24 @@ }, { "name": "Bira-Nyali (D.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bhele", + "depth": 10, "iso_1_code": null, "iso_3_code": "bhy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5553", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5552", "native_tokenizers": [], @@ -3032,20 +3491,24 @@ }, { "name": "Bira-Nyali (D.311)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bila", + "depth": 10, "iso_1_code": null, "iso_3_code": "bip", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5555", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5554", "native_tokenizers": [], @@ -3053,20 +3516,24 @@ }, { "name": "Bira-Nyali (D.312)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaiku", + "depth": 10, "iso_1_code": null, "iso_3_code": "kkq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5557", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5556", "native_tokenizers": [], @@ -3074,20 +3541,24 @@ }, { "name": "Bira-Nyali (D.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bira", + "depth": 10, "iso_1_code": null, "iso_3_code": "brf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5559", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5558", "native_tokenizers": [], @@ -3095,20 +3566,24 @@ }, { "name": "Bira-Nyali (D.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyali", + "depth": 10, "iso_1_code": null, "iso_3_code": "nlj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5561", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5560", "native_tokenizers": [], @@ -3116,20 +3591,24 @@ }, { "name": "Bira-Nyali (D.331)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vanuma", + "depth": 10, "iso_1_code": null, "iso_3_code": "vau", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5563", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5562", "native_tokenizers": [], @@ -3137,20 +3616,24 @@ }, { "name": "Bira-Nyali (D.332)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Budu", + "depth": 10, "iso_1_code": null, "iso_3_code": "buu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5565", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5564", "native_tokenizers": [], @@ -3158,20 +3641,24 @@ }, { "name": "Bira-Nyali (D.333)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5567", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5566", "native_tokenizers": [], @@ -3179,20 +3666,24 @@ }, { "name": "Bira-Nyali (D.334)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbo", + "depth": 10, "iso_1_code": null, "iso_3_code": "zmw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5569", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5568", "native_tokenizers": [], @@ -3200,20 +3691,24 @@ }, { "name": "Bira-Nyali (D.335)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Beeke", + "depth": 10, "iso_1_code": null, "iso_3_code": "bkf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5571", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5570", "native_tokenizers": [], @@ -3221,20 +3716,24 @@ }, { "name": "Bira-Nyali (D.336)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngbee", + "depth": 10, "iso_1_code": null, "iso_3_code": "jgb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5573", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5572", "native_tokenizers": [], @@ -3242,20 +3741,24 @@ }, { "name": "Lega-Holoholo (D.201)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lika", + "depth": 10, "iso_1_code": null, "iso_3_code": "lik", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5575", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5574", "native_tokenizers": [], @@ -3263,20 +3766,24 @@ }, { "name": "Lega-Holoholo (D.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bali", + "depth": 10, "iso_1_code": null, "iso_3_code": "bcp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5577", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5576", "native_tokenizers": [], @@ -3284,20 +3791,24 @@ }, { "name": "Lega-Holoholo (D.211)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kango", + "depth": 10, "iso_1_code": null, "iso_3_code": "kzy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5579", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5578", "native_tokenizers": [], @@ -3305,20 +3816,24 @@ }, { "name": "Lega-Holoholo (D.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amba", + "depth": 10, "iso_1_code": null, "iso_3_code": "rwm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5581", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5580", "native_tokenizers": [], @@ -3326,20 +3841,24 @@ }, { "name": "Lega-Holoholo (D.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Komo", + "depth": 10, "iso_1_code": null, "iso_3_code": "kmw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5583", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5582", "native_tokenizers": [], @@ -3347,20 +3866,24 @@ }, { "name": "Lega-Holoholo (D.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Songoora", + "depth": 10, "iso_1_code": null, "iso_3_code": "sod", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5585", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5584", "native_tokenizers": [], @@ -3368,14 +3891,17 @@ }, { "name": "Lega-Holoholo (D.25)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lega-Mwenga", + "depth": 10, "iso_1_code": null, "iso_3_code": "lgm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3392,6 +3918,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3407,14 +3934,17 @@ }, { "name": "Lega-Holoholo (D.251)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lega-Shabunda", + "depth": 10, "iso_1_code": null, "iso_3_code": "lea", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3431,6 +3961,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3446,14 +3977,17 @@ }, { "name": "Lega-Holoholo (D.251)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kanu", + "depth": 10, "iso_1_code": null, "iso_3_code": "khx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5591", "native_tokenizers": [], @@ -3461,15 +3995,18 @@ }, { "name": "Kwami", + "depth": 10, "iso_1_code": null, "iso_3_code": "ktf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5592", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5590", "native_tokenizers": [], @@ -3477,20 +4014,24 @@ }, { "name": "Lega-Holoholo (D.26)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zimba", + "depth": 10, "iso_1_code": null, "iso_3_code": "zmb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5594", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5593", "native_tokenizers": [], @@ -3498,20 +4039,24 @@ }, { "name": "Lega-Holoholo (D.27)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bangubangu", + "depth": 10, "iso_1_code": null, "iso_3_code": "bnx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5596", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5595", "native_tokenizers": [], @@ -3519,20 +4064,24 @@ }, { "name": "Lega-Holoholo (D.28)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Holoholo", + "depth": 10, "iso_1_code": null, "iso_3_code": "hoo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5598", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5597", "native_tokenizers": [], @@ -3540,20 +4089,24 @@ }, { "name": "Mbole-Enya (D.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbole", + "depth": 10, "iso_1_code": null, "iso_3_code": "mdq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5600", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5599", "native_tokenizers": [], @@ -3561,20 +4114,24 @@ }, { "name": "Mbole-Enya (D.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lengola", + "depth": 10, "iso_1_code": null, "iso_3_code": "lej", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5602", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5601", "native_tokenizers": [], @@ -3582,20 +4139,24 @@ }, { "name": "Mbole-Enya (D.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mituku", + "depth": 10, "iso_1_code": null, "iso_3_code": "zmq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5604", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5603", "native_tokenizers": [], @@ -3603,20 +4164,24 @@ }, { "name": "Mbole-Enya (D.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Enya", + "depth": 10, "iso_1_code": null, "iso_3_code": "gey", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5606", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5605", "native_tokenizers": [], @@ -3624,20 +4189,24 @@ }, { "name": "Mbolle-Enya (D.141)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zula", + "depth": 10, "iso_1_code": null, "iso_3_code": "zla", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5608", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5607", "native_tokenizers": [], @@ -3645,26 +4214,31 @@ }, { "name": "Nyanga (D.43)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5610", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5609", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3680,19 +4254,23 @@ }, { "name": "E", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chaga (E.621)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Machame", + "depth": 10, "iso_1_code": null, "iso_3_code": "jmc", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3710,15 +4288,18 @@ }, { "name": "Rwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "rwk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5614", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3734,14 +4315,17 @@ }, { "name": "Chaga (E.622)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mochi", + "depth": 10, "iso_1_code": null, "iso_3_code": "old", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3759,9 +4343,11 @@ }, { "name": "Vunjo", + "depth": 10, "iso_1_code": null, "iso_3_code": "vun", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3778,6 +4364,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3793,20 +4380,24 @@ }, { "name": "Chaga (E.623)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rombo", + "depth": 10, "iso_1_code": null, "iso_3_code": "rof", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5619", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5618", "native_tokenizers": [], @@ -3814,20 +4405,24 @@ }, { "name": "Chaga (E.64)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kahe", + "depth": 10, "iso_1_code": null, "iso_3_code": "hka", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5621", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5620", "native_tokenizers": [], @@ -3835,20 +4430,24 @@ }, { "name": "Chaga (E.65)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gweno", + "depth": 10, "iso_1_code": null, "iso_3_code": "gwe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5623", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5622", "native_tokenizers": [], @@ -3856,14 +4455,17 @@ }, { "name": "Kikuyu-Kamba (E.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gikuyu", + "depth": 10, "iso_1_code": "ki", "iso_3_code": "kik", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3880,6 +4482,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3895,20 +4498,24 @@ }, { "name": "Kikuyu-Kamba (E.52)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kiembu", + "depth": 10, "iso_1_code": null, "iso_3_code": "ebu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5627", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5626", "native_tokenizers": [], @@ -3916,14 +4523,17 @@ }, { "name": "Kikuyu-Kamba (E.53)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kim\u00ee\u00eeru", + "depth": 10, "iso_1_code": null, "iso_3_code": "mer", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3940,6 +4550,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -3955,20 +4566,24 @@ }, { "name": "Kikuyu-Kamba (E.531)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mwimbi-Muthambi", + "depth": 10, "iso_1_code": null, "iso_3_code": "mws", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5631", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5630", "native_tokenizers": [], @@ -3976,14 +4591,17 @@ }, { "name": "Kikuyu-Kamba (E.54)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kitharaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "thk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4000,6 +4618,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4015,20 +4634,24 @@ }, { "name": "Kikuyu-Kamba (E.541)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gichuka", + "depth": 10, "iso_1_code": null, "iso_3_code": "cuh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5635", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5634", "native_tokenizers": [], @@ -4036,14 +4659,17 @@ }, { "name": "Kikuyu-Kamba (E.55)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "kam", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4060,6 +4686,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4075,20 +4702,24 @@ }, { "name": "Kikuyu-Kamba (E.56)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhaiso", + "depth": 10, "iso_1_code": null, "iso_3_code": "dhs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5639", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5638", "native_tokenizers": [], @@ -4096,20 +4727,24 @@ }, { "name": "Nyika-Taita (E.701)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kiwilwana", + "depth": 10, "iso_1_code": null, "iso_3_code": "mlk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5641", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5640", "native_tokenizers": [], @@ -4117,14 +4752,17 @@ }, { "name": "Nyika-Taita (E.71)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kipfokomu", + "depth": 10, "iso_1_code": null, "iso_3_code": "pkb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4141,6 +4779,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4156,14 +4795,17 @@ }, { "name": "Nyika-Taita (E.72)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chichonyi-Chidzihana-Chikauma", + "depth": 10, "iso_1_code": null, "iso_3_code": "coh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5645", "native_tokenizers": [], @@ -4171,9 +4813,11 @@ }, { "name": "Chiduruma", + "depth": 10, "iso_1_code": null, "iso_3_code": "dug", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4191,9 +4835,11 @@ }, { "name": "Kigiryama", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4210,6 +4856,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4225,14 +4872,17 @@ }, { "name": "Nyika-Taita (E.73)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chidigo", + "depth": 10, "iso_1_code": null, "iso_3_code": "dig", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4249,6 +4899,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4264,20 +4915,24 @@ }, { "name": "Nyika-Taita (E.731)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Segeju", + "depth": 10, "iso_1_code": null, "iso_3_code": "seg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5651", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5650", "native_tokenizers": [], @@ -4285,14 +4940,17 @@ }, { "name": "Nyika-Taita (E.74)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dawida", + "depth": 10, "iso_1_code": null, "iso_3_code": "dav", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5653", "native_tokenizers": [], @@ -4300,15 +4958,18 @@ }, { "name": "Taveta", + "depth": 10, "iso_1_code": null, "iso_3_code": "tvs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5654", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5652", "native_tokenizers": [], @@ -4316,20 +4977,24 @@ }, { "name": "Nyika-Taita (E.741)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sagalla", + "depth": 10, "iso_1_code": null, "iso_3_code": "tga", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5656", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5655", "native_tokenizers": [], @@ -4337,26 +5002,31 @@ }, { "name": "Temi (E.46)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Temi", + "depth": 10, "iso_1_code": null, "iso_3_code": "soz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5658", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5657", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4372,14 +5042,17 @@ }, { "name": "F", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ruwila", + "depth": 9, "iso_1_code": null, "iso_3_code": "rwl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5660", "native_tokenizers": [], @@ -4387,14 +5060,17 @@ }, { "name": "Nilamba-Rangi (F.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isanzu", + "depth": 10, "iso_1_code": null, "iso_3_code": "isn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5662", "native_tokenizers": [], @@ -4402,9 +5078,11 @@ }, { "name": "Nilamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "nim", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4421,6 +5099,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4436,14 +5115,17 @@ }, { "name": "Nilamba-Rangi (F.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyaturu", + "depth": 10, "iso_1_code": null, "iso_3_code": "rim", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4460,6 +5142,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4475,20 +5158,24 @@ }, { "name": "Nilamba-Rangi (F.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rangi", + "depth": 10, "iso_1_code": null, "iso_3_code": "lag", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5667", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5666", "native_tokenizers": [], @@ -4496,20 +5183,24 @@ }, { "name": "Nilamba-Rangi (F.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbugwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5669", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5668", "native_tokenizers": [], @@ -4517,14 +5208,17 @@ }, { "name": "Sukuma-Nyamwezi (F.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sukuma", + "depth": 10, "iso_1_code": null, "iso_3_code": "suk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4541,6 +5235,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4556,14 +5251,17 @@ }, { "name": "Sukuma-Nyamwezi (F.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konongo", + "depth": 10, "iso_1_code": null, "iso_3_code": "kcz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5673", "native_tokenizers": [], @@ -4571,15 +5269,18 @@ }, { "name": "Nyamwezi", + "depth": 10, "iso_1_code": null, "iso_3_code": "nym", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5674", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5672", "native_tokenizers": [], @@ -4587,20 +5288,24 @@ }, { "name": "Sukuma-Nyamwezi (F.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sumbwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "suw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5676", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5675", "native_tokenizers": [], @@ -4608,20 +5313,24 @@ }, { "name": "Sukuma-Nyamwezi (F.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kimbu", + "depth": 10, "iso_1_code": null, "iso_3_code": "kiv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5678", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5677", "native_tokenizers": [], @@ -4629,20 +5338,24 @@ }, { "name": "Sukuma-Nyamwezi (F.25)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bungu", + "depth": 10, "iso_1_code": null, "iso_3_code": "wun", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5680", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5679", "native_tokenizers": [], @@ -4650,20 +5363,24 @@ }, { "name": "Tongwe-Bende (F.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tongwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "tny", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5682", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5681", "native_tokenizers": [], @@ -4671,26 +5388,31 @@ }, { "name": "Tongwe-Bende (F.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bende", + "depth": 10, "iso_1_code": null, "iso_3_code": "bdp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5684", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5683", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4706,25 +5428,30 @@ }, { "name": "G", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bena-Kinga (G.61)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sangu", + "depth": 10, "iso_1_code": null, "iso_3_code": "sbp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5687", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5686", "native_tokenizers": [], @@ -4732,14 +5459,17 @@ }, { "name": "Bena-Kinga (G.62)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hehe", + "depth": 10, "iso_1_code": null, "iso_3_code": "heh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4756,6 +5486,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4771,14 +5502,17 @@ }, { "name": "Bena-Kinga (G.63)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bena", + "depth": 10, "iso_1_code": null, "iso_3_code": "bez", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5691", "native_tokenizers": [], @@ -4786,15 +5520,18 @@ }, { "name": "Benamanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "egm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5692", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5690", "native_tokenizers": [], @@ -4802,20 +5539,24 @@ }, { "name": "Bena-Kinga (G.64)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pangwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "pbr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5694", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5693", "native_tokenizers": [], @@ -4823,20 +5564,24 @@ }, { "name": "Bena-Kinga (G.65)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kinga", + "depth": 10, "iso_1_code": null, "iso_3_code": "zga", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5696", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5695", "native_tokenizers": [], @@ -4844,20 +5589,24 @@ }, { "name": "Bena-Kinga (G.651)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Magoma", + "depth": 10, "iso_1_code": null, "iso_3_code": "gmx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5698", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5697", "native_tokenizers": [], @@ -4865,20 +5614,24 @@ }, { "name": "Bena-Kinga (G.66)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vwanji", + "depth": 10, "iso_1_code": null, "iso_3_code": "wbi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5700", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5699", "native_tokenizers": [], @@ -4886,20 +5639,24 @@ }, { "name": "Bena-Kinga (G.67)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kisi", + "depth": 10, "iso_1_code": null, "iso_3_code": "kiz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5702", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5701", "native_tokenizers": [], @@ -4907,14 +5664,17 @@ }, { "name": "Gogo-Kagulu (G.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gogo", + "depth": 10, "iso_1_code": null, "iso_3_code": "gog", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4931,6 +5691,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4946,14 +5707,17 @@ }, { "name": "Gogo-Kagulu (G.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kagulu", + "depth": 10, "iso_1_code": null, "iso_3_code": "kki", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4970,6 +5734,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -4985,14 +5750,17 @@ }, { "name": "Pogolo-Ndamba (G.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pogolo", + "depth": 10, "iso_1_code": null, "iso_3_code": "poy", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5009,6 +5777,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5024,14 +5793,17 @@ }, { "name": "Pogolo-Ndamba (G.52)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5048,6 +5820,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5063,20 +5836,24 @@ }, { "name": "Shambala (G.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asu", + "depth": 10, "iso_1_code": null, "iso_3_code": "asa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5712", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5711", "native_tokenizers": [], @@ -5084,14 +5861,17 @@ }, { "name": "Shambala (G.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shambala", + "depth": 10, "iso_1_code": null, "iso_3_code": "ksb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5108,6 +5888,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5123,20 +5904,24 @@ }, { "name": "Shambala (G.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bondei", + "depth": 10, "iso_1_code": null, "iso_3_code": "bou", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5716", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5715", "native_tokenizers": [], @@ -5144,14 +5929,17 @@ }, { "name": "Swahili (G.40)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Swahili, Congo", + "depth": 10, "iso_1_code": "sw", "iso_3_code": "swc", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5168,6 +5956,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5183,20 +5972,24 @@ }, { "name": "Swahili (G.402)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Makwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "ymk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5720", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5719", "native_tokenizers": [], @@ -5204,14 +5997,17 @@ }, { "name": "Swahili (G.403)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mwani", + "depth": 10, "iso_1_code": null, "iso_3_code": "wmw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5228,6 +6024,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5243,14 +6040,17 @@ }, { "name": "Swahili (G.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Swahili", + "depth": 10, "iso_1_code": "sw", "iso_3_code": "swh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5267,6 +6067,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5282,14 +6083,17 @@ }, { "name": "Swahili (G.44)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Comorian, Maore", + "depth": 10, "iso_1_code": null, "iso_3_code": "swb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5307,9 +6111,11 @@ }, { "name": "Comorian, Mwali", + "depth": 10, "iso_1_code": null, "iso_3_code": "wlc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5727", "native_tokenizers": [], @@ -5317,9 +6123,11 @@ }, { "name": "Comorian, Ndzwani", + "depth": 10, "iso_1_code": null, "iso_3_code": "wni", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5728", "native_tokenizers": [], @@ -5327,9 +6135,11 @@ }, { "name": "Comorian, Ngazidja", + "depth": 10, "iso_1_code": null, "iso_3_code": "zdj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5346,6 +6156,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5361,20 +6172,24 @@ }, { "name": "Zigula-Zaramo (G.301)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Doe", + "depth": 10, "iso_1_code": null, "iso_3_code": "doe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5731", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5730", "native_tokenizers": [], @@ -5382,14 +6197,17 @@ }, { "name": "Zigula-Zaramo (G.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zigula", + "depth": 10, "iso_1_code": null, "iso_3_code": "ziw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5406,6 +6224,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5421,20 +6240,24 @@ }, { "name": "Zigula-Zaramo (G.311)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mushungulu", + "depth": 10, "iso_1_code": null, "iso_3_code": "xma", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5735", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5734", "native_tokenizers": [], @@ -5442,14 +6265,17 @@ }, { "name": "Zigula-Zaramo (G.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwere", + "depth": 10, "iso_1_code": null, "iso_3_code": "cwe", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5466,6 +6292,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5481,20 +6308,24 @@ }, { "name": "Zigula-Zaramo (G.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zaramo", + "depth": 10, "iso_1_code": null, "iso_3_code": "zaj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5739", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5738", "native_tokenizers": [], @@ -5502,14 +6333,17 @@ }, { "name": "Zigula-Zaramo (G.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngulu", + "depth": 10, "iso_1_code": null, "iso_3_code": "ngp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5526,6 +6360,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5541,14 +6376,17 @@ }, { "name": "Zigula-Zaramo (G.35)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luguru", + "depth": 10, "iso_1_code": null, "iso_3_code": "ruf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5565,6 +6403,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5580,20 +6419,24 @@ }, { "name": "Zigula-Zaramo (G.36)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kami", + "depth": 10, "iso_1_code": null, "iso_3_code": "kcu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5745", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5744", "native_tokenizers": [], @@ -5601,14 +6444,17 @@ }, { "name": "Zigula-Zaramo (G.37)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kutu", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdc", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5625,6 +6471,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5640,14 +6487,17 @@ }, { "name": "Zigula-Zaramo (G.38)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vidunda", + "depth": 10, "iso_1_code": null, "iso_3_code": "vid", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5664,6 +6514,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5679,26 +6530,31 @@ }, { "name": "Zigula-Zaramo (G.39)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sagala", + "depth": 10, "iso_1_code": null, "iso_3_code": "sbm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5751", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5750", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5714,19 +6570,23 @@ }, { "name": "H", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kikongo (H.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Beembe", + "depth": 10, "iso_1_code": null, "iso_3_code": "beq", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5743,6 +6603,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5758,14 +6619,17 @@ }, { "name": "Kikongo (H.112)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Doondo", + "depth": 10, "iso_1_code": null, "iso_3_code": "dde", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5756", "native_tokenizers": [], @@ -5773,15 +6637,18 @@ }, { "name": "Kaamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "xku", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5757", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5755", "native_tokenizers": [], @@ -5789,20 +6656,24 @@ }, { "name": "Kikongo (H.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vili", + "depth": 10, "iso_1_code": null, "iso_3_code": "vif", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5759", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5758", "native_tokenizers": [], @@ -5810,20 +6681,24 @@ }, { "name": "Kikongo (H.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kunyi", + "depth": 10, "iso_1_code": null, "iso_3_code": "njx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5761", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5760", "native_tokenizers": [], @@ -5831,20 +6706,24 @@ }, { "name": "Kikongo (H.131)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suundi", + "depth": 10, "iso_1_code": null, "iso_3_code": "sdj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5763", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5762", "native_tokenizers": [], @@ -5852,14 +6731,17 @@ }, { "name": "Kikongo (H.16)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koongo", + "depth": 10, "iso_1_code": "kg", "iso_3_code": "kng", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5877,9 +6759,11 @@ }, { "name": "Kikongo", + "depth": 10, "iso_1_code": "kg", "iso_3_code": "kwy", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5897,9 +6781,11 @@ }, { "name": "Laari", + "depth": 10, "iso_1_code": "kg", "iso_3_code": "ldi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5917,9 +6803,11 @@ }, { "name": "Kiyombe", + "depth": 10, "iso_1_code": null, "iso_3_code": "yom", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5936,6 +6824,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5951,14 +6840,17 @@ }, { "name": "Kimbundu (H.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kimbundu", + "depth": 10, "iso_1_code": null, "iso_3_code": "kmb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -5976,15 +6868,18 @@ }, { "name": "Mpinda", + "depth": 10, "iso_1_code": null, "iso_3_code": "pnd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5771", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -6000,20 +6895,24 @@ }, { "name": "Kimbundu (H.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kibala", + "depth": 10, "iso_1_code": null, "iso_3_code": "blv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5773", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5772", "native_tokenizers": [], @@ -6021,20 +6920,24 @@ }, { "name": "Kimbundu (H.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Songo", + "depth": 10, "iso_1_code": null, "iso_3_code": "nsx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5775", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5774", "native_tokenizers": [], @@ -6042,20 +6945,24 @@ }, { "name": "Mbala-Hunganna (H.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbala", + "depth": 10, "iso_1_code": null, "iso_3_code": "mdp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5777", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5776", "native_tokenizers": [], @@ -6063,20 +6970,24 @@ }, { "name": "Mbala-Hunganna (H.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hungana", + "depth": 10, "iso_1_code": null, "iso_3_code": "hum", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5779", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5778", "native_tokenizers": [], @@ -6084,14 +6995,17 @@ }, { "name": "Yaka (H.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lonzo", + "depth": 10, "iso_1_code": null, "iso_3_code": "lnz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5781", "native_tokenizers": [], @@ -6099,9 +7013,11 @@ }, { "name": "Pelende", + "depth": 10, "iso_1_code": null, "iso_3_code": "ppp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5782", "native_tokenizers": [], @@ -6109,15 +7025,18 @@ }, { "name": "Yaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "yaf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5783", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5780", "native_tokenizers": [], @@ -6125,14 +7044,17 @@ }, { "name": "Yaka (H.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hungu", + "depth": 10, "iso_1_code": null, "iso_3_code": "hng", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5785", "native_tokenizers": [], @@ -6140,15 +7062,18 @@ }, { "name": "Suku", + "depth": 10, "iso_1_code": null, "iso_3_code": "sub", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5786", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5784", "native_tokenizers": [], @@ -6156,20 +7081,24 @@ }, { "name": "Yaka (H.321)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sonde", + "depth": 10, "iso_1_code": null, "iso_3_code": "shc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5788", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5787", "native_tokenizers": [], @@ -6177,26 +7106,31 @@ }, { "name": "Yaka (H.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbangala", + "depth": 10, "iso_1_code": null, "iso_3_code": "mxg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5790", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5789", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -6212,25 +7146,30 @@ }, { "name": "J", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haya-Jita (E.20)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Subi", + "depth": 10, "iso_1_code": null, "iso_3_code": "xsj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5793", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5792", "native_tokenizers": [], @@ -6238,20 +7177,24 @@ }, { "name": "Haya-Jita (E.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyambo", + "depth": 10, "iso_1_code": null, "iso_3_code": "now", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5795", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5794", "native_tokenizers": [], @@ -6259,14 +7202,17 @@ }, { "name": "Haya-Jita (E.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haya", + "depth": 10, "iso_1_code": null, "iso_3_code": "hay", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6283,6 +7229,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6298,20 +7245,24 @@ }, { "name": "Haya-Jita (E.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zinza", + "depth": 10, "iso_1_code": null, "iso_3_code": "zin", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5799", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5798", "native_tokenizers": [], @@ -6319,20 +7270,24 @@ }, { "name": "Haya-Jita (E.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kerewe", + "depth": 10, "iso_1_code": null, "iso_3_code": "ked", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5801", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5800", "native_tokenizers": [], @@ -6340,20 +7295,24 @@ }, { "name": "Haya-Jita (E.25)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jita", + "depth": 10, "iso_1_code": null, "iso_3_code": "jit", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5803", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5802", "native_tokenizers": [], @@ -6361,20 +7320,24 @@ }, { "name": "Haya-Jita (E.251)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwaya", + "depth": 10, "iso_1_code": null, "iso_3_code": "kya", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5805", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5804", "native_tokenizers": [], @@ -6382,20 +7345,24 @@ }, { "name": "Haya-Jita (E.252)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kara", + "depth": 10, "iso_1_code": null, "iso_3_code": "reg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5807", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5806", "native_tokenizers": [], @@ -6403,20 +7370,24 @@ }, { "name": "Konzo-Ndandi (D.40)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kobo", + "depth": 10, "iso_1_code": null, "iso_3_code": "okc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5809", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5808", "native_tokenizers": [], @@ -6424,14 +7395,17 @@ }, { "name": "Konzo-Ndandi (D.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konzo", + "depth": 10, "iso_1_code": null, "iso_3_code": "koo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6448,6 +7422,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6463,14 +7438,17 @@ }, { "name": "Konzo-Ndandi (D.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nande", + "depth": 10, "iso_1_code": null, "iso_3_code": "nnb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6487,6 +7465,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6502,20 +7481,24 @@ }, { "name": "Logooli-Kuria (E.401)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngoreme", + "depth": 10, "iso_1_code": null, "iso_3_code": "ngq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5815", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5814", "native_tokenizers": [], @@ -6523,20 +7506,24 @@ }, { "name": "Logooli-Kuria (E.402)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ikizu", + "depth": 10, "iso_1_code": null, "iso_3_code": "ikz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5817", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5816", "native_tokenizers": [], @@ -6544,14 +7531,17 @@ }, { "name": "Logooli-Kuria (E.403)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suba", + "depth": 10, "iso_1_code": null, "iso_3_code": "sxb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6568,6 +7558,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6583,20 +7574,24 @@ }, { "name": "Logooli-Kuria (E.405)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kabwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "cwa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5821", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5820", "native_tokenizers": [], @@ -6604,20 +7599,24 @@ }, { "name": "Logooli-Kuria (E.406)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Singa", + "depth": 10, "iso_1_code": null, "iso_3_code": "sgm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5823", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5822", "native_tokenizers": [], @@ -6625,20 +7624,24 @@ }, { "name": "Logooli-Kuria (E.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lulogooli", + "depth": 10, "iso_1_code": null, "iso_3_code": "rag", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5825", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5824", "native_tokenizers": [], @@ -6646,20 +7649,24 @@ }, { "name": "Logooli-Kuria (E.411)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luidakho-Luisukha-Lutirichi", + "depth": 10, "iso_1_code": null, "iso_3_code": "ida", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5827", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5826", "native_tokenizers": [], @@ -6667,14 +7674,17 @@ }, { "name": "Logooli-Kuria (E.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ekegusii", + "depth": 10, "iso_1_code": null, "iso_3_code": "guz", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6691,6 +7701,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6706,14 +7717,17 @@ }, { "name": "Logooli-Kuria (E.43)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuria", + "depth": 10, "iso_1_code": null, "iso_3_code": "kuj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6730,6 +7744,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6745,20 +7760,24 @@ }, { "name": "Logooli-Kuria (E.431)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suba-Simbiti", + "depth": 10, "iso_1_code": null, "iso_3_code": "ssc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5833", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5832", "native_tokenizers": [], @@ -6766,20 +7785,24 @@ }, { "name": "Logooli-Kuria (E.44)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zanaki", + "depth": 10, "iso_1_code": null, "iso_3_code": "zak", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5835", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5834", "native_tokenizers": [], @@ -6787,20 +7810,24 @@ }, { "name": "Logooli-Kuria (E.45)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ikoma-Nata-Isenye", + "depth": 10, "iso_1_code": null, "iso_3_code": "ntk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5837", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5836", "native_tokenizers": [], @@ -6808,14 +7835,17 @@ }, { "name": "Masaba-Luhya (E.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bukusu", + "depth": 10, "iso_1_code": null, "iso_3_code": "bxk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5839", "native_tokenizers": [], @@ -6823,9 +7853,11 @@ }, { "name": "Lutachoni", + "depth": 10, "iso_1_code": null, "iso_3_code": "lts", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5840", "native_tokenizers": [], @@ -6833,9 +7865,11 @@ }, { "name": "Masaaba", + "depth": 10, "iso_1_code": null, "iso_3_code": "myx", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6852,6 +7886,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6867,14 +7902,17 @@ }, { "name": "Masaba-Luhya (E.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lukabaras", + "depth": 10, "iso_1_code": null, "iso_3_code": "lkb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5843", "native_tokenizers": [], @@ -6882,9 +7920,11 @@ }, { "name": "Olushisa", + "depth": 10, "iso_1_code": null, "iso_3_code": "lks", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5844", "native_tokenizers": [], @@ -6892,9 +7932,11 @@ }, { "name": "Olumarama", + "depth": 10, "iso_1_code": null, "iso_3_code": "lrm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5845", "native_tokenizers": [], @@ -6902,9 +7944,11 @@ }, { "name": "Olutsotso", + "depth": 10, "iso_1_code": null, "iso_3_code": "lto", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5846", "native_tokenizers": [], @@ -6912,9 +7956,11 @@ }, { "name": "Oluwanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "lwg", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6932,15 +7978,18 @@ }, { "name": "Nyala", + "depth": 10, "iso_1_code": null, "iso_3_code": "nle", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5848", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -6956,20 +8005,24 @@ }, { "name": "Masaba-Luhya (E.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Olunyole", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5850", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5849", "native_tokenizers": [], @@ -6977,14 +8030,17 @@ }, { "name": "Masaba-Luhya (E.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saamya-Gwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "lsm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7001,6 +8057,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7016,20 +8073,24 @@ }, { "name": "Masaba-Luhya (E.341)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Olukhayo", + "depth": 10, "iso_1_code": null, "iso_3_code": "lko", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5854", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5853", "native_tokenizers": [], @@ -7037,20 +8098,24 @@ }, { "name": "Masaba-Luhya (E.342)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Olumarachi", + "depth": 10, "iso_1_code": null, "iso_3_code": "lri", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5856", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5855", "native_tokenizers": [], @@ -7058,14 +8123,17 @@ }, { "name": "Masaba-Luhya (E.35)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyole", + "depth": 10, "iso_1_code": null, "iso_3_code": "nuj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7082,6 +8150,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7097,14 +8166,17 @@ }, { "name": "Nyoro-Ganda (E.101)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gungu", + "depth": 10, "iso_1_code": null, "iso_3_code": "rub", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7121,6 +8193,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7136,14 +8209,17 @@ }, { "name": "Nyoro-Ganda (E.102)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Talinga-Bwisi", + "depth": 10, "iso_1_code": null, "iso_3_code": "tlj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7160,6 +8236,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7175,20 +8252,24 @@ }, { "name": "Nyoro-Ganda (E.103)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ruruuli-Runyala", + "depth": 10, "iso_1_code": null, "iso_3_code": "ruc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5864", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5863", "native_tokenizers": [], @@ -7196,14 +8277,17 @@ }, { "name": "Nyoro-Ganda (E.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyoro", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7220,6 +8304,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7235,14 +8320,17 @@ }, { "name": "Nyoro-Ganda (E.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tooro", + "depth": 10, "iso_1_code": null, "iso_3_code": "ttj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7259,6 +8347,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7274,20 +8363,24 @@ }, { "name": "Nyoro-Ganda (E.121)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hema", + "depth": 10, "iso_1_code": null, "iso_3_code": "nix", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5870", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5869", "native_tokenizers": [], @@ -7295,14 +8388,17 @@ }, { "name": "Nyoro-Ganda (E.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyankore", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7319,6 +8415,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7334,14 +8431,17 @@ }, { "name": "Nyoro-Ganda (E.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chiga", + "depth": 10, "iso_1_code": null, "iso_3_code": "cgg", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7358,6 +8458,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7373,14 +8474,17 @@ }, { "name": "Nyoro-Ganda (E.15)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ganda", + "depth": 10, "iso_1_code": "lg", "iso_3_code": "lug", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7399,6 +8503,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7414,14 +8519,17 @@ }, { "name": "Nyoro-Ganda (E.16)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kenye", + "depth": 10, "iso_1_code": null, "iso_3_code": "lke", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5878", "native_tokenizers": [], @@ -7429,9 +8537,11 @@ }, { "name": "Soga", + "depth": 10, "iso_1_code": null, "iso_3_code": "xog", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7448,6 +8558,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7463,14 +8574,17 @@ }, { "name": "Nyoro-Ganda (E.17)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gwere", + "depth": 10, "iso_1_code": null, "iso_3_code": "gwr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7487,6 +8601,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7502,14 +8617,17 @@ }, { "name": "Ruanda-Rundi (D.61)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kinyarwanda", + "depth": 10, "iso_1_code": "rw", "iso_3_code": "kin", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7526,6 +8644,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7541,14 +8660,17 @@ }, { "name": "Ruanda-Rundi (D.62)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rundi", + "depth": 10, "iso_1_code": "rn", "iso_3_code": "run", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7565,6 +8687,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7580,20 +8703,24 @@ }, { "name": "Ruanda-Rundi (D.63)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fuliiru", + "depth": 10, "iso_1_code": null, "iso_3_code": "flr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5887", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5886", "native_tokenizers": [], @@ -7601,20 +8728,24 @@ }, { "name": "Ruanda-Rundi (D.631)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kiviila", + "depth": 10, "iso_1_code": null, "iso_3_code": "job", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5889", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5888", "native_tokenizers": [], @@ -7622,20 +8753,24 @@ }, { "name": "Ruanda-Rundi (D.64)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shubi", + "depth": 10, "iso_1_code": null, "iso_3_code": "suj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5891", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5890", "native_tokenizers": [], @@ -7643,20 +8778,24 @@ }, { "name": "Ruanda-Rundi (D.65)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hangaza", + "depth": 10, "iso_1_code": null, "iso_3_code": "han", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5893", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5892", "native_tokenizers": [], @@ -7664,20 +8803,24 @@ }, { "name": "Ruanda-Rundi (D.66)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ha", + "depth": 10, "iso_1_code": null, "iso_3_code": "haq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5895", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5894", "native_tokenizers": [], @@ -7685,9 +8828,11 @@ }, { "name": "Ruanda-Rundi (D.67)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7703,20 +8848,24 @@ }, { "name": "Shi-Hunde (D.501)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyindu", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5898", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5897", "native_tokenizers": [], @@ -7724,20 +8873,24 @@ }, { "name": "Shi-Hunde (D.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hunde", + "depth": 10, "iso_1_code": null, "iso_3_code": "hke", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5900", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5899", "native_tokenizers": [], @@ -7745,14 +8898,17 @@ }, { "name": "Shi-Hunde (D.52)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Havu", + "depth": 10, "iso_1_code": null, "iso_3_code": "hav", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7769,6 +8925,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7784,14 +8941,17 @@ }, { "name": "Shi-Hunde (D.53)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shi", + "depth": 10, "iso_1_code": null, "iso_3_code": "shr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7808,6 +8968,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7823,20 +8984,24 @@ }, { "name": "Shi-Hunde (D.531)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tembo", + "depth": 10, "iso_1_code": null, "iso_3_code": "tbt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5906", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5905", "native_tokenizers": [], @@ -7844,26 +9009,31 @@ }, { "name": "Shi-Hunde (D.56)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kabwari", + "depth": 10, "iso_1_code": null, "iso_3_code": "kcw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5908", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5907", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"lg\")", @@ -7879,19 +9049,23 @@ }, { "name": "K", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ciokwe-Luchazi (K.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chokwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "cjk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -7908,6 +9082,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -7923,14 +9098,17 @@ }, { "name": "Ciokwe-Luchazi (K.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luimbi", + "depth": 10, "iso_1_code": null, "iso_3_code": "lum", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5913", "native_tokenizers": [], @@ -7938,9 +9116,11 @@ }, { "name": "Nyemba", + "depth": 10, "iso_1_code": null, "iso_3_code": "nba", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -7957,6 +9137,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -7972,20 +9153,24 @@ }, { "name": "Ciokwe-Luchazi (K.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luchazi", + "depth": 10, "iso_1_code": null, "iso_3_code": "lch", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5916", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5915", "native_tokenizers": [], @@ -7993,14 +9178,17 @@ }, { "name": "Ciokwe-Luchazi (K.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luvale", + "depth": 10, "iso_1_code": null, "iso_3_code": "lue", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8017,6 +9205,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8032,14 +9221,17 @@ }, { "name": "Ciokwe-Luchazi (K.15)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbunda", + "depth": 10, "iso_1_code": null, "iso_3_code": "mck", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8056,6 +9248,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8071,14 +9264,17 @@ }, { "name": "Ciokwe-Luchazi (K.16)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyengo", + "depth": 10, "iso_1_code": null, "iso_3_code": "nye", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5922", "native_tokenizers": [], @@ -8086,15 +9282,18 @@ }, { "name": "Yauma", + "depth": 10, "iso_1_code": null, "iso_3_code": "yax", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5923", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5921", "native_tokenizers": [], @@ -8102,20 +9301,24 @@ }, { "name": "Ciokwe-Luchazi (K.17)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbwela", + "depth": 10, "iso_1_code": null, "iso_3_code": "mfu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5925", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5924", "native_tokenizers": [], @@ -8123,20 +9326,24 @@ }, { "name": "Ciokwe-Luchazi (K.18)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nkangala", + "depth": 10, "iso_1_code": null, "iso_3_code": "nkn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5927", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5926", "native_tokenizers": [], @@ -8144,14 +9351,17 @@ }, { "name": "Lozi (K.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lozi", + "depth": 10, "iso_1_code": null, "iso_3_code": "loz", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8168,6 +9378,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8183,20 +9394,24 @@ }, { "name": "Luyana (K.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luyana", + "depth": 10, "iso_1_code": null, "iso_3_code": "lyn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5931", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5930", "native_tokenizers": [], @@ -8204,20 +9419,24 @@ }, { "name": "Luyana (K.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbowe", + "depth": 10, "iso_1_code": null, "iso_3_code": "mxo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5933", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5932", "native_tokenizers": [], @@ -8225,14 +9444,17 @@ }, { "name": "Luyana (K.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwangali", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8249,6 +9471,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8264,14 +9487,17 @@ }, { "name": "Luyana (K.332)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gciriku", + "depth": 10, "iso_1_code": null, "iso_3_code": "diu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8288,6 +9514,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8303,14 +9530,17 @@ }, { "name": "Luyana (K.333)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbukushu", + "depth": 10, "iso_1_code": null, "iso_3_code": "mhw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8327,6 +9557,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8342,20 +9573,24 @@ }, { "name": "Luyana (K.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mashi", + "depth": 10, "iso_1_code": null, "iso_3_code": "mho", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5941", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5940", "native_tokenizers": [], @@ -8363,20 +9598,24 @@ }, { "name": "Luyana (K.35)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Simaa", + "depth": 10, "iso_1_code": null, "iso_3_code": "sie", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5943", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5942", "native_tokenizers": [], @@ -8384,20 +9623,24 @@ }, { "name": "Subiya-Totela (K.402)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "fwe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5945", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5944", "native_tokenizers": [], @@ -8405,20 +9648,24 @@ }, { "name": "Subiya-Totela (K.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Totela", + "depth": 10, "iso_1_code": null, "iso_3_code": "ttl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5947", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5946", "native_tokenizers": [], @@ -8426,14 +9673,17 @@ }, { "name": "Subiya-Totela (K.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuhane", + "depth": 10, "iso_1_code": null, "iso_3_code": "sbs", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8450,6 +9700,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8464,6 +9715,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8479,19 +9731,23 @@ }, { "name": "L", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaonde (L.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaonde", + "depth": 10, "iso_1_code": null, "iso_3_code": "kqn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8508,6 +9764,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8523,14 +9780,17 @@ }, { "name": "Luba (L.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luba-Kasai", + "depth": 10, "iso_1_code": null, "iso_3_code": "lua", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8547,6 +9807,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8562,14 +9823,17 @@ }, { "name": "Luba (L.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kanyok", + "depth": 10, "iso_1_code": null, "iso_3_code": "kny", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8586,6 +9850,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8601,14 +9866,17 @@ }, { "name": "Luba (L.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luba-Katanga", + "depth": 10, "iso_1_code": "lu", "iso_3_code": "lub", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8625,6 +9893,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8640,20 +9909,24 @@ }, { "name": "Luba (L.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hemba", + "depth": 10, "iso_1_code": null, "iso_3_code": "hem", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5960", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5959", "native_tokenizers": [], @@ -8661,20 +9934,24 @@ }, { "name": "Luba (L.35)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "sng", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5962", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5961", "native_tokenizers": [], @@ -8682,20 +9959,24 @@ }, { "name": "Lunda (L.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Salampasu", + "depth": 10, "iso_1_code": null, "iso_3_code": "slx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5964", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5963", "native_tokenizers": [], @@ -8703,14 +9984,17 @@ }, { "name": "Lunda (L.52)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lunda", + "depth": 10, "iso_1_code": null, "iso_3_code": "lun", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8727,6 +10011,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8742,14 +10027,17 @@ }, { "name": "Lunda (L.53)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ruund", + "depth": 10, "iso_1_code": null, "iso_3_code": "rnd", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8766,6 +10054,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8781,20 +10070,24 @@ }, { "name": "Nkoya (L.60)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nkoya", + "depth": 10, "iso_1_code": null, "iso_3_code": "nka", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5970", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5969", "native_tokenizers": [], @@ -8802,14 +10095,17 @@ }, { "name": "Pende (L.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Phende", + "depth": 10, "iso_1_code": null, "iso_3_code": "pem", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8826,6 +10122,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8841,14 +10138,17 @@ }, { "name": "Pende (L.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Holu", + "depth": 10, "iso_1_code": null, "iso_3_code": "hol", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5974", "native_tokenizers": [], @@ -8856,15 +10156,18 @@ }, { "name": "Samba", + "depth": 10, "iso_1_code": null, "iso_3_code": "smx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5975", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5973", "native_tokenizers": [], @@ -8872,20 +10175,24 @@ }, { "name": "Pende (L.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwese", + "depth": 10, "iso_1_code": null, "iso_3_code": "kws", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5977", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5976", "native_tokenizers": [], @@ -8893,20 +10200,24 @@ }, { "name": "Songe (L.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kete", + "depth": 10, "iso_1_code": null, "iso_3_code": "kcv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5979", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5978", "native_tokenizers": [], @@ -8914,20 +10225,24 @@ }, { "name": "Songe (L.221)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lwalu", + "depth": 10, "iso_1_code": null, "iso_3_code": "lwa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5981", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5980", "native_tokenizers": [], @@ -8935,14 +10250,17 @@ }, { "name": "Songe (L.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Songe", + "depth": 10, "iso_1_code": null, "iso_3_code": "sop", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8959,6 +10277,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -8974,20 +10293,24 @@ }, { "name": "Songe (L.231)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bindji", + "depth": 10, "iso_1_code": null, "iso_3_code": "bpj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5985", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5984", "native_tokenizers": [], @@ -8995,26 +10318,31 @@ }, { "name": "Songe (L.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luna", + "depth": 10, "iso_1_code": null, "iso_3_code": "luj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5987", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5986", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9030,25 +10358,30 @@ }, { "name": "M", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bemba (M.401)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bwile", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5990", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5989", "native_tokenizers": [], @@ -9056,20 +10389,24 @@ }, { "name": "Bemba (M.402)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aushi", + "depth": 10, "iso_1_code": null, "iso_3_code": "auh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5992", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5991", "native_tokenizers": [], @@ -9077,14 +10414,17 @@ }, { "name": "Bemba (M.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Taabwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "tap", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9101,6 +10441,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9116,14 +10457,17 @@ }, { "name": "Bemba (M.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bemba", + "depth": 10, "iso_1_code": null, "iso_3_code": "bem", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9140,6 +10484,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9155,20 +10500,24 @@ }, { "name": "Fipa-Mambwe (M.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pimbwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "piw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5998", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5997", "native_tokenizers": [], @@ -9176,20 +10525,24 @@ }, { "name": "Fipa-Mambwe (M.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rungwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "rnw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6000", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "5999", "native_tokenizers": [], @@ -9197,20 +10550,24 @@ }, { "name": "Fipa-Mambwe (M.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fipa", + "depth": 10, "iso_1_code": null, "iso_3_code": "fip", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6002", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6001", "native_tokenizers": [], @@ -9218,14 +10575,17 @@ }, { "name": "Fipa-Mambwe (M.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mambwe-Lungu", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9242,6 +10602,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9257,20 +10618,24 @@ }, { "name": "Lala-Bisa-Lamba (M.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lala-Bisa", + "depth": 10, "iso_1_code": null, "iso_3_code": "leb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6006", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6005", "native_tokenizers": [], @@ -9278,14 +10643,17 @@ }, { "name": "Lala-Bisa-Lamba (M.54)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "lam", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9302,6 +10670,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9317,20 +10686,24 @@ }, { "name": "Lala-Bisa-Lamba (M.55)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Seba", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6010", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6009", "native_tokenizers": [], @@ -9338,14 +10711,17 @@ }, { "name": "Lenje-Tonga (M.61)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lenje", + "depth": 10, "iso_1_code": null, "iso_3_code": "leh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9362,6 +10738,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9377,14 +10754,17 @@ }, { "name": "Lenje-Tonga (M.62)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Soli", + "depth": 10, "iso_1_code": null, "iso_3_code": "sby", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9401,6 +10781,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9416,14 +10797,17 @@ }, { "name": "Lenje-Tonga (M.63)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ila", + "depth": 10, "iso_1_code": null, "iso_3_code": "ilb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9440,6 +10824,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9455,20 +10840,24 @@ }, { "name": "Lenje-Tonga (M.631)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sala", + "depth": 10, "iso_1_code": null, "iso_3_code": "shq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6018", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6017", "native_tokenizers": [], @@ -9476,14 +10865,17 @@ }, { "name": "Lenje-Tonga (M.64)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dombe", + "depth": 10, "iso_1_code": null, "iso_3_code": "dov", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6020", "native_tokenizers": [], @@ -9491,9 +10883,11 @@ }, { "name": "Tonga", + "depth": 10, "iso_1_code": null, "iso_3_code": "toi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9510,6 +10904,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9525,14 +10920,17 @@ }, { "name": "Nyakyusa-Ngonde (M.301)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndali", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9549,6 +10947,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9564,14 +10963,17 @@ }, { "name": "Nyakyusa-Ngonde (M.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyakyusa-Ngonde", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyy", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9588,6 +10990,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9603,14 +11006,17 @@ }, { "name": "Nyiha-Safwa (M.201)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lambya", + "depth": 10, "iso_1_code": null, "iso_3_code": "lai", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9627,6 +11033,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9642,20 +11049,24 @@ }, { "name": "Nyiha-Safwa (M.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wanda", + "depth": 10, "iso_1_code": null, "iso_3_code": "wbh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6029", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6028", "native_tokenizers": [], @@ -9663,14 +11074,17 @@ }, { "name": "Nyiha-Safwa (M.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyamwanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "mwn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9687,6 +11101,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9702,14 +11117,17 @@ }, { "name": "Nyiha-Safwa (M.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyiha, Tanzania", + "depth": 10, "iso_1_code": null, "iso_3_code": "nih", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6033", "native_tokenizers": [], @@ -9717,9 +11135,11 @@ }, { "name": "Nyika, Tanzania", + "depth": 10, "iso_1_code": null, "iso_3_code": "nkt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6034", "native_tokenizers": [], @@ -9727,9 +11147,11 @@ }, { "name": "Nyika", + "depth": 10, "iso_1_code": null, "iso_3_code": "nkv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6035", "native_tokenizers": [], @@ -9737,15 +11159,18 @@ }, { "name": "Nyiha, Malawi", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6036", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6032", "native_tokenizers": [], @@ -9753,20 +11178,24 @@ }, { "name": "Nyiha-Safwa (M.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Malila", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6038", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6037", "native_tokenizers": [], @@ -9774,26 +11203,31 @@ }, { "name": "Nyiha-Safwa (M.25)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Safwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "sbk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6040", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6039", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9809,19 +11243,23 @@ }, { "name": "N", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chewa-Nyanja (N.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chichewa", + "depth": 10, "iso_1_code": "ny", "iso_3_code": "nya", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9838,6 +11276,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -9853,14 +11292,17 @@ }, { "name": "Manda (N.101)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndendeule", + "depth": 10, "iso_1_code": null, "iso_3_code": "dne", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6045", "native_tokenizers": [], @@ -9868,15 +11310,18 @@ }, { "name": "Ndwewe", + "depth": 10, "iso_1_code": null, "iso_3_code": "nww", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6046", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6044", "native_tokenizers": [], @@ -9884,20 +11329,24 @@ }, { "name": "Manda (N.102)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nindi", + "depth": 10, "iso_1_code": null, "iso_3_code": "nxi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6048", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6047", "native_tokenizers": [], @@ -9905,20 +11354,24 @@ }, { "name": "Manda (N.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manda", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6050", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6049", "native_tokenizers": [], @@ -9926,14 +11379,17 @@ }, { "name": "Manda (N.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chingoni", + "depth": 10, "iso_1_code": null, "iso_3_code": "xnj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6052", "native_tokenizers": [], @@ -9941,15 +11397,18 @@ }, { "name": "Xingoni", + "depth": 10, "iso_1_code": null, "iso_3_code": "xnq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6053", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6051", "native_tokenizers": [], @@ -9957,20 +11416,24 @@ }, { "name": "Manda (N.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Matengo", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6055", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6054", "native_tokenizers": [], @@ -9978,20 +11441,24 @@ }, { "name": "Manda (N.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mpoto", + "depth": 10, "iso_1_code": null, "iso_3_code": "mpa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6057", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6056", "native_tokenizers": [], @@ -9999,14 +11466,17 @@ }, { "name": "Manda (N.15)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tonga", + "depth": 10, "iso_1_code": null, "iso_3_code": "tog", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10023,6 +11493,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10038,14 +11509,17 @@ }, { "name": "Senga-Sena (N.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nsenga", + "depth": 10, "iso_1_code": null, "iso_3_code": "nse", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10063,9 +11537,11 @@ }, { "name": "Phimbi", + "depth": 10, "iso_1_code": null, "iso_3_code": "phm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10082,6 +11558,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10097,20 +11574,24 @@ }, { "name": "Senga-Sena (N.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kunda", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6064", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6063", "native_tokenizers": [], @@ -10118,14 +11599,17 @@ }, { "name": "Senga-Sena (N.43)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyungwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10142,6 +11626,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10157,14 +11642,17 @@ }, { "name": "Senga-Sena (N.44)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6068", "native_tokenizers": [], @@ -10172,9 +11660,11 @@ }, { "name": "Sena", + "depth": 10, "iso_1_code": null, "iso_3_code": "seh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10191,6 +11681,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10206,14 +11697,17 @@ }, { "name": "Senga-Sena (N.441)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sena, Malawi", + "depth": 10, "iso_1_code": null, "iso_3_code": "swk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10230,6 +11724,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10245,20 +11740,24 @@ }, { "name": "Tumbuka (N.201)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mwera", + "depth": 10, "iso_1_code": null, "iso_3_code": "mjh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6073", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6072", "native_tokenizers": [], @@ -10266,14 +11765,17 @@ }, { "name": "Tumbuka (N.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tumbuka", + "depth": 10, "iso_1_code": null, "iso_3_code": "tum", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10290,6 +11792,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10304,6 +11807,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10319,19 +11823,23 @@ }, { "name": "P", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Makhuwa (P.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kokola", + "depth": 10, "iso_1_code": null, "iso_3_code": "kzn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10349,9 +11857,11 @@ }, { "name": "Lolo", + "depth": 10, "iso_1_code": null, "iso_3_code": "llb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10369,9 +11879,11 @@ }, { "name": "Makhuwa-Meetto", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10389,9 +11901,11 @@ }, { "name": "Manyawa", + "depth": 10, "iso_1_code": null, "iso_3_code": "mny", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10409,9 +11923,11 @@ }, { "name": "Takwane", + "depth": 10, "iso_1_code": null, "iso_3_code": "tke", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10429,9 +11945,11 @@ }, { "name": "Makhuwa-Shirima", + "depth": 10, "iso_1_code": null, "iso_3_code": "vmk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10449,9 +11967,11 @@ }, { "name": "Marenje", + "depth": 10, "iso_1_code": null, "iso_3_code": "vmr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6084", "native_tokenizers": [], @@ -10459,9 +11979,11 @@ }, { "name": "Makhuwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "vmw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10479,9 +12001,11 @@ }, { "name": "Makhuwa-Marrevone", + "depth": 10, "iso_1_code": null, "iso_3_code": "xmc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6086", "native_tokenizers": [], @@ -10489,15 +12013,18 @@ }, { "name": "Makhuwa-Saka", + "depth": 10, "iso_1_code": null, "iso_3_code": "xsq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6087", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10513,14 +12040,17 @@ }, { "name": "Makhuwa (P.311)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koti", + "depth": 10, "iso_1_code": null, "iso_3_code": "eko", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10537,6 +12067,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10552,20 +12083,24 @@ }, { "name": "Makhuwa (P.312)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nathembo", + "depth": 10, "iso_1_code": null, "iso_3_code": "nte", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6091", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6090", "native_tokenizers": [], @@ -10573,14 +12108,17 @@ }, { "name": "Makhuwa (P.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lomwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "ngl", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10597,6 +12135,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10612,20 +12151,24 @@ }, { "name": "Makhuwa (P.331)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lomwe, Malawi", + "depth": 10, "iso_1_code": null, "iso_3_code": "lon", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6095", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6094", "native_tokenizers": [], @@ -10633,14 +12176,17 @@ }, { "name": "Makhuwa (P.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chuwabu", + "depth": 10, "iso_1_code": null, "iso_3_code": "chw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10658,15 +12204,18 @@ }, { "name": "Maindo", + "depth": 10, "iso_1_code": null, "iso_3_code": "cwb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6098", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10682,20 +12231,24 @@ }, { "name": "Makhuwa (P.341)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Makhuwa-Moniga", + "depth": 10, "iso_1_code": null, "iso_3_code": "mhm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6100", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6099", "native_tokenizers": [], @@ -10703,20 +12256,24 @@ }, { "name": "Matuumbi (P.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndengereko", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6102", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6101", "native_tokenizers": [], @@ -10724,20 +12281,24 @@ }, { "name": "Matuumbi (P.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rufiji", + "depth": 10, "iso_1_code": null, "iso_3_code": "rui", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6104", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6103", "native_tokenizers": [], @@ -10745,20 +12306,24 @@ }, { "name": "Matuumbi (P.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Matumbi", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6106", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6105", "native_tokenizers": [], @@ -10766,14 +12331,17 @@ }, { "name": "Matuumbi (P.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngindo", + "depth": 10, "iso_1_code": null, "iso_3_code": "nnq", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10790,6 +12358,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10805,20 +12374,24 @@ }, { "name": "Matuumbi (P.15)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbunga", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6110", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6109", "native_tokenizers": [], @@ -10826,14 +12399,17 @@ }, { "name": "Yao (P.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yao", + "depth": 10, "iso_1_code": null, "iso_3_code": "yao", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10850,6 +12426,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10865,20 +12442,24 @@ }, { "name": "Yao (P.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mwera", + "depth": 10, "iso_1_code": null, "iso_3_code": "mwe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6114", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6113", "native_tokenizers": [], @@ -10886,14 +12467,17 @@ }, { "name": "Yao (P.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Makonde", + "depth": 10, "iso_1_code": null, "iso_3_code": "kde", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10911,9 +12495,11 @@ }, { "name": "Machinga", + "depth": 10, "iso_1_code": null, "iso_3_code": "mvw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6117", "native_tokenizers": [], @@ -10921,15 +12507,18 @@ }, { "name": "Matambwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "wtb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6118", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10945,26 +12534,31 @@ }, { "name": "Yao (P.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndonde Hamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "njd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6120", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6119", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -10980,19 +12574,23 @@ }, { "name": "R", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Herero (R.30)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Herero", + "depth": 10, "iso_1_code": "hz", "iso_3_code": "her", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11009,6 +12607,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11024,14 +12623,17 @@ }, { "name": "Herero (R.311)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhimba", + "depth": 10, "iso_1_code": null, "iso_3_code": "dhm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11048,6 +12650,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11063,14 +12666,17 @@ }, { "name": "Umbundu (R.101)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngendelengo", + "depth": 10, "iso_1_code": null, "iso_3_code": "nql", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6127", "native_tokenizers": [], @@ -11078,15 +12684,18 @@ }, { "name": "Kuvale", + "depth": 10, "iso_1_code": null, "iso_3_code": "olu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6128", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6126", "native_tokenizers": [], @@ -11094,14 +12703,17 @@ }, { "name": "Umbundu (R.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Umbundu", + "depth": 10, "iso_1_code": null, "iso_3_code": "umb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11118,6 +12730,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11133,20 +12746,24 @@ }, { "name": "Umbundu (R.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndombe", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6132", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6131", "native_tokenizers": [], @@ -11154,14 +12771,17 @@ }, { "name": "Umbundu (R.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyaneka", + "depth": 10, "iso_1_code": null, "iso_3_code": "nyk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11179,15 +12799,18 @@ }, { "name": "Kwandu", + "depth": 10, "iso_1_code": null, "iso_3_code": "xdo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6135", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11203,20 +12826,24 @@ }, { "name": "Umbundu (R.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nkumbi", + "depth": 10, "iso_1_code": null, "iso_3_code": "khu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6137", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6136", "native_tokenizers": [], @@ -11224,14 +12851,17 @@ }, { "name": "Wambo (R.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oshiwambo", + "depth": 10, "iso_1_code": "kj", "iso_3_code": "kua", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11248,6 +12878,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11263,20 +12894,24 @@ }, { "name": "Wambo (R.214)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbalanhu", + "depth": 10, "iso_1_code": null, "iso_3_code": "lnb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6141", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6140", "native_tokenizers": [], @@ -11284,14 +12919,17 @@ }, { "name": "Wambo (R.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndonga", + "depth": 10, "iso_1_code": "ng", "iso_3_code": "ndo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11308,6 +12946,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11323,20 +12962,24 @@ }, { "name": "Wambo (R.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwambi", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6145", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6144", "native_tokenizers": [], @@ -11344,20 +12987,24 @@ }, { "name": "Wambo (R.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngandjera", + "depth": 10, "iso_1_code": null, "iso_3_code": "nne", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6147", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6146", "native_tokenizers": [], @@ -11365,26 +13012,31 @@ }, { "name": "Yeyi (R.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yeyi", + "depth": 10, "iso_1_code": null, "iso_3_code": "yey", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6149", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6148", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11400,19 +13052,23 @@ }, { "name": "S", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Copi (S.61)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chopi", + "depth": 10, "iso_1_code": null, "iso_3_code": "cce", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11429,6 +13085,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11444,14 +13101,17 @@ }, { "name": "Copi (S.62)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tonga", + "depth": 10, "iso_1_code": null, "iso_3_code": "toh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11468,6 +13128,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11483,14 +13144,17 @@ }, { "name": "Nguni (S.407)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndebele", + "depth": 10, "iso_1_code": "nr", "iso_3_code": "nbl", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11507,6 +13171,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11522,14 +13187,17 @@ }, { "name": "Nguni (S.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Xhosa", + "depth": 10, "iso_1_code": "xh", "iso_3_code": "xho", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11546,6 +13214,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11561,14 +13230,17 @@ }, { "name": "Nguni (S.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zulu", + "depth": 10, "iso_1_code": "zu", "iso_3_code": "zul", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11585,6 +13257,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11600,14 +13273,17 @@ }, { "name": "Nguni (S.43)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Swati", + "depth": 10, "iso_1_code": "ss", "iso_3_code": "ssw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11624,6 +13300,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11639,14 +13316,17 @@ }, { "name": "Nguni (S.44)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndebele", + "depth": 10, "iso_1_code": "nd", "iso_3_code": "nde", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11663,6 +13343,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11678,14 +13359,17 @@ }, { "name": "Shona (S.10)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dema", + "depth": 10, "iso_1_code": null, "iso_3_code": "dmx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6166", "native_tokenizers": [], @@ -11693,9 +13377,11 @@ }, { "name": "Shona", + "depth": 10, "iso_1_code": "sn", "iso_3_code": "sna", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11712,6 +13398,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11727,20 +13414,24 @@ }, { "name": "Shona (S.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tawara", + "depth": 10, "iso_1_code": null, "iso_3_code": "twl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6169", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6168", "native_tokenizers": [], @@ -11748,14 +13439,17 @@ }, { "name": "Shona (S.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manyika", + "depth": 10, "iso_1_code": null, "iso_3_code": "mxc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6171", "native_tokenizers": [], @@ -11763,9 +13457,11 @@ }, { "name": "Tewe", + "depth": 10, "iso_1_code": null, "iso_3_code": "twx", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11782,6 +13478,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11797,14 +13494,17 @@ }, { "name": "Shona (S.15)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndau", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndc", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11821,6 +13521,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11836,14 +13537,17 @@ }, { "name": "Shona (S.16)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "kck", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11861,15 +13565,18 @@ }, { "name": "Nambya", + "depth": 10, "iso_1_code": null, "iso_3_code": "nmq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6177", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11885,14 +13592,17 @@ }, { "name": "Sotho-Tswana (S.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Setswana", + "depth": 10, "iso_1_code": "tn", "iso_3_code": "tsn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11911,6 +13621,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11926,20 +13637,24 @@ }, { "name": "Sotho-Tswana (S.311)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kgalagadi", + "depth": 10, "iso_1_code": null, "iso_3_code": "xkv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6181", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6180", "native_tokenizers": [], @@ -11947,14 +13662,17 @@ }, { "name": "Sotho-Tswana (S.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Birwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "brl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6183", "native_tokenizers": [], @@ -11962,9 +13680,11 @@ }, { "name": "Sotho, Northern", + "depth": 10, "iso_1_code": null, "iso_3_code": "nso", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -11982,15 +13702,18 @@ }, { "name": "Tswapong", + "depth": 10, "iso_1_code": null, "iso_3_code": "two", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6185", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12006,14 +13729,17 @@ }, { "name": "Sotho-Tswana (S.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sotho, Southern", + "depth": 10, "iso_1_code": "st", "iso_3_code": "sot", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12030,6 +13756,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12045,14 +13772,17 @@ }, { "name": "Tswa-Rhonga (S.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tswa", + "depth": 10, "iso_1_code": null, "iso_3_code": "tsc", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12069,6 +13799,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12084,14 +13815,17 @@ }, { "name": "Tswa-Rhonga (S.53)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsonga", + "depth": 10, "iso_1_code": "ts", "iso_3_code": "tso", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12108,6 +13842,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12123,14 +13858,17 @@ }, { "name": "Tswa-Rhonga (S.54)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ronga", + "depth": 10, "iso_1_code": null, "iso_3_code": "rng", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12147,6 +13885,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12162,14 +13901,17 @@ }, { "name": "Venda (S.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Venda", + "depth": 10, "iso_1_code": "ve", "iso_3_code": "ven", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12186,6 +13928,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12200,6 +13943,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12214,6 +13958,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12229,30 +13974,36 @@ }, { "name": "Northwest", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bafia (A.501)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hijuk", + "depth": 10, "iso_1_code": null, "iso_3_code": "hij", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6199", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6198", "native_tokenizers": [], @@ -12260,20 +14011,24 @@ }, { "name": "Bafia (A.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lefa", + "depth": 10, "iso_1_code": null, "iso_3_code": "lfa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6201", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6200", "native_tokenizers": [], @@ -12281,20 +14036,24 @@ }, { "name": "Bafia (A.52)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dimbong", + "depth": 10, "iso_1_code": null, "iso_3_code": "dii", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6203", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6202", "native_tokenizers": [], @@ -12302,14 +14061,17 @@ }, { "name": "Bafia (A.53)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bafia", + "depth": 10, "iso_1_code": null, "iso_3_code": "ksf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12326,6 +14088,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12341,20 +14104,24 @@ }, { "name": "Bafia (A.54)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tibea", + "depth": 10, "iso_1_code": null, "iso_3_code": "ngy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6207", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6206", "native_tokenizers": [], @@ -12362,20 +14129,24 @@ }, { "name": "Basaa (A.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barombi", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6209", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6208", "native_tokenizers": [], @@ -12383,20 +14154,24 @@ }, { "name": "Basaa (A.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bankon", + "depth": 10, "iso_1_code": null, "iso_3_code": "abb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6211", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6210", "native_tokenizers": [], @@ -12404,14 +14179,17 @@ }, { "name": "Basaa (A.43)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Basaa", + "depth": 10, "iso_1_code": null, "iso_3_code": "bas", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12429,15 +14207,18 @@ }, { "name": "Bakoko", + "depth": 10, "iso_1_code": null, "iso_3_code": "bkh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6214", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12453,20 +14234,24 @@ }, { "name": "Basaa (A.44)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tunen", + "depth": 10, "iso_1_code": null, "iso_3_code": "tvu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6216", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6215", "native_tokenizers": [], @@ -12474,20 +14259,24 @@ }, { "name": "Basaa (A.45)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyokon", + "depth": 10, "iso_1_code": null, "iso_3_code": "nvo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6218", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6217", "native_tokenizers": [], @@ -12495,14 +14284,17 @@ }, { "name": "Basaa (A.46)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nomaande", + "depth": 10, "iso_1_code": null, "iso_3_code": "lem", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12519,6 +14311,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12534,20 +14327,24 @@ }, { "name": "Basaa (A.461)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tuotomb", + "depth": 10, "iso_1_code": null, "iso_3_code": "ttf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6222", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6221", "native_tokenizers": [], @@ -12555,14 +14352,17 @@ }, { "name": "Basaa (A.462)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yambeta", + "depth": 10, "iso_1_code": null, "iso_3_code": "yat", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12579,6 +14379,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12594,14 +14395,17 @@ }, { "name": "Bubi-Benga (A.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bubia", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6226", "native_tokenizers": [], @@ -12609,15 +14413,18 @@ }, { "name": "Bube", + "depth": 10, "iso_1_code": null, "iso_3_code": "bvb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6227", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6225", "native_tokenizers": [], @@ -12625,20 +14432,24 @@ }, { "name": "Bubi-Benga (A.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Batanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "bnm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6229", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6228", "native_tokenizers": [], @@ -12646,14 +14457,17 @@ }, { "name": "Bubi-Benga (A.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kombe", + "depth": 10, "iso_1_code": null, "iso_3_code": "nui", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6231", "native_tokenizers": [], @@ -12661,15 +14475,18 @@ }, { "name": "Iyasa", + "depth": 10, "iso_1_code": null, "iso_3_code": "yko", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6232", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6230", "native_tokenizers": [], @@ -12677,20 +14494,24 @@ }, { "name": "Bubi-Benga (A.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Benga", + "depth": 10, "iso_1_code": null, "iso_3_code": "bng", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6234", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6233", "native_tokenizers": [], @@ -12698,20 +14519,24 @@ }, { "name": "Duala (A.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wumboko", + "depth": 10, "iso_1_code": null, "iso_3_code": "bqm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6236", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6235", "native_tokenizers": [], @@ -12719,20 +14544,24 @@ }, { "name": "Duala (A.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mokpwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "bri", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6238", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6237", "native_tokenizers": [], @@ -12740,20 +14569,24 @@ }, { "name": "Duala (A.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isubu", + "depth": 10, "iso_1_code": null, "iso_3_code": "szv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6240", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6239", "native_tokenizers": [], @@ -12761,20 +14594,24 @@ }, { "name": "Duala (A.231)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakole", + "depth": 10, "iso_1_code": null, "iso_3_code": "kme", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6242", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6241", "native_tokenizers": [], @@ -12782,14 +14619,17 @@ }, { "name": "Duala (A.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duala", + "depth": 10, "iso_1_code": null, "iso_3_code": "dua", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12806,6 +14646,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12821,20 +14662,24 @@ }, { "name": "Duala (A.27)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mulimba", + "depth": 10, "iso_1_code": null, "iso_3_code": "mzd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6246", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6245", "native_tokenizers": [], @@ -12842,14 +14687,17 @@ }, { "name": "Ewondo-Fang (A.71)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eton", + "depth": 10, "iso_1_code": null, "iso_3_code": "eto", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12867,15 +14715,18 @@ }, { "name": "Mengisa", + "depth": 10, "iso_1_code": null, "iso_3_code": "mct", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6249", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12891,14 +14742,17 @@ }, { "name": "Ewondo-Fang (A.72)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ewondo", + "depth": 10, "iso_1_code": null, "iso_3_code": "ewo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12915,6 +14769,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12930,14 +14785,17 @@ }, { "name": "Ewondo-Fang (A.73)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bebele", + "depth": 10, "iso_1_code": null, "iso_3_code": "beb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6253", "native_tokenizers": [], @@ -12945,15 +14803,18 @@ }, { "name": "Bebil", + "depth": 10, "iso_1_code": null, "iso_3_code": "bxp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6254", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6252", "native_tokenizers": [], @@ -12961,14 +14822,17 @@ }, { "name": "Ewondo-Fang (A.74)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bulu", + "depth": 10, "iso_1_code": null, "iso_3_code": "bum", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -12985,6 +14849,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13000,14 +14865,17 @@ }, { "name": "Ewondo-Fang (A.75)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fang", + "depth": 10, "iso_1_code": null, "iso_3_code": "fan", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13024,6 +14892,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13039,20 +14908,24 @@ }, { "name": "Kaka (A.91)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwakum", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6260", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6259", "native_tokenizers": [], @@ -13060,20 +14933,24 @@ }, { "name": "Kaka (A.92)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pol", + "depth": 10, "iso_1_code": null, "iso_3_code": "pmm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6262", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6261", "native_tokenizers": [], @@ -13081,14 +14958,17 @@ }, { "name": "Kaka (A.93)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kako", + "depth": 10, "iso_1_code": null, "iso_3_code": "kkj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13105,6 +14985,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13120,20 +15001,24 @@ }, { "name": "Lundu-Balong (A.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oroko", + "depth": 10, "iso_1_code": null, "iso_3_code": "bdu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6266", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6265", "native_tokenizers": [], @@ -13141,20 +15026,24 @@ }, { "name": "Lundu-Balong (A.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bafaw-Balong", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6268", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6267", "native_tokenizers": [], @@ -13162,20 +15051,24 @@ }, { "name": "Lundu-Balong (A.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bonkeng", + "depth": 10, "iso_1_code": null, "iso_3_code": "bvg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6270", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6269", "native_tokenizers": [], @@ -13183,20 +15076,24 @@ }, { "name": "Lundu-Balong (A.15)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbo", + "depth": 10, "iso_1_code": null, "iso_3_code": "mbo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6272", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6271", "native_tokenizers": [], @@ -13204,20 +15101,24 @@ }, { "name": "Lundu-Balong (A.151)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nkongho", + "depth": 10, "iso_1_code": null, "iso_3_code": "nkc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6274", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6273", "native_tokenizers": [], @@ -13225,20 +15126,24 @@ }, { "name": "Lundu-Balong (A.15B)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bassossi", + "depth": 10, "iso_1_code": null, "iso_3_code": "bsi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6276", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6275", "native_tokenizers": [], @@ -13246,14 +15151,17 @@ }, { "name": "Lundu-Balong (A.15C)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "bqz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6278", "native_tokenizers": [], @@ -13261,9 +15169,11 @@ }, { "name": "Akoose", + "depth": 10, "iso_1_code": null, "iso_3_code": "bss", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13280,6 +15190,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13295,20 +15206,24 @@ }, { "name": "Makaa-Njem (A.801)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gyele", + "depth": 10, "iso_1_code": null, "iso_3_code": "gyi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6281", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6280", "native_tokenizers": [], @@ -13316,20 +15231,24 @@ }, { "name": "Makaa-Njem (A.802)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ukhwejo", + "depth": 10, "iso_1_code": null, "iso_3_code": "ukh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6283", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6282", "native_tokenizers": [], @@ -13337,20 +15256,24 @@ }, { "name": "Makaa-Njem (A.81)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwasio", + "depth": 10, "iso_1_code": null, "iso_3_code": "nmg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6285", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6284", "native_tokenizers": [], @@ -13358,20 +15281,24 @@ }, { "name": "Makaa-Njem (A.82)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Swo", + "depth": 10, "iso_1_code": null, "iso_3_code": "sox", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6287", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6286", "native_tokenizers": [], @@ -13379,14 +15306,17 @@ }, { "name": "Makaa-Njem (A.83)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Makaa", + "depth": 10, "iso_1_code": null, "iso_3_code": "mcp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13403,6 +15333,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13418,20 +15349,24 @@ }, { "name": "Makaa-Njem (A.831)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Byep", + "depth": 10, "iso_1_code": null, "iso_3_code": "mkk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6291", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6290", "native_tokenizers": [], @@ -13439,20 +15374,24 @@ }, { "name": "Makaa-Njem (A.832)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kol", + "depth": 10, "iso_1_code": null, "iso_3_code": "biw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6293", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6292", "native_tokenizers": [], @@ -13460,20 +15399,24 @@ }, { "name": "Makaa-Njem (A.84)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Njyem", + "depth": 10, "iso_1_code": null, "iso_3_code": "njy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6295", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6294", "native_tokenizers": [], @@ -13481,14 +15424,17 @@ }, { "name": "Makaa-Njem (A.842)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koonzime", + "depth": 10, "iso_1_code": null, "iso_3_code": "ozm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13505,6 +15451,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13520,20 +15467,24 @@ }, { "name": "Makaa-Njem (A.85)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bekwel", + "depth": 10, "iso_1_code": null, "iso_3_code": "bkw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6299", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6298", "native_tokenizers": [], @@ -13541,14 +15492,17 @@ }, { "name": "Makaa-Njem (A.86)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mpiemo", + "depth": 10, "iso_1_code": null, "iso_3_code": "mcx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6301", "native_tokenizers": [], @@ -13556,15 +15510,18 @@ }, { "name": "Mpumpong", + "depth": 10, "iso_1_code": null, "iso_3_code": "mgg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6302", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6300", "native_tokenizers": [], @@ -13572,20 +15529,24 @@ }, { "name": "Makaa-Njem (A.87)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bomwali", + "depth": 10, "iso_1_code": null, "iso_3_code": "bmw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6304", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6303", "native_tokenizers": [], @@ -13593,14 +15554,17 @@ }, { "name": "Sanaga (A.601)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tuki", + "depth": 10, "iso_1_code": null, "iso_3_code": "bag", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6306", "native_tokenizers": [], @@ -13608,15 +15572,18 @@ }, { "name": "Leti", + "depth": 10, "iso_1_code": null, "iso_3_code": "leo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6307", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6305", "native_tokenizers": [], @@ -13624,14 +15591,17 @@ }, { "name": "Sanaga (A.62)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nulibie", + "depth": 10, "iso_1_code": null, "iso_3_code": "ekm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6309", "native_tokenizers": [], @@ -13639,9 +15609,11 @@ }, { "name": "Numala", + "depth": 10, "iso_1_code": null, "iso_3_code": "mmu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6310", "native_tokenizers": [], @@ -13649,15 +15621,18 @@ }, { "name": "Yangben", + "depth": 10, "iso_1_code": null, "iso_3_code": "yav", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6311", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6308", "native_tokenizers": [], @@ -13665,20 +15640,24 @@ }, { "name": "Sanaga (A.621)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nubaca", + "depth": 10, "iso_1_code": null, "iso_3_code": "baf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6313", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6312", "native_tokenizers": [], @@ -13686,14 +15665,17 @@ }, { "name": "Sanaga (A.622)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nugunu", + "depth": 10, "iso_1_code": null, "iso_3_code": "yas", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13710,6 +15692,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13725,20 +15708,24 @@ }, { "name": "Sanaga (A.623)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbule", + "depth": 10, "iso_1_code": null, "iso_3_code": "mlb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6317", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6316", "native_tokenizers": [], @@ -13746,26 +15733,31 @@ }, { "name": "Sanaga (A.65)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bati", + "depth": 10, "iso_1_code": null, "iso_3_code": "btc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6319", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6318", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -13781,25 +15773,30 @@ }, { "name": "B", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kele (B.201)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndasa", + "depth": 10, "iso_1_code": null, "iso_3_code": "nda", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6322", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6321", "native_tokenizers": [], @@ -13807,20 +15804,24 @@ }, { "name": "Kele (B.202)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sighu", + "depth": 10, "iso_1_code": null, "iso_3_code": "sxe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6324", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6323", "native_tokenizers": [], @@ -13828,20 +15829,24 @@ }, { "name": "Kele (B.203)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Samay", + "depth": 10, "iso_1_code": null, "iso_3_code": "syx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6326", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6325", "native_tokenizers": [], @@ -13849,20 +15854,24 @@ }, { "name": "Kele (B.204)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndambomo", + "depth": 10, "iso_1_code": null, "iso_3_code": "nxo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6328", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6327", "native_tokenizers": [], @@ -13870,20 +15879,24 @@ }, { "name": "Kele (B.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Seki", + "depth": 10, "iso_1_code": null, "iso_3_code": "syi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6330", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6329", "native_tokenizers": [], @@ -13891,20 +15904,24 @@ }, { "name": "Kele (B.211)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Molengue", + "depth": 10, "iso_1_code": null, "iso_3_code": "bxc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6332", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6331", "native_tokenizers": [], @@ -13912,14 +15929,17 @@ }, { "name": "Kele (B.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "K\u00e9l\u00e9", + "depth": 10, "iso_1_code": null, "iso_3_code": "keb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6334", "native_tokenizers": [], @@ -13927,15 +15947,18 @@ }, { "name": "Ngom", + "depth": 10, "iso_1_code": null, "iso_3_code": "nra", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6335", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6333", "native_tokenizers": [], @@ -13943,20 +15966,24 @@ }, { "name": "Kele (B.23)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbangwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "zmn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6337", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6336", "native_tokenizers": [], @@ -13964,20 +15991,24 @@ }, { "name": "Kele (B.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wumbvu", + "depth": 10, "iso_1_code": null, "iso_3_code": "wum", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6339", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6338", "native_tokenizers": [], @@ -13985,20 +16016,24 @@ }, { "name": "Kele (B.25)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kota", + "depth": 10, "iso_1_code": null, "iso_3_code": "koq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6341", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6340", "native_tokenizers": [], @@ -14006,20 +16041,24 @@ }, { "name": "Kele (B.251)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sake", + "depth": 10, "iso_1_code": null, "iso_3_code": "sak", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6343", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6342", "native_tokenizers": [], @@ -14027,20 +16066,24 @@ }, { "name": "Kele (B.252)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mahongwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "mhb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6345", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6344", "native_tokenizers": [], @@ -14048,20 +16091,24 @@ }, { "name": "Mbete (B.602)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaningi", + "depth": 10, "iso_1_code": null, "iso_3_code": "kzo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6347", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6346", "native_tokenizers": [], @@ -14069,20 +16116,24 @@ }, { "name": "Mbete (B.61)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbere", + "depth": 10, "iso_1_code": null, "iso_3_code": "mdt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6349", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6348", "native_tokenizers": [], @@ -14090,20 +16141,24 @@ }, { "name": "Mbete (B.62)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ombamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "mbm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6351", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6350", "native_tokenizers": [], @@ -14111,20 +16166,24 @@ }, { "name": "Mbete (B.63)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndumu", + "depth": 10, "iso_1_code": null, "iso_3_code": "nmd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6353", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6352", "native_tokenizers": [], @@ -14132,20 +16191,24 @@ }, { "name": "Myene (B.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Myene", + "depth": 10, "iso_1_code": null, "iso_3_code": "mye", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6355", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6354", "native_tokenizers": [], @@ -14153,20 +16216,24 @@ }, { "name": "Nzebi (B.501)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wandji", + "depth": 10, "iso_1_code": null, "iso_3_code": "wdd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6357", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6356", "native_tokenizers": [], @@ -14174,20 +16241,24 @@ }, { "name": "Nzebi (B.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duma", + "depth": 10, "iso_1_code": null, "iso_3_code": "dma", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6359", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6358", "native_tokenizers": [], @@ -14195,20 +16266,24 @@ }, { "name": "Nzebi (B.52)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Njebi", + "depth": 10, "iso_1_code": null, "iso_3_code": "nzb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6361", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6360", "native_tokenizers": [], @@ -14216,20 +16291,24 @@ }, { "name": "Nzebi (B.53)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsaangi", + "depth": 10, "iso_1_code": null, "iso_3_code": "tsa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6363", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6362", "native_tokenizers": [], @@ -14237,20 +16316,24 @@ }, { "name": "Shira-Punu (B.401)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bwisi", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6365", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6364", "native_tokenizers": [], @@ -14258,20 +16341,24 @@ }, { "name": "Shira-Punu (B.402)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barama", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6367", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6366", "native_tokenizers": [], @@ -14279,20 +16366,24 @@ }, { "name": "Shira-Punu (B.403)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vumbu", + "depth": 10, "iso_1_code": null, "iso_3_code": "vum", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6369", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6368", "native_tokenizers": [], @@ -14300,20 +16391,24 @@ }, { "name": "Shira-Punu (B.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sira", + "depth": 10, "iso_1_code": null, "iso_3_code": "swj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6371", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6370", "native_tokenizers": [], @@ -14321,20 +16416,24 @@ }, { "name": "Shira-Punu (B.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sangu", + "depth": 10, "iso_1_code": null, "iso_3_code": "snq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6373", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6372", "native_tokenizers": [], @@ -14342,20 +16441,24 @@ }, { "name": "Shira-Punu (B.43)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Punu", + "depth": 10, "iso_1_code": null, "iso_3_code": "puu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6375", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6374", "native_tokenizers": [], @@ -14363,20 +16466,24 @@ }, { "name": "Shira-Punu (B.44)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lumbu", + "depth": 10, "iso_1_code": null, "iso_3_code": "lup", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6377", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6376", "native_tokenizers": [], @@ -14384,20 +16491,24 @@ }, { "name": "Teke (B.701)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tchitchege", + "depth": 10, "iso_1_code": null, "iso_3_code": "tck", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6379", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6378", "native_tokenizers": [], @@ -14405,20 +16516,24 @@ }, { "name": "Teke (B.71)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Teke-Tege", + "depth": 10, "iso_1_code": null, "iso_3_code": "teg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6381", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6380", "native_tokenizers": [], @@ -14426,20 +16541,24 @@ }, { "name": "Teke (B.72)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngungwel", + "depth": 10, "iso_1_code": null, "iso_3_code": "ngz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6383", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6382", "native_tokenizers": [], @@ -14447,14 +16566,17 @@ }, { "name": "Teke (B.73)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "iyx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6385", "native_tokenizers": [], @@ -14462,9 +16584,11 @@ }, { "name": "Teke-Laali", + "depth": 10, "iso_1_code": null, "iso_3_code": "lli", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6386", "native_tokenizers": [], @@ -14472,9 +16596,11 @@ }, { "name": "Teke-Tsaayi", + "depth": 10, "iso_1_code": null, "iso_3_code": "tyi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6387", "native_tokenizers": [], @@ -14482,15 +16608,18 @@ }, { "name": "Teke-Tyee", + "depth": 10, "iso_1_code": null, "iso_3_code": "tyx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6388", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6384", "native_tokenizers": [], @@ -14498,14 +16627,17 @@ }, { "name": "Teke (B.74)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Teke-Eboo", + "depth": 10, "iso_1_code": null, "iso_3_code": "ebo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6390", "native_tokenizers": [], @@ -14513,15 +16645,18 @@ }, { "name": "Teke-Nzikou", + "depth": 10, "iso_1_code": null, "iso_3_code": "nzu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6391", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6389", "native_tokenizers": [], @@ -14529,20 +16664,24 @@ }, { "name": "Teke (B.75)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Teke, Ibali", + "depth": 10, "iso_1_code": null, "iso_3_code": "tek", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6393", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6392", "native_tokenizers": [], @@ -14550,14 +16689,17 @@ }, { "name": "Teke (B.77)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Teke-Wuumu", + "depth": 10, "iso_1_code": null, "iso_3_code": "ifm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6395", "native_tokenizers": [], @@ -14565,15 +16707,18 @@ }, { "name": "Teke-Kukuya", + "depth": 10, "iso_1_code": null, "iso_3_code": "kkw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6396", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6394", "native_tokenizers": [], @@ -14581,20 +16726,24 @@ }, { "name": "Tiene-Yanzi (B.81)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tiene", + "depth": 10, "iso_1_code": null, "iso_3_code": "tii", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6398", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6397", "native_tokenizers": [], @@ -14602,20 +16751,24 @@ }, { "name": "Tiene-Yanzi (B.82)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boma", + "depth": 10, "iso_1_code": null, "iso_3_code": "boh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6400", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6399", "native_tokenizers": [], @@ -14623,20 +16776,24 @@ }, { "name": "Tiene-Yanzi (B.83)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mfinu", + "depth": 10, "iso_1_code": null, "iso_3_code": "zmf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6402", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6401", "native_tokenizers": [], @@ -14644,20 +16801,24 @@ }, { "name": "Tiene-Yanzi (B.84)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbuun", + "depth": 10, "iso_1_code": null, "iso_3_code": "zmp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6404", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6403", "native_tokenizers": [], @@ -14665,14 +16826,17 @@ }, { "name": "Tiene-Yanzi (B.85)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Songo", + "depth": 10, "iso_1_code": null, "iso_3_code": "soo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6406", "native_tokenizers": [], @@ -14680,15 +16844,18 @@ }, { "name": "Iyansi", + "depth": 10, "iso_1_code": null, "iso_3_code": "yns", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6407", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6405", "native_tokenizers": [], @@ -14696,20 +16863,24 @@ }, { "name": "Tiene-Yanzi (B.86)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ding", + "depth": 10, "iso_1_code": null, "iso_3_code": "diz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6409", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6408", "native_tokenizers": [], @@ -14717,20 +16888,24 @@ }, { "name": "Tiene-Yanzi (B.861)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngwii", + "depth": 10, "iso_1_code": null, "iso_3_code": "nlo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6411", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6410", "native_tokenizers": [], @@ -14738,20 +16913,24 @@ }, { "name": "Tiene-Yanzi (B.862)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lwel", + "depth": 10, "iso_1_code": null, "iso_3_code": "lvl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6413", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6412", "native_tokenizers": [], @@ -14759,20 +16938,24 @@ }, { "name": "Tiene-Yanzi (B.864)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngongo", + "depth": 10, "iso_1_code": null, "iso_3_code": "noq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6415", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6414", "native_tokenizers": [], @@ -14780,20 +16963,24 @@ }, { "name": "Tiene-Yanzi (B.865)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nzadi", + "depth": 10, "iso_1_code": null, "iso_3_code": "nzd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6417", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6416", "native_tokenizers": [], @@ -14801,20 +16988,24 @@ }, { "name": "Tsogo (B.301)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eviya", + "depth": 10, "iso_1_code": null, "iso_3_code": "gev", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6419", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6418", "native_tokenizers": [], @@ -14822,20 +17013,24 @@ }, { "name": "Tsogo (B.302)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Simba", + "depth": 10, "iso_1_code": null, "iso_3_code": "sbw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6421", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6420", "native_tokenizers": [], @@ -14843,20 +17038,24 @@ }, { "name": "Tsogo (B.304)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pinji", + "depth": 10, "iso_1_code": null, "iso_3_code": "pic", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6423", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6422", "native_tokenizers": [], @@ -14864,20 +17063,24 @@ }, { "name": "Tsogo (B.305)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bubi", + "depth": 10, "iso_1_code": null, "iso_3_code": "buw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6425", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6424", "native_tokenizers": [], @@ -14885,20 +17088,24 @@ }, { "name": "Tsogo (B.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsogo", + "depth": 10, "iso_1_code": null, "iso_3_code": "tsv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6427", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6426", "native_tokenizers": [], @@ -14906,26 +17113,31 @@ }, { "name": "Tsogo (B.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kande", + "depth": 10, "iso_1_code": null, "iso_3_code": "kbs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6429", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6428", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6320", "native_tokenizers": [], @@ -14933,19 +17145,23 @@ }, { "name": "C", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bangi-Ntomba (C.30)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bangala", + "depth": 10, "iso_1_code": null, "iso_3_code": "bxg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6432", "native_tokenizers": [], @@ -14953,9 +17169,11 @@ }, { "name": "Lingala", + "depth": 10, "iso_1_code": "ln", "iso_3_code": "lin", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -14972,6 +17190,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -14987,20 +17206,24 @@ }, { "name": "Bangi-Ntomba (C.302)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bolondo", + "depth": 10, "iso_1_code": null, "iso_3_code": "bzm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6435", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6434", "native_tokenizers": [], @@ -15008,14 +17231,17 @@ }, { "name": "Bangi-Ntomba (C.31)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baloi", + "depth": 10, "iso_1_code": null, "iso_3_code": "biz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6437", "native_tokenizers": [], @@ -15023,15 +17249,18 @@ }, { "name": "Likila", + "depth": 10, "iso_1_code": null, "iso_3_code": "lie", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6438", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6436", "native_tokenizers": [], @@ -15039,20 +17268,24 @@ }, { "name": "Bangi-Ntomba (C.311)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mabaale", + "depth": 10, "iso_1_code": null, "iso_3_code": "mmz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6440", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6439", "native_tokenizers": [], @@ -15060,20 +17293,24 @@ }, { "name": "Bangi-Ntomba (C.312)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndobo", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6442", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6441", "native_tokenizers": [], @@ -15081,14 +17318,17 @@ }, { "name": "Bangi-Ntomba (C.32)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bangi", + "depth": 10, "iso_1_code": null, "iso_3_code": "bni", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6444", "native_tokenizers": [], @@ -15096,15 +17336,18 @@ }, { "name": "Moi", + "depth": 10, "iso_1_code": null, "iso_3_code": "mow", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6445", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6443", "native_tokenizers": [], @@ -15112,20 +17355,24 @@ }, { "name": "Bangi-Ntomba (C.321)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Libinza", + "depth": 10, "iso_1_code": null, "iso_3_code": "liz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6447", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6446", "native_tokenizers": [], @@ -15133,20 +17380,24 @@ }, { "name": "Bangi-Ntomba (C.33)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sengele", + "depth": 10, "iso_1_code": null, "iso_3_code": "szg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6449", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6448", "native_tokenizers": [], @@ -15154,20 +17405,24 @@ }, { "name": "Bangi-Ntomba (C.34)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sakata", + "depth": 10, "iso_1_code": null, "iso_3_code": "skt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6451", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6450", "native_tokenizers": [], @@ -15175,14 +17430,17 @@ }, { "name": "Bangi-Ntomba (C.35)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bolia", + "depth": 10, "iso_1_code": null, "iso_3_code": "bli", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6453", "native_tokenizers": [], @@ -15190,15 +17448,18 @@ }, { "name": "Ntomba", + "depth": 10, "iso_1_code": null, "iso_3_code": "nto", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6454", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6452", "native_tokenizers": [], @@ -15206,14 +17467,17 @@ }, { "name": "Bangi-Ntomba (C.36)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boloki", + "depth": 10, "iso_1_code": null, "iso_3_code": "bkt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6456", "native_tokenizers": [], @@ -15221,9 +17485,11 @@ }, { "name": "Lusengo", + "depth": 10, "iso_1_code": null, "iso_3_code": "lse", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6457", "native_tokenizers": [], @@ -15231,9 +17497,11 @@ }, { "name": "Ndolo", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6458", "native_tokenizers": [], @@ -15241,15 +17509,18 @@ }, { "name": "Yamongeri", + "depth": 10, "iso_1_code": null, "iso_3_code": "ymg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6459", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6455", "native_tokenizers": [], @@ -15257,20 +17528,24 @@ }, { "name": "Bangi-Ntomba (C.37)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Budja", + "depth": 10, "iso_1_code": null, "iso_3_code": "bja", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6461", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6460", "native_tokenizers": [], @@ -15278,20 +17553,24 @@ }, { "name": "Bangi-Ntomba (C.371)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tembo", + "depth": 10, "iso_1_code": null, "iso_3_code": "tmv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6463", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6462", "native_tokenizers": [], @@ -15299,20 +17578,24 @@ }, { "name": "Bushoong (C.81)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dengese", + "depth": 10, "iso_1_code": null, "iso_3_code": "dez", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6465", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6464", "native_tokenizers": [], @@ -15320,14 +17603,17 @@ }, { "name": "Bushoong (C.82)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ohendo", + "depth": 10, "iso_1_code": null, "iso_3_code": "soe", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15344,6 +17630,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15359,20 +17646,24 @@ }, { "name": "Bushoong (C.83)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bushoong", + "depth": 10, "iso_1_code": null, "iso_3_code": "buf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6469", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6468", "native_tokenizers": [], @@ -15380,20 +17671,24 @@ }, { "name": "Bushoong (C.84)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lele", + "depth": 10, "iso_1_code": null, "iso_3_code": "lel", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6471", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6470", "native_tokenizers": [], @@ -15401,20 +17696,24 @@ }, { "name": "Bushoong (C.85)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wongo", + "depth": 10, "iso_1_code": null, "iso_3_code": "won", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6473", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6472", "native_tokenizers": [], @@ -15422,20 +17721,24 @@ }, { "name": "Mboshi (C.21)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mboko", + "depth": 10, "iso_1_code": null, "iso_3_code": "mdu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6475", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6474", "native_tokenizers": [], @@ -15443,20 +17746,24 @@ }, { "name": "Mboshi (C.22)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "akw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6477", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6476", "native_tokenizers": [], @@ -15464,20 +17771,24 @@ }, { "name": "Mboshi (C.24)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koyo", + "depth": 10, "iso_1_code": null, "iso_3_code": "koh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6479", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6478", "native_tokenizers": [], @@ -15485,20 +17796,24 @@ }, { "name": "Mboshi (C.25)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbosi", + "depth": 10, "iso_1_code": null, "iso_3_code": "mdw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6481", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6480", "native_tokenizers": [], @@ -15506,20 +17821,24 @@ }, { "name": "Mboshi (C.26)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Likwala", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6483", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6482", "native_tokenizers": [], @@ -15527,20 +17846,24 @@ }, { "name": "Mboshi (C.27)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Likuba", + "depth": 10, "iso_1_code": null, "iso_3_code": "kxx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6485", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6484", "native_tokenizers": [], @@ -15548,14 +17871,17 @@ }, { "name": "Mongo-Nkundo (C.61)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mongo-Nkundu", + "depth": 10, "iso_1_code": null, "iso_3_code": "lol", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15572,6 +17898,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15587,20 +17914,24 @@ }, { "name": "Mongo-Nkundo (C.62)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lalia", + "depth": 10, "iso_1_code": null, "iso_3_code": "lal", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6489", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6488", "native_tokenizers": [], @@ -15608,14 +17939,17 @@ }, { "name": "Mongo-Nkundo (C.63)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngando", + "depth": 10, "iso_1_code": null, "iso_3_code": "nxd", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15632,6 +17966,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15647,20 +17982,24 @@ }, { "name": "Ngombe (C.401)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pagibete", + "depth": 10, "iso_1_code": null, "iso_3_code": "pae", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6493", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6492", "native_tokenizers": [], @@ -15668,20 +18007,24 @@ }, { "name": "Ngombe (C.403)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kango", + "depth": 10, "iso_1_code": null, "iso_3_code": "kty", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6495", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6494", "native_tokenizers": [], @@ -15689,14 +18032,17 @@ }, { "name": "Ngombe (C.41)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngombe", + "depth": 10, "iso_1_code": null, "iso_3_code": "ngc", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15713,6 +18059,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -15728,20 +18075,24 @@ }, { "name": "Ngombe (C.411)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bomboma", + "depth": 10, "iso_1_code": null, "iso_3_code": "bws", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6499", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6498", "native_tokenizers": [], @@ -15749,20 +18100,24 @@ }, { "name": "Ngombe (C.412)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bamwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "bmg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6501", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6500", "native_tokenizers": [], @@ -15770,20 +18125,24 @@ }, { "name": "Ngombe (C.413)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dzando", + "depth": 10, "iso_1_code": null, "iso_3_code": "dzn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6503", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6502", "native_tokenizers": [], @@ -15791,20 +18150,24 @@ }, { "name": "Ngombe (C.414)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ligenza", + "depth": 10, "iso_1_code": null, "iso_3_code": "lgz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6505", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6504", "native_tokenizers": [], @@ -15812,20 +18175,24 @@ }, { "name": "Ngombe (C.42)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bwela", + "depth": 10, "iso_1_code": null, "iso_3_code": "bwl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6507", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6506", "native_tokenizers": [], @@ -15833,20 +18200,24 @@ }, { "name": "Ngombe (C.44)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bwa", + "depth": 10, "iso_1_code": null, "iso_3_code": "bww", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6509", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6508", "native_tokenizers": [], @@ -15854,20 +18225,24 @@ }, { "name": "Ngombe (C.441)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Babango", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6511", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6510", "native_tokenizers": [], @@ -15875,20 +18250,24 @@ }, { "name": "Ngombe (C.45)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngelima", + "depth": 10, "iso_1_code": null, "iso_3_code": "agh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6513", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6512", "native_tokenizers": [], @@ -15896,20 +18275,24 @@ }, { "name": "Ngondi (C.101)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dibole", + "depth": 10, "iso_1_code": null, "iso_3_code": "bvx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6515", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6514", "native_tokenizers": [], @@ -15917,20 +18300,24 @@ }, { "name": "Ngondi (C.102)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngando", + "depth": 10, "iso_1_code": null, "iso_3_code": "ngd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6517", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6516", "native_tokenizers": [], @@ -15938,20 +18325,24 @@ }, { "name": "Ngondi (C.104)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "axk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6519", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6518", "native_tokenizers": [], @@ -15959,20 +18350,24 @@ }, { "name": "Ngondi (C.11)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngundi", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6521", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6520", "native_tokenizers": [], @@ -15980,20 +18375,24 @@ }, { "name": "Ngondi (C.12)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pande", + "depth": 10, "iso_1_code": null, "iso_3_code": "bkj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6523", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6522", "native_tokenizers": [], @@ -16001,20 +18400,24 @@ }, { "name": "Ngondi (C.13)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbati", + "depth": 10, "iso_1_code": null, "iso_3_code": "mdn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6525", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6524", "native_tokenizers": [], @@ -16022,20 +18425,24 @@ }, { "name": "Ngondi (C.14)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bomitaba", + "depth": 10, "iso_1_code": null, "iso_3_code": "zmx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6527", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6526", "native_tokenizers": [], @@ -16043,20 +18450,24 @@ }, { "name": "Ngondi (C.143)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bonjo", + "depth": 10, "iso_1_code": null, "iso_3_code": "bok", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6529", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6528", "native_tokenizers": [], @@ -16064,20 +18475,24 @@ }, { "name": "Ngondi (C.15)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bongili", + "depth": 10, "iso_1_code": null, "iso_3_code": "bui", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6531", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6530", "native_tokenizers": [], @@ -16085,14 +18500,17 @@ }, { "name": "Ngondi (C.16)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boko", + "depth": 10, "iso_1_code": null, "iso_3_code": "bkp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6533", "native_tokenizers": [], @@ -16100,9 +18518,11 @@ }, { "name": "Lobala", + "depth": 10, "iso_1_code": null, "iso_3_code": "loq", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16119,6 +18539,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16134,20 +18555,24 @@ }, { "name": "Ngondi (C.161)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bomboli", + "depth": 10, "iso_1_code": null, "iso_3_code": "bml", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6536", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6535", "native_tokenizers": [], @@ -16155,20 +18580,24 @@ }, { "name": "Ngondi (C.162)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bozaba", + "depth": 10, "iso_1_code": null, "iso_3_code": "bzo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6538", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6537", "native_tokenizers": [], @@ -16176,20 +18605,24 @@ }, { "name": "Soko-Kele (C.51)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbesa", + "depth": 10, "iso_1_code": null, "iso_3_code": "zms", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6540", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6539", "native_tokenizers": [], @@ -16197,20 +18630,24 @@ }, { "name": "Soko-Kele (C.52)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "So", + "depth": 10, "iso_1_code": null, "iso_3_code": "soc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6542", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6541", "native_tokenizers": [], @@ -16218,20 +18655,24 @@ }, { "name": "Soko-Kele (C.53)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Poke", + "depth": 10, "iso_1_code": null, "iso_3_code": "pof", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6544", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6543", "native_tokenizers": [], @@ -16239,20 +18680,24 @@ }, { "name": "Soko-Kele (C.54)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lombo", + "depth": 10, "iso_1_code": null, "iso_3_code": "loo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6546", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6545", "native_tokenizers": [], @@ -16260,14 +18705,17 @@ }, { "name": "Soko-Kele (C.55)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kele", + "depth": 10, "iso_1_code": null, "iso_3_code": "khy", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16284,6 +18732,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16299,20 +18748,24 @@ }, { "name": "Soko-Kele (C.56)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Foma", + "depth": 10, "iso_1_code": null, "iso_3_code": "fom", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6550", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6549", "native_tokenizers": [], @@ -16320,14 +18773,17 @@ }, { "name": "Tetela (C.71)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "hba", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6552", "native_tokenizers": [], @@ -16335,9 +18791,11 @@ }, { "name": "Tetela", + "depth": 10, "iso_1_code": null, "iso_3_code": "tll", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16354,6 +18812,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16369,20 +18828,24 @@ }, { "name": "Tetela (C.72)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kusu", + "depth": 10, "iso_1_code": null, "iso_3_code": "ksv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6555", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6554", "native_tokenizers": [], @@ -16390,20 +18853,24 @@ }, { "name": "Tetela (C.73)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nkutu", + "depth": 10, "iso_1_code": null, "iso_3_code": "nkw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6557", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6556", "native_tokenizers": [], @@ -16411,9 +18878,11 @@ }, { "name": "Tetela (C.74)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16429,20 +18898,24 @@ }, { "name": "Tetela (C.75)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kela", + "depth": 10, "iso_1_code": null, "iso_3_code": "kel", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6560", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6559", "native_tokenizers": [], @@ -16450,26 +18923,31 @@ }, { "name": "Tetela (C.76)", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ombo", + "depth": 10, "iso_1_code": null, "iso_3_code": "oml", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6562", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6561", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16484,6 +18962,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16498,6 +18977,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16513,20 +18993,24 @@ }, { "name": "Ndemli", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndemli", + "depth": 7, "iso_1_code": null, "iso_3_code": "nml", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6564", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6563", "native_tokenizers": [], @@ -16534,14 +19018,17 @@ }, { "name": "Tikar", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tikar", + "depth": 7, "iso_1_code": null, "iso_3_code": "tik", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16558,6 +19045,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16573,14 +19061,17 @@ }, { "name": "Tivoid", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abon", + "depth": 7, "iso_1_code": null, "iso_3_code": "abo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6568", "native_tokenizers": [], @@ -16588,9 +19079,11 @@ }, { "name": "Esimbi", + "depth": 7, "iso_1_code": null, "iso_3_code": "ags", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6569", "native_tokenizers": [], @@ -16598,9 +19091,11 @@ }, { "name": "Ambo", + "depth": 7, "iso_1_code": null, "iso_3_code": "amb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6570", "native_tokenizers": [], @@ -16608,9 +19103,11 @@ }, { "name": "Ipulo", + "depth": 7, "iso_1_code": null, "iso_3_code": "ass", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6571", "native_tokenizers": [], @@ -16618,9 +19115,11 @@ }, { "name": "Iceve-Maci", + "depth": 7, "iso_1_code": null, "iso_3_code": "bec", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6572", "native_tokenizers": [], @@ -16628,9 +19127,11 @@ }, { "name": "Balo", + "depth": 7, "iso_1_code": null, "iso_3_code": "bqo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6573", "native_tokenizers": [], @@ -16638,9 +19139,11 @@ }, { "name": "Bitare", + "depth": 7, "iso_1_code": null, "iso_3_code": "brt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6574", "native_tokenizers": [], @@ -16648,9 +19151,11 @@ }, { "name": "Batu", + "depth": 7, "iso_1_code": null, "iso_3_code": "btu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6575", "native_tokenizers": [], @@ -16658,9 +19163,11 @@ }, { "name": "Evant", + "depth": 7, "iso_1_code": null, "iso_3_code": "bzz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6576", "native_tokenizers": [], @@ -16668,9 +19175,11 @@ }, { "name": "Caka", + "depth": 7, "iso_1_code": null, "iso_3_code": "ckx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6577", "native_tokenizers": [], @@ -16678,9 +19187,11 @@ }, { "name": "Eman", + "depth": 7, "iso_1_code": null, "iso_3_code": "emn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6578", "native_tokenizers": [], @@ -16688,9 +19199,11 @@ }, { "name": "Mesaka", + "depth": 7, "iso_1_code": null, "iso_3_code": "iyo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6579", "native_tokenizers": [], @@ -16698,9 +19211,11 @@ }, { "name": "Manta", + "depth": 7, "iso_1_code": null, "iso_3_code": "myg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6580", "native_tokenizers": [], @@ -16708,9 +19223,11 @@ }, { "name": "Osatu", + "depth": 7, "iso_1_code": null, "iso_3_code": "ost", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6581", "native_tokenizers": [], @@ -16718,9 +19235,11 @@ }, { "name": "Tiv", + "depth": 7, "iso_1_code": null, "iso_3_code": "tiv", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16738,9 +19257,11 @@ }, { "name": "Iyive", + "depth": 7, "iso_1_code": null, "iso_3_code": "uiv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6583", "native_tokenizers": [], @@ -16748,15 +19269,18 @@ }, { "name": "Itang", + "depth": 7, "iso_1_code": null, "iso_3_code": "uta", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6584", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16772,14 +19296,17 @@ }, { "name": "Unclassified", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Busuu", + "depth": 7, "iso_1_code": null, "iso_3_code": "bju", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6586", "native_tokenizers": [], @@ -16787,9 +19314,11 @@ }, { "name": "Bishuo", + "depth": 7, "iso_1_code": null, "iso_3_code": "bwh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6587", "native_tokenizers": [], @@ -16797,9 +19326,11 @@ }, { "name": "Bikya", + "depth": 7, "iso_1_code": null, "iso_3_code": "byb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6588", "native_tokenizers": [], @@ -16807,15 +19338,18 @@ }, { "name": "Moingi", + "depth": 7, "iso_1_code": null, "iso_3_code": "mwz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6589", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6585", "native_tokenizers": [], @@ -16823,25 +19357,30 @@ }, { "name": "Wide Grassfields", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Menchum", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Befang", + "depth": 8, "iso_1_code": null, "iso_3_code": "bby", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6592", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6591", "native_tokenizers": [], @@ -16849,14 +19388,17 @@ }, { "name": "Narrow Grassfields", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fum", + "depth": 8, "iso_1_code": null, "iso_3_code": "fum", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6594", "native_tokenizers": [], @@ -16864,19 +19406,23 @@ }, { "name": "Mbam-Nkam", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bamileke", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ghom\u00e1l\u00e1\u2019", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16894,9 +19440,11 @@ }, { "name": "Kwa\u2019", + "depth": 10, "iso_1_code": null, "iso_3_code": "bko", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6598", "native_tokenizers": [], @@ -16904,9 +19452,11 @@ }, { "name": "Fe\u2019fe\u2019", + "depth": 10, "iso_1_code": null, "iso_3_code": "fmp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6599", "native_tokenizers": [], @@ -16914,9 +19464,11 @@ }, { "name": "Ngomba", + "depth": 10, "iso_1_code": null, "iso_3_code": "jgo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6600", "native_tokenizers": [], @@ -16924,9 +19476,11 @@ }, { "name": "Ngombale", + "depth": 10, "iso_1_code": null, "iso_3_code": "nla", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16944,9 +19498,11 @@ }, { "name": "Ngiemboon", + "depth": 10, "iso_1_code": null, "iso_3_code": "nnh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -16964,9 +19520,11 @@ }, { "name": "Nda\u2019nda\u2019", + "depth": 10, "iso_1_code": null, "iso_3_code": "nnz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6603", "native_tokenizers": [], @@ -16974,9 +19532,11 @@ }, { "name": "Ngwe", + "depth": 10, "iso_1_code": null, "iso_3_code": "nwe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6604", "native_tokenizers": [], @@ -16984,9 +19544,11 @@ }, { "name": "Mengaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "xmg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6605", "native_tokenizers": [], @@ -16994,9 +19556,11 @@ }, { "name": "Yemba", + "depth": 10, "iso_1_code": null, "iso_3_code": "ybb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17013,6 +19577,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17028,14 +19593,17 @@ }, { "name": "Ngemba", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awing", + "depth": 10, "iso_1_code": null, "iso_3_code": "azo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6608", "native_tokenizers": [], @@ -17043,9 +19611,11 @@ }, { "name": "Bambili-Bambui", + "depth": 10, "iso_1_code": null, "iso_3_code": "baw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6609", "native_tokenizers": [], @@ -17053,9 +19623,11 @@ }, { "name": "Bafut", + "depth": 10, "iso_1_code": null, "iso_3_code": "bfd", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17073,9 +19645,11 @@ }, { "name": "Beba", + "depth": 10, "iso_1_code": null, "iso_3_code": "bfp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6611", "native_tokenizers": [], @@ -17083,9 +19657,11 @@ }, { "name": "Mankong", + "depth": 10, "iso_1_code": null, "iso_3_code": "bqt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6612", "native_tokenizers": [], @@ -17093,9 +19669,11 @@ }, { "name": "Kpati", + "depth": 10, "iso_1_code": null, "iso_3_code": "koc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6613", "native_tokenizers": [], @@ -17103,9 +19681,11 @@ }, { "name": "Mendankwe-Nkwen", + "depth": 10, "iso_1_code": null, "iso_3_code": "mfd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6614", "native_tokenizers": [], @@ -17113,9 +19693,11 @@ }, { "name": "Ngemba", + "depth": 10, "iso_1_code": null, "iso_3_code": "nge", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6615", "native_tokenizers": [], @@ -17123,9 +19705,11 @@ }, { "name": "Pinyin", + "depth": 10, "iso_1_code": null, "iso_3_code": "pny", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17142,6 +19726,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17157,14 +19742,17 @@ }, { "name": "Nkambe", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lidzonka", + "depth": 10, "iso_1_code": null, "iso_3_code": "add", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6618", "native_tokenizers": [], @@ -17172,9 +19760,11 @@ }, { "name": "Kwaja", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6619", "native_tokenizers": [], @@ -17182,9 +19772,11 @@ }, { "name": "Limbum", + "depth": 10, "iso_1_code": null, "iso_3_code": "lmp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17202,9 +19794,11 @@ }, { "name": "Mbo\u2019", + "depth": 10, "iso_1_code": null, "iso_3_code": "mtk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6621", "native_tokenizers": [], @@ -17212,9 +19806,11 @@ }, { "name": "Mfumte", + "depth": 10, "iso_1_code": null, "iso_3_code": "nfu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6622", "native_tokenizers": [], @@ -17222,9 +19818,11 @@ }, { "name": "Yamba", + "depth": 10, "iso_1_code": null, "iso_3_code": "yam", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17241,6 +19839,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17256,14 +19855,17 @@ }, { "name": "Nun", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bamun", + "depth": 10, "iso_1_code": null, "iso_3_code": "bax", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6625", "native_tokenizers": [], @@ -17271,9 +19873,11 @@ }, { "name": "Chopechop", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6626", "native_tokenizers": [], @@ -17281,9 +19885,11 @@ }, { "name": "Supapya", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6627", "native_tokenizers": [], @@ -17291,9 +19897,11 @@ }, { "name": "Mengambo", + "depth": 10, "iso_1_code": null, "iso_3_code": "bce", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6628", "native_tokenizers": [], @@ -17301,9 +19909,11 @@ }, { "name": "Chufie\u2019", + "depth": 10, "iso_1_code": null, "iso_3_code": "bfj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6629", "native_tokenizers": [], @@ -17311,9 +19921,11 @@ }, { "name": "Mendenkye", + "depth": 10, "iso_1_code": null, "iso_3_code": "bgj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6630", "native_tokenizers": [], @@ -17321,9 +19933,11 @@ }, { "name": "Chrambo", + "depth": 10, "iso_1_code": null, "iso_3_code": "bmo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6631", "native_tokenizers": [], @@ -17331,9 +19945,11 @@ }, { "name": "Medumba", + "depth": 10, "iso_1_code": null, "iso_3_code": "byv", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17351,15 +19967,18 @@ }, { "name": "Mungaka", + "depth": 10, "iso_1_code": null, "iso_3_code": "mhk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6633", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17374,6 +19993,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17389,14 +20009,17 @@ }, { "name": "Momo", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Menka", + "depth": 9, "iso_1_code": null, "iso_3_code": "mea", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6635", "native_tokenizers": [], @@ -17404,9 +20027,11 @@ }, { "name": "Meta\u2019", + "depth": 9, "iso_1_code": null, "iso_3_code": "mgo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17424,9 +20049,11 @@ }, { "name": "Mundani", + "depth": 9, "iso_1_code": null, "iso_3_code": "mnf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17444,9 +20071,11 @@ }, { "name": "Ngamambo", + "depth": 9, "iso_1_code": null, "iso_3_code": "nbv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6638", "native_tokenizers": [], @@ -17454,9 +20083,11 @@ }, { "name": "Ngie", + "depth": 9, "iso_1_code": null, "iso_3_code": "ngj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6639", "native_tokenizers": [], @@ -17464,9 +20095,11 @@ }, { "name": "Ngwo", + "depth": 9, "iso_1_code": null, "iso_3_code": "ngn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6640", "native_tokenizers": [], @@ -17474,9 +20107,11 @@ }, { "name": "Njen", + "depth": 9, "iso_1_code": null, "iso_3_code": "njj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6641", "native_tokenizers": [], @@ -17484,15 +20119,18 @@ }, { "name": "Ngoshie", + "depth": 9, "iso_1_code": null, "iso_3_code": "nsh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6642", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17508,19 +20146,23 @@ }, { "name": "Ring", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Center", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Babanki", + "depth": 10, "iso_1_code": null, "iso_3_code": "bbk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17538,9 +20180,11 @@ }, { "name": "Mmen", + "depth": 10, "iso_1_code": null, "iso_3_code": "bfm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6646", "native_tokenizers": [], @@ -17548,9 +20192,11 @@ }, { "name": "Kom", + "depth": 10, "iso_1_code": null, "iso_3_code": "bkm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6647", "native_tokenizers": [], @@ -17558,9 +20204,11 @@ }, { "name": "Bum", + "depth": 10, "iso_1_code": null, "iso_3_code": "bmv", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17578,9 +20226,11 @@ }, { "name": "Mbessa", + "depth": 10, "iso_1_code": null, "iso_3_code": "emz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6649", "native_tokenizers": [], @@ -17588,9 +20238,11 @@ }, { "name": "Kung", + "depth": 10, "iso_1_code": null, "iso_3_code": "kfl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6650", "native_tokenizers": [], @@ -17598,9 +20250,11 @@ }, { "name": "Kuk", + "depth": 10, "iso_1_code": null, "iso_3_code": "kfn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6651", "native_tokenizers": [], @@ -17608,9 +20262,11 @@ }, { "name": "Oku", + "depth": 10, "iso_1_code": null, "iso_3_code": "oku", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17627,6 +20283,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17642,20 +20299,24 @@ }, { "name": "East", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lamnso\u02bc", + "depth": 10, "iso_1_code": null, "iso_3_code": "lns", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6654", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6653", "native_tokenizers": [], @@ -17663,14 +20324,17 @@ }, { "name": "South", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Vengo", + "depth": 10, "iso_1_code": null, "iso_3_code": "bav", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17688,9 +20352,11 @@ }, { "name": "Wushi", + "depth": 10, "iso_1_code": null, "iso_3_code": "bse", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6657", "native_tokenizers": [], @@ -17698,9 +20364,11 @@ }, { "name": "Ngiemekohke", + "depth": 10, "iso_1_code": null, "iso_3_code": "bvm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6658", "native_tokenizers": [], @@ -17708,15 +20376,18 @@ }, { "name": "Kenswei Nsei", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6659", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17732,14 +20403,17 @@ }, { "name": "West", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aghem", + "depth": 10, "iso_1_code": null, "iso_3_code": "agq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6661", "native_tokenizers": [], @@ -17747,9 +20421,11 @@ }, { "name": "Isu", + "depth": 10, "iso_1_code": null, "iso_3_code": "isu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6662", "native_tokenizers": [], @@ -17757,9 +20433,11 @@ }, { "name": "Laimbue", + "depth": 10, "iso_1_code": null, "iso_3_code": "lmx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6663", "native_tokenizers": [], @@ -17767,9 +20445,11 @@ }, { "name": "Weh", + "depth": 10, "iso_1_code": null, "iso_3_code": "weh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6664", "native_tokenizers": [], @@ -17777,21 +20457,25 @@ }, { "name": "Zhoa", + "depth": 10, "iso_1_code": null, "iso_3_code": "zhw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6665", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6660", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17807,14 +20491,17 @@ }, { "name": "Unclassified", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nde-Gbite", + "depth": 9, "iso_1_code": null, "iso_3_code": "ned", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6667", "native_tokenizers": [], @@ -17822,21 +20509,25 @@ }, { "name": "Viti", + "depth": 9, "iso_1_code": null, "iso_3_code": "vit", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6668", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6666", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17852,14 +20543,17 @@ }, { "name": "Western Momo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ambele", + "depth": 8, "iso_1_code": null, "iso_3_code": "ael", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6670", "native_tokenizers": [], @@ -17867,9 +20561,11 @@ }, { "name": "Atong", + "depth": 8, "iso_1_code": null, "iso_3_code": "ato", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6671", "native_tokenizers": [], @@ -17877,21 +20573,25 @@ }, { "name": "Busam", + "depth": 8, "iso_1_code": null, "iso_3_code": "bxs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6672", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6669", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17907,14 +20607,17 @@ }, { "name": "Yemne-Kimbi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mundabli", + "depth": 7, "iso_1_code": null, "iso_3_code": "boe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6674", "native_tokenizers": [], @@ -17922,9 +20625,11 @@ }, { "name": "Fang", + "depth": 7, "iso_1_code": null, "iso_3_code": "fak", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6675", "native_tokenizers": [], @@ -17932,9 +20637,11 @@ }, { "name": "Koshin", + "depth": 7, "iso_1_code": null, "iso_3_code": "kid", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6676", "native_tokenizers": [], @@ -17942,9 +20649,11 @@ }, { "name": "Mungbam", + "depth": 7, "iso_1_code": null, "iso_3_code": "mij", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6677", "native_tokenizers": [], @@ -17952,21 +20661,25 @@ }, { "name": "Ajumbu", + "depth": 7, "iso_1_code": null, "iso_3_code": "muc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6678", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6673", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -17982,14 +20695,17 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u00c1nc\u00e1", + "depth": 6, "iso_1_code": null, "iso_3_code": "acb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6680", "native_tokenizers": [], @@ -17997,21 +20713,25 @@ }, { "name": "Buru", + "depth": 6, "iso_1_code": null, "iso_3_code": "bqw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6681", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6679", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18027,19 +20747,23 @@ }, { "name": "Cross River", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bendi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Utugwang-Irungene-Afrike", + "depth": 6, "iso_1_code": null, "iso_3_code": "afe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6684", "native_tokenizers": [], @@ -18047,9 +20771,11 @@ }, { "name": "Elege", + "depth": 6, "iso_1_code": null, "iso_3_code": "alf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6685", "native_tokenizers": [], @@ -18057,9 +20783,11 @@ }, { "name": "Bekwarra", + "depth": 6, "iso_1_code": null, "iso_3_code": "bkv", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18077,9 +20805,11 @@ }, { "name": "Bokyi", + "depth": 6, "iso_1_code": null, "iso_3_code": "bky", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6687", "native_tokenizers": [], @@ -18087,9 +20817,11 @@ }, { "name": "Bete-Bendi", + "depth": 6, "iso_1_code": null, "iso_3_code": "btt", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18107,9 +20839,11 @@ }, { "name": "Bumaji", + "depth": 6, "iso_1_code": null, "iso_3_code": "byp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6689", "native_tokenizers": [], @@ -18117,9 +20851,11 @@ }, { "name": "Abanglekuo", + "depth": 6, "iso_1_code": null, "iso_3_code": "bzy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6690", "native_tokenizers": [], @@ -18127,9 +20863,11 @@ }, { "name": "Ubang", + "depth": 6, "iso_1_code": null, "iso_3_code": "uba", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6691", "native_tokenizers": [], @@ -18137,15 +20875,18 @@ }, { "name": "Bukpe", + "depth": 6, "iso_1_code": null, "iso_3_code": "ukp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6692", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18161,19 +20902,23 @@ }, { "name": "Delta Cross", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Delta", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abureni", + "depth": 7, "iso_1_code": null, "iso_3_code": "mgj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6695", "native_tokenizers": [], @@ -18181,9 +20926,11 @@ }, { "name": "Obulom", + "depth": 7, "iso_1_code": null, "iso_3_code": "obu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6696", "native_tokenizers": [], @@ -18191,9 +20938,11 @@ }, { "name": "Ogbia", + "depth": 7, "iso_1_code": null, "iso_3_code": "ogb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6697", "native_tokenizers": [], @@ -18201,9 +20950,11 @@ }, { "name": "Ogbogolo", + "depth": 7, "iso_1_code": null, "iso_3_code": "ogg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6698", "native_tokenizers": [], @@ -18211,9 +20962,11 @@ }, { "name": "Ogbronuagum", + "depth": 7, "iso_1_code": null, "iso_3_code": "ogu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6699", "native_tokenizers": [], @@ -18221,9 +20974,11 @@ }, { "name": "O\u2019chi\u2019chi\u2019", + "depth": 7, "iso_1_code": null, "iso_3_code": "xoc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6700", "native_tokenizers": [], @@ -18231,14 +20986,17 @@ }, { "name": "Abua-Odual", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abua", + "depth": 8, "iso_1_code": null, "iso_3_code": "abn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18256,15 +21014,18 @@ }, { "name": "Odual", + "depth": 8, "iso_1_code": null, "iso_3_code": "odu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6703", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18280,26 +21041,31 @@ }, { "name": "Kugbo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kugbo", + "depth": 8, "iso_1_code": null, "iso_3_code": "kes", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6705", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6704", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18315,19 +21081,23 @@ }, { "name": "Lower Cross", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Obolo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Obolo", + "depth": 8, "iso_1_code": null, "iso_3_code": "ann", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18345,9 +21115,11 @@ }, { "name": "Eki", + "depth": 8, "iso_1_code": null, "iso_3_code": "eki", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6709", "native_tokenizers": [], @@ -18355,9 +21127,11 @@ }, { "name": "Idere", + "depth": 8, "iso_1_code": null, "iso_3_code": "ide", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6710", "native_tokenizers": [], @@ -18365,20 +21139,24 @@ }, { "name": "Ebughu", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ebughu", + "depth": 9, "iso_1_code": null, "iso_3_code": "ebg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6712", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6711", "native_tokenizers": [], @@ -18386,20 +21164,24 @@ }, { "name": "Efai", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Efai", + "depth": 9, "iso_1_code": null, "iso_3_code": "efa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6714", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6713", "native_tokenizers": [], @@ -18407,14 +21189,17 @@ }, { "name": "Efik", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anaang", + "depth": 9, "iso_1_code": null, "iso_3_code": "anw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6716", "native_tokenizers": [], @@ -18422,9 +21207,11 @@ }, { "name": "Efik", + "depth": 9, "iso_1_code": null, "iso_3_code": "efi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18442,9 +21229,11 @@ }, { "name": "Ibibio", + "depth": 9, "iso_1_code": null, "iso_3_code": "ibb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6718", "native_tokenizers": [], @@ -18452,15 +21241,18 @@ }, { "name": "Ukwa", + "depth": 9, "iso_1_code": null, "iso_3_code": "ukq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6719", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18476,14 +21268,17 @@ }, { "name": "Ekit", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ekit", + "depth": 9, "iso_1_code": null, "iso_3_code": "eke", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6721", "native_tokenizers": [], @@ -18491,15 +21286,18 @@ }, { "name": "Etebi", + "depth": 9, "iso_1_code": null, "iso_3_code": "etb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6722", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6720", "native_tokenizers": [], @@ -18507,14 +21305,17 @@ }, { "name": "Enwang-Uda", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Enwan", + "depth": 9, "iso_1_code": null, "iso_3_code": "enw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6724", "native_tokenizers": [], @@ -18522,15 +21323,18 @@ }, { "name": "Uda", + "depth": 9, "iso_1_code": null, "iso_3_code": "uda", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6725", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6723", "native_tokenizers": [], @@ -18538,20 +21342,24 @@ }, { "name": "Ibino", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibino", + "depth": 9, "iso_1_code": null, "iso_3_code": "ibn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6727", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6726", "native_tokenizers": [], @@ -18559,14 +21367,17 @@ }, { "name": "Ibuoro", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibuoro", + "depth": 9, "iso_1_code": null, "iso_3_code": "ibr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6729", "native_tokenizers": [], @@ -18574,9 +21385,11 @@ }, { "name": "Itu Mbon Uzo", + "depth": 9, "iso_1_code": null, "iso_3_code": "itm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6730", "native_tokenizers": [], @@ -18584,9 +21397,11 @@ }, { "name": "Ito", + "depth": 9, "iso_1_code": null, "iso_3_code": "itw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6731", "native_tokenizers": [], @@ -18594,15 +21409,18 @@ }, { "name": "Nkari", + "depth": 9, "iso_1_code": null, "iso_3_code": "nkz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6732", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6728", "native_tokenizers": [], @@ -18610,20 +21428,24 @@ }, { "name": "Iko", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iko", + "depth": 9, "iso_1_code": null, "iso_3_code": "iki", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6734", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6733", "native_tokenizers": [], @@ -18631,20 +21453,24 @@ }, { "name": "Ilue", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ilue", + "depth": 9, "iso_1_code": null, "iso_3_code": "ilv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6736", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6735", "native_tokenizers": [], @@ -18652,20 +21478,24 @@ }, { "name": "Okobo", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Okobo", + "depth": 9, "iso_1_code": null, "iso_3_code": "okb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6738", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6737", "native_tokenizers": [], @@ -18673,20 +21503,24 @@ }, { "name": "Oro", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oro", + "depth": 9, "iso_1_code": null, "iso_3_code": "orx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6740", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6739", "native_tokenizers": [], @@ -18694,26 +21528,31 @@ }, { "name": "Usaghade", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Usaghade", + "depth": 9, "iso_1_code": null, "iso_3_code": "usk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6742", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6741", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18728,6 +21567,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18743,19 +21583,23 @@ }, { "name": "Ogoni", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gokana", + "depth": 8, "iso_1_code": null, "iso_3_code": "gkn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18773,9 +21617,11 @@ }, { "name": "Khana", + "depth": 8, "iso_1_code": null, "iso_3_code": "ogo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18793,15 +21639,18 @@ }, { "name": "T\u00e8\u00e8\u0323 \u0323", + "depth": 8, "iso_1_code": null, "iso_3_code": "tkq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6747", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18817,14 +21666,17 @@ }, { "name": "West", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baan", + "depth": 8, "iso_1_code": null, "iso_3_code": "bvj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6749", "native_tokenizers": [], @@ -18832,21 +21684,25 @@ }, { "name": "Eleme", + "depth": 8, "iso_1_code": null, "iso_3_code": "elm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6750", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6748", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -18862,19 +21718,23 @@ }, { "name": "Upper Cross", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agoi-Doko-Iyoniyong", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iyongiyong", + "depth": 8, "iso_1_code": null, "iso_3_code": "bbs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6753", "native_tokenizers": [], @@ -18882,9 +21742,11 @@ }, { "name": "Robambami", + "depth": 8, "iso_1_code": null, "iso_3_code": "ibm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6754", "native_tokenizers": [], @@ -18892,15 +21754,18 @@ }, { "name": "Deko-Dusanga", + "depth": 8, "iso_1_code": null, "iso_3_code": "uya", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6755", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6752", "native_tokenizers": [], @@ -18908,20 +21773,24 @@ }, { "name": "Akpet", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ukpet-Ehom", + "depth": 8, "iso_1_code": null, "iso_3_code": "akd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6757", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6756", "native_tokenizers": [], @@ -18929,30 +21798,36 @@ }, { "name": "Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East-West", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ikom", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Olulumo-Ikom", + "depth": 10, "iso_1_code": null, "iso_3_code": "iko", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6761", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6760", "native_tokenizers": [], @@ -18960,14 +21835,17 @@ }, { "name": "Loko", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lubila", + "depth": 10, "iso_1_code": null, "iso_3_code": "kcc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6763", "native_tokenizers": [], @@ -18975,9 +21853,11 @@ }, { "name": "Nkukoli", + "depth": 10, "iso_1_code": null, "iso_3_code": "nbo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6764", "native_tokenizers": [], @@ -18985,9 +21865,11 @@ }, { "name": "Lokaa", + "depth": 10, "iso_1_code": null, "iso_3_code": "yaz", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19004,6 +21886,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19019,19 +21902,23 @@ }, { "name": "Mbembe-Legbo", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Legbo", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Legbo", + "depth": 11, "iso_1_code": null, "iso_3_code": "agb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6768", "native_tokenizers": [], @@ -19039,9 +21926,11 @@ }, { "name": "Leyigha", + "depth": 11, "iso_1_code": null, "iso_3_code": "ayi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6769", "native_tokenizers": [], @@ -19049,15 +21938,18 @@ }, { "name": "Lenyima", + "depth": 11, "iso_1_code": null, "iso_3_code": "ldg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6770", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6767", "native_tokenizers": [], @@ -19065,32 +21957,38 @@ }, { "name": "Mbembe", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbembe, Cross River", + "depth": 11, "iso_1_code": null, "iso_3_code": "mfn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6772", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6771", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6766", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19106,30 +22004,36 @@ }, { "name": "North-South", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koring-Kukele", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koring", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oring", + "depth": 11, "iso_1_code": null, "iso_3_code": "org", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6776", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6775", "native_tokenizers": [], @@ -19137,14 +22041,17 @@ }, { "name": "Kukele", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Uzekwe", + "depth": 11, "iso_1_code": null, "iso_3_code": "eze", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6778", "native_tokenizers": [], @@ -19152,9 +22059,11 @@ }, { "name": "Kukele", + "depth": 11, "iso_1_code": null, "iso_3_code": "kez", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19171,6 +22080,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19185,6 +22095,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19200,19 +22111,23 @@ }, { "name": "Ubaghara-Kohumono", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kohumono", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hohumono", + "depth": 11, "iso_1_code": null, "iso_3_code": "bcs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6782", "native_tokenizers": [], @@ -19220,9 +22135,11 @@ }, { "name": "Umon", + "depth": 11, "iso_1_code": null, "iso_3_code": "umm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6783", "native_tokenizers": [], @@ -19230,15 +22147,18 @@ }, { "name": "Agwagwune", + "depth": 11, "iso_1_code": null, "iso_3_code": "yay", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6784", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6781", "native_tokenizers": [], @@ -19246,32 +22166,38 @@ }, { "name": "Ubaghara", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ubaghara", + "depth": 11, "iso_1_code": null, "iso_3_code": "byc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6786", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6785", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6780", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19286,6 +22212,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19301,14 +22228,17 @@ }, { "name": "Kiong-Korop", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kiong", + "depth": 8, "iso_1_code": null, "iso_3_code": "kkm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6788", "native_tokenizers": [], @@ -19316,9 +22246,11 @@ }, { "name": "Durop", + "depth": 8, "iso_1_code": null, "iso_3_code": "krp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6789", "native_tokenizers": [], @@ -19326,21 +22258,25 @@ }, { "name": "Odut", + "depth": 8, "iso_1_code": null, "iso_3_code": "oda", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6790", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6787", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19355,6 +22291,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19369,6 +22306,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19384,25 +22322,30 @@ }, { "name": "Defoid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akokoid", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arigidi", + "depth": 6, "iso_1_code": null, "iso_3_code": "aqg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6793", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6792", "native_tokenizers": [], @@ -19410,14 +22353,17 @@ }, { "name": "Ayere-Ahan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u00c0h\u00e0n", + "depth": 6, "iso_1_code": null, "iso_3_code": "ahn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6795", "native_tokenizers": [], @@ -19425,15 +22371,18 @@ }, { "name": "Ayere", + "depth": 6, "iso_1_code": null, "iso_3_code": "aye", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6796", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6794", "native_tokenizers": [], @@ -19441,19 +22390,23 @@ }, { "name": "Yoruboid", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Edekiri", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ede Cabe", + "depth": 7, "iso_1_code": null, "iso_3_code": "cbj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6799", "native_tokenizers": [], @@ -19461,9 +22414,11 @@ }, { "name": "Ede Ica", + "depth": 7, "iso_1_code": null, "iso_3_code": "ica", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6800", "native_tokenizers": [], @@ -19471,9 +22426,11 @@ }, { "name": "Ede Idaca", + "depth": 7, "iso_1_code": null, "iso_3_code": "idd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6801", "native_tokenizers": [], @@ -19481,9 +22438,11 @@ }, { "name": "If\u00e8", + "depth": 7, "iso_1_code": null, "iso_3_code": "ife", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"yo\")", @@ -19501,9 +22460,11 @@ }, { "name": "Ede Ije", + "depth": 7, "iso_1_code": null, "iso_3_code": "ijj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6803", "native_tokenizers": [], @@ -19511,9 +22472,11 @@ }, { "name": "Isekiri", + "depth": 7, "iso_1_code": null, "iso_3_code": "its", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6804", "native_tokenizers": [], @@ -19521,9 +22484,11 @@ }, { "name": "Lucumi", + "depth": 7, "iso_1_code": null, "iso_3_code": "luq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6805", "native_tokenizers": [], @@ -19531,9 +22496,11 @@ }, { "name": "Mokole", + "depth": 7, "iso_1_code": null, "iso_3_code": "mkl", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"yo\")", @@ -19551,9 +22518,11 @@ }, { "name": "Nago, Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "nqg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6807", "native_tokenizers": [], @@ -19561,9 +22530,11 @@ }, { "name": "Ede Nago, Kura", + "depth": 7, "iso_1_code": null, "iso_3_code": "nqk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6808", "native_tokenizers": [], @@ -19571,9 +22542,11 @@ }, { "name": "Ulukwumi", + "depth": 7, "iso_1_code": null, "iso_3_code": "ulb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6809", "native_tokenizers": [], @@ -19581,9 +22554,11 @@ }, { "name": "Nago, Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "xkb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6810", "native_tokenizers": [], @@ -19591,9 +22566,11 @@ }, { "name": "Yoruba", + "depth": 7, "iso_1_code": "yo", "iso_3_code": "yor", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"yo\")", @@ -19612,6 +22589,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"yo\")", @@ -19627,26 +22605,31 @@ }, { "name": "Igala", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Igala", + "depth": 7, "iso_1_code": null, "iso_3_code": "igl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6813", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6812", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"yo\")", @@ -19661,6 +22644,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"yo\")", @@ -19676,19 +22660,23 @@ }, { "name": "Edoid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Delta", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Degema", + "depth": 6, "iso_1_code": null, "iso_3_code": "deg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6816", "native_tokenizers": [], @@ -19696,9 +22684,11 @@ }, { "name": "Engenni", + "depth": 6, "iso_1_code": null, "iso_3_code": "enn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6817", "native_tokenizers": [], @@ -19706,15 +22696,18 @@ }, { "name": "Epie", + "depth": 6, "iso_1_code": null, "iso_3_code": "epi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6818", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6815", "native_tokenizers": [], @@ -19722,14 +22715,17 @@ }, { "name": "North-Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ihievbe", + "depth": 6, "iso_1_code": null, "iso_3_code": "ihi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6820", "native_tokenizers": [], @@ -19737,9 +22733,11 @@ }, { "name": "Ikhin-Aokho", + "depth": 6, "iso_1_code": null, "iso_3_code": "ikh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6821", "native_tokenizers": [], @@ -19747,14 +22745,17 @@ }, { "name": "Edo-Esan-Ora", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Edo", + "depth": 7, "iso_1_code": null, "iso_3_code": "bin", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19772,9 +22773,11 @@ }, { "name": "Emai-Iuleha-Ora", + "depth": 7, "iso_1_code": null, "iso_3_code": "ema", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6824", "native_tokenizers": [], @@ -19782,9 +22785,11 @@ }, { "name": "Esan", + "depth": 7, "iso_1_code": null, "iso_3_code": "ish", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19801,6 +22806,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19816,14 +22822,17 @@ }, { "name": "Ghotuo-Uneme-Yekhee", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ghotuo", + "depth": 7, "iso_1_code": null, "iso_3_code": "aaa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6827", "native_tokenizers": [], @@ -19831,9 +22840,11 @@ }, { "name": "Ivbie North-Okpela-Arhe", + "depth": 7, "iso_1_code": null, "iso_3_code": "atg", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19851,9 +22862,11 @@ }, { "name": "Enwan", + "depth": 7, "iso_1_code": null, "iso_3_code": "env", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6829", "native_tokenizers": [], @@ -19861,9 +22874,11 @@ }, { "name": "Etsako", + "depth": 7, "iso_1_code": null, "iso_3_code": "ets", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6830", "native_tokenizers": [], @@ -19871,9 +22886,11 @@ }, { "name": "Igwe", + "depth": 7, "iso_1_code": null, "iso_3_code": "igw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6831", "native_tokenizers": [], @@ -19881,9 +22898,11 @@ }, { "name": "Ikpeshi", + "depth": 7, "iso_1_code": null, "iso_3_code": "ikp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6832", "native_tokenizers": [], @@ -19891,9 +22910,11 @@ }, { "name": "Ososo", + "depth": 7, "iso_1_code": null, "iso_3_code": "oso", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6833", "native_tokenizers": [], @@ -19901,9 +22922,11 @@ }, { "name": "Sasaru", + "depth": 7, "iso_1_code": null, "iso_3_code": "sxs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6834", "native_tokenizers": [], @@ -19911,15 +22934,18 @@ }, { "name": "Uneme", + "depth": 7, "iso_1_code": null, "iso_3_code": "une", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6835", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19934,6 +22960,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -19949,14 +22976,17 @@ }, { "name": "Northwestern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aduge", + "depth": 6, "iso_1_code": null, "iso_3_code": "adu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6837", "native_tokenizers": [], @@ -19964,14 +22994,17 @@ }, { "name": "Osse", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ehueun", + "depth": 7, "iso_1_code": null, "iso_3_code": "ehu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6839", "native_tokenizers": [], @@ -19979,9 +23012,11 @@ }, { "name": "Iyayu", + "depth": 7, "iso_1_code": null, "iso_3_code": "iya", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6840", "native_tokenizers": [], @@ -19989,9 +23024,11 @@ }, { "name": "Uhami", + "depth": 7, "iso_1_code": null, "iso_3_code": "uha", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6841", "native_tokenizers": [], @@ -19999,15 +23036,18 @@ }, { "name": "Ukue", + "depth": 7, "iso_1_code": null, "iso_3_code": "uku", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6842", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6838", "native_tokenizers": [], @@ -20015,14 +23055,17 @@ }, { "name": "Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akuku", + "depth": 7, "iso_1_code": null, "iso_3_code": "ayk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6844", "native_tokenizers": [], @@ -20030,9 +23073,11 @@ }, { "name": "Idesa", + "depth": 7, "iso_1_code": null, "iso_3_code": "ids", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6845", "native_tokenizers": [], @@ -20040,9 +23085,11 @@ }, { "name": "Okpe", + "depth": 7, "iso_1_code": null, "iso_3_code": "okx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6846", "native_tokenizers": [], @@ -20050,9 +23097,11 @@ }, { "name": "Oloma", + "depth": 7, "iso_1_code": null, "iso_3_code": "olm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6847", "native_tokenizers": [], @@ -20060,21 +23109,25 @@ }, { "name": "Okpamheri", + "depth": 7, "iso_1_code": null, "iso_3_code": "opa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6848", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6843", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6836", "native_tokenizers": [], @@ -20082,14 +23135,17 @@ }, { "name": "Southwestern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eruwa", + "depth": 6, "iso_1_code": null, "iso_3_code": "erh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6850", "native_tokenizers": [], @@ -20097,9 +23153,11 @@ }, { "name": "Uvbie", + "depth": 6, "iso_1_code": null, "iso_3_code": "evh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6851", "native_tokenizers": [], @@ -20107,9 +23165,11 @@ }, { "name": "Isoko", + "depth": 6, "iso_1_code": null, "iso_3_code": "iso", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20127,9 +23187,11 @@ }, { "name": "Okpe", + "depth": 6, "iso_1_code": null, "iso_3_code": "oke", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20147,9 +23209,11 @@ }, { "name": "Urhobo", + "depth": 6, "iso_1_code": null, "iso_3_code": "urh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20166,6 +23230,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20180,6 +23245,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20195,30 +23261,36 @@ }, { "name": "Idomoid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akweya", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eloyi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ajiri", + "depth": 7, "iso_1_code": null, "iso_3_code": "afo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6858", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6857", "native_tokenizers": [], @@ -20226,25 +23298,30 @@ }, { "name": "Etulo-Idoma", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Etulo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Etulo", + "depth": 8, "iso_1_code": null, "iso_3_code": "utr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6861", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6860", "native_tokenizers": [], @@ -20252,14 +23329,17 @@ }, { "name": "Idoma", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agatu", + "depth": 8, "iso_1_code": null, "iso_3_code": "agc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6863", "native_tokenizers": [], @@ -20267,9 +23347,11 @@ }, { "name": "Alago", + "depth": 8, "iso_1_code": null, "iso_3_code": "ala", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6864", "native_tokenizers": [], @@ -20277,9 +23359,11 @@ }, { "name": "Idoma", + "depth": 8, "iso_1_code": null, "iso_3_code": "idu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20297,9 +23381,11 @@ }, { "name": "Igede", + "depth": 8, "iso_1_code": null, "iso_3_code": "ige", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20317,15 +23403,18 @@ }, { "name": "Yala", + "depth": 8, "iso_1_code": null, "iso_3_code": "yba", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6867", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20340,6 +23429,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20354,6 +23444,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20369,14 +23460,17 @@ }, { "name": "Yatye-Akpa", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akweya", + "depth": 6, "iso_1_code": null, "iso_3_code": "akf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6869", "native_tokenizers": [], @@ -20384,21 +23478,25 @@ }, { "name": "Yace", + "depth": 6, "iso_1_code": null, "iso_3_code": "ekr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6870", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6868", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20414,25 +23512,30 @@ }, { "name": "Igboid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ekpeye", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ekpeye", + "depth": 6, "iso_1_code": null, "iso_3_code": "ekp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6873", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6872", "native_tokenizers": [], @@ -20440,14 +23543,17 @@ }, { "name": "Igbo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ezaa", + "depth": 6, "iso_1_code": null, "iso_3_code": "eza", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20465,9 +23571,11 @@ }, { "name": "Mgbolizhia", + "depth": 6, "iso_1_code": null, "iso_3_code": "gmz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6876", "native_tokenizers": [], @@ -20475,9 +23583,11 @@ }, { "name": "Igbo", + "depth": 6, "iso_1_code": "ig", "iso_3_code": "ibo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20495,9 +23605,11 @@ }, { "name": "Ika", + "depth": 6, "iso_1_code": null, "iso_3_code": "ikk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20515,9 +23627,11 @@ }, { "name": "Ikwere", + "depth": 6, "iso_1_code": null, "iso_3_code": "ikw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20535,9 +23649,11 @@ }, { "name": "Ikwo", + "depth": 6, "iso_1_code": null, "iso_3_code": "iqw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20555,9 +23671,11 @@ }, { "name": "Izii", + "depth": 6, "iso_1_code": null, "iso_3_code": "izz", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20575,9 +23693,11 @@ }, { "name": "Ogbah", + "depth": 6, "iso_1_code": null, "iso_3_code": "ogc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6882", "native_tokenizers": [], @@ -20585,15 +23705,18 @@ }, { "name": "Ukwuani-Aboh-Ndoni", + "depth": 6, "iso_1_code": null, "iso_3_code": "ukw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6883", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20608,6 +23731,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20623,14 +23747,17 @@ }, { "name": "Jukunoid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bete", + "depth": 5, "iso_1_code": null, "iso_3_code": "byf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6885", "native_tokenizers": [], @@ -20638,24 +23765,29 @@ }, { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jukun-Mbembe-Wurbo", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jukun", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jukun Takum", + "depth": 8, "iso_1_code": null, "iso_3_code": "jbu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20673,9 +23805,11 @@ }, { "name": "Jibu", + "depth": 8, "iso_1_code": null, "iso_3_code": "jib", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6890", "native_tokenizers": [], @@ -20683,9 +23817,11 @@ }, { "name": "H\u00f5ne", + "depth": 8, "iso_1_code": null, "iso_3_code": "juh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6891", "native_tokenizers": [], @@ -20693,15 +23829,18 @@ }, { "name": "W\u00e3pha", + "depth": 8, "iso_1_code": null, "iso_3_code": "juw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6892", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20717,14 +23856,17 @@ }, { "name": "Kororofa", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wannu", + "depth": 8, "iso_1_code": null, "iso_3_code": "jub", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6894", "native_tokenizers": [], @@ -20732,9 +23874,11 @@ }, { "name": "Wapan", + "depth": 8, "iso_1_code": null, "iso_3_code": "juk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6895", "native_tokenizers": [], @@ -20742,15 +23886,18 @@ }, { "name": "Jiba", + "depth": 8, "iso_1_code": null, "iso_3_code": "juo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6896", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6893", "native_tokenizers": [], @@ -20758,14 +23905,17 @@ }, { "name": "Mbembe", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbembe, Tigon", + "depth": 8, "iso_1_code": null, "iso_3_code": "nza", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20782,6 +23932,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20797,20 +23948,24 @@ }, { "name": "Unclassified", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shoo-Minda-Nye", + "depth": 8, "iso_1_code": null, "iso_3_code": "bcv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6900", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6899", "native_tokenizers": [], @@ -20818,14 +23973,17 @@ }, { "name": "Wurbo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karimjo", + "depth": 8, "iso_1_code": null, "iso_3_code": "cfg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6902", "native_tokenizers": [], @@ -20833,9 +23991,11 @@ }, { "name": "Jiru", + "depth": 8, "iso_1_code": null, "iso_3_code": "jrr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6903", "native_tokenizers": [], @@ -20843,21 +24003,25 @@ }, { "name": "Tita", + "depth": 8, "iso_1_code": null, "iso_3_code": "tdq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6904", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6901", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20873,14 +24037,17 @@ }, { "name": "Kpan-Icen", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Etkywan", + "depth": 7, "iso_1_code": null, "iso_3_code": "ich", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6906", "native_tokenizers": [], @@ -20888,21 +24055,25 @@ }, { "name": "Kpan", + "depth": 7, "iso_1_code": null, "iso_3_code": "kpk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6907", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6905", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20918,14 +24089,17 @@ }, { "name": "Yukuben-Kuteb", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akum", + "depth": 6, "iso_1_code": null, "iso_3_code": "aku", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6909", "native_tokenizers": [], @@ -20933,9 +24107,11 @@ }, { "name": "Beezen", + "depth": 6, "iso_1_code": null, "iso_3_code": "bnz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6910", "native_tokenizers": [], @@ -20943,9 +24119,11 @@ }, { "name": "Kapya", + "depth": 6, "iso_1_code": null, "iso_3_code": "klo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6911", "native_tokenizers": [], @@ -20953,9 +24131,11 @@ }, { "name": "Kutep", + "depth": 6, "iso_1_code": null, "iso_3_code": "kub", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20973,15 +24153,18 @@ }, { "name": "Yukuben", + "depth": 6, "iso_1_code": null, "iso_3_code": "ybl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6913", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -20996,6 +24179,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21011,30 +24195,36 @@ }, { "name": "Kainji", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amo", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amo", + "depth": 7, "iso_1_code": null, "iso_3_code": "amo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6917", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6916", "native_tokenizers": [], @@ -21042,14 +24232,17 @@ }, { "name": "Northern Jos", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Panawa", + "depth": 7, "iso_1_code": null, "iso_3_code": "pwb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6919", "native_tokenizers": [], @@ -21057,14 +24250,17 @@ }, { "name": "Jera", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gamo-Ningi", + "depth": 8, "iso_1_code": null, "iso_3_code": "bte", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6921", "native_tokenizers": [], @@ -21072,9 +24268,11 @@ }, { "name": "Izora", + "depth": 8, "iso_1_code": null, "iso_3_code": "cbo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6922", "native_tokenizers": [], @@ -21082,9 +24280,11 @@ }, { "name": "Tunzuii", + "depth": 8, "iso_1_code": null, "iso_3_code": "dza", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6923", "native_tokenizers": [], @@ -21092,9 +24292,11 @@ }, { "name": "Lere", + "depth": 8, "iso_1_code": null, "iso_3_code": "gnh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6924", "native_tokenizers": [], @@ -21102,9 +24304,11 @@ }, { "name": "Gyem", + "depth": 8, "iso_1_code": null, "iso_3_code": "gye", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6925", "native_tokenizers": [], @@ -21112,9 +24316,11 @@ }, { "name": "Jere", + "depth": 8, "iso_1_code": null, "iso_3_code": "jer", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6926", "native_tokenizers": [], @@ -21122,9 +24328,11 @@ }, { "name": "Janji", + "depth": 8, "iso_1_code": null, "iso_3_code": "jni", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6927", "native_tokenizers": [], @@ -21132,9 +24340,11 @@ }, { "name": "Kudu-Camo", + "depth": 8, "iso_1_code": null, "iso_3_code": "kov", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6928", "native_tokenizers": [], @@ -21142,9 +24352,11 @@ }, { "name": "Lemoro", + "depth": 8, "iso_1_code": null, "iso_3_code": "ldj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6929", "native_tokenizers": [], @@ -21152,9 +24364,11 @@ }, { "name": "Iguta", + "depth": 8, "iso_1_code": null, "iso_3_code": "nar", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6930", "native_tokenizers": [], @@ -21162,9 +24376,11 @@ }, { "name": "Sheni", + "depth": 8, "iso_1_code": null, "iso_3_code": "scv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6931", "native_tokenizers": [], @@ -21172,9 +24388,11 @@ }, { "name": "Shau", + "depth": 8, "iso_1_code": null, "iso_3_code": "sqh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6932", "native_tokenizers": [], @@ -21182,15 +24400,18 @@ }, { "name": "Sanga", + "depth": 8, "iso_1_code": null, "iso_3_code": "xsn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6933", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6920", "native_tokenizers": [], @@ -21198,14 +24419,17 @@ }, { "name": "Kauru", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bina", + "depth": 8, "iso_1_code": null, "iso_3_code": "byj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6935", "native_tokenizers": [], @@ -21213,9 +24437,11 @@ }, { "name": "Dungu", + "depth": 8, "iso_1_code": null, "iso_3_code": "dbv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6936", "native_tokenizers": [], @@ -21223,9 +24449,11 @@ }, { "name": "Tugbiri-Niragu", + "depth": 8, "iso_1_code": null, "iso_3_code": "grh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6937", "native_tokenizers": [], @@ -21233,9 +24461,11 @@ }, { "name": "Kizamani", + "depth": 8, "iso_1_code": null, "iso_3_code": "izm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6938", "native_tokenizers": [], @@ -21243,9 +24473,11 @@ }, { "name": "Kaivi", + "depth": 8, "iso_1_code": null, "iso_3_code": "kce", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6939", "native_tokenizers": [], @@ -21253,9 +24485,11 @@ }, { "name": "Vono", + "depth": 8, "iso_1_code": null, "iso_3_code": "kch", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6940", "native_tokenizers": [], @@ -21263,9 +24497,11 @@ }, { "name": "Kinuku", + "depth": 8, "iso_1_code": null, "iso_3_code": "kkd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6941", "native_tokenizers": [], @@ -21273,9 +24509,11 @@ }, { "name": "Tumi", + "depth": 8, "iso_1_code": null, "iso_3_code": "kku", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6942", "native_tokenizers": [], @@ -21283,9 +24521,11 @@ }, { "name": "Kono", + "depth": 8, "iso_1_code": null, "iso_3_code": "klk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6943", "native_tokenizers": [], @@ -21293,9 +24533,11 @@ }, { "name": "Kurama", + "depth": 8, "iso_1_code": null, "iso_3_code": "krh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6944", "native_tokenizers": [], @@ -21303,9 +24545,11 @@ }, { "name": "Rishiwa", + "depth": 8, "iso_1_code": null, "iso_3_code": "rsw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6945", "native_tokenizers": [], @@ -21313,9 +24557,11 @@ }, { "name": "Mala", + "depth": 8, "iso_1_code": null, "iso_3_code": "ruy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6946", "native_tokenizers": [], @@ -21323,9 +24569,11 @@ }, { "name": "Ruma", + "depth": 8, "iso_1_code": null, "iso_3_code": "ruz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6947", "native_tokenizers": [], @@ -21333,21 +24581,25 @@ }, { "name": "Vori", + "depth": 8, "iso_1_code": null, "iso_3_code": "sde", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6948", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6934", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6918", "native_tokenizers": [], @@ -21355,14 +24607,17 @@ }, { "name": "Piti-Atsam", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atsam", + "depth": 7, "iso_1_code": null, "iso_3_code": "cch", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6950", "native_tokenizers": [], @@ -21370,21 +24625,25 @@ }, { "name": "Abishi", + "depth": 7, "iso_1_code": null, "iso_3_code": "pcn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6951", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6949", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6915", "native_tokenizers": [], @@ -21392,19 +24651,23 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Basa", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Basa-Gumna", + "depth": 7, "iso_1_code": null, "iso_3_code": "bsl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6954", "native_tokenizers": [], @@ -21412,9 +24675,11 @@ }, { "name": "Bassa-Kontagora", + "depth": 7, "iso_1_code": null, "iso_3_code": "bsr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6955", "native_tokenizers": [], @@ -21422,9 +24687,11 @@ }, { "name": "Basa-Gurmana", + "depth": 7, "iso_1_code": null, "iso_3_code": "buj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6956", "native_tokenizers": [], @@ -21432,15 +24699,18 @@ }, { "name": "Basa", + "depth": 7, "iso_1_code": null, "iso_3_code": "bzw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6957", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6953", "native_tokenizers": [], @@ -21448,14 +24718,17 @@ }, { "name": "Baushi-Gurmana", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bauchi", + "depth": 7, "iso_1_code": null, "iso_3_code": "bsf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6959", "native_tokenizers": [], @@ -21463,15 +24736,18 @@ }, { "name": "Gurmana", + "depth": 7, "iso_1_code": null, "iso_3_code": "gvm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6960", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6958", "native_tokenizers": [], @@ -21479,14 +24755,17 @@ }, { "name": "Duka", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gwamhi-Wuri", + "depth": 7, "iso_1_code": null, "iso_3_code": "bga", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6962", "native_tokenizers": [], @@ -21494,9 +24773,11 @@ }, { "name": "Damakawa", + "depth": 7, "iso_1_code": null, "iso_3_code": "dam", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6963", "native_tokenizers": [], @@ -21504,9 +24785,11 @@ }, { "name": "C\u2019Lela", + "depth": 7, "iso_1_code": null, "iso_3_code": "dri", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6964", "native_tokenizers": [], @@ -21514,9 +24797,11 @@ }, { "name": "ut-Ma\u2019in", + "depth": 7, "iso_1_code": null, "iso_3_code": "gel", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6965", "native_tokenizers": [], @@ -21524,9 +24809,11 @@ }, { "name": "us-Saare", + "depth": 7, "iso_1_code": null, "iso_3_code": "uss", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6966", "native_tokenizers": [], @@ -21534,9 +24821,11 @@ }, { "name": "ut-Hun", + "depth": 7, "iso_1_code": null, "iso_3_code": "uth", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21553,6 +24842,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21568,14 +24858,17 @@ }, { "name": "Kainji Lake", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsucuba", + "depth": 7, "iso_1_code": null, "iso_3_code": "cbq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6969", "native_tokenizers": [], @@ -21583,9 +24876,11 @@ }, { "name": "Laru", + "depth": 7, "iso_1_code": null, "iso_3_code": "lan", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6970", "native_tokenizers": [], @@ -21593,15 +24888,18 @@ }, { "name": "Lopa", + "depth": 7, "iso_1_code": null, "iso_3_code": "lop", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6971", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6968", "native_tokenizers": [], @@ -21609,14 +24907,17 @@ }, { "name": "Kambari", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cishingini", + "depth": 7, "iso_1_code": null, "iso_3_code": "asg", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21634,9 +24935,11 @@ }, { "name": "Baangi", + "depth": 7, "iso_1_code": null, "iso_3_code": "bqx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6974", "native_tokenizers": [], @@ -21644,9 +24947,11 @@ }, { "name": "Tsikimba", + "depth": 7, "iso_1_code": null, "iso_3_code": "kdl", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21664,9 +24969,11 @@ }, { "name": "Tsishingini", + "depth": 7, "iso_1_code": null, "iso_3_code": "tsw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21684,15 +24991,18 @@ }, { "name": "Tsuvadi", + "depth": 7, "iso_1_code": null, "iso_3_code": "tvd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6977", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21708,14 +25018,17 @@ }, { "name": "Kamuku", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Acipa, Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": "acp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6979", "native_tokenizers": [], @@ -21723,9 +25036,11 @@ }, { "name": "Cicipu", + "depth": 7, "iso_1_code": null, "iso_3_code": "awc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6980", "native_tokenizers": [], @@ -21733,9 +25048,11 @@ }, { "name": "Kamuku", + "depth": 7, "iso_1_code": null, "iso_3_code": "cdr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6981", "native_tokenizers": [], @@ -21743,9 +25060,11 @@ }, { "name": "Cahungwarya", + "depth": 7, "iso_1_code": null, "iso_3_code": "nat", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6982", "native_tokenizers": [], @@ -21753,9 +25072,11 @@ }, { "name": "Pangu", + "depth": 7, "iso_1_code": null, "iso_3_code": "png", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6983", "native_tokenizers": [], @@ -21763,9 +25084,11 @@ }, { "name": "Rogo", + "depth": 7, "iso_1_code": null, "iso_3_code": "rod", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6984", "native_tokenizers": [], @@ -21773,9 +25096,11 @@ }, { "name": "Shama-Sambuga", + "depth": 7, "iso_1_code": null, "iso_3_code": "sqa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6985", "native_tokenizers": [], @@ -21783,15 +25108,18 @@ }, { "name": "Fungwa", + "depth": 7, "iso_1_code": null, "iso_3_code": "ula", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6986", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6978", "native_tokenizers": [], @@ -21799,26 +25127,31 @@ }, { "name": "Reshe", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Reshe", + "depth": 7, "iso_1_code": null, "iso_3_code": "res", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6988", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6987", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21833,6 +25166,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21848,19 +25182,23 @@ }, { "name": "Nupoid", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ebira-Gade", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gade", + "depth": 6, "iso_1_code": null, "iso_3_code": "ged", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6991", "native_tokenizers": [], @@ -21868,15 +25206,18 @@ }, { "name": "Ebira", + "depth": 6, "iso_1_code": null, "iso_3_code": "igb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6992", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6990", "native_tokenizers": [], @@ -21884,14 +25225,17 @@ }, { "name": "Nupe-Gbagyi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dibo", + "depth": 6, "iso_1_code": null, "iso_3_code": "dio", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6994", "native_tokenizers": [], @@ -21899,14 +25243,17 @@ }, { "name": "Gbagyi-Gbari", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gbagyi", + "depth": 7, "iso_1_code": null, "iso_3_code": "gbr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21924,15 +25271,18 @@ }, { "name": "Gbari", + "depth": 7, "iso_1_code": null, "iso_3_code": "gby", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6997", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -21948,14 +25298,17 @@ }, { "name": "Nupe", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asu", + "depth": 7, "iso_1_code": null, "iso_3_code": "aum", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6999", "native_tokenizers": [], @@ -21963,9 +25316,11 @@ }, { "name": "Gupa-Abawa", + "depth": 7, "iso_1_code": null, "iso_3_code": "gpa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7000", "native_tokenizers": [], @@ -21973,9 +25328,11 @@ }, { "name": "Kakanda", + "depth": 7, "iso_1_code": null, "iso_3_code": "kka", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7001", "native_tokenizers": [], @@ -21983,9 +25340,11 @@ }, { "name": "Kami", + "depth": 7, "iso_1_code": null, "iso_3_code": "kmi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7002", "native_tokenizers": [], @@ -21993,9 +25352,11 @@ }, { "name": "Kupa", + "depth": 7, "iso_1_code": null, "iso_3_code": "kug", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7003", "native_tokenizers": [], @@ -22003,21 +25364,25 @@ }, { "name": "Nupe-Nupe-Tako", + "depth": 7, "iso_1_code": null, "iso_3_code": "nup", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7004", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "6998", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22032,6 +25397,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22047,20 +25413,24 @@ }, { "name": "Oko", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oko-Eni-Osayen", + "depth": 5, "iso_1_code": null, "iso_3_code": "oks", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7006", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7005", "native_tokenizers": [], @@ -22068,14 +25438,17 @@ }, { "name": "Plateau", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atoro", + "depth": 5, "iso_1_code": null, "iso_3_code": "tdv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7008", "native_tokenizers": [], @@ -22083,20 +25456,24 @@ }, { "name": "Alumic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arum", + "depth": 6, "iso_1_code": null, "iso_3_code": "aab", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7010", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7009", "native_tokenizers": [], @@ -22104,20 +25481,24 @@ }, { "name": "Ayu", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ayu", + "depth": 6, "iso_1_code": null, "iso_3_code": "ayu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7012", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7011", "native_tokenizers": [], @@ -22125,14 +25506,17 @@ }, { "name": "Beromic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berom", + "depth": 6, "iso_1_code": null, "iso_3_code": "bom", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22150,9 +25534,11 @@ }, { "name": "Iten", + "depth": 6, "iso_1_code": null, "iso_3_code": "etx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7015", "native_tokenizers": [], @@ -22160,15 +25546,18 @@ }, { "name": "Shall-Zwall", + "depth": 6, "iso_1_code": null, "iso_3_code": "sha", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7016", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22184,25 +25573,30 @@ }, { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North-Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cara", + "depth": 7, "iso_1_code": null, "iso_3_code": "cfd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7019", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7018", "native_tokenizers": [], @@ -22210,14 +25604,17 @@ }, { "name": "South-Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ibaas", + "depth": 7, "iso_1_code": null, "iso_3_code": "cen", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7021", "native_tokenizers": [], @@ -22225,9 +25622,11 @@ }, { "name": "Firan", + "depth": 7, "iso_1_code": null, "iso_3_code": "fir", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7022", "native_tokenizers": [], @@ -22235,9 +25634,11 @@ }, { "name": "Ganang", + "depth": 7, "iso_1_code": null, "iso_3_code": "gne", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7023", "native_tokenizers": [], @@ -22245,9 +25646,11 @@ }, { "name": "Rigwe", + "depth": 7, "iso_1_code": null, "iso_3_code": "iri", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22265,9 +25668,11 @@ }, { "name": "Izere", + "depth": 7, "iso_1_code": null, "iso_3_code": "izr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22285,9 +25690,11 @@ }, { "name": "Jju", + "depth": 7, "iso_1_code": null, "iso_3_code": "kaj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7026", "native_tokenizers": [], @@ -22295,9 +25702,11 @@ }, { "name": "Tyap", + "depth": 7, "iso_1_code": null, "iso_3_code": "kcg", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22314,6 +25723,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22329,26 +25739,31 @@ }, { "name": "West-Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ahwai", + "depth": 7, "iso_1_code": null, "iso_3_code": "nfd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7029", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7028", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22364,14 +25779,17 @@ }, { "name": "Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ejuele", + "depth": 6, "iso_1_code": null, "iso_3_code": "dbi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7031", "native_tokenizers": [], @@ -22379,9 +25797,11 @@ }, { "name": "Ajiya", + "depth": 6, "iso_1_code": null, "iso_3_code": "idc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7032", "native_tokenizers": [], @@ -22389,9 +25809,11 @@ }, { "name": "Ikulu", + "depth": 6, "iso_1_code": null, "iso_3_code": "ikl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7033", "native_tokenizers": [], @@ -22399,9 +25821,11 @@ }, { "name": "Iku-Gora-Ankwa", + "depth": 6, "iso_1_code": null, "iso_3_code": "ikv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7034", "native_tokenizers": [], @@ -22409,9 +25833,11 @@ }, { "name": "Adara", + "depth": 6, "iso_1_code": null, "iso_3_code": "kad", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7035", "native_tokenizers": [], @@ -22419,15 +25845,18 @@ }, { "name": "Kuturmi", + "depth": 6, "iso_1_code": null, "iso_3_code": "khj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7036", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7030", "native_tokenizers": [], @@ -22435,14 +25864,17 @@ }, { "name": "Southeastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Horom", + "depth": 6, "iso_1_code": null, "iso_3_code": "hoe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7038", "native_tokenizers": [], @@ -22450,9 +25882,11 @@ }, { "name": "Bo-Rukul", + "depth": 6, "iso_1_code": null, "iso_3_code": "mae", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7039", "native_tokenizers": [], @@ -22460,15 +25894,18 @@ }, { "name": "Pyam", + "depth": 6, "iso_1_code": null, "iso_3_code": "pym", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7040", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7037", "native_tokenizers": [], @@ -22476,14 +25913,17 @@ }, { "name": "Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Migili", + "depth": 6, "iso_1_code": null, "iso_3_code": "mgi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7042", "native_tokenizers": [], @@ -22491,9 +25931,11 @@ }, { "name": "Rjili", + "depth": 6, "iso_1_code": null, "iso_3_code": "uji", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7043", "native_tokenizers": [], @@ -22501,9 +25943,11 @@ }, { "name": "Koro Nulu", + "depth": 6, "iso_1_code": null, "iso_3_code": "vkn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7044", "native_tokenizers": [], @@ -22511,15 +25955,18 @@ }, { "name": "Koro Zuba", + "depth": 6, "iso_1_code": null, "iso_3_code": "vkz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7045", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7041", "native_tokenizers": [], @@ -22527,14 +25974,17 @@ }, { "name": "Tarokoid", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yangkam", + "depth": 6, "iso_1_code": null, "iso_3_code": "bsx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7047", "native_tokenizers": [], @@ -22542,9 +25992,11 @@ }, { "name": "Pye", + "depth": 6, "iso_1_code": null, "iso_3_code": "pai", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7048", "native_tokenizers": [], @@ -22552,9 +26004,11 @@ }, { "name": "Kusur-Myet", + "depth": 6, "iso_1_code": null, "iso_3_code": "tdl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7049", "native_tokenizers": [], @@ -22562,15 +26016,18 @@ }, { "name": "Tarok", + "depth": 6, "iso_1_code": null, "iso_3_code": "yer", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7050", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7046", "native_tokenizers": [], @@ -22578,24 +26035,29 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northwestern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hyamic", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kyoli", + "depth": 8, "iso_1_code": null, "iso_3_code": "cry", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7054", "native_tokenizers": [], @@ -22603,9 +26065,11 @@ }, { "name": "Hyam", + "depth": 8, "iso_1_code": null, "iso_3_code": "jab", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7055", "native_tokenizers": [], @@ -22613,9 +26077,11 @@ }, { "name": "Gyong", + "depth": 8, "iso_1_code": null, "iso_3_code": "kdm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7056", "native_tokenizers": [], @@ -22623,9 +26089,11 @@ }, { "name": "Shamang", + "depth": 8, "iso_1_code": null, "iso_3_code": "xsh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7057", "native_tokenizers": [], @@ -22633,15 +26101,18 @@ }, { "name": "Zhire", + "depth": 8, "iso_1_code": null, "iso_3_code": "zhi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7058", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7053", "native_tokenizers": [], @@ -22649,14 +26120,17 @@ }, { "name": "Koro", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ashe", + "depth": 8, "iso_1_code": null, "iso_3_code": "ahs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7060", "native_tokenizers": [], @@ -22664,9 +26138,11 @@ }, { "name": "Koro Wachi", + "depth": 8, "iso_1_code": null, "iso_3_code": "bqv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7061", "native_tokenizers": [], @@ -22674,9 +26150,11 @@ }, { "name": "Duya", + "depth": 8, "iso_1_code": null, "iso_3_code": "ldb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7062", "native_tokenizers": [], @@ -22684,21 +26162,25 @@ }, { "name": "Nyankpa", + "depth": 8, "iso_1_code": null, "iso_3_code": "yes", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7063", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7059", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7052", "native_tokenizers": [], @@ -22706,19 +26188,23 @@ }, { "name": "Southwestern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "A", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aninka", + "depth": 8, "iso_1_code": null, "iso_3_code": "aqk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7066", "native_tokenizers": [], @@ -22726,9 +26212,11 @@ }, { "name": "Kadung", + "depth": 8, "iso_1_code": null, "iso_3_code": "dkg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7067", "native_tokenizers": [], @@ -22736,9 +26224,11 @@ }, { "name": "Bijim", + "depth": 8, "iso_1_code": null, "iso_3_code": "jbm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7068", "native_tokenizers": [], @@ -22746,9 +26236,11 @@ }, { "name": "Bu", + "depth": 8, "iso_1_code": null, "iso_3_code": "jid", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7069", "native_tokenizers": [], @@ -22756,9 +26248,11 @@ }, { "name": "Kamantan", + "depth": 8, "iso_1_code": null, "iso_3_code": "kci", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7070", "native_tokenizers": [], @@ -22766,9 +26260,11 @@ }, { "name": "Nikyob-Nindem", + "depth": 8, "iso_1_code": null, "iso_3_code": "kdp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22786,9 +26282,11 @@ }, { "name": "Kanufi", + "depth": 8, "iso_1_code": null, "iso_3_code": "kni", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7072", "native_tokenizers": [], @@ -22796,9 +26294,11 @@ }, { "name": "Mada", + "depth": 8, "iso_1_code": null, "iso_3_code": "mda", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22816,9 +26316,11 @@ }, { "name": "Numana", + "depth": 8, "iso_1_code": null, "iso_3_code": "nbr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7074", "native_tokenizers": [], @@ -22826,9 +26328,11 @@ }, { "name": "Ninzo", + "depth": 8, "iso_1_code": null, "iso_3_code": "nin", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22846,9 +26350,11 @@ }, { "name": "Nungu", + "depth": 8, "iso_1_code": null, "iso_3_code": "rin", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7076", "native_tokenizers": [], @@ -22856,9 +26362,11 @@ }, { "name": "Kuce", + "depth": 8, "iso_1_code": null, "iso_3_code": "ruk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7077", "native_tokenizers": [], @@ -22866,15 +26374,18 @@ }, { "name": "Tiyaa", + "depth": 8, "iso_1_code": null, "iso_3_code": "tyy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7078", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22890,14 +26401,17 @@ }, { "name": "B", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akye", + "depth": 8, "iso_1_code": null, "iso_3_code": "aik", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7080", "native_tokenizers": [], @@ -22905,9 +26419,11 @@ }, { "name": "Eggon", + "depth": 8, "iso_1_code": null, "iso_3_code": "ego", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7081", "native_tokenizers": [], @@ -22915,9 +26431,11 @@ }, { "name": "Sambe", + "depth": 8, "iso_1_code": null, "iso_3_code": "xab", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7082", "native_tokenizers": [], @@ -22925,21 +26443,25 @@ }, { "name": "Hasha", + "depth": 8, "iso_1_code": null, "iso_3_code": "ybj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7083", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7079", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22954,6 +26476,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22968,6 +26491,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -22983,20 +26507,24 @@ }, { "name": "Ukaan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ukaan", + "depth": 5, "iso_1_code": null, "iso_3_code": "kcf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7085", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7084", "native_tokenizers": [], @@ -23004,26 +26532,31 @@ }, { "name": "Unclassified", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fali of Baissa", + "depth": 5, "iso_1_code": null, "iso_3_code": "fah", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7087", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7086", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23039,14 +26572,17 @@ }, { "name": "Dogon", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dogon, Ampari", + "depth": 4, "iso_1_code": null, "iso_3_code": "aqd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7089", "native_tokenizers": [], @@ -23054,9 +26590,11 @@ }, { "name": "Dogon, Dogul Dom", + "depth": 4, "iso_1_code": null, "iso_3_code": "dbg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7090", "native_tokenizers": [], @@ -23064,9 +26602,11 @@ }, { "name": "Dogon, Ben Tey", + "depth": 4, "iso_1_code": null, "iso_3_code": "dbt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7091", "native_tokenizers": [], @@ -23074,9 +26614,11 @@ }, { "name": "Dogon, Bondum Dom", + "depth": 4, "iso_1_code": null, "iso_3_code": "dbu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7092", "native_tokenizers": [], @@ -23084,9 +26626,11 @@ }, { "name": "Dogon, Bankan Tey", + "depth": 4, "iso_1_code": null, "iso_3_code": "dbw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7093", "native_tokenizers": [], @@ -23094,9 +26638,11 @@ }, { "name": "Dogon, Donno So", + "depth": 4, "iso_1_code": null, "iso_3_code": "dds", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7094", "native_tokenizers": [], @@ -23104,9 +26650,11 @@ }, { "name": "Dogon, Bunoge", + "depth": 4, "iso_1_code": null, "iso_3_code": "dgb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7095", "native_tokenizers": [], @@ -23114,9 +26662,11 @@ }, { "name": "Dogon, Jamsay", + "depth": 4, "iso_1_code": null, "iso_3_code": "djm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7096", "native_tokenizers": [], @@ -23124,9 +26674,11 @@ }, { "name": "Dogon, Mombo", + "depth": 4, "iso_1_code": null, "iso_3_code": "dmb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7097", "native_tokenizers": [], @@ -23134,9 +26686,11 @@ }, { "name": "Dogon, Ana Tinga", + "depth": 4, "iso_1_code": null, "iso_3_code": "dti", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7098", "native_tokenizers": [], @@ -23144,9 +26698,11 @@ }, { "name": "Dogon, Tene Kan", + "depth": 4, "iso_1_code": null, "iso_3_code": "dtk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7099", "native_tokenizers": [], @@ -23154,9 +26710,11 @@ }, { "name": "Dogon, Tomo Kan", + "depth": 4, "iso_1_code": null, "iso_3_code": "dtm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7100", "native_tokenizers": [], @@ -23164,9 +26722,11 @@ }, { "name": "Dogon, Tommo So", + "depth": 4, "iso_1_code": null, "iso_3_code": "dto", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7101", "native_tokenizers": [], @@ -23174,9 +26734,11 @@ }, { "name": "Dogon, Toro So", + "depth": 4, "iso_1_code": null, "iso_3_code": "dts", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23194,9 +26756,11 @@ }, { "name": "Dogon, Toro Tegu", + "depth": 4, "iso_1_code": null, "iso_3_code": "dtt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7103", "native_tokenizers": [], @@ -23204,9 +26768,11 @@ }, { "name": "Dogon, Tebul Ure", + "depth": 4, "iso_1_code": null, "iso_3_code": "dtu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7104", "native_tokenizers": [], @@ -23214,9 +26780,11 @@ }, { "name": "Dogon, Yanda Dom", + "depth": 4, "iso_1_code": null, "iso_3_code": "dym", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7105", "native_tokenizers": [], @@ -23224,9 +26792,11 @@ }, { "name": "Dogon, Nanga Dama", + "depth": 4, "iso_1_code": null, "iso_3_code": "nzz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7106", "native_tokenizers": [], @@ -23234,15 +26804,18 @@ }, { "name": "Dogon, Tiranige Diga", + "depth": 4, "iso_1_code": null, "iso_3_code": "tde", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7107", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23258,19 +26831,23 @@ }, { "name": "Kru", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aizi", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aizi, Tiagbamrin", + "depth": 5, "iso_1_code": null, "iso_3_code": "ahi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7110", "native_tokenizers": [], @@ -23278,9 +26855,11 @@ }, { "name": "Aizi, Mobumrin", + "depth": 5, "iso_1_code": null, "iso_3_code": "ahm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7111", "native_tokenizers": [], @@ -23288,15 +26867,18 @@ }, { "name": "Aizi, Aproumu", + "depth": 5, "iso_1_code": null, "iso_3_code": "ahp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7112", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7109", "native_tokenizers": [], @@ -23304,19 +26886,23 @@ }, { "name": "Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakwe", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bakw\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "bjw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7115", "native_tokenizers": [], @@ -23324,15 +26910,18 @@ }, { "name": "Wan\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "hwa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7116", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7114", "native_tokenizers": [], @@ -23340,19 +26929,23 @@ }, { "name": "Bete", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "B\u00e9t\u00e9, Gagnoa", + "depth": 7, "iso_1_code": null, "iso_3_code": "btg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7119", "native_tokenizers": [], @@ -23360,9 +26953,11 @@ }, { "name": "Kouya", + "depth": 7, "iso_1_code": null, "iso_3_code": "kyf", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23379,6 +26974,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23394,14 +26990,17 @@ }, { "name": "Western", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "B\u00e9t\u00e9, Guiberoua", + "depth": 7, "iso_1_code": null, "iso_3_code": "bet", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7122", "native_tokenizers": [], @@ -23409,9 +27008,11 @@ }, { "name": "B\u00e9t\u00e9, Daloa", + "depth": 7, "iso_1_code": null, "iso_3_code": "bev", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7123", "native_tokenizers": [], @@ -23419,21 +27020,25 @@ }, { "name": "Godi\u00e9", + "depth": 7, "iso_1_code": null, "iso_3_code": "god", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7124", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7121", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23449,14 +27054,17 @@ }, { "name": "Dida", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dida, Lakota", + "depth": 6, "iso_1_code": null, "iso_3_code": "dic", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7126", "native_tokenizers": [], @@ -23464,9 +27072,11 @@ }, { "name": "Gu\u00e9bie", + "depth": 6, "iso_1_code": null, "iso_3_code": "gie", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7127", "native_tokenizers": [], @@ -23474,9 +27084,11 @@ }, { "name": "Dida, Yocobou\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "gud", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23494,15 +27106,18 @@ }, { "name": "Neyo", + "depth": 6, "iso_1_code": null, "iso_3_code": "ney", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7129", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23518,26 +27133,31 @@ }, { "name": "Kwadia", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kodia", + "depth": 6, "iso_1_code": null, "iso_3_code": "kwp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7131", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7130", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23553,14 +27173,17 @@ }, { "name": "Kuwaa", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuwaa", + "depth": 5, "iso_1_code": null, "iso_3_code": "blh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23577,6 +27200,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23592,20 +27216,24 @@ }, { "name": "Seme", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Siamou", + "depth": 5, "iso_1_code": null, "iso_3_code": "sif", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7135", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7134", "native_tokenizers": [], @@ -23613,19 +27241,23 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bassa", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bassa", + "depth": 6, "iso_1_code": null, "iso_3_code": "bsq", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23643,9 +27275,11 @@ }, { "name": "Dewoin", + "depth": 6, "iso_1_code": null, "iso_3_code": "dee", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7139", "native_tokenizers": [], @@ -23653,15 +27287,18 @@ }, { "name": "Gbii", + "depth": 6, "iso_1_code": null, "iso_3_code": "ggb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7140", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23677,25 +27314,30 @@ }, { "name": "Grebo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Glio-Oubi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Glio-Oubi", + "depth": 7, "iso_1_code": null, "iso_3_code": "oub", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7143", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7142", "native_tokenizers": [], @@ -23703,14 +27345,17 @@ }, { "name": "Ivorian", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Krumen, Plapo", + "depth": 7, "iso_1_code": null, "iso_3_code": "ktj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23728,9 +27373,11 @@ }, { "name": "Krumen, Pye", + "depth": 7, "iso_1_code": null, "iso_3_code": "pye", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7146", "native_tokenizers": [], @@ -23738,9 +27385,11 @@ }, { "name": "Krumen, Tepo", + "depth": 7, "iso_1_code": null, "iso_3_code": "ted", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23757,6 +27406,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23772,14 +27422,17 @@ }, { "name": "Liberian", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Grebo, Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "gbo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23797,9 +27450,11 @@ }, { "name": "Grebo, Gboloo", + "depth": 7, "iso_1_code": null, "iso_3_code": "gec", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7150", "native_tokenizers": [], @@ -23807,9 +27462,11 @@ }, { "name": "Grebo, Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "grj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7151", "native_tokenizers": [], @@ -23817,9 +27474,11 @@ }, { "name": "Grebo, Central", + "depth": 7, "iso_1_code": null, "iso_3_code": "grv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7152", "native_tokenizers": [], @@ -23827,15 +27486,18 @@ }, { "name": "Grebo, Barclayville", + "depth": 7, "iso_1_code": null, "iso_3_code": "gry", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7153", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23850,6 +27512,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23865,14 +27528,17 @@ }, { "name": "Klao", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Klao", + "depth": 6, "iso_1_code": null, "iso_3_code": "klu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7155", "native_tokenizers": [], @@ -23880,15 +27546,18 @@ }, { "name": "Tajuasohn", + "depth": 6, "iso_1_code": null, "iso_3_code": "tja", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7156", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7154", "native_tokenizers": [], @@ -23896,19 +27565,23 @@ }, { "name": "Wee", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guere-Krahn", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Daho-Doo", + "depth": 7, "iso_1_code": null, "iso_3_code": "das", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7159", "native_tokenizers": [], @@ -23916,9 +27589,11 @@ }, { "name": "Glaro-Twabo", + "depth": 7, "iso_1_code": null, "iso_3_code": "glr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7160", "native_tokenizers": [], @@ -23926,9 +27601,11 @@ }, { "name": "W\u00e8 Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "gxx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7161", "native_tokenizers": [], @@ -23936,9 +27613,11 @@ }, { "name": "Sapo", + "depth": 7, "iso_1_code": null, "iso_3_code": "krn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7162", "native_tokenizers": [], @@ -23946,9 +27625,11 @@ }, { "name": "Krahn, Western", + "depth": 7, "iso_1_code": null, "iso_3_code": "krw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7163", "native_tokenizers": [], @@ -23956,15 +27637,18 @@ }, { "name": "W\u00e8 Western", + "depth": 7, "iso_1_code": null, "iso_3_code": "wec", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7164", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7158", "native_tokenizers": [], @@ -23972,14 +27656,17 @@ }, { "name": "Konobo", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Krahn, Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": "kqo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -23996,6 +27683,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24011,14 +27699,17 @@ }, { "name": "Nyabwa", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyabwa", + "depth": 7, "iso_1_code": null, "iso_3_code": "nwb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24035,6 +27726,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24050,14 +27742,17 @@ }, { "name": "Wobe", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "W\u00e8 Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "wob", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24074,6 +27769,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24088,6 +27784,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24102,6 +27799,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24116,6 +27814,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24131,14 +27830,17 @@ }, { "name": "Kwa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Esuma", + "depth": 4, "iso_1_code": null, "iso_3_code": "esm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7172", "native_tokenizers": [], @@ -24146,9 +27848,11 @@ }, { "name": "Boro", + "depth": 4, "iso_1_code": null, "iso_3_code": "xxb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7173", "native_tokenizers": [], @@ -24156,19 +27860,23 @@ }, { "name": "Left Bank", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Avatime-Nyangbo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Avatime", + "depth": 6, "iso_1_code": null, "iso_3_code": "avn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24186,9 +27894,11 @@ }, { "name": "Nyagbo", + "depth": 6, "iso_1_code": null, "iso_3_code": "nyb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7177", "native_tokenizers": [], @@ -24196,15 +27906,18 @@ }, { "name": "Tafi", + "depth": 6, "iso_1_code": null, "iso_3_code": "tcd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7178", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24220,14 +27933,17 @@ }, { "name": "Gbe", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aguna", + "depth": 6, "iso_1_code": null, "iso_3_code": "aug", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7180", "native_tokenizers": [], @@ -24235,9 +27951,11 @@ }, { "name": "Gbe, Ci", + "depth": 6, "iso_1_code": null, "iso_3_code": "cib", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7181", "native_tokenizers": [], @@ -24245,9 +27963,11 @@ }, { "name": "\u00c9w\u00e9", + "depth": 6, "iso_1_code": "ee", "iso_3_code": "ewe", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24265,9 +27985,11 @@ }, { "name": "Gbe, Gbesi", + "depth": 6, "iso_1_code": null, "iso_3_code": "gbs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7183", "native_tokenizers": [], @@ -24275,9 +27997,11 @@ }, { "name": "Gbe, Eastern Xwla", + "depth": 6, "iso_1_code": null, "iso_3_code": "gbx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7184", "native_tokenizers": [], @@ -24285,9 +28009,11 @@ }, { "name": "Kpessi", + "depth": 6, "iso_1_code": null, "iso_3_code": "kef", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7185", "native_tokenizers": [], @@ -24295,9 +28021,11 @@ }, { "name": "Gbe, Kotafon", + "depth": 6, "iso_1_code": null, "iso_3_code": "kqk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7186", "native_tokenizers": [], @@ -24305,9 +28033,11 @@ }, { "name": "Gbe, Saxwe", + "depth": 6, "iso_1_code": null, "iso_3_code": "sxw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7187", "native_tokenizers": [], @@ -24315,9 +28045,11 @@ }, { "name": "Gbe, Waci", + "depth": 6, "iso_1_code": null, "iso_3_code": "wci", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7188", "native_tokenizers": [], @@ -24325,9 +28057,11 @@ }, { "name": "Wudu", + "depth": 6, "iso_1_code": null, "iso_3_code": "wud", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7189", "native_tokenizers": [], @@ -24335,9 +28069,11 @@ }, { "name": "Gbe, Xwela", + "depth": 6, "iso_1_code": null, "iso_3_code": "xwe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7190", "native_tokenizers": [], @@ -24345,9 +28081,11 @@ }, { "name": "Gbe, Western Xwla", + "depth": 6, "iso_1_code": null, "iso_3_code": "xwl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7191", "native_tokenizers": [], @@ -24355,14 +28093,17 @@ }, { "name": "Aja", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aja", + "depth": 7, "iso_1_code": null, "iso_3_code": "ajg", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24380,9 +28121,11 @@ }, { "name": "Gbe, Ayizo", + "depth": 7, "iso_1_code": null, "iso_3_code": "ayb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7194", "native_tokenizers": [], @@ -24390,9 +28133,11 @@ }, { "name": "Gbe, Defi", + "depth": 7, "iso_1_code": null, "iso_3_code": "gbh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7195", "native_tokenizers": [], @@ -24400,9 +28145,11 @@ }, { "name": "Gun", + "depth": 7, "iso_1_code": null, "iso_3_code": "guw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24420,9 +28167,11 @@ }, { "name": "Gbe, Tofin", + "depth": 7, "iso_1_code": null, "iso_3_code": "tfi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7197", "native_tokenizers": [], @@ -24430,15 +28179,18 @@ }, { "name": "Gbe, Weme", + "depth": 7, "iso_1_code": null, "iso_3_code": "wem", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7198", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24454,14 +28206,17 @@ }, { "name": "Fon", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fon", + "depth": 7, "iso_1_code": null, "iso_3_code": "fon", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24479,15 +28234,18 @@ }, { "name": "Gbe, Maxi", + "depth": 7, "iso_1_code": null, "iso_3_code": "mxl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7201", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24503,14 +28261,17 @@ }, { "name": "Mina", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gen", + "depth": 7, "iso_1_code": null, "iso_3_code": "gej", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24527,6 +28288,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24541,6 +28303,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24556,14 +28319,17 @@ }, { "name": "Kebu-Animere", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Animere", + "depth": 6, "iso_1_code": null, "iso_3_code": "anf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7205", "native_tokenizers": [], @@ -24571,15 +28337,18 @@ }, { "name": "Akebu", + "depth": 6, "iso_1_code": null, "iso_3_code": "keu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7206", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7204", "native_tokenizers": [], @@ -24587,14 +28356,17 @@ }, { "name": "Kposo-Ahlo-Bowili", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adangbe", + "depth": 6, "iso_1_code": null, "iso_3_code": "adq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7208", "native_tokenizers": [], @@ -24602,9 +28374,11 @@ }, { "name": "Igo", + "depth": 6, "iso_1_code": null, "iso_3_code": "ahl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7209", "native_tokenizers": [], @@ -24612,9 +28386,11 @@ }, { "name": "Tuwuli", + "depth": 6, "iso_1_code": null, "iso_3_code": "bov", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24632,15 +28408,18 @@ }, { "name": "Ikposo", + "depth": 6, "iso_1_code": null, "iso_3_code": "kpo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7211", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24655,6 +28434,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24670,19 +28450,23 @@ }, { "name": "Nyo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agneby", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ab\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "aba", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24700,9 +28484,11 @@ }, { "name": "Abidji", + "depth": 6, "iso_1_code": null, "iso_3_code": "abi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24720,9 +28506,11 @@ }, { "name": "Adioukrou", + "depth": 6, "iso_1_code": null, "iso_3_code": "adj", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24739,6 +28527,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24754,14 +28543,17 @@ }, { "name": "Attie", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atti\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "ati", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24778,6 +28570,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24793,14 +28586,17 @@ }, { "name": "Avikam-Alladian", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alladian", + "depth": 6, "iso_1_code": null, "iso_3_code": "ald", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24818,15 +28614,18 @@ }, { "name": "Avikam", + "depth": 6, "iso_1_code": null, "iso_3_code": "avi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7221", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24842,14 +28641,17 @@ }, { "name": "Ga-Dangme", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dangme", + "depth": 6, "iso_1_code": null, "iso_3_code": "ada", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24867,9 +28669,11 @@ }, { "name": "Ga", + "depth": 6, "iso_1_code": null, "iso_3_code": "gaa", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24886,6 +28690,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24901,19 +28706,23 @@ }, { "name": "Potou-Tano", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Basila-Adele", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adele", + "depth": 7, "iso_1_code": null, "iso_3_code": "ade", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24931,15 +28740,18 @@ }, { "name": "Anii", + "depth": 7, "iso_1_code": null, "iso_3_code": "blo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7228", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -24955,20 +28767,24 @@ }, { "name": "Ega", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ega", + "depth": 7, "iso_1_code": null, "iso_3_code": "ega", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7230", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7229", "native_tokenizers": [], @@ -24976,19 +28792,23 @@ }, { "name": "Lelemi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lelemi-Akpafu", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Siwu", + "depth": 8, "iso_1_code": null, "iso_3_code": "akp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25006,9 +28826,11 @@ }, { "name": "Lelemi", + "depth": 8, "iso_1_code": null, "iso_3_code": "lef", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25025,6 +28847,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25040,14 +28863,17 @@ }, { "name": "Likpe-Santrokofi", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sekpele", + "depth": 8, "iso_1_code": null, "iso_3_code": "lip", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25065,9 +28891,11 @@ }, { "name": "Selee", + "depth": 8, "iso_1_code": null, "iso_3_code": "snw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25084,6 +28912,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25098,6 +28927,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25113,20 +28943,24 @@ }, { "name": "Logba", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Logba", + "depth": 7, "iso_1_code": null, "iso_3_code": "lgq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7239", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7238", "native_tokenizers": [], @@ -25134,14 +28968,17 @@ }, { "name": "Potou", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tchaman", + "depth": 7, "iso_1_code": null, "iso_3_code": "ebr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7241", "native_tokenizers": [], @@ -25149,15 +28986,18 @@ }, { "name": "Mbato", + "depth": 7, "iso_1_code": null, "iso_3_code": "gwa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7242", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7240", "native_tokenizers": [], @@ -25165,24 +29005,29 @@ }, { "name": "Tano", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akan", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abron", + "depth": 9, "iso_1_code": null, "iso_3_code": "abr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7246", "native_tokenizers": [], @@ -25190,9 +29035,11 @@ }, { "name": "Akan", + "depth": 9, "iso_1_code": "ak", "iso_3_code": "aka", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7247", "native_tokenizers": [], @@ -25200,15 +29047,18 @@ }, { "name": "Wasa", + "depth": 9, "iso_1_code": null, "iso_3_code": "wss", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7248", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7245", "native_tokenizers": [], @@ -25216,19 +29066,23 @@ }, { "name": "Bia", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anyin", + "depth": 10, "iso_1_code": null, "iso_3_code": "any", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25246,9 +29100,11 @@ }, { "name": "Baoul\u00e9", + "depth": 10, "iso_1_code": null, "iso_3_code": "bci", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25266,9 +29122,11 @@ }, { "name": "Anufo", + "depth": 10, "iso_1_code": null, "iso_3_code": "cko", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25286,9 +29144,11 @@ }, { "name": "Anyin Morofo", + "depth": 10, "iso_1_code": null, "iso_3_code": "mtb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7254", "native_tokenizers": [], @@ -25296,9 +29156,11 @@ }, { "name": "Esahie", + "depth": 10, "iso_1_code": null, "iso_3_code": "sfw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25315,6 +29177,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25330,14 +29193,17 @@ }, { "name": "Southern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ahanta", + "depth": 10, "iso_1_code": null, "iso_3_code": "aha", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25355,9 +29221,11 @@ }, { "name": "Jwira-Pepesa", + "depth": 10, "iso_1_code": null, "iso_3_code": "jwi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7258", "native_tokenizers": [], @@ -25365,9 +29233,11 @@ }, { "name": "Nzema", + "depth": 10, "iso_1_code": null, "iso_3_code": "nzi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25384,6 +29254,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25398,6 +29269,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25412,6 +29284,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25427,19 +29300,23 @@ }, { "name": "Guang", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North Guang", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gikyode", + "depth": 9, "iso_1_code": null, "iso_3_code": "acd", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25457,9 +29334,11 @@ }, { "name": "Ginyanga", + "depth": 9, "iso_1_code": null, "iso_3_code": "ayg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7263", "native_tokenizers": [], @@ -25467,9 +29346,11 @@ }, { "name": "Tchumbuli", + "depth": 9, "iso_1_code": null, "iso_3_code": "bqa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7264", "native_tokenizers": [], @@ -25477,9 +29358,11 @@ }, { "name": "Dompo", + "depth": 9, "iso_1_code": null, "iso_3_code": "doy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7265", "native_tokenizers": [], @@ -25487,9 +29370,11 @@ }, { "name": "Foodo", + "depth": 9, "iso_1_code": null, "iso_3_code": "fod", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7266", "native_tokenizers": [], @@ -25497,9 +29382,11 @@ }, { "name": "Gonja", + "depth": 9, "iso_1_code": null, "iso_3_code": "gjn", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25517,9 +29404,11 @@ }, { "name": "Kplang", + "depth": 9, "iso_1_code": null, "iso_3_code": "kph", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7268", "native_tokenizers": [], @@ -25527,9 +29416,11 @@ }, { "name": "Krache", + "depth": 9, "iso_1_code": null, "iso_3_code": "kye", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7269", "native_tokenizers": [], @@ -25537,9 +29428,11 @@ }, { "name": "Nawuri", + "depth": 9, "iso_1_code": null, "iso_3_code": "naw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25557,9 +29450,11 @@ }, { "name": "Chumburung", + "depth": 9, "iso_1_code": null, "iso_3_code": "ncu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25577,9 +29472,11 @@ }, { "name": "Nkonya", + "depth": 9, "iso_1_code": null, "iso_3_code": "nko", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25597,9 +29494,11 @@ }, { "name": "Nkami", + "depth": 9, "iso_1_code": null, "iso_3_code": "nkq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7273", "native_tokenizers": [], @@ -25607,9 +29506,11 @@ }, { "name": "Nchumbulu", + "depth": 9, "iso_1_code": null, "iso_3_code": "nlu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7274", "native_tokenizers": [], @@ -25617,15 +29518,18 @@ }, { "name": "Dwang", + "depth": 9, "iso_1_code": null, "iso_3_code": "nnu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7275", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25641,14 +29545,17 @@ }, { "name": "South Guang", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awutu", + "depth": 9, "iso_1_code": null, "iso_3_code": "afu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7277", "native_tokenizers": [], @@ -25656,9 +29563,11 @@ }, { "name": "Cherepon", + "depth": 9, "iso_1_code": null, "iso_3_code": "cpn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7278", "native_tokenizers": [], @@ -25666,9 +29575,11 @@ }, { "name": "Gua", + "depth": 9, "iso_1_code": null, "iso_3_code": "gwx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7279", "native_tokenizers": [], @@ -25676,21 +29587,25 @@ }, { "name": "Larteh", + "depth": 9, "iso_1_code": null, "iso_3_code": "lar", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7280", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7276", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25706,20 +29621,24 @@ }, { "name": "Krobu", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Krobu", + "depth": 8, "iso_1_code": null, "iso_3_code": "kxb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7282", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7281", "native_tokenizers": [], @@ -25727,14 +29646,17 @@ }, { "name": "Western", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abure", + "depth": 8, "iso_1_code": null, "iso_3_code": "abu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7284", "native_tokenizers": [], @@ -25742,21 +29664,25 @@ }, { "name": "Beti", + "depth": 8, "iso_1_code": null, "iso_3_code": "eot", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7285", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7283", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25771,6 +29697,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25785,6 +29712,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25799,6 +29727,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25814,29 +29743,35 @@ }, { "name": "North", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adamawa-Ubangi", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adamawa", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fali", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fali, South", + "depth": 7, "iso_1_code": null, "iso_3_code": "fal", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25854,15 +29789,18 @@ }, { "name": "Fali, North", + "depth": 7, "iso_1_code": null, "iso_3_code": "fll", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7291", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25878,20 +29816,24 @@ }, { "name": "Kam", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kam", + "depth": 7, "iso_1_code": null, "iso_3_code": "kdx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7293", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7292", "native_tokenizers": [], @@ -25899,20 +29841,24 @@ }, { "name": "Kwa", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwa", + "depth": 7, "iso_1_code": null, "iso_3_code": "kwb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7295", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7294", "native_tokenizers": [], @@ -25920,20 +29866,24 @@ }, { "name": "La\u2019bi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "La\u2019bi", + "depth": 7, "iso_1_code": null, "iso_3_code": "lbi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7297", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7296", "native_tokenizers": [], @@ -25941,24 +29891,29 @@ }, { "name": "Leko-Nimbari", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duru", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dii", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duupa", + "depth": 9, "iso_1_code": null, "iso_3_code": "dae", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7301", "native_tokenizers": [], @@ -25966,9 +29921,11 @@ }, { "name": "Dii", + "depth": 9, "iso_1_code": null, "iso_3_code": "dur", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -25986,15 +29943,18 @@ }, { "name": "Dugun", + "depth": 9, "iso_1_code": null, "iso_3_code": "ndu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7303", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26010,20 +29970,24 @@ }, { "name": "Duli", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duli-Gey", + "depth": 9, "iso_1_code": null, "iso_3_code": "duz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7305", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7304", "native_tokenizers": [], @@ -26031,19 +29995,23 @@ }, { "name": "Voko-Dowayo", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kutin", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pere", + "depth": 10, "iso_1_code": null, "iso_3_code": "pfe", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26060,6 +30028,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26075,19 +30044,23 @@ }, { "name": "Vere-Dowayo", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dowayo", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Doyayo", + "depth": 11, "iso_1_code": null, "iso_3_code": "dow", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26104,6 +30077,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26119,19 +30093,23 @@ }, { "name": "Vere-Gimme", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gimme", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gimnime", + "depth": 12, "iso_1_code": null, "iso_3_code": "gmn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7314", "native_tokenizers": [], @@ -26139,15 +30117,18 @@ }, { "name": "Gimme", + "depth": 12, "iso_1_code": null, "iso_3_code": "kmp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7315", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7313", "native_tokenizers": [], @@ -26155,14 +30136,17 @@ }, { "name": "Vere", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koma", + "depth": 12, "iso_1_code": null, "iso_3_code": "kmy", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26180,15 +30164,18 @@ }, { "name": "Verre", + "depth": 12, "iso_1_code": null, "iso_3_code": "ver", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7318", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26203,6 +30190,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26217,6 +30205,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26232,26 +30221,31 @@ }, { "name": "Voko", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Longto", + "depth": 10, "iso_1_code": null, "iso_3_code": "wok", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7320", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7319", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26266,6 +30260,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26281,14 +30276,17 @@ }, { "name": "Leko", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kolbila", + "depth": 8, "iso_1_code": null, "iso_3_code": "klc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7322", "native_tokenizers": [], @@ -26296,9 +30294,11 @@ }, { "name": "Mubako", + "depth": 8, "iso_1_code": null, "iso_3_code": "muo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7323", "native_tokenizers": [], @@ -26306,9 +30306,11 @@ }, { "name": "Samba Leko", + "depth": 8, "iso_1_code": null, "iso_3_code": "ndi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26326,15 +30328,18 @@ }, { "name": "Wom", + "depth": 8, "iso_1_code": null, "iso_3_code": "wom", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7325", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26350,19 +30355,23 @@ }, { "name": "Mumuye-Yandang", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mumuye", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gengle", + "depth": 9, "iso_1_code": null, "iso_3_code": "geg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7328", "native_tokenizers": [], @@ -26370,9 +30379,11 @@ }, { "name": "Kumba", + "depth": 9, "iso_1_code": null, "iso_3_code": "ksm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7329", "native_tokenizers": [], @@ -26380,9 +30391,11 @@ }, { "name": "Mumuye", + "depth": 9, "iso_1_code": null, "iso_3_code": "mzm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26400,9 +30413,11 @@ }, { "name": "Pangseng", + "depth": 9, "iso_1_code": null, "iso_3_code": "pgs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7331", "native_tokenizers": [], @@ -26410,9 +30425,11 @@ }, { "name": "Rang", + "depth": 9, "iso_1_code": null, "iso_3_code": "rax", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7332", "native_tokenizers": [], @@ -26420,9 +30437,11 @@ }, { "name": "Teme", + "depth": 9, "iso_1_code": null, "iso_3_code": "tdo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7333", "native_tokenizers": [], @@ -26430,15 +30449,18 @@ }, { "name": "Waka", + "depth": 9, "iso_1_code": null, "iso_3_code": "wav", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7334", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26454,14 +30476,17 @@ }, { "name": "Yandang", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bali", + "depth": 9, "iso_1_code": null, "iso_3_code": "bcn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7336", "native_tokenizers": [], @@ -26469,9 +30494,11 @@ }, { "name": "Kugama", + "depth": 9, "iso_1_code": null, "iso_3_code": "kow", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7337", "native_tokenizers": [], @@ -26479,9 +30506,11 @@ }, { "name": "Kpasham", + "depth": 9, "iso_1_code": null, "iso_3_code": "pbn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7338", "native_tokenizers": [], @@ -26489,9 +30518,11 @@ }, { "name": "Yendang", + "depth": 9, "iso_1_code": null, "iso_3_code": "ynq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7339", "native_tokenizers": [], @@ -26499,21 +30530,25 @@ }, { "name": "Yotti", + "depth": 9, "iso_1_code": null, "iso_3_code": "yot", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7340", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7335", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26529,26 +30564,31 @@ }, { "name": "Nimbari", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nimbari", + "depth": 8, "iso_1_code": null, "iso_3_code": "nmr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7342", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7341", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26564,19 +30604,23 @@ }, { "name": "Mbum-Day", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bua", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bua", + "depth": 8, "iso_1_code": null, "iso_3_code": "bub", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7345", "native_tokenizers": [], @@ -26584,9 +30628,11 @@ }, { "name": "Bolgo", + "depth": 8, "iso_1_code": null, "iso_3_code": "bvo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7346", "native_tokenizers": [], @@ -26594,9 +30640,11 @@ }, { "name": "Fania", + "depth": 8, "iso_1_code": null, "iso_3_code": "fni", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7347", "native_tokenizers": [], @@ -26604,9 +30652,11 @@ }, { "name": "Bon Gula", + "depth": 8, "iso_1_code": null, "iso_3_code": "glc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7348", "native_tokenizers": [], @@ -26614,9 +30664,11 @@ }, { "name": "Gula Iro", + "depth": 8, "iso_1_code": null, "iso_3_code": "glj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7349", "native_tokenizers": [], @@ -26624,9 +30676,11 @@ }, { "name": "Koke", + "depth": 8, "iso_1_code": null, "iso_3_code": "kou", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7350", "native_tokenizers": [], @@ -26634,9 +30688,11 @@ }, { "name": "Niellim", + "depth": 8, "iso_1_code": null, "iso_3_code": "nie", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7351", "native_tokenizers": [], @@ -26644,9 +30700,11 @@ }, { "name": "Noy", + "depth": 8, "iso_1_code": null, "iso_3_code": "noy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7352", "native_tokenizers": [], @@ -26654,9 +30712,11 @@ }, { "name": "Tunia", + "depth": 8, "iso_1_code": null, "iso_3_code": "tug", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7353", "native_tokenizers": [], @@ -26664,15 +30724,18 @@ }, { "name": "Zan Gula", + "depth": 8, "iso_1_code": null, "iso_3_code": "zna", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7354", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7344", "native_tokenizers": [], @@ -26680,20 +30743,24 @@ }, { "name": "Day", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Day", + "depth": 8, "iso_1_code": null, "iso_3_code": "dai", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7356", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7355", "native_tokenizers": [], @@ -26701,14 +30768,17 @@ }, { "name": "Kim", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Besme", + "depth": 8, "iso_1_code": null, "iso_3_code": "bes", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7358", "native_tokenizers": [], @@ -26716,9 +30786,11 @@ }, { "name": "Goundo", + "depth": 8, "iso_1_code": null, "iso_3_code": "goy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7359", "native_tokenizers": [], @@ -26726,9 +30798,11 @@ }, { "name": "Kim", + "depth": 8, "iso_1_code": null, "iso_3_code": "kia", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26745,6 +30819,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26760,24 +30835,29 @@ }, { "name": "Mbum", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Mbum", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karang", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kare", + "depth": 10, "iso_1_code": null, "iso_3_code": "kbn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7364", "native_tokenizers": [], @@ -26785,9 +30865,11 @@ }, { "name": "Karang", + "depth": 10, "iso_1_code": null, "iso_3_code": "kzr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7365", "native_tokenizers": [], @@ -26795,9 +30877,11 @@ }, { "name": "Nzakambay", + "depth": 10, "iso_1_code": null, "iso_3_code": "nzy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7366", "native_tokenizers": [], @@ -26805,15 +30889,18 @@ }, { "name": "Pana", + "depth": 10, "iso_1_code": null, "iso_3_code": "pnz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7367", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7363", "native_tokenizers": [], @@ -26821,14 +30908,17 @@ }, { "name": "Koh", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuo", + "depth": 10, "iso_1_code": null, "iso_3_code": "xuo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26845,6 +30935,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26859,6 +30950,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26874,19 +30966,23 @@ }, { "name": "Northern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dama-Galke", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dama", + "depth": 10, "iso_1_code": null, "iso_3_code": "dmm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7372", "native_tokenizers": [], @@ -26894,9 +30990,11 @@ }, { "name": "Ndai", + "depth": 10, "iso_1_code": null, "iso_3_code": "gke", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7373", "native_tokenizers": [], @@ -26904,15 +31002,18 @@ }, { "name": "Mono", + "depth": 10, "iso_1_code": null, "iso_3_code": "mru", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7374", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7371", "native_tokenizers": [], @@ -26920,14 +31021,17 @@ }, { "name": "Tupuri-Mambai", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mambai", + "depth": 10, "iso_1_code": null, "iso_3_code": "mcs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7376", "native_tokenizers": [], @@ -26935,9 +31039,11 @@ }, { "name": "Mundang", + "depth": 10, "iso_1_code": null, "iso_3_code": "mua", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26955,9 +31061,11 @@ }, { "name": "Tupuri", + "depth": 10, "iso_1_code": null, "iso_3_code": "tui", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26974,6 +31082,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -26988,6 +31097,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27003,20 +31113,24 @@ }, { "name": "Southern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbum", + "depth": 9, "iso_1_code": null, "iso_3_code": "mdd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7380", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7379", "native_tokenizers": [], @@ -27024,14 +31138,17 @@ }, { "name": "Unclassified", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dek", + "depth": 9, "iso_1_code": null, "iso_3_code": "dek", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7382", "native_tokenizers": [], @@ -27039,9 +31156,11 @@ }, { "name": "Pam", + "depth": 9, "iso_1_code": null, "iso_3_code": "pmn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7383", "native_tokenizers": [], @@ -27049,21 +31168,25 @@ }, { "name": "To", + "depth": 9, "iso_1_code": null, "iso_3_code": "toz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7384", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7381", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27078,6 +31201,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27093,20 +31217,24 @@ }, { "name": "Unclassified", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oblo", + "depth": 7, "iso_1_code": null, "iso_3_code": "obl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7386", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7385", "native_tokenizers": [], @@ -27114,19 +31242,23 @@ }, { "name": "Waja-Jen", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jen", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kyak", + "depth": 8, "iso_1_code": null, "iso_3_code": "bka", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7389", "native_tokenizers": [], @@ -27134,9 +31266,11 @@ }, { "name": "Burak", + "depth": 8, "iso_1_code": null, "iso_3_code": "bys", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7390", "native_tokenizers": [], @@ -27144,9 +31278,11 @@ }, { "name": "M\u00e1ghd\u00ec", + "depth": 8, "iso_1_code": null, "iso_3_code": "gmd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7391", "native_tokenizers": [], @@ -27154,9 +31290,11 @@ }, { "name": "Moo", + "depth": 8, "iso_1_code": null, "iso_3_code": "gwg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7392", "native_tokenizers": [], @@ -27164,9 +31302,11 @@ }, { "name": "Dza", + "depth": 8, "iso_1_code": null, "iso_3_code": "jen", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7393", "native_tokenizers": [], @@ -27174,9 +31314,11 @@ }, { "name": "Leelau", + "depth": 8, "iso_1_code": null, "iso_3_code": "ldk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7394", "native_tokenizers": [], @@ -27184,9 +31326,11 @@ }, { "name": "Loo", + "depth": 8, "iso_1_code": null, "iso_3_code": "ldo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7395", "native_tokenizers": [], @@ -27194,9 +31338,11 @@ }, { "name": "Mingang Doso", + "depth": 8, "iso_1_code": null, "iso_3_code": "mko", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7396", "native_tokenizers": [], @@ -27204,9 +31350,11 @@ }, { "name": "Mak", + "depth": 8, "iso_1_code": null, "iso_3_code": "pbl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7397", "native_tokenizers": [], @@ -27214,15 +31362,18 @@ }, { "name": "Tha", + "depth": 8, "iso_1_code": null, "iso_3_code": "thy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7398", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7388", "native_tokenizers": [], @@ -27230,20 +31381,24 @@ }, { "name": "Longuda", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Longuda", + "depth": 8, "iso_1_code": null, "iso_3_code": "lnu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7400", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7399", "native_tokenizers": [], @@ -27251,19 +31406,23 @@ }, { "name": "Waja", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awak", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awak", + "depth": 9, "iso_1_code": null, "iso_3_code": "awo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7403", "native_tokenizers": [], @@ -27271,15 +31430,18 @@ }, { "name": "Kamo", + "depth": 9, "iso_1_code": null, "iso_3_code": "kcq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7404", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7402", "native_tokenizers": [], @@ -27287,14 +31449,17 @@ }, { "name": "Cham-Mona", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cham", + "depth": 9, "iso_1_code": null, "iso_3_code": "cfa", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7406", "native_tokenizers": [], @@ -27302,15 +31467,18 @@ }, { "name": "Tso", + "depth": 9, "iso_1_code": null, "iso_3_code": "ldp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7407", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7405", "native_tokenizers": [], @@ -27318,20 +31486,24 @@ }, { "name": "Dadiya", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dadiya", + "depth": 9, "iso_1_code": null, "iso_3_code": "dbd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7409", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7408", "native_tokenizers": [], @@ -27339,14 +31511,17 @@ }, { "name": "Tula", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bangwinji", + "depth": 9, "iso_1_code": null, "iso_3_code": "bsj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7411", "native_tokenizers": [], @@ -27354,9 +31529,11 @@ }, { "name": "Tula", + "depth": 9, "iso_1_code": null, "iso_3_code": "tul", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27374,15 +31551,18 @@ }, { "name": "Waja", + "depth": 9, "iso_1_code": null, "iso_3_code": "wja", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7413", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27397,6 +31577,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27412,25 +31593,30 @@ }, { "name": "Yungur", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Libo", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaan", + "depth": 9, "iso_1_code": null, "iso_3_code": "ldl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7416", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7415", "native_tokenizers": [], @@ -27438,20 +31624,24 @@ }, { "name": "Mboi", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mboi", + "depth": 9, "iso_1_code": null, "iso_3_code": "moi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7418", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7417", "native_tokenizers": [], @@ -27459,14 +31649,17 @@ }, { "name": "Yungur-Roba", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lala-Roba", + "depth": 9, "iso_1_code": null, "iso_3_code": "lla", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7420", "native_tokenizers": [], @@ -27474,9 +31667,11 @@ }, { "name": "Voro", + "depth": 9, "iso_1_code": null, "iso_3_code": "vor", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7421", "native_tokenizers": [], @@ -27484,27 +31679,32 @@ }, { "name": "Bena", + "depth": 9, "iso_1_code": null, "iso_3_code": "yun", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7422", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7419", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7414", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27519,6 +31719,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -27534,40 +31735,48 @@ }, { "name": "Ubangi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Core", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda-Bambari", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda-Bambari", + "depth": 10, "iso_1_code": null, "iso_3_code": "liy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7428", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7427", "native_tokenizers": [], @@ -27575,20 +31784,24 @@ }, { "name": "Banda-Banda", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda-Banda", + "depth": 10, "iso_1_code": null, "iso_3_code": "bpd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7430", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7429", "native_tokenizers": [], @@ -27596,20 +31809,24 @@ }, { "name": "Banda-Mbres", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda-Mbr\u00e8s", + "depth": 10, "iso_1_code": null, "iso_3_code": "bqk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7432", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7431", "native_tokenizers": [], @@ -27617,20 +31834,24 @@ }, { "name": "Banda-Ndele", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda-Nd\u00e9l\u00e9", + "depth": 10, "iso_1_code": null, "iso_3_code": "bfl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7434", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7433", "native_tokenizers": [], @@ -27638,14 +31859,17 @@ }, { "name": "Mid-Southern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda, Mid-Southern", + "depth": 10, "iso_1_code": null, "iso_3_code": "bjo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7436", "native_tokenizers": [], @@ -27653,9 +31877,11 @@ }, { "name": "Gobu", + "depth": 10, "iso_1_code": null, "iso_3_code": "gox", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7437", "native_tokenizers": [], @@ -27663,9 +31889,11 @@ }, { "name": "Kpagua", + "depth": 10, "iso_1_code": null, "iso_3_code": "kuw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7438", "native_tokenizers": [], @@ -27673,9 +31901,11 @@ }, { "name": "Mono", + "depth": 10, "iso_1_code": null, "iso_3_code": "mnh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7439", "native_tokenizers": [], @@ -27683,15 +31913,18 @@ }, { "name": "Ngundu", + "depth": 10, "iso_1_code": null, "iso_3_code": "nue", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7440", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7435", "native_tokenizers": [], @@ -27699,26 +31932,31 @@ }, { "name": "Togbo-Vara", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda, Togbo-Vara", + "depth": 10, "iso_1_code": null, "iso_3_code": "tor", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7442", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7441", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7426", "native_tokenizers": [], @@ -27726,26 +31964,31 @@ }, { "name": "Western", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda-Yangere", + "depth": 9, "iso_1_code": null, "iso_3_code": "yaj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7444", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7443", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7425", "native_tokenizers": [], @@ -27753,14 +31996,17 @@ }, { "name": "South Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Langbashe", + "depth": 8, "iso_1_code": null, "iso_3_code": "lna", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7446", "native_tokenizers": [], @@ -27768,15 +32014,18 @@ }, { "name": "Banda, South Central", + "depth": 8, "iso_1_code": null, "iso_3_code": "lnl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7447", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7445", "native_tokenizers": [], @@ -27784,20 +32033,24 @@ }, { "name": "Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbandja", + "depth": 8, "iso_1_code": null, "iso_3_code": "zmz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7449", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7448", "native_tokenizers": [], @@ -27805,20 +32058,24 @@ }, { "name": "Southwestern", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngbundu", + "depth": 8, "iso_1_code": null, "iso_3_code": "nuu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7451", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7450", "native_tokenizers": [], @@ -27826,26 +32083,31 @@ }, { "name": "West Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Banda, West Central", + "depth": 8, "iso_1_code": null, "iso_3_code": "bbp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7453", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7452", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7424", "native_tokenizers": [], @@ -27853,14 +32115,17 @@ }, { "name": "Gbaya-Manza-Ngbaka", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suma", + "depth": 7, "iso_1_code": null, "iso_3_code": "sqm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7455", "native_tokenizers": [], @@ -27868,14 +32133,17 @@ }, { "name": "Central", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bhogoto", + "depth": 8, "iso_1_code": null, "iso_3_code": "bdt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7457", "native_tokenizers": [], @@ -27883,9 +32151,11 @@ }, { "name": "Gbaya-Bossangoa", + "depth": 8, "iso_1_code": null, "iso_3_code": "gbp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7458", "native_tokenizers": [], @@ -27893,9 +32163,11 @@ }, { "name": "Gbaya-Bozoum", + "depth": 8, "iso_1_code": null, "iso_3_code": "gbq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7459", "native_tokenizers": [], @@ -27903,15 +32175,18 @@ }, { "name": "Gbanu", + "depth": 8, "iso_1_code": null, "iso_3_code": "gbv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7460", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7456", "native_tokenizers": [], @@ -27919,14 +32194,17 @@ }, { "name": "East", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ali", + "depth": 8, "iso_1_code": null, "iso_3_code": "aiy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7462", "native_tokenizers": [], @@ -27934,9 +32212,11 @@ }, { "name": "Bofi", + "depth": 8, "iso_1_code": null, "iso_3_code": "bff", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7463", "native_tokenizers": [], @@ -27944,9 +32224,11 @@ }, { "name": "Mandja", + "depth": 8, "iso_1_code": null, "iso_3_code": "mzv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7464", "native_tokenizers": [], @@ -27954,9 +32236,11 @@ }, { "name": "Ngbaka", + "depth": 8, "iso_1_code": null, "iso_3_code": "nga", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7465", "native_tokenizers": [], @@ -27964,15 +32248,18 @@ }, { "name": "Ngbaka Manza", + "depth": 8, "iso_1_code": null, "iso_3_code": "ngg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7466", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7461", "native_tokenizers": [], @@ -27980,14 +32267,17 @@ }, { "name": "Northwest", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gbaya, Northwest", + "depth": 8, "iso_1_code": null, "iso_3_code": "gya", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28004,6 +32294,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28019,14 +32310,17 @@ }, { "name": "Southwest", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bangandu", + "depth": 8, "iso_1_code": null, "iso_3_code": "bgf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7470", "native_tokenizers": [], @@ -28034,9 +32328,11 @@ }, { "name": "Gbaya-Mbodomo", + "depth": 8, "iso_1_code": null, "iso_3_code": "gmm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7471", "native_tokenizers": [], @@ -28044,9 +32340,11 @@ }, { "name": "Gbaya, Southwest", + "depth": 8, "iso_1_code": null, "iso_3_code": "gso", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28064,15 +32362,18 @@ }, { "name": "Ngombe", + "depth": 8, "iso_1_code": null, "iso_3_code": "nmj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7473", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28087,6 +32388,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28102,14 +32404,17 @@ }, { "name": "Ngbandi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dendi", + "depth": 7, "iso_1_code": null, "iso_3_code": "deq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7475", "native_tokenizers": [], @@ -28117,9 +32422,11 @@ }, { "name": "Gbayi", + "depth": 7, "iso_1_code": null, "iso_3_code": "gyg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7476", "native_tokenizers": [], @@ -28127,9 +32434,11 @@ }, { "name": "Mbangi", + "depth": 7, "iso_1_code": null, "iso_3_code": "mgn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7477", "native_tokenizers": [], @@ -28137,9 +32446,11 @@ }, { "name": "Ngbandi, Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "nbw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7478", "native_tokenizers": [], @@ -28147,9 +32458,11 @@ }, { "name": "Ngbandi, Northern", + "depth": 7, "iso_1_code": null, "iso_3_code": "ngb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28167,15 +32480,18 @@ }, { "name": "Yakoma", + "depth": 7, "iso_1_code": null, "iso_3_code": "yky", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7480", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28191,24 +32507,29 @@ }, { "name": "Sere-Ngbaka-Mba", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngbaka-Mba", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mba", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dongo", + "depth": 9, "iso_1_code": null, "iso_3_code": "doo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7484", "native_tokenizers": [], @@ -28216,9 +32537,11 @@ }, { "name": "Mba", + "depth": 9, "iso_1_code": null, "iso_3_code": "mfc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7485", "native_tokenizers": [], @@ -28226,9 +32549,11 @@ }, { "name": "Ma", + "depth": 9, "iso_1_code": null, "iso_3_code": "msj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7486", "native_tokenizers": [], @@ -28236,15 +32561,18 @@ }, { "name": "Ndunga", + "depth": 9, "iso_1_code": null, "iso_3_code": "ndt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7487", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7483", "native_tokenizers": [], @@ -28252,24 +32580,29 @@ }, { "name": "Ngbaka", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mayogo-Bangba", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bangba", + "depth": 11, "iso_1_code": null, "iso_3_code": "bbe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7491", "native_tokenizers": [], @@ -28277,15 +32610,18 @@ }, { "name": "Mayogo", + "depth": 11, "iso_1_code": null, "iso_3_code": "mdm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7492", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7490", "native_tokenizers": [], @@ -28293,14 +32629,17 @@ }, { "name": "Mundu", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "M\u00fcnd\u00fc", + "depth": 11, "iso_1_code": null, "iso_3_code": "muh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28317,6 +32656,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28331,6 +32671,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28346,19 +32687,23 @@ }, { "name": "Western", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baka-Gundi", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baka", + "depth": 11, "iso_1_code": null, "iso_3_code": "bkc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7497", "native_tokenizers": [], @@ -28366,9 +32711,11 @@ }, { "name": "Limassa", + "depth": 11, "iso_1_code": null, "iso_3_code": "bme", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7498", "native_tokenizers": [], @@ -28376,9 +32723,11 @@ }, { "name": "Gundi", + "depth": 11, "iso_1_code": null, "iso_3_code": "gdi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7499", "native_tokenizers": [], @@ -28386,15 +32735,18 @@ }, { "name": "Ganzi", + "depth": 11, "iso_1_code": null, "iso_3_code": "gnz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7500", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7496", "native_tokenizers": [], @@ -28402,14 +32754,17 @@ }, { "name": "Bwaka", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gilima", + "depth": 11, "iso_1_code": null, "iso_3_code": "gix", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7502", "native_tokenizers": [], @@ -28417,15 +32772,18 @@ }, { "name": "Ngbaka Ma\u2019bo", + "depth": 11, "iso_1_code": null, "iso_3_code": "nbm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7503", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7501", "native_tokenizers": [], @@ -28433,14 +32791,17 @@ }, { "name": "Gbanzili", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buraka", + "depth": 11, "iso_1_code": null, "iso_3_code": "bkg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7505", "native_tokenizers": [], @@ -28448,15 +32809,18 @@ }, { "name": "Gbanziri", + "depth": 11, "iso_1_code": null, "iso_3_code": "gbg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7506", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7504", "native_tokenizers": [], @@ -28464,14 +32828,17 @@ }, { "name": "Monzombo", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kpala", + "depth": 11, "iso_1_code": null, "iso_3_code": "kpl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7508", "native_tokenizers": [], @@ -28479,9 +32846,11 @@ }, { "name": "Monzombo", + "depth": 11, "iso_1_code": null, "iso_3_code": "moj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7509", "native_tokenizers": [], @@ -28489,27 +32858,32 @@ }, { "name": "Yango", + "depth": 11, "iso_1_code": null, "iso_3_code": "yng", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7510", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7507", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7495", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28524,6 +32898,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28539,19 +32914,23 @@ }, { "name": "Sere", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Feroge-Mangaya", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Feroge", + "depth": 9, "iso_1_code": null, "iso_3_code": "fer", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7513", "native_tokenizers": [], @@ -28559,15 +32938,18 @@ }, { "name": "Mangayat", + "depth": 9, "iso_1_code": null, "iso_3_code": "myj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7514", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7512", "native_tokenizers": [], @@ -28575,14 +32957,17 @@ }, { "name": "Indri-Togoyo", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Indri", + "depth": 9, "iso_1_code": null, "iso_3_code": "idr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7516", "native_tokenizers": [], @@ -28590,15 +32975,18 @@ }, { "name": "Togoyo", + "depth": 9, "iso_1_code": null, "iso_3_code": "tgy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7517", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7515", "native_tokenizers": [], @@ -28606,19 +32994,23 @@ }, { "name": "Sere-Bviri", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bai-Viri", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bai", + "depth": 10, "iso_1_code": null, "iso_3_code": "bdj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7520", "native_tokenizers": [], @@ -28626,15 +33018,18 @@ }, { "name": "Belanda Viri", + "depth": 10, "iso_1_code": null, "iso_3_code": "bvi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7521", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7519", "native_tokenizers": [], @@ -28642,14 +33037,17 @@ }, { "name": "Ndogo-Sere", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndogo", + "depth": 10, "iso_1_code": null, "iso_3_code": "ndz", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28667,9 +33065,11 @@ }, { "name": "Sere", + "depth": 10, "iso_1_code": null, "iso_3_code": "swf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7524", "native_tokenizers": [], @@ -28677,15 +33077,18 @@ }, { "name": "Tagbu", + "depth": 10, "iso_1_code": null, "iso_3_code": "tbm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7525", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28700,6 +33103,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28714,6 +33118,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28728,6 +33133,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28743,19 +33149,23 @@ }, { "name": "Zande", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barambo-Pambia", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barambu", + "depth": 8, "iso_1_code": null, "iso_3_code": "brm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7528", "native_tokenizers": [], @@ -28763,15 +33173,18 @@ }, { "name": "Pambia", + "depth": 8, "iso_1_code": null, "iso_3_code": "pmb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7529", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7527", "native_tokenizers": [], @@ -28779,14 +33192,17 @@ }, { "name": "Zande-Nzakara", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Geme", + "depth": 8, "iso_1_code": null, "iso_3_code": "geq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7531", "native_tokenizers": [], @@ -28794,9 +33210,11 @@ }, { "name": "Kpatili", + "depth": 8, "iso_1_code": null, "iso_3_code": "kym", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7532", "native_tokenizers": [], @@ -28804,9 +33222,11 @@ }, { "name": "Nzakara", + "depth": 8, "iso_1_code": null, "iso_3_code": "nzk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7533", "native_tokenizers": [], @@ -28814,9 +33234,11 @@ }, { "name": "Zande", + "depth": 8, "iso_1_code": null, "iso_3_code": "zne", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28833,6 +33255,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28847,6 +33270,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28861,6 +33285,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28875,6 +33300,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28890,19 +33316,23 @@ }, { "name": "Gur", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bariba", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baatonum", + "depth": 6, "iso_1_code": null, "iso_3_code": "bba", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28919,6 +33349,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28934,24 +33365,29 @@ }, { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bwamu", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bomu", + "depth": 8, "iso_1_code": null, "iso_3_code": "bmq", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28969,9 +33405,11 @@ }, { "name": "Buamu", + "depth": 8, "iso_1_code": null, "iso_3_code": "box", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -28989,9 +33427,11 @@ }, { "name": "Bwamu, L\u00e1\u00e1 L\u00e1\u00e1", + "depth": 8, "iso_1_code": null, "iso_3_code": "bwj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7543", "native_tokenizers": [], @@ -28999,15 +33439,18 @@ }, { "name": "Bwamu, Cwi", + "depth": 8, "iso_1_code": null, "iso_3_code": "bwy", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7544", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29023,20 +33466,24 @@ }, { "name": "Kurumfe", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koromf\u00e9", + "depth": 8, "iso_1_code": null, "iso_3_code": "kfz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7546", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7545", "native_tokenizers": [], @@ -29044,19 +33491,23 @@ }, { "name": "Oti-Volta", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buli-Koma", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buli", + "depth": 9, "iso_1_code": null, "iso_3_code": "bwu", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29074,9 +33525,11 @@ }, { "name": "Konni", + "depth": 9, "iso_1_code": null, "iso_3_code": "kma", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29093,6 +33546,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29108,14 +33562,17 @@ }, { "name": "Eastern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biali", + "depth": 9, "iso_1_code": null, "iso_3_code": "beh", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7552", "native_tokenizers": [], @@ -29123,9 +33580,11 @@ }, { "name": "Mbelime", + "depth": 9, "iso_1_code": null, "iso_3_code": "mql", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7553", "native_tokenizers": [], @@ -29133,9 +33592,11 @@ }, { "name": "Ditammari", + "depth": 9, "iso_1_code": null, "iso_3_code": "tbz", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29153,9 +33614,11 @@ }, { "name": "Waama", + "depth": 9, "iso_1_code": null, "iso_3_code": "wwa", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29172,6 +33635,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29187,14 +33651,17 @@ }, { "name": "Gurma", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ngangam", + "depth": 9, "iso_1_code": null, "iso_3_code": "gng", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29212,9 +33679,11 @@ }, { "name": "Gourmanch\u00e9ma", + "depth": 9, "iso_1_code": null, "iso_3_code": "gux", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29232,9 +33701,11 @@ }, { "name": "Nateni", + "depth": 9, "iso_1_code": null, "iso_3_code": "ntm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7559", "native_tokenizers": [], @@ -29242,9 +33713,11 @@ }, { "name": "Miyobe", + "depth": 9, "iso_1_code": null, "iso_3_code": "soy", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29262,9 +33735,11 @@ }, { "name": "Konkomba", + "depth": 9, "iso_1_code": null, "iso_3_code": "xon", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29282,14 +33757,17 @@ }, { "name": "Moba", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bimoba", + "depth": 10, "iso_1_code": null, "iso_3_code": "bim", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29307,9 +33785,11 @@ }, { "name": "Moba", + "depth": 10, "iso_1_code": null, "iso_3_code": "mfq", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29326,6 +33806,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29341,14 +33822,17 @@ }, { "name": "Ntcham", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akaselem", + "depth": 10, "iso_1_code": null, "iso_3_code": "aks", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7566", "native_tokenizers": [], @@ -29356,9 +33840,11 @@ }, { "name": "Ntcham", + "depth": 10, "iso_1_code": null, "iso_3_code": "bud", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29375,6 +33861,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29389,6 +33876,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29404,25 +33892,30 @@ }, { "name": "Western", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nootre", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Notre", + "depth": 10, "iso_1_code": null, "iso_3_code": "bly", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7570", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7569", "native_tokenizers": [], @@ -29430,14 +33923,17 @@ }, { "name": "Northwest", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Farefare", + "depth": 10, "iso_1_code": null, "iso_3_code": "gur", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29455,9 +33951,11 @@ }, { "name": "Moore", + "depth": 10, "iso_1_code": null, "iso_3_code": "mos", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29475,9 +33973,11 @@ }, { "name": "Safaliba", + "depth": 10, "iso_1_code": null, "iso_3_code": "saf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7574", "native_tokenizers": [], @@ -29485,9 +33985,11 @@ }, { "name": "Wali", + "depth": 10, "iso_1_code": null, "iso_3_code": "wlx", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29505,19 +34007,23 @@ }, { "name": "Dagaari-Birifor", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Birifor", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Birifor, Malba", + "depth": 12, "iso_1_code": null, "iso_3_code": "bfo", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29535,9 +34041,11 @@ }, { "name": "Birifor, Southern", + "depth": 12, "iso_1_code": null, "iso_3_code": "biv", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29554,6 +34062,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29569,14 +34078,17 @@ }, { "name": "Dagaari", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dagaare, Southern", + "depth": 12, "iso_1_code": null, "iso_3_code": "dga", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29594,9 +34106,11 @@ }, { "name": "Dagaari Dioula", + "depth": 12, "iso_1_code": null, "iso_3_code": "dgd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7582", "native_tokenizers": [], @@ -29604,9 +34118,11 @@ }, { "name": "Dagara, Northern", + "depth": 12, "iso_1_code": null, "iso_3_code": "dgi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29623,6 +34139,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29637,6 +34154,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29651,6 +34169,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29666,14 +34185,17 @@ }, { "name": "Southeast", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dagbani", + "depth": 10, "iso_1_code": null, "iso_3_code": "dag", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29691,9 +34213,11 @@ }, { "name": "Hanga", + "depth": 10, "iso_1_code": null, "iso_3_code": "hag", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29711,9 +34235,11 @@ }, { "name": "Kamara", + "depth": 10, "iso_1_code": null, "iso_3_code": "jmr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7587", "native_tokenizers": [], @@ -29721,9 +34247,11 @@ }, { "name": "Kusaal", + "depth": 10, "iso_1_code": null, "iso_3_code": "kus", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29741,9 +34269,11 @@ }, { "name": "Mampruli", + "depth": 10, "iso_1_code": null, "iso_3_code": "maw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29761,15 +34291,18 @@ }, { "name": "Kantosi", + "depth": 10, "iso_1_code": null, "iso_3_code": "xkt", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7590", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29784,6 +34317,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29799,14 +34333,17 @@ }, { "name": "Yom-Nawdm", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nawdm", + "depth": 9, "iso_1_code": null, "iso_3_code": "nmz", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29824,15 +34361,18 @@ }, { "name": "Yom", + "depth": 9, "iso_1_code": null, "iso_3_code": "pil", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7593", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29847,6 +34387,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29861,6 +34402,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29876,19 +34418,23 @@ }, { "name": "Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dogoso-Khe", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dogoso", + "depth": 8, "iso_1_code": null, "iso_3_code": "dgs", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7596", "native_tokenizers": [], @@ -29896,15 +34442,18 @@ }, { "name": "Khe", + "depth": 8, "iso_1_code": null, "iso_3_code": "kqg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7597", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7595", "native_tokenizers": [], @@ -29912,20 +34461,24 @@ }, { "name": "Dyan", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dyan", + "depth": 8, "iso_1_code": null, "iso_3_code": "dya", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7599", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7598", "native_tokenizers": [], @@ -29933,14 +34486,17 @@ }, { "name": "Gan-Dogose", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dogos\u00e9", + "depth": 8, "iso_1_code": null, "iso_3_code": "dos", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29958,9 +34514,11 @@ }, { "name": "Kaansa", + "depth": 8, "iso_1_code": null, "iso_3_code": "gna", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -29978,15 +34536,18 @@ }, { "name": "Khisa", + "depth": 8, "iso_1_code": null, "iso_3_code": "kqm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7603", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30002,19 +34563,23 @@ }, { "name": "Grusi", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bago-Kusuntu", + "depth": 9, "iso_1_code": null, "iso_3_code": "bqg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7606", "native_tokenizers": [], @@ -30022,9 +34587,11 @@ }, { "name": "Chala", + "depth": 9, "iso_1_code": null, "iso_3_code": "cll", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7607", "native_tokenizers": [], @@ -30032,9 +34599,11 @@ }, { "name": "Lukpa", + "depth": 9, "iso_1_code": null, "iso_3_code": "dop", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30052,9 +34621,11 @@ }, { "name": "Kabiy\u00e8", + "depth": 9, "iso_1_code": null, "iso_3_code": "kbp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30072,9 +34643,11 @@ }, { "name": "Tem", + "depth": 9, "iso_1_code": null, "iso_3_code": "kdh", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30092,9 +34665,11 @@ }, { "name": "Lama", + "depth": 9, "iso_1_code": null, "iso_3_code": "las", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30112,9 +34687,11 @@ }, { "name": "Delo", + "depth": 9, "iso_1_code": null, "iso_3_code": "ntr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30131,6 +34708,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30146,14 +34724,17 @@ }, { "name": "Northern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalams\u00e9", + "depth": 9, "iso_1_code": null, "iso_3_code": "knz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7614", "native_tokenizers": [], @@ -30161,9 +34742,11 @@ }, { "name": "Ly\u00e9l\u00e9", + "depth": 9, "iso_1_code": null, "iso_3_code": "lee", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30181,9 +34764,11 @@ }, { "name": "Nuni, Southern", + "depth": 9, "iso_1_code": null, "iso_3_code": "nnw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30201,9 +34786,11 @@ }, { "name": "Nuni, Northern", + "depth": 9, "iso_1_code": null, "iso_3_code": "nuv", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7617", "native_tokenizers": [], @@ -30211,9 +34798,11 @@ }, { "name": "Pana", + "depth": 9, "iso_1_code": null, "iso_3_code": "pnq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7618", "native_tokenizers": [], @@ -30221,9 +34810,11 @@ }, { "name": "Kasem", + "depth": 9, "iso_1_code": null, "iso_3_code": "xsm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30240,6 +34831,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30255,14 +34847,17 @@ }, { "name": "Western", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chakali", + "depth": 9, "iso_1_code": null, "iso_3_code": "cli", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7621", "native_tokenizers": [], @@ -30270,9 +34865,11 @@ }, { "name": "Winy\u00e9", + "depth": 9, "iso_1_code": null, "iso_3_code": "kst", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7622", "native_tokenizers": [], @@ -30280,9 +34877,11 @@ }, { "name": "Deg", + "depth": 9, "iso_1_code": null, "iso_3_code": "mzw", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30300,9 +34899,11 @@ }, { "name": "Phuie", + "depth": 9, "iso_1_code": null, "iso_3_code": "pug", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7624", "native_tokenizers": [], @@ -30310,9 +34911,11 @@ }, { "name": "Paasaal", + "depth": 9, "iso_1_code": null, "iso_3_code": "sig", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30330,9 +34933,11 @@ }, { "name": "Sisaala, Tumulung", + "depth": 9, "iso_1_code": null, "iso_3_code": "sil", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30350,9 +34955,11 @@ }, { "name": "Sissala", + "depth": 9, "iso_1_code": null, "iso_3_code": "sld", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30370,9 +34977,11 @@ }, { "name": "Sisaala, Western", + "depth": 9, "iso_1_code": null, "iso_3_code": "ssl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7628", "native_tokenizers": [], @@ -30380,9 +34989,11 @@ }, { "name": "Tampulma", + "depth": 9, "iso_1_code": null, "iso_3_code": "tpm", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30400,9 +35011,11 @@ }, { "name": "Vagla", + "depth": 9, "iso_1_code": null, "iso_3_code": "vag", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30419,6 +35032,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30433,6 +35047,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30448,14 +35063,17 @@ }, { "name": "Kirma-Tyurama", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cerma", + "depth": 8, "iso_1_code": null, "iso_3_code": "cme", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30473,15 +35091,18 @@ }, { "name": "Turka", + "depth": 8, "iso_1_code": null, "iso_3_code": "tuz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7633", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30496,6 +35117,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30510,6 +35132,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30525,14 +35148,17 @@ }, { "name": "Kulango", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kulango, Bondoukou", + "depth": 6, "iso_1_code": null, "iso_3_code": "kzc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7635", "native_tokenizers": [], @@ -30540,15 +35166,18 @@ }, { "name": "Kulango, Bouna", + "depth": 6, "iso_1_code": null, "iso_3_code": "nku", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7636", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7634", "native_tokenizers": [], @@ -30556,14 +35185,17 @@ }, { "name": "Lobi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lobi", + "depth": 6, "iso_1_code": null, "iso_3_code": "lob", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30580,6 +35212,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30595,19 +35228,23 @@ }, { "name": "Senufo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karaboro", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karaboro, Western", + "depth": 7, "iso_1_code": null, "iso_3_code": "kza", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7641", "native_tokenizers": [], @@ -30615,9 +35252,11 @@ }, { "name": "Karaboro, Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": "xrb", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30634,6 +35273,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30649,20 +35289,24 @@ }, { "name": "Kpalaga", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "S\u00e9noufo, Palaka", + "depth": 7, "iso_1_code": null, "iso_3_code": "plr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7644", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7643", "native_tokenizers": [], @@ -30670,14 +35314,17 @@ }, { "name": "Nafaanra", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nafaanra", + "depth": 7, "iso_1_code": null, "iso_3_code": "nfr", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30694,6 +35341,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30709,14 +35357,17 @@ }, { "name": "Senari", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "S\u00e9noufo, Cebaara", + "depth": 7, "iso_1_code": null, "iso_3_code": "sef", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7648", "native_tokenizers": [], @@ -30724,9 +35375,11 @@ }, { "name": "S\u00e9noufo, Senara", + "depth": 7, "iso_1_code": null, "iso_3_code": "seq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7649", "native_tokenizers": [], @@ -30734,15 +35387,18 @@ }, { "name": "S\u00e9noufo, Syenara", + "depth": 7, "iso_1_code": null, "iso_3_code": "shz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7650", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7647", "native_tokenizers": [], @@ -30750,14 +35406,17 @@ }, { "name": "Suppire-Mamara", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "S\u00e9noufo, Mamara", + "depth": 7, "iso_1_code": null, "iso_3_code": "myk", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30775,9 +35434,11 @@ }, { "name": "S\u00e9noufo, Shempire", + "depth": 7, "iso_1_code": null, "iso_3_code": "seb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7653", "native_tokenizers": [], @@ -30785,9 +35446,11 @@ }, { "name": "S\u00e9noufo, Nanerig\u00e9", + "depth": 7, "iso_1_code": null, "iso_3_code": "sen", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7654", "native_tokenizers": [], @@ -30795,9 +35458,11 @@ }, { "name": "S\u00e9noufo, S\u00ecc\u00ect\u00e9", + "depth": 7, "iso_1_code": null, "iso_3_code": "sep", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7655", "native_tokenizers": [], @@ -30805,9 +35470,11 @@ }, { "name": "S\u00e9noufo, Supyire", + "depth": 7, "iso_1_code": null, "iso_3_code": "spp", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30824,6 +35491,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30839,14 +35507,17 @@ }, { "name": "Tagwana-Djimini", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "S\u00e9noufo, Djimini", + "depth": 7, "iso_1_code": null, "iso_3_code": "dyi", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30864,9 +35535,11 @@ }, { "name": "S\u00e9noufo, Nyarafolo", + "depth": 7, "iso_1_code": null, "iso_3_code": "sev", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7659", "native_tokenizers": [], @@ -30874,15 +35547,18 @@ }, { "name": "S\u00e9noufo, Tagwana", + "depth": 7, "iso_1_code": null, "iso_3_code": "tgw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7660", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30897,6 +35573,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30912,14 +35589,17 @@ }, { "name": "Teen", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Loma", + "depth": 6, "iso_1_code": null, "iso_3_code": "loi", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7662", "native_tokenizers": [], @@ -30927,15 +35607,18 @@ }, { "name": "T\u00e9\u00e9n", + "depth": 6, "iso_1_code": null, "iso_3_code": "lor", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7663", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7661", "native_tokenizers": [], @@ -30943,20 +35626,24 @@ }, { "name": "Tiefo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ti\u00e9fo", + "depth": 6, "iso_1_code": null, "iso_3_code": "tiq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7665", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7664", "native_tokenizers": [], @@ -30964,14 +35651,17 @@ }, { "name": "Tusia", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Toussian, Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": "tsp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7667", "native_tokenizers": [], @@ -30979,9 +35669,11 @@ }, { "name": "Toussian, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "wib", "children": [], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -30998,6 +35690,7 @@ ] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -31013,20 +35706,24 @@ }, { "name": "Viemo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Viemo", + "depth": 6, "iso_1_code": null, "iso_3_code": "vig", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7670", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7669", "native_tokenizers": [], @@ -31034,14 +35731,17 @@ }, { "name": "Wara-Natioro", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Natioro", + "depth": 6, "iso_1_code": null, "iso_3_code": "nti", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7672", "native_tokenizers": [], @@ -31049,9 +35749,11 @@ }, { "name": "Paleni", + "depth": 6, "iso_1_code": null, "iso_3_code": "pnl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7673", "native_tokenizers": [], @@ -31059,21 +35761,25 @@ }, { "name": "Wara", + "depth": 6, "iso_1_code": null, "iso_3_code": "wbf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7674", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7671", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -31088,6 +35794,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -31102,6 +35809,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -31116,6 +35824,7 @@ "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tn\")", @@ -31131,24 +35840,29 @@ }, { "name": "Kordofanian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Heiban", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ko", + "depth": 4, "iso_1_code": null, "iso_3_code": "fuj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7678", "native_tokenizers": [], @@ -31156,15 +35870,18 @@ }, { "name": "Warnang", + "depth": 4, "iso_1_code": null, "iso_3_code": "wrn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7679", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7677", "native_tokenizers": [], @@ -31172,29 +35889,35 @@ }, { "name": "West-Central", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ebang-Logol", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ebang-Laru", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Heiban", + "depth": 7, "iso_1_code": null, "iso_3_code": "hbn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7684", "native_tokenizers": [], @@ -31202,15 +35925,18 @@ }, { "name": "Laro", + "depth": 7, "iso_1_code": null, "iso_3_code": "lro", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7685", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7683", "native_tokenizers": [], @@ -31218,20 +35944,24 @@ }, { "name": "Logol", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Logol", + "depth": 7, "iso_1_code": null, "iso_3_code": "lof", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7687", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7686", "native_tokenizers": [], @@ -31239,26 +35969,31 @@ }, { "name": "Utoro", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Otoro", + "depth": 7, "iso_1_code": null, "iso_3_code": "otr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7689", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7688", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7682", "native_tokenizers": [], @@ -31266,26 +36001,31 @@ }, { "name": "Rere", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koalib", + "depth": 6, "iso_1_code": null, "iso_3_code": "kib", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7691", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7690", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7681", "native_tokenizers": [], @@ -31293,20 +36033,24 @@ }, { "name": "Shirumba", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shwai", + "depth": 5, "iso_1_code": null, "iso_3_code": "shw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7693", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7692", "native_tokenizers": [], @@ -31314,23 +36058,18 @@ }, { "name": "Western", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Moro", + "depth": 5, "iso_1_code": null, "iso_3_code": "mor", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7695", "native_tokenizers": [], "scripts": [ @@ -31339,66 +36078,50 @@ }, { "name": "Tira", + "depth": 5, "iso_1_code": null, "iso_3_code": "tic", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7696", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7694", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7680", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7676", "native_tokenizers": [], "scripts": [] }, { "name": "Katla", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Katla", + "depth": 3, "iso_1_code": null, "iso_3_code": "kcr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7698", "native_tokenizers": [], @@ -31406,15 +36129,18 @@ }, { "name": "Tima", + "depth": 3, "iso_1_code": null, "iso_3_code": "tms", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7699", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7697", "native_tokenizers": [], @@ -31422,14 +36148,17 @@ }, { "name": "Rashad", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tegali", + "depth": 3, "iso_1_code": null, "iso_3_code": "ras", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7701", "native_tokenizers": [], @@ -31437,15 +36166,18 @@ }, { "name": "Tagoi", + "depth": 3, "iso_1_code": null, "iso_3_code": "tag", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7702", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7700", "native_tokenizers": [], @@ -31453,30 +36185,36 @@ }, { "name": "Talodi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Talodi Proper", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jomang", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Talodi", + "depth": 5, "iso_1_code": null, "iso_3_code": "tlo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7706", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7705", "native_tokenizers": [], @@ -31484,20 +36222,24 @@ }, { "name": "Nding", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nding", + "depth": 5, "iso_1_code": null, "iso_3_code": "eli", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7708", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7707", "native_tokenizers": [], @@ -31505,14 +36247,17 @@ }, { "name": "Ngile-Dengebu", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dagik", + "depth": 5, "iso_1_code": null, "iso_3_code": "dec", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7710", "native_tokenizers": [], @@ -31520,15 +36265,18 @@ }, { "name": "Ngile", + "depth": 5, "iso_1_code": null, "iso_3_code": "jle", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7711", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7709", "native_tokenizers": [], @@ -31536,14 +36284,17 @@ }, { "name": "Tocho", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Acheron", + "depth": 5, "iso_1_code": null, "iso_3_code": "acz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7713", "native_tokenizers": [], @@ -31551,9 +36302,11 @@ }, { "name": "Lumun", + "depth": 5, "iso_1_code": null, "iso_3_code": "lmd", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7714", "native_tokenizers": [], @@ -31561,9 +36314,11 @@ }, { "name": "Tocho", + "depth": 5, "iso_1_code": null, "iso_3_code": "taz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7715", "native_tokenizers": [], @@ -31571,21 +36326,25 @@ }, { "name": "Torona", + "depth": 5, "iso_1_code": null, "iso_3_code": "tqr", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7716", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7712", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7704", "native_tokenizers": [], @@ -31593,79 +36352,75 @@ }, { "name": "Tegem", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lafofa", + "depth": 4, "iso_1_code": null, "iso_3_code": "laf", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7718", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7717", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7703", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7675", "native_tokenizers": [], "scripts": [] }, { "name": "Mande", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bissa", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bisa", + "depth": 5, "iso_1_code": null, "iso_3_code": "bib", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7723", "native_tokenizers": [], "scripts": [ @@ -31673,38 +36428,26 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7722", "native_tokenizers": [], "scripts": [] }, { "name": "Busa", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boko", + "depth": 5, "iso_1_code": null, "iso_3_code": "bqc", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7725", "native_tokenizers": [], "scripts": [ @@ -31713,18 +36456,12 @@ }, { "name": "Bis\u00e3", + "depth": 5, "iso_1_code": null, "iso_3_code": "bqp", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7726", "native_tokenizers": [], "scripts": [ @@ -31733,18 +36470,12 @@ }, { "name": "Bokobaru", + "depth": 5, "iso_1_code": null, "iso_3_code": "bus", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7727", "native_tokenizers": [], "scripts": [ @@ -31752,29 +36483,25 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7724", "native_tokenizers": [], "scripts": [] }, { "name": "Kyanga", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shanga", + "depth": 5, "iso_1_code": null, "iso_3_code": "sho", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7729", "native_tokenizers": [], @@ -31782,15 +36509,18 @@ }, { "name": "Kyanga", + "depth": 5, "iso_1_code": null, "iso_3_code": "tye", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7730", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7728", "native_tokenizers": [], @@ -31798,23 +36528,18 @@ }, { "name": "Samo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Samo, Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": "sbd", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7732", "native_tokenizers": [], "scripts": [ @@ -31823,9 +36548,11 @@ }, { "name": "Samo, Matya", + "depth": 5, "iso_1_code": null, "iso_3_code": "stj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7733", "native_tokenizers": [], @@ -31833,52 +36560,43 @@ }, { "name": "Samo, Maya", + "depth": 5, "iso_1_code": null, "iso_3_code": "sym", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7734", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7731", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7721", "native_tokenizers": [], "scripts": [] }, { "name": "Southeastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gbin", + "depth": 4, "iso_1_code": null, "iso_3_code": "xgb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7736", "native_tokenizers": [], @@ -31886,28 +36604,24 @@ }, { "name": "Guro-Tura", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guro-Yaoure", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guro", + "depth": 6, "iso_1_code": null, "iso_3_code": "goa", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7739", "native_tokenizers": [], "scripts": [ @@ -31916,18 +36630,12 @@ }, { "name": "Yaour\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "yre", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7740", "native_tokenizers": [], "scripts": [ @@ -31935,43 +36643,32 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7738", "native_tokenizers": [], "scripts": [] }, { "name": "Tura-Dan-Mano", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mano", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maan", + "depth": 7, "iso_1_code": null, "iso_3_code": "mev", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7743", "native_tokenizers": [], "scripts": [ @@ -31979,38 +36676,26 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7742", "native_tokenizers": [], "scripts": [] }, { "name": "Tura-Dan", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dan", + "depth": 7, "iso_1_code": null, "iso_3_code": "dnj", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7745", "native_tokenizers": [], "scripts": [ @@ -32019,9 +36704,11 @@ }, { "name": "Goo", + "depth": 7, "iso_1_code": null, "iso_3_code": "gov", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7746", "native_tokenizers": [], @@ -32029,9 +36716,11 @@ }, { "name": "Kla-Dan", + "depth": 7, "iso_1_code": null, "iso_3_code": "lda", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7747", "native_tokenizers": [], @@ -32039,18 +36728,12 @@ }, { "name": "Toura", + "depth": 7, "iso_1_code": null, "iso_3_code": "neb", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7748", "native_tokenizers": [], "scripts": [ @@ -32058,62 +36741,45 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7744", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7741", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7737", "native_tokenizers": [], "scripts": [] }, { "name": "Nwa-Ben", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ben-Gban", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gban", + "depth": 6, "iso_1_code": null, "iso_3_code": "ggu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7751", "native_tokenizers": [], @@ -32121,9 +36787,11 @@ }, { "name": "Ngen", + "depth": 6, "iso_1_code": null, "iso_3_code": "gnj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7752", "native_tokenizers": [], @@ -32131,15 +36799,18 @@ }, { "name": "Beng", + "depth": 6, "iso_1_code": null, "iso_3_code": "nhb", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7753", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7750", "native_tokenizers": [], @@ -32147,23 +36818,18 @@ }, { "name": "Wan-Mwan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mwan", + "depth": 6, "iso_1_code": null, "iso_3_code": "moa", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7755", "native_tokenizers": [], "scripts": [ @@ -32172,100 +36838,81 @@ }, { "name": "Wan", + "depth": 6, "iso_1_code": null, "iso_3_code": "wan", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7756", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7754", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7749", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7735", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7720", "native_tokenizers": [], "scripts": [] }, { "name": "Western", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central-Southwestern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manding-Jogo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jogo-Jeri", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jeri Kuo", + "depth": 7, "iso_1_code": null, "iso_3_code": "jek", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7762", "native_tokenizers": [], @@ -32273,20 +36920,24 @@ }, { "name": "Jeri-Jalkuna", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jalkunan", + "depth": 8, "iso_1_code": null, "iso_3_code": "bxl", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7764", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7763", "native_tokenizers": [], @@ -32294,14 +36945,17 @@ }, { "name": "Jogo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ligbi", + "depth": 8, "iso_1_code": null, "iso_3_code": "lig", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7766", "native_tokenizers": [], @@ -32309,21 +36963,25 @@ }, { "name": "Tonjon", + "depth": 8, "iso_1_code": null, "iso_3_code": "tjn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7767", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7765", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7761", "native_tokenizers": [], @@ -32331,24 +36989,29 @@ }, { "name": "Manding-Vai", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manding-Mokole", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manding", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bolon", + "depth": 9, "iso_1_code": null, "iso_3_code": "bof", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7771", "native_tokenizers": [], @@ -32356,9 +37019,11 @@ }, { "name": "Jahanka", + "depth": 9, "iso_1_code": null, "iso_3_code": "jad", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7772", "native_tokenizers": [], @@ -32366,9 +37031,11 @@ }, { "name": "Sininkere", + "depth": 9, "iso_1_code": null, "iso_3_code": "skq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7773", "native_tokenizers": [], @@ -32376,25 +37043,30 @@ }, { "name": "Manding-East", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marka-Dafin", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marka", + "depth": 11, "iso_1_code": null, "iso_3_code": "rkm", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7776", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7775", "native_tokenizers": [], @@ -32402,28 +37074,24 @@ }, { "name": "Northeastern Manding", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bamana", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bamanankan", + "depth": 12, "iso_1_code": "bm", "iso_3_code": "bam", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7779", "native_tokenizers": [], "scripts": [ @@ -32432,18 +37100,12 @@ }, { "name": "Jula", + "depth": 12, "iso_1_code": null, "iso_3_code": "dyu", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7780", "native_tokenizers": [], "scripts": [ @@ -32451,43 +37113,32 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7778", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7777", "native_tokenizers": [], "scripts": [] }, { "name": "Southeastern Manding", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maninkakan, Eastern", + "depth": 11, "iso_1_code": null, "iso_3_code": "emk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7782", "native_tokenizers": [], @@ -32495,9 +37146,11 @@ }, { "name": "Konyanka", + "depth": 11, "iso_1_code": null, "iso_3_code": "mku", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7783", "native_tokenizers": [], @@ -32505,18 +37158,12 @@ }, { "name": "Maninka, Sankaran", + "depth": 11, "iso_1_code": null, "iso_3_code": "msc", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7784", "native_tokenizers": [], "scripts": [ @@ -32525,9 +37172,11 @@ }, { "name": "Manya", + "depth": 11, "iso_1_code": null, "iso_3_code": "mzj", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7785", "native_tokenizers": [], @@ -32535,14 +37184,17 @@ }, { "name": "Maninka-Mori", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wojenaka", + "depth": 12, "iso_1_code": null, "iso_3_code": "jod", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7787", "native_tokenizers": [], @@ -32550,9 +37202,11 @@ }, { "name": "Worodougou", + "depth": 12, "iso_1_code": null, "iso_3_code": "jud", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7788", "native_tokenizers": [], @@ -32560,9 +37214,11 @@ }, { "name": "Koro", + "depth": 12, "iso_1_code": null, "iso_3_code": "kfo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7789", "native_tokenizers": [], @@ -32570,9 +37226,11 @@ }, { "name": "Koyaga", + "depth": 12, "iso_1_code": null, "iso_3_code": "kga", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7790", "native_tokenizers": [], @@ -32580,67 +37238,51 @@ }, { "name": "Mahou", + "depth": 12, "iso_1_code": null, "iso_3_code": "mxx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7791", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7786", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7781", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7774", "native_tokenizers": [], "scripts": [] }, { "name": "Manding-West", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Xaasongaxango", + "depth": 10, "iso_1_code": null, "iso_3_code": "kao", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7793", "native_tokenizers": [], "scripts": [ @@ -32649,9 +37291,11 @@ }, { "name": "Maninkakan, Western", + "depth": 10, "iso_1_code": null, "iso_3_code": "mlq", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7794", "native_tokenizers": [], @@ -32659,18 +37303,12 @@ }, { "name": "Mandinka", + "depth": 10, "iso_1_code": null, "iso_3_code": "mnk", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7795", "native_tokenizers": [], "scripts": [ @@ -32679,9 +37317,11 @@ }, { "name": "Maninkakan, Kita", + "depth": 10, "iso_1_code": null, "iso_3_code": "mwk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7796", "native_tokenizers": [], @@ -32689,52 +37329,43 @@ }, { "name": "Kagoro", + "depth": 10, "iso_1_code": null, "iso_3_code": "xkg", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7797", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7792", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7770", "native_tokenizers": [], "scripts": [] }, { "name": "Mokole", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kakabe", + "depth": 9, "iso_1_code": null, "iso_3_code": "kke", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7799", "native_tokenizers": [], @@ -32742,18 +37373,12 @@ }, { "name": "Kuranko", + "depth": 9, "iso_1_code": null, "iso_3_code": "knk", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7800", "native_tokenizers": [], "scripts": [ @@ -32762,9 +37387,11 @@ }, { "name": "Lele", + "depth": 9, "iso_1_code": null, "iso_3_code": "llc", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7801", "native_tokenizers": [], @@ -32772,18 +37399,12 @@ }, { "name": "Mogofin", + "depth": 9, "iso_1_code": null, "iso_3_code": "mfg", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7802", "native_tokenizers": [], "scripts": [ @@ -32791,52 +37412,33 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7798", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7769", "native_tokenizers": [], "scripts": [] }, { "name": "Vai-Kono", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kono", + "depth": 8, "iso_1_code": null, "iso_3_code": "kno", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7804", "native_tokenizers": [], "scripts": [ @@ -32845,75 +37447,51 @@ }, { "name": "Vai", + "depth": 8, "iso_1_code": null, "iso_3_code": "vai", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7805", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7803", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7768", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7760", "native_tokenizers": [], "scripts": [] }, { "name": "Susu-Yalunka", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Susu", + "depth": 6, "iso_1_code": null, "iso_3_code": "sus", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7807", "native_tokenizers": [], "scripts": [ @@ -32923,18 +37501,12 @@ }, { "name": "Yalunka", + "depth": 6, "iso_1_code": null, "iso_3_code": "yal", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7808", "native_tokenizers": [], "scripts": [ @@ -32942,48 +37514,38 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7806", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7759", "native_tokenizers": [], "scripts": [] }, { "name": "Southwestern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kpelle", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kpelle, Guinea", + "depth": 6, "iso_1_code": null, "iso_3_code": "gkp", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7811", "native_tokenizers": [], @@ -32991,9 +37553,11 @@ }, { "name": "Kono", + "depth": 6, "iso_1_code": null, "iso_3_code": "knu", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7812", "native_tokenizers": [], @@ -33001,15 +37565,18 @@ }, { "name": "Kpelle, Liberia", + "depth": 6, "iso_1_code": null, "iso_3_code": "xpe", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7813", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7810", "native_tokenizers": [], @@ -33017,14 +37584,17 @@ }, { "name": "Mende-Loma", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zialo", + "depth": 6, "iso_1_code": null, "iso_3_code": "zil", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7815", "native_tokenizers": [], @@ -33032,23 +37602,18 @@ }, { "name": "Loma", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Loma", + "depth": 7, "iso_1_code": null, "iso_3_code": "lom", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7817", "native_tokenizers": [], "scripts": [ @@ -33057,18 +37622,12 @@ }, { "name": "Toma", + "depth": 7, "iso_1_code": null, "iso_3_code": "tod", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7818", "native_tokenizers": [], "scripts": [ @@ -33076,40 +37635,38 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7816", "native_tokenizers": [], "scripts": [] }, { "name": "Mende-Bandi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bandi", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bandi", + "depth": 8, "iso_1_code": null, "iso_3_code": "bza", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7821", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7820", "native_tokenizers": [], @@ -33117,23 +37674,18 @@ }, { "name": "Mende-Loko", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Loko", + "depth": 8, "iso_1_code": null, "iso_3_code": "lok", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7823", "native_tokenizers": [], "scripts": [ @@ -33142,18 +37694,12 @@ }, { "name": "Mende", + "depth": 8, "iso_1_code": null, "iso_3_code": "men", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7824", "native_tokenizers": [], "scripts": [ @@ -33161,85 +37707,53 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7822", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7819", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7814", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7809", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7758", "native_tokenizers": [], "scripts": [] }, { "name": "Northwestern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kpeego", + "depth": 4, "iso_1_code": null, "iso_3_code": "cpo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7826", "native_tokenizers": [], @@ -33247,14 +37761,17 @@ }, { "name": "Samogo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bankagooma", + "depth": 5, "iso_1_code": null, "iso_3_code": "bxw", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7828", "native_tokenizers": [], @@ -33262,9 +37779,11 @@ }, { "name": "Dz\u00f9\u00f9ngoo", + "depth": 5, "iso_1_code": null, "iso_3_code": "dnn", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7829", "native_tokenizers": [], @@ -33272,9 +37791,11 @@ }, { "name": "Duungooma", + "depth": 5, "iso_1_code": null, "iso_3_code": "dux", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7830", "native_tokenizers": [], @@ -33282,9 +37803,11 @@ }, { "name": "Jowulu", + "depth": 5, "iso_1_code": null, "iso_3_code": "jow", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7831", "native_tokenizers": [], @@ -33292,15 +37815,18 @@ }, { "name": "Seenku", + "depth": 5, "iso_1_code": null, "iso_3_code": "sos", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7832", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7827", "native_tokenizers": [], @@ -33308,28 +37834,24 @@ }, { "name": "Soninke-Bobo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bobo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konab\u00e9r\u00e9", + "depth": 6, "iso_1_code": null, "iso_3_code": "bbo", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7835", "native_tokenizers": [], "scripts": [ @@ -33338,18 +37860,12 @@ }, { "name": "Bobo Madar\u00e9, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "bwq", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7836", "native_tokenizers": [], "scripts": [ @@ -33357,39 +37873,37 @@ ] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7834", "native_tokenizers": [], "scripts": [] }, { "name": "Soninke-Boso", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boso", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bozo, Tiemac\u00e8w\u00e8", + "depth": 8, "iso_1_code": null, "iso_3_code": "boo", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7840", "native_tokenizers": [], @@ -33397,9 +37911,11 @@ }, { "name": "Bozo, Tieyaxo", + "depth": 8, "iso_1_code": null, "iso_3_code": "boz", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7841", "native_tokenizers": [], @@ -33407,15 +37923,18 @@ }, { "name": "Bozo, Kelengaxo", + "depth": 8, "iso_1_code": null, "iso_3_code": "bzx", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7842", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7839", "native_tokenizers": [], @@ -33423,26 +37942,31 @@ }, { "name": "Jenaama", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bozo, Jenaama", + "depth": 8, "iso_1_code": null, "iso_3_code": "bze", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7844", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7843", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7838", "native_tokenizers": [], @@ -33450,118 +37974,92 @@ }, { "name": "Soninke", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Soninke", + "depth": 7, "iso_1_code": null, "iso_3_code": "snk", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7846", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7845", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7837", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7833", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7825", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7757", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "7719", "native_tokenizers": [], "scripts": [] }, { "name": "Unclassified", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbre", + "depth": 2, "iso_1_code": null, "iso_3_code": "mka", "children": [], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7848", "native_tokenizers": [], "scripts": [] } ], + "family": "Niger-Congo", "tokenizers": {}, "node_i": "7847", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tn\")", - "original_lang_name": "tswana", - "original_lang_code": "tsn", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Niger-Congo", + "tokenizers": {}, "node_i": "5320", "native_tokenizers": [], "scripts": [] diff --git a/data/Nilo-Saharan.json b/data/Nilo-Saharan.json index a720aab420156837e1db2415f013f2e734529263..52c452ce601ed896e0c5e650e57214097aef7929 100644 --- a/data/Nilo-Saharan.json +++ b/data/Nilo-Saharan.json @@ -1,29 +1,35 @@ { "name": "Nilo-Saharan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuliak", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ik", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ik", + "depth": 3, "iso_1_code": null, "iso_3_code": "ikx", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7852", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7851", "native_tokenizers": [], @@ -31,14 +37,17 @@ }, { "name": "Ngangea-So", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nyang\u2019i", + "depth": 3, "iso_1_code": null, "iso_3_code": "nyp", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7854", "native_tokenizers": [], @@ -46,21 +55,25 @@ }, { "name": "Soo", + "depth": 3, "iso_1_code": null, "iso_3_code": "teu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7855", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7853", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7850", "native_tokenizers": [], @@ -68,19 +81,23 @@ }, { "name": "Saharan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berti", + "depth": 3, "iso_1_code": null, "iso_3_code": "byt", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7858", "native_tokenizers": [], @@ -88,15 +105,18 @@ }, { "name": "Zaghawa", + "depth": 3, "iso_1_code": null, "iso_3_code": "zag", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7859", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7857", "native_tokenizers": [], @@ -104,19 +124,23 @@ }, { "name": "Western", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kanuri", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kanuri, Bilma", + "depth": 4, "iso_1_code": null, "iso_3_code": "bms", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7862", "native_tokenizers": [], @@ -124,9 +148,11 @@ }, { "name": "Kanembu", + "depth": 4, "iso_1_code": null, "iso_3_code": "kbl", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7863", "native_tokenizers": [], @@ -134,9 +160,11 @@ }, { "name": "Kanuri, Manga", + "depth": 4, "iso_1_code": "kr", "iso_3_code": "kby", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7864", "native_tokenizers": [], @@ -146,9 +174,11 @@ }, { "name": "Kanuri, Yerwa", + "depth": 4, "iso_1_code": "kr", "iso_3_code": "knc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7865", "native_tokenizers": [], @@ -159,9 +189,11 @@ }, { "name": "Kanuri, Tumari", + "depth": 4, "iso_1_code": "kr", "iso_3_code": "krt", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7866", "native_tokenizers": [], @@ -169,15 +201,18 @@ }, { "name": "Tarjumo", + "depth": 4, "iso_1_code": null, "iso_3_code": "txj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7867", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7861", "native_tokenizers": [], @@ -185,14 +220,17 @@ }, { "name": "Tebu", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dazaga", + "depth": 4, "iso_1_code": null, "iso_3_code": "dzg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7869", "native_tokenizers": [], @@ -200,27 +238,32 @@ }, { "name": "Tedaga", + "depth": 4, "iso_1_code": null, "iso_3_code": "tuq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7870", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7868", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7860", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7856", "native_tokenizers": [], @@ -228,24 +271,29 @@ }, { "name": "Satellite-Core", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Core", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "B\u2019aga", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Daats\u02bci\u0301in", + "depth": 4, "iso_1_code": null, "iso_3_code": "dtn", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7874", "native_tokenizers": [], @@ -253,9 +301,11 @@ }, { "name": "Gumuz", + "depth": 4, "iso_1_code": null, "iso_3_code": "guk", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7875", "native_tokenizers": [], @@ -264,6 +314,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7873", "native_tokenizers": [], @@ -271,30 +322,36 @@ }, { "name": "Eastern Sudanic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern (k languages)", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nara", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nara", + "depth": 6, "iso_1_code": null, "iso_3_code": "nrb", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7879", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7878", "native_tokenizers": [], @@ -302,19 +359,23 @@ }, { "name": "Nubian", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mattokki", + "depth": 7, "iso_1_code": null, "iso_3_code": "xnz", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7882", "native_tokenizers": [], @@ -322,20 +383,24 @@ }, { "name": "Birked", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Birked", + "depth": 8, "iso_1_code": null, "iso_3_code": "brk", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7884", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7883", "native_tokenizers": [], @@ -343,20 +408,24 @@ }, { "name": "Dongolawi", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andaandi", + "depth": 8, "iso_1_code": null, "iso_3_code": "dgl", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7886", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7885", "native_tokenizers": [], @@ -364,19 +433,23 @@ }, { "name": "Hill", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kadaru-Ghulfan", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ghulfan", + "depth": 9, "iso_1_code": null, "iso_3_code": "ghl", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7889", "native_tokenizers": [], @@ -384,15 +457,18 @@ }, { "name": "Kadaru", + "depth": 9, "iso_1_code": null, "iso_3_code": "kdu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7890", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7888", "native_tokenizers": [], @@ -400,14 +476,17 @@ }, { "name": "Unclassified", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dilling", + "depth": 9, "iso_1_code": null, "iso_3_code": "dil", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7892", "native_tokenizers": [], @@ -415,9 +494,11 @@ }, { "name": "Dair", + "depth": 9, "iso_1_code": null, "iso_3_code": "drb", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7893", "native_tokenizers": [], @@ -425,9 +506,11 @@ }, { "name": "El Hugeirat", + "depth": 9, "iso_1_code": null, "iso_3_code": "elh", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7894", "native_tokenizers": [], @@ -435,9 +518,11 @@ }, { "name": "Karko", + "depth": 9, "iso_1_code": null, "iso_3_code": "kko", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7895", "native_tokenizers": [], @@ -445,27 +530,32 @@ }, { "name": "Wali", + "depth": 9, "iso_1_code": null, "iso_3_code": "wll", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7896", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7891", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7887", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7881", "native_tokenizers": [], @@ -473,20 +563,24 @@ }, { "name": "Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nobiin", + "depth": 7, "iso_1_code": null, "iso_3_code": "fia", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7898", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7897", "native_tokenizers": [], @@ -494,26 +588,31 @@ }, { "name": "Western", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Midob", + "depth": 7, "iso_1_code": null, "iso_3_code": "mei", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7900", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7899", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7880", "native_tokenizers": [], @@ -521,14 +620,17 @@ }, { "name": "Nyimang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Afitti", + "depth": 6, "iso_1_code": null, "iso_3_code": "aft", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7902", "native_tokenizers": [], @@ -536,15 +638,18 @@ }, { "name": "Ama", + "depth": 6, "iso_1_code": null, "iso_3_code": "nyi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7903", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7901", "native_tokenizers": [], @@ -552,25 +657,30 @@ }, { "name": "Tama", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mararit", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mararit", + "depth": 7, "iso_1_code": null, "iso_3_code": "mgb", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7906", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7905", "native_tokenizers": [], @@ -578,14 +688,17 @@ }, { "name": "Tama-Sungor", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Assangori", + "depth": 7, "iso_1_code": null, "iso_3_code": "sjg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7908", "native_tokenizers": [], @@ -593,27 +706,32 @@ }, { "name": "Tama", + "depth": 7, "iso_1_code": null, "iso_3_code": "tma", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7909", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7907", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7904", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7877", "native_tokenizers": [], @@ -621,24 +739,29 @@ }, { "name": "Southern (n languages)", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Daju", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Daju", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Logorik", + "depth": 7, "iso_1_code": null, "iso_3_code": "liu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7913", "native_tokenizers": [], @@ -646,15 +769,18 @@ }, { "name": "Shatt", + "depth": 7, "iso_1_code": null, "iso_3_code": "shj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7914", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7912", "native_tokenizers": [], @@ -662,14 +788,17 @@ }, { "name": "Western Daju", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baygo", + "depth": 7, "iso_1_code": null, "iso_3_code": "byg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7916", "native_tokenizers": [], @@ -677,9 +806,11 @@ }, { "name": "Daju, Dar Fur", + "depth": 7, "iso_1_code": null, "iso_3_code": "daj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7917", "native_tokenizers": [], @@ -687,9 +818,11 @@ }, { "name": "Daju, Dar Sila", + "depth": 7, "iso_1_code": null, "iso_3_code": "dau", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7918", "native_tokenizers": [], @@ -697,9 +830,11 @@ }, { "name": "Daju, Dar Daju", + "depth": 7, "iso_1_code": null, "iso_3_code": "djc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7919", "native_tokenizers": [], @@ -707,21 +842,25 @@ }, { "name": "Njalgulgule", + "depth": 7, "iso_1_code": null, "iso_3_code": "njl", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7920", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7915", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7911", "native_tokenizers": [], @@ -729,19 +868,23 @@ }, { "name": "Eastern Jebel", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aka-Kelo-Molo", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aka", + "depth": 7, "iso_1_code": null, "iso_3_code": "soh", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7923", "native_tokenizers": [], @@ -749,9 +892,11 @@ }, { "name": "Kelo", + "depth": 7, "iso_1_code": null, "iso_3_code": "xel", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7924", "native_tokenizers": [], @@ -759,15 +904,18 @@ }, { "name": "Molo", + "depth": 7, "iso_1_code": null, "iso_3_code": "zmo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7925", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7922", "native_tokenizers": [], @@ -775,26 +923,31 @@ }, { "name": "Gaam", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gaam", + "depth": 7, "iso_1_code": null, "iso_3_code": "tbi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7927", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7926", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7921", "native_tokenizers": [], @@ -802,24 +955,29 @@ }, { "name": "Nilotic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bari", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bari", + "depth": 8, "iso_1_code": null, "iso_3_code": "bfa", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7931", "native_tokenizers": [], @@ -827,9 +985,11 @@ }, { "name": "Kakwa", + "depth": 8, "iso_1_code": null, "iso_3_code": "keo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7932", "native_tokenizers": [], @@ -839,9 +999,11 @@ }, { "name": "Mandari", + "depth": 8, "iso_1_code": null, "iso_3_code": "mqu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7933", "native_tokenizers": [], @@ -849,15 +1011,18 @@ }, { "name": "Kuku", + "depth": 8, "iso_1_code": null, "iso_3_code": "ukv", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7934", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7930", "native_tokenizers": [], @@ -865,24 +1030,29 @@ }, { "name": "Lotuxo-Teso", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lotuxo-Maa", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lotuxo", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dongotono", + "depth": 10, "iso_1_code": null, "iso_3_code": "ddd", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7938", "native_tokenizers": [], @@ -890,9 +1060,11 @@ }, { "name": "Imotong", + "depth": 10, "iso_1_code": null, "iso_3_code": "imt", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7939", "native_tokenizers": [], @@ -900,9 +1072,11 @@ }, { "name": "Lango", + "depth": 10, "iso_1_code": null, "iso_3_code": "lgo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7940", "native_tokenizers": [], @@ -910,9 +1084,11 @@ }, { "name": "Lokoya", + "depth": 10, "iso_1_code": null, "iso_3_code": "lky", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7941", "native_tokenizers": [], @@ -920,9 +1096,11 @@ }, { "name": "Otuho", + "depth": 10, "iso_1_code": null, "iso_3_code": "lot", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7942", "native_tokenizers": [], @@ -930,9 +1108,11 @@ }, { "name": "Lopit", + "depth": 10, "iso_1_code": null, "iso_3_code": "lpx", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7943", "native_tokenizers": [], @@ -940,9 +1120,11 @@ }, { "name": "Logir", + "depth": 10, "iso_1_code": null, "iso_3_code": "lqr", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7944", "native_tokenizers": [], @@ -950,15 +1132,18 @@ }, { "name": "Okolie", + "depth": 10, "iso_1_code": null, "iso_3_code": "oie", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7945", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7937", "native_tokenizers": [], @@ -966,14 +1151,17 @@ }, { "name": "Ongamo-Maa", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maasai", + "depth": 10, "iso_1_code": null, "iso_3_code": "mas", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7947", "native_tokenizers": [], @@ -983,9 +1171,11 @@ }, { "name": "Ngasa", + "depth": 10, "iso_1_code": null, "iso_3_code": "nsg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7948", "native_tokenizers": [], @@ -993,21 +1183,25 @@ }, { "name": "Samburu", + "depth": 10, "iso_1_code": null, "iso_3_code": "saq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7949", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7946", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7936", "native_tokenizers": [], @@ -1015,19 +1209,23 @@ }, { "name": "Teso-Turkana", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Teso", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ateso", + "depth": 10, "iso_1_code": null, "iso_3_code": "teo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7952", "native_tokenizers": [], @@ -1036,6 +1234,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7951", "native_tokenizers": [], @@ -1043,14 +1242,17 @@ }, { "name": "Turkana", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ng\u2019akarimojong", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7954", "native_tokenizers": [], @@ -1060,9 +1262,11 @@ }, { "name": "Nyangatom", + "depth": 10, "iso_1_code": null, "iso_3_code": "nnj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7955", "native_tokenizers": [], @@ -1070,9 +1274,11 @@ }, { "name": "Toposa", + "depth": 10, "iso_1_code": null, "iso_3_code": "toq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7956", "native_tokenizers": [], @@ -1080,9 +1286,11 @@ }, { "name": "Turkana", + "depth": 10, "iso_1_code": null, "iso_3_code": "tuv", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7957", "native_tokenizers": [], @@ -1091,24 +1299,28 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7953", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7950", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7935", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7929", "native_tokenizers": [], @@ -1116,24 +1328,29 @@ }, { "name": "Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalenjin", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Elgon", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kupsapiiny", + "depth": 9, "iso_1_code": null, "iso_3_code": "kpz", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7961", "native_tokenizers": [], @@ -1143,9 +1360,11 @@ }, { "name": "Sabaot", + "depth": 9, "iso_1_code": null, "iso_3_code": "spy", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7962", "native_tokenizers": [], @@ -1154,6 +1373,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7960", "native_tokenizers": [], @@ -1161,19 +1381,23 @@ }, { "name": "Nandi-Markweta", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kipsigis", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kipsigis", + "depth": 10, "iso_1_code": null, "iso_3_code": "sgc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7965", "native_tokenizers": [], @@ -1182,6 +1406,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7964", "native_tokenizers": [], @@ -1189,14 +1414,17 @@ }, { "name": "Markweta", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Markweeta", + "depth": 10, "iso_1_code": null, "iso_3_code": "enb", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7967", "native_tokenizers": [], @@ -1205,6 +1433,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7966", "native_tokenizers": [], @@ -1212,14 +1441,17 @@ }, { "name": "Nandi", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Keiyo", + "depth": 10, "iso_1_code": null, "iso_3_code": "eyo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7969", "native_tokenizers": [], @@ -1227,9 +1459,11 @@ }, { "name": "Kisankasa", + "depth": 10, "iso_1_code": null, "iso_3_code": "kqh", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7970", "native_tokenizers": [], @@ -1237,9 +1471,11 @@ }, { "name": "Nandi", + "depth": 10, "iso_1_code": null, "iso_3_code": "niq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7971", "native_tokenizers": [], @@ -1249,9 +1485,11 @@ }, { "name": "Terik", + "depth": 10, "iso_1_code": null, "iso_3_code": "tec", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7972", "native_tokenizers": [], @@ -1259,21 +1497,25 @@ }, { "name": "Tugen", + "depth": 10, "iso_1_code": null, "iso_3_code": "tuy", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7973", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7968", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7963", "native_tokenizers": [], @@ -1281,20 +1523,24 @@ }, { "name": "Okiek", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Okiek", + "depth": 9, "iso_1_code": null, "iso_3_code": "oki", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7975", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7974", "native_tokenizers": [], @@ -1302,26 +1548,31 @@ }, { "name": "Pokot", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "P\u00f6koot", + "depth": 9, "iso_1_code": null, "iso_3_code": "pko", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7977", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7976", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7959", "native_tokenizers": [], @@ -1329,14 +1580,17 @@ }, { "name": "Tatoga", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Omotik", + "depth": 8, "iso_1_code": null, "iso_3_code": "omt", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7979", "native_tokenizers": [], @@ -1344,9 +1598,11 @@ }, { "name": "Datooga", + "depth": 8, "iso_1_code": null, "iso_3_code": "tcc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7980", "native_tokenizers": [], @@ -1355,12 +1611,14 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7978", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7958", "native_tokenizers": [], @@ -1368,24 +1626,29 @@ }, { "name": "Western", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dinka-Nuer", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dinka", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dinka, South Central", + "depth": 9, "iso_1_code": null, "iso_3_code": "dib", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7984", "native_tokenizers": [], @@ -1393,9 +1656,11 @@ }, { "name": "Dinka, Southwestern", + "depth": 9, "iso_1_code": null, "iso_3_code": "dik", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7985", "native_tokenizers": [], @@ -1405,9 +1670,11 @@ }, { "name": "Dinka, Northeastern", + "depth": 9, "iso_1_code": null, "iso_3_code": "dip", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7986", "native_tokenizers": [], @@ -1417,9 +1684,11 @@ }, { "name": "Dinka, Northwestern", + "depth": 9, "iso_1_code": null, "iso_3_code": "diw", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7987", "native_tokenizers": [], @@ -1427,9 +1696,11 @@ }, { "name": "Dinka, Southeastern", + "depth": 9, "iso_1_code": null, "iso_3_code": "dks", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7988", "native_tokenizers": [], @@ -1438,6 +1709,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7983", "native_tokenizers": [], @@ -1445,14 +1717,17 @@ }, { "name": "Nuer", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Reel", + "depth": 9, "iso_1_code": null, "iso_3_code": "atu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7990", "native_tokenizers": [], @@ -1460,9 +1735,11 @@ }, { "name": "Nuer", + "depth": 9, "iso_1_code": null, "iso_3_code": "nus", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7991", "native_tokenizers": [], @@ -1471,12 +1748,14 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7989", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7982", "native_tokenizers": [], @@ -1484,30 +1763,36 @@ }, { "name": "Luo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anuak", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anuak", + "depth": 10, "iso_1_code": null, "iso_3_code": "anu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7995", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7994", "native_tokenizers": [], @@ -1515,20 +1800,24 @@ }, { "name": "Bor", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Belanda Bor", + "depth": 10, "iso_1_code": null, "iso_3_code": "bxb", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7997", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7996", "native_tokenizers": [], @@ -1536,14 +1825,17 @@ }, { "name": "Jur", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luwo", + "depth": 10, "iso_1_code": null, "iso_3_code": "lwo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7999", "native_tokenizers": [], @@ -1552,6 +1844,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7998", "native_tokenizers": [], @@ -1559,25 +1852,30 @@ }, { "name": "Mabaan-Burun", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burun", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burun", + "depth": 11, "iso_1_code": null, "iso_3_code": "bdi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8002", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8001", "native_tokenizers": [], @@ -1585,14 +1883,17 @@ }, { "name": "Mabaan", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jumjum", + "depth": 11, "iso_1_code": null, "iso_3_code": "jum", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8004", "native_tokenizers": [], @@ -1600,9 +1901,11 @@ }, { "name": "Mabaan", + "depth": 11, "iso_1_code": null, "iso_3_code": "mfz", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8005", "native_tokenizers": [], @@ -1611,12 +1914,14 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8003", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8000", "native_tokenizers": [], @@ -1624,14 +1929,17 @@ }, { "name": "Shilluk", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Shilluk", + "depth": 10, "iso_1_code": null, "iso_3_code": "shk", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8007", "native_tokenizers": [], @@ -1640,6 +1948,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8006", "native_tokenizers": [], @@ -1647,20 +1956,24 @@ }, { "name": "Thuri", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Thuri", + "depth": 10, "iso_1_code": null, "iso_3_code": "thu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8009", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8008", "native_tokenizers": [], @@ -1668,26 +1981,31 @@ }, { "name": "Unclassified", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "P\u00e4ri", + "depth": 10, "iso_1_code": null, "iso_3_code": "lkr", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8011", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8010", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7993", "native_tokenizers": [], @@ -1695,19 +2013,23 @@ }, { "name": "Southern", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adhola", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jopadhola", + "depth": 10, "iso_1_code": null, "iso_3_code": "adh", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8014", "native_tokenizers": [], @@ -1716,6 +2038,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8013", "native_tokenizers": [], @@ -1723,14 +2046,17 @@ }, { "name": "Kuman", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kumam", + "depth": 10, "iso_1_code": null, "iso_3_code": "kdi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8016", "native_tokenizers": [], @@ -1739,6 +2065,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8015", "native_tokenizers": [], @@ -1746,19 +2073,23 @@ }, { "name": "Luo-Acholi", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alur-Acholi", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Thur", + "depth": 11, "iso_1_code": null, "iso_3_code": "lth", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8019", "native_tokenizers": [], @@ -1766,14 +2097,17 @@ }, { "name": "Alur", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alur", + "depth": 12, "iso_1_code": null, "iso_3_code": "alz", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8021", "native_tokenizers": [], @@ -1782,6 +2116,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8020", "native_tokenizers": [], @@ -1789,14 +2124,17 @@ }, { "name": "Lango-Acholi", + "depth": 11, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Acholi", + "depth": 12, "iso_1_code": null, "iso_3_code": "ach", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8023", "native_tokenizers": [], @@ -1806,9 +2144,11 @@ }, { "name": "Lango", + "depth": 12, "iso_1_code": null, "iso_3_code": "laj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8024", "native_tokenizers": [], @@ -1817,12 +2157,14 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8022", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8018", "native_tokenizers": [], @@ -1830,14 +2172,17 @@ }, { "name": "Luo", + "depth": 10, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dholuo", + "depth": 11, "iso_1_code": null, "iso_3_code": "luo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8026", "native_tokenizers": [], @@ -1846,36 +2191,42 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8025", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8017", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8012", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7992", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7981", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7928", "native_tokenizers": [], @@ -1883,36 +2234,43 @@ }, { "name": "Surmic", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Majang", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Majang", + "depth": 8, "iso_1_code": null, "iso_3_code": "mpe", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8030", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8029", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8028", "native_tokenizers": [], @@ -1920,30 +2278,36 @@ }, { "name": "South", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Southeast", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwegu", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwegu", + "depth": 9, "iso_1_code": null, "iso_3_code": "xwg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8034", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8033", "native_tokenizers": [], @@ -1951,25 +2315,30 @@ }, { "name": "Pastoral", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Me\u2019en", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Me\u2019en", + "depth": 10, "iso_1_code": null, "iso_3_code": "mym", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8037", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8036", "native_tokenizers": [], @@ -1977,14 +2346,17 @@ }, { "name": "Suri", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mursi", + "depth": 10, "iso_1_code": null, "iso_3_code": "muz", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8039", "native_tokenizers": [], @@ -1992,27 +2364,32 @@ }, { "name": "Suri, Tirmaga-Chai", + "depth": 10, "iso_1_code": null, "iso_3_code": "suq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8040", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8038", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8035", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8032", "native_tokenizers": [], @@ -2020,24 +2397,29 @@ }, { "name": "Southwest", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Didinga-Murle", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Didinga-Longarim", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Didinga", + "depth": 10, "iso_1_code": null, "iso_3_code": "did", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8044", "native_tokenizers": [], @@ -2047,15 +2429,18 @@ }, { "name": "Laarim", + "depth": 10, "iso_1_code": null, "iso_3_code": "loh", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8045", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8043", "native_tokenizers": [], @@ -2063,14 +2448,17 @@ }, { "name": "Murle", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Murle", + "depth": 10, "iso_1_code": null, "iso_3_code": "mur", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8047", "native_tokenizers": [], @@ -2079,6 +2467,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8046", "native_tokenizers": [], @@ -2086,26 +2475,31 @@ }, { "name": "Tennet", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tennet", + "depth": 10, "iso_1_code": null, "iso_3_code": "tex", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8049", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8048", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8042", "native_tokenizers": [], @@ -2113,38 +2507,45 @@ }, { "name": "Kacipo-Balesi", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suri, Kacipo-Bale", + "depth": 9, "iso_1_code": null, "iso_3_code": "koe", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8051", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8050", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8041", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8031", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8027", "native_tokenizers": [], @@ -2152,14 +2553,17 @@ }, { "name": "Temein", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tese", + "depth": 6, "iso_1_code": null, "iso_3_code": "keg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8053", "native_tokenizers": [], @@ -2167,27 +2571,32 @@ }, { "name": "Temein", + "depth": 6, "iso_1_code": null, "iso_3_code": "teq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8054", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8052", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7910", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7876", "native_tokenizers": [], @@ -2195,14 +2604,17 @@ }, { "name": "Kadugli-Krongo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kanga", + "depth": 4, "iso_1_code": null, "iso_3_code": "kcp", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8056", "native_tokenizers": [], @@ -2210,9 +2622,11 @@ }, { "name": "Keiga", + "depth": 4, "iso_1_code": null, "iso_3_code": "kec", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8057", "native_tokenizers": [], @@ -2220,9 +2634,11 @@ }, { "name": "Krongo", + "depth": 4, "iso_1_code": null, "iso_3_code": "kgo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8058", "native_tokenizers": [], @@ -2230,9 +2646,11 @@ }, { "name": "Tumtum", + "depth": 4, "iso_1_code": null, "iso_3_code": "tbr", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8059", "native_tokenizers": [], @@ -2240,9 +2658,11 @@ }, { "name": "Tulishi", + "depth": 4, "iso_1_code": null, "iso_3_code": "tey", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8060", "native_tokenizers": [], @@ -2250,15 +2670,18 @@ }, { "name": "Katcha-Kadugli-Miri", + "depth": 4, "iso_1_code": null, "iso_3_code": "xtc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8061", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8055", "native_tokenizers": [], @@ -2266,14 +2689,17 @@ }, { "name": "Koman", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gule", + "depth": 4, "iso_1_code": null, "iso_3_code": "gly", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8063", "native_tokenizers": [], @@ -2281,9 +2707,11 @@ }, { "name": "Gwama", + "depth": 4, "iso_1_code": null, "iso_3_code": "kmq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8064", "native_tokenizers": [], @@ -2291,9 +2719,11 @@ }, { "name": "Opo", + "depth": 4, "iso_1_code": null, "iso_3_code": "lgn", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8065", "native_tokenizers": [], @@ -2301,9 +2731,11 @@ }, { "name": "Uduk", + "depth": 4, "iso_1_code": null, "iso_3_code": "udu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8066", "native_tokenizers": [], @@ -2313,21 +2745,25 @@ }, { "name": "Komo", + "depth": 4, "iso_1_code": null, "iso_3_code": "xom", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8067", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8062", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7872", "native_tokenizers": [], @@ -2335,14 +2771,17 @@ }, { "name": "Satellites", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berta", + "depth": 3, "iso_1_code": null, "iso_3_code": "wti", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8069", "native_tokenizers": [], @@ -2350,24 +2789,29 @@ }, { "name": "Central Sudanic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "East", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lendu", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ndrulo", + "depth": 6, "iso_1_code": null, "iso_3_code": "dno", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8073", "native_tokenizers": [], @@ -2375,9 +2819,11 @@ }, { "name": "Lendu", + "depth": 6, "iso_1_code": null, "iso_3_code": "led", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8074", "native_tokenizers": [], @@ -2387,9 +2833,11 @@ }, { "name": "Ngiti", + "depth": 6, "iso_1_code": null, "iso_3_code": "niy", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8075", "native_tokenizers": [], @@ -2398,6 +2846,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8072", "native_tokenizers": [], @@ -2405,14 +2854,17 @@ }, { "name": "Mangbetu", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asoa", + "depth": 6, "iso_1_code": null, "iso_3_code": "asv", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8077", "native_tokenizers": [], @@ -2420,9 +2872,11 @@ }, { "name": "Lombi", + "depth": 6, "iso_1_code": null, "iso_3_code": "lmi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8078", "native_tokenizers": [], @@ -2430,15 +2884,18 @@ }, { "name": "Mangbetu", + "depth": 6, "iso_1_code": null, "iso_3_code": "mdj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8079", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8076", "native_tokenizers": [], @@ -2446,14 +2903,17 @@ }, { "name": "Mangbutu-Efe", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bendi", + "depth": 6, "iso_1_code": null, "iso_3_code": "bct", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8081", "native_tokenizers": [], @@ -2461,9 +2921,11 @@ }, { "name": "Efe", + "depth": 6, "iso_1_code": null, "iso_3_code": "efe", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8082", "native_tokenizers": [], @@ -2471,9 +2933,11 @@ }, { "name": "Lese", + "depth": 6, "iso_1_code": null, "iso_3_code": "les", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8083", "native_tokenizers": [], @@ -2481,9 +2945,11 @@ }, { "name": "Mamvu", + "depth": 6, "iso_1_code": null, "iso_3_code": "mdi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8084", "native_tokenizers": [], @@ -2491,9 +2957,11 @@ }, { "name": "Mangbutu", + "depth": 6, "iso_1_code": null, "iso_3_code": "mdk", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8085", "native_tokenizers": [], @@ -2501,9 +2969,11 @@ }, { "name": "Mvuba", + "depth": 6, "iso_1_code": null, "iso_3_code": "mxh", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8086", "native_tokenizers": [], @@ -2511,9 +2981,11 @@ }, { "name": "Kebu", + "depth": 6, "iso_1_code": null, "iso_3_code": "ndp", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8087", "native_tokenizers": [], @@ -2522,6 +2994,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8080", "native_tokenizers": [], @@ -2529,19 +3002,23 @@ }, { "name": "Moru-Madi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Avokaya", + "depth": 7, "iso_1_code": null, "iso_3_code": "avu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8090", "native_tokenizers": [], @@ -2551,9 +3028,11 @@ }, { "name": "Keliko", + "depth": 7, "iso_1_code": null, "iso_3_code": "kbo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8091", "native_tokenizers": [], @@ -2563,9 +3042,11 @@ }, { "name": "Lugbara", + "depth": 7, "iso_1_code": null, "iso_3_code": "lgg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8092", "native_tokenizers": [], @@ -2575,9 +3056,11 @@ }, { "name": "Logo", + "depth": 7, "iso_1_code": null, "iso_3_code": "log", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8093", "native_tokenizers": [], @@ -2587,9 +3070,11 @@ }, { "name": "Aringa", + "depth": 7, "iso_1_code": null, "iso_3_code": "luc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8094", "native_tokenizers": [], @@ -2599,15 +3084,18 @@ }, { "name": "Omi", + "depth": 7, "iso_1_code": null, "iso_3_code": "omi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8095", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8089", "native_tokenizers": [], @@ -2615,20 +3103,24 @@ }, { "name": "Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Moru", + "depth": 7, "iso_1_code": null, "iso_3_code": "mgd", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8097", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8096", "native_tokenizers": [], @@ -2636,14 +3128,17 @@ }, { "name": "Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Olu\u2019bo", + "depth": 7, "iso_1_code": null, "iso_3_code": "lul", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8099", "native_tokenizers": [], @@ -2651,9 +3146,11 @@ }, { "name": "Ma\u2019di", + "depth": 7, "iso_1_code": null, "iso_3_code": "mhi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8100", "native_tokenizers": [], @@ -2663,27 +3160,32 @@ }, { "name": "Ma\u2019di, Southern", + "depth": 7, "iso_1_code": null, "iso_3_code": "snm", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8101", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8098", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8088", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8071", "native_tokenizers": [], @@ -2691,24 +3193,29 @@ }, { "name": "West", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bongo-Bagirmi", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bongo-Baka", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Beli", + "depth": 7, "iso_1_code": null, "iso_3_code": "blm", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8105", "native_tokenizers": [], @@ -2716,14 +3223,17 @@ }, { "name": "Baka", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baka", + "depth": 8, "iso_1_code": null, "iso_3_code": "bdh", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8107", "native_tokenizers": [], @@ -2732,6 +3242,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8106", "native_tokenizers": [], @@ -2739,20 +3250,24 @@ }, { "name": "Bongo", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bongo", + "depth": 8, "iso_1_code": null, "iso_3_code": "bot", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8109", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8108", "native_tokenizers": [], @@ -2760,14 +3275,17 @@ }, { "name": "M\u00f6d\u00f6-Nyamusa", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jur Modo", + "depth": 8, "iso_1_code": null, "iso_3_code": "bex", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8111", "native_tokenizers": [], @@ -2777,15 +3295,18 @@ }, { "name": "Nyamusa-Molo", + "depth": 8, "iso_1_code": null, "iso_3_code": "nwm", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8112", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8110", "native_tokenizers": [], @@ -2793,14 +3314,17 @@ }, { "name": "Morokodo-Mo\u2019da", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mo\u2019da", + "depth": 8, "iso_1_code": null, "iso_3_code": "gbn", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8114", "native_tokenizers": [], @@ -2808,9 +3332,11 @@ }, { "name": "Morokodo", + "depth": 8, "iso_1_code": null, "iso_3_code": "mgc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8115", "native_tokenizers": [], @@ -2819,6 +3345,7 @@ ] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8113", "native_tokenizers": [], @@ -2826,26 +3353,31 @@ }, { "name": "Unclassified", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mittu", + "depth": 8, "iso_1_code": null, "iso_3_code": "mwu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8117", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8116", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8104", "native_tokenizers": [], @@ -2853,14 +3385,17 @@ }, { "name": "Kara", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fulu", + "depth": 7, "iso_1_code": null, "iso_3_code": "fuu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8119", "native_tokenizers": [], @@ -2868,9 +3403,11 @@ }, { "name": "Gula", + "depth": 7, "iso_1_code": null, "iso_3_code": "kcm", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8120", "native_tokenizers": [], @@ -2878,15 +3415,18 @@ }, { "name": "Yulu", + "depth": 7, "iso_1_code": null, "iso_3_code": "yul", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8121", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8118", "native_tokenizers": [], @@ -2894,14 +3434,17 @@ }, { "name": "Sara-Bagirmi", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Birri", + "depth": 7, "iso_1_code": null, "iso_3_code": "bvq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8123", "native_tokenizers": [], @@ -2909,9 +3452,11 @@ }, { "name": "Fongoro", + "depth": 7, "iso_1_code": null, "iso_3_code": "fgr", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8124", "native_tokenizers": [], @@ -2919,14 +3464,17 @@ }, { "name": "Bagirmi", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Morom", + "depth": 8, "iso_1_code": null, "iso_3_code": "bdo", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8126", "native_tokenizers": [], @@ -2934,9 +3482,11 @@ }, { "name": "Bagirmi", + "depth": 8, "iso_1_code": null, "iso_3_code": "bmi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8127", "native_tokenizers": [], @@ -2944,9 +3494,11 @@ }, { "name": "Berakou", + "depth": 8, "iso_1_code": null, "iso_3_code": "bxv", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8128", "native_tokenizers": [], @@ -2954,9 +3506,11 @@ }, { "name": "Disa", + "depth": 8, "iso_1_code": null, "iso_3_code": "dsi", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8129", "native_tokenizers": [], @@ -2964,9 +3518,11 @@ }, { "name": "Gula", + "depth": 8, "iso_1_code": null, "iso_3_code": "glu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8130", "native_tokenizers": [], @@ -2974,9 +3530,11 @@ }, { "name": "Jaya", + "depth": 8, "iso_1_code": null, "iso_3_code": "jyy", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8131", "native_tokenizers": [], @@ -2984,9 +3542,11 @@ }, { "name": "Kenga", + "depth": 8, "iso_1_code": null, "iso_3_code": "kyq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8132", "native_tokenizers": [], @@ -2996,15 +3556,18 @@ }, { "name": "Naba", + "depth": 8, "iso_1_code": null, "iso_3_code": "mne", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8133", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8125", "native_tokenizers": [], @@ -3012,19 +3575,23 @@ }, { "name": "Sara", + "depth": 7, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sara Proper", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bedjond", + "depth": 9, "iso_1_code": null, "iso_3_code": "bjv", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8136", "native_tokenizers": [], @@ -3034,9 +3601,11 @@ }, { "name": "Dagba", + "depth": 9, "iso_1_code": null, "iso_3_code": "dgk", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8137", "native_tokenizers": [], @@ -3044,9 +3613,11 @@ }, { "name": "Gor", + "depth": 9, "iso_1_code": null, "iso_3_code": "gqr", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8138", "native_tokenizers": [], @@ -3056,9 +3627,11 @@ }, { "name": "Gulay", + "depth": 9, "iso_1_code": null, "iso_3_code": "gvl", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8139", "native_tokenizers": [], @@ -3068,9 +3641,11 @@ }, { "name": "Horo", + "depth": 9, "iso_1_code": null, "iso_3_code": "hor", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8140", "native_tokenizers": [], @@ -3078,9 +3653,11 @@ }, { "name": "Kabba", + "depth": 9, "iso_1_code": null, "iso_3_code": "ksp", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8141", "native_tokenizers": [], @@ -3090,9 +3667,11 @@ }, { "name": "Laka", + "depth": 9, "iso_1_code": null, "iso_3_code": "lap", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8142", "native_tokenizers": [], @@ -3102,9 +3681,11 @@ }, { "name": "Mango", + "depth": 9, "iso_1_code": null, "iso_3_code": "mge", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8143", "native_tokenizers": [], @@ -3112,9 +3693,11 @@ }, { "name": "Sar", + "depth": 9, "iso_1_code": null, "iso_3_code": "mwm", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8144", "native_tokenizers": [], @@ -3124,9 +3707,11 @@ }, { "name": "Mbay", + "depth": 9, "iso_1_code": null, "iso_3_code": "myb", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8145", "native_tokenizers": [], @@ -3136,9 +3721,11 @@ }, { "name": "Ngam", + "depth": 9, "iso_1_code": null, "iso_3_code": "nmc", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8146", "native_tokenizers": [], @@ -3146,9 +3733,11 @@ }, { "name": "Ngambay", + "depth": 9, "iso_1_code": null, "iso_3_code": "sba", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8147", "native_tokenizers": [], @@ -3158,14 +3747,17 @@ }, { "name": "Sara Kaba", + "depth": 9, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaba D\u00e9m\u00e9, Sara", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8149", "native_tokenizers": [], @@ -3173,9 +3765,11 @@ }, { "name": "Kaba Naa, Sara", + "depth": 10, "iso_1_code": null, "iso_3_code": "kwv", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8150", "native_tokenizers": [], @@ -3183,9 +3777,11 @@ }, { "name": "Kulfa", + "depth": 10, "iso_1_code": null, "iso_3_code": "kxj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8151", "native_tokenizers": [], @@ -3193,21 +3789,25 @@ }, { "name": "Sara Kaba", + "depth": 10, "iso_1_code": null, "iso_3_code": "sbz", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8152", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8148", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8135", "native_tokenizers": [], @@ -3215,14 +3815,17 @@ }, { "name": "Vale", + "depth": 8, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luto", + "depth": 9, "iso_1_code": null, "iso_3_code": "ndy", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8154", "native_tokenizers": [], @@ -3232,27 +3835,32 @@ }, { "name": "Vale", + "depth": 9, "iso_1_code": null, "iso_3_code": "vae", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8155", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8153", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8134", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8122", "native_tokenizers": [], @@ -3260,26 +3868,31 @@ }, { "name": "Sinyar", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sinyar", + "depth": 7, "iso_1_code": null, "iso_3_code": "sys", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8157", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8156", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8103", "native_tokenizers": [], @@ -3287,14 +3900,17 @@ }, { "name": "Kresh", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aja", + "depth": 6, "iso_1_code": null, "iso_3_code": "aja", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8159", "native_tokenizers": [], @@ -3302,27 +3918,32 @@ }, { "name": "Gbaya", + "depth": 6, "iso_1_code": null, "iso_3_code": "krs", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8160", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8158", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8102", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8070", "native_tokenizers": [], @@ -3330,14 +3951,17 @@ }, { "name": "Fur", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amdang", + "depth": 4, "iso_1_code": null, "iso_3_code": "amj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8162", "native_tokenizers": [], @@ -3345,15 +3969,18 @@ }, { "name": "Fur", + "depth": 4, "iso_1_code": null, "iso_3_code": "fvr", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8163", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8161", "native_tokenizers": [], @@ -3361,20 +3988,24 @@ }, { "name": "Kunama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kunama", + "depth": 4, "iso_1_code": null, "iso_3_code": "kun", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8165", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8164", "native_tokenizers": [], @@ -3382,14 +4013,17 @@ }, { "name": "Maban", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karanga", + "depth": 4, "iso_1_code": null, "iso_3_code": "kth", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8167", "native_tokenizers": [], @@ -3397,20 +4031,24 @@ }, { "name": "Kendeje", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kendeje", + "depth": 5, "iso_1_code": null, "iso_3_code": "klf", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8169", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8168", "native_tokenizers": [], @@ -3418,14 +4056,17 @@ }, { "name": "Maba", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Maba", + "depth": 5, "iso_1_code": null, "iso_3_code": "mde", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8171", "native_tokenizers": [], @@ -3433,15 +4074,18 @@ }, { "name": "Marfa", + "depth": 5, "iso_1_code": null, "iso_3_code": "mvu", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8172", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8170", "native_tokenizers": [], @@ -3449,14 +4093,17 @@ }, { "name": "Masalit", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Massalat", + "depth": 5, "iso_1_code": null, "iso_3_code": "mdg", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8174", "native_tokenizers": [], @@ -3464,15 +4111,18 @@ }, { "name": "Masalit", + "depth": 5, "iso_1_code": null, "iso_3_code": "mls", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8175", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8173", "native_tokenizers": [], @@ -3480,14 +4130,17 @@ }, { "name": "Runga-Kibet", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kibet", + "depth": 5, "iso_1_code": null, "iso_3_code": "kie", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8177", "native_tokenizers": [], @@ -3495,15 +4148,18 @@ }, { "name": "Runga", + "depth": 5, "iso_1_code": null, "iso_3_code": "rou", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8178", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8176", "native_tokenizers": [], @@ -3511,38 +4167,45 @@ }, { "name": "Surbakhal", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Surbakhal", + "depth": 5, "iso_1_code": null, "iso_3_code": "sbj", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8180", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8179", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8166", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8068", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7871", "native_tokenizers": [], @@ -3550,14 +4213,17 @@ }, { "name": "Songhai", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Korandje", + "depth": 2, "iso_1_code": null, "iso_3_code": "kcy", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8182", "native_tokenizers": [], @@ -3565,14 +4231,17 @@ }, { "name": "Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tadaksahak", + "depth": 3, "iso_1_code": null, "iso_3_code": "dsq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8184", "native_tokenizers": [], @@ -3580,15 +4249,18 @@ }, { "name": "Tasawaq", + "depth": 3, "iso_1_code": null, "iso_3_code": "twq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8185", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8183", "native_tokenizers": [], @@ -3596,14 +4268,17 @@ }, { "name": "Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dendi", + "depth": 3, "iso_1_code": null, "iso_3_code": "ddn", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8187", "native_tokenizers": [], @@ -3613,9 +4288,11 @@ }, { "name": "Zarma", + "depth": 3, "iso_1_code": null, "iso_3_code": "dje", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8188", "native_tokenizers": [], @@ -3625,9 +4302,11 @@ }, { "name": "Songhay, Humburi Senni", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmb", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8189", "native_tokenizers": [], @@ -3635,9 +4314,11 @@ }, { "name": "Songhay, Koyra Chiini", + "depth": 3, "iso_1_code": null, "iso_3_code": "khq", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8190", "native_tokenizers": [], @@ -3647,9 +4328,11 @@ }, { "name": "Songhay, Koyraboro Senni", + "depth": 3, "iso_1_code": null, "iso_3_code": "ses", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8191", "native_tokenizers": [], @@ -3659,27 +4342,32 @@ }, { "name": "Tondi Songway Kiini", + "depth": 3, "iso_1_code": null, "iso_3_code": "tst", "children": [], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8192", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8186", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "8181", "native_tokenizers": [], "scripts": [] } ], + "family": "Nilo-Saharan", "tokenizers": {}, "node_i": "7849", "native_tokenizers": [], diff --git a/data/Nimboran.json b/data/Nimboran.json index 17c08487da5b85ffe06ad98f2ae37acaafadf523..9fcf22008c247e4bacbda33f5ed8f0196bb0c2a7 100644 --- a/data/Nimboran.json +++ b/data/Nimboran.json @@ -1,13 +1,16 @@ { "name": "Nimboran", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gresi", + "depth": 1, "iso_1_code": null, "iso_3_code": "grs", "children": [], + "family": "Nimboran", "tokenizers": {}, "node_i": "8194", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Mlap", + "depth": 1, "iso_1_code": null, "iso_3_code": "kja", "children": [], + "family": "Nimboran", "tokenizers": {}, "node_i": "8195", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Kemtuik", + "depth": 1, "iso_1_code": null, "iso_3_code": "kmt", "children": [], + "family": "Nimboran", "tokenizers": {}, "node_i": "8196", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Mekwei", + "depth": 1, "iso_1_code": null, "iso_3_code": "msf", "children": [], + "family": "Nimboran", "tokenizers": {}, "node_i": "8197", "native_tokenizers": [], @@ -45,15 +54,18 @@ }, { "name": "Nimboran", + "depth": 1, "iso_1_code": null, "iso_3_code": "nir", "children": [], + "family": "Nimboran", "tokenizers": {}, "node_i": "8198", "native_tokenizers": [], "scripts": [] } ], + "family": "Nimboran", "tokenizers": {}, "node_i": "8193", "native_tokenizers": [], diff --git a/data/North Bougainville.json b/data/North Bougainville.json index ba29be4c4f3e118b178bb19b29724ec2b8f3f93d..dd2ad73cc148478b4db1e24d84bf3a752b7c600b 100644 --- a/data/North Bougainville.json +++ b/data/North Bougainville.json @@ -1,24 +1,29 @@ { "name": "North Bougainville", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Keriaka", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ramopa", + "depth": 2, "iso_1_code": null, "iso_3_code": "kjx", "children": [], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8201", "native_tokenizers": [], "scripts": [] } ], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8200", "native_tokenizers": [], @@ -26,20 +31,24 @@ }, { "name": "Konua", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rapoisi", + "depth": 2, "iso_1_code": null, "iso_3_code": "kyx", "children": [], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8203", "native_tokenizers": [], "scripts": [] } ], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8202", "native_tokenizers": [], @@ -47,14 +56,17 @@ }, { "name": "Rotokas", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Askopan", + "depth": 2, "iso_1_code": null, "iso_3_code": "eiv", "children": [], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8205", "native_tokenizers": [], @@ -62,9 +74,11 @@ }, { "name": "Rotokas", + "depth": 2, "iso_1_code": null, "iso_3_code": "roo", "children": [], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8206", "native_tokenizers": [], @@ -73,12 +87,14 @@ ] } ], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8204", "native_tokenizers": [], "scripts": [] } ], + "family": "North Bougainville", "tokenizers": {}, "node_i": "8199", "native_tokenizers": [], diff --git a/data/Otomanguean.json b/data/Otomanguean.json index 86cd24b64e5290bfe2b78b18ff67b37e980bd96b..73dd4b03f7f7e1d65a309aec0416b577a1aa4fc2 100644 --- a/data/Otomanguean.json +++ b/data/Otomanguean.json @@ -1,28 +1,34 @@ { "name": "Otomanguean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Otomanguean", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amuzgo-Mixtecan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amuzgo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amuzgo, Guerrero", + "depth": 4, "iso_1_code": null, "iso_3_code": "amu", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8211", "native_tokenizers": [], @@ -32,9 +38,11 @@ }, { "name": "Amuzgo, San Pedro Amuzgos", + "depth": 4, "iso_1_code": null, "iso_3_code": "azg", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8212", "native_tokenizers": [], @@ -44,15 +52,18 @@ }, { "name": "Amuzgo, Ipalapa", + "depth": 4, "iso_1_code": null, "iso_3_code": "azm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8213", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8210", "native_tokenizers": [], @@ -60,19 +71,23 @@ }, { "name": "Mixtecan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cuicatec", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cuicatec, Teutila", + "depth": 5, "iso_1_code": null, "iso_3_code": "cut", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8216", "native_tokenizers": [], @@ -82,9 +97,11 @@ }, { "name": "Cuicatec, Tepeuxila", + "depth": 5, "iso_1_code": null, "iso_3_code": "cux", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8217", "native_tokenizers": [], @@ -93,6 +110,7 @@ ] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8215", "native_tokenizers": [], @@ -100,14 +118,17 @@ }, { "name": "Mixtec", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mixtec, Western Juxtlahuaca", + "depth": 5, "iso_1_code": null, "iso_3_code": "jmx", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8219", "native_tokenizers": [], @@ -115,9 +136,11 @@ }, { "name": "Mixtec, Yutanduchi", + "depth": 5, "iso_1_code": null, "iso_3_code": "mab", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8220", "native_tokenizers": [], @@ -125,9 +148,11 @@ }, { "name": "Mixtec, Amoltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mbz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8221", "native_tokenizers": [], @@ -135,9 +160,11 @@ }, { "name": "Mixtec, Itundujia", + "depth": 5, "iso_1_code": null, "iso_3_code": "mce", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8222", "native_tokenizers": [], @@ -145,9 +172,11 @@ }, { "name": "Mixtec, Santa Luc\u00eda Monteverde", + "depth": 5, "iso_1_code": null, "iso_3_code": "mdv", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8223", "native_tokenizers": [], @@ -155,9 +184,11 @@ }, { "name": "Mixtec, Southwestern Tlaxiaco", + "depth": 5, "iso_1_code": null, "iso_3_code": "meh", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8224", "native_tokenizers": [], @@ -165,9 +196,11 @@ }, { "name": "Mixtec, Atatlahuca", + "depth": 5, "iso_1_code": null, "iso_3_code": "mib", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8225", "native_tokenizers": [], @@ -177,9 +210,11 @@ }, { "name": "Mixtec, Ocotepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mie", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8226", "native_tokenizers": [], @@ -189,9 +224,11 @@ }, { "name": "Mixtec, San Miguel el Grande", + "depth": 5, "iso_1_code": null, "iso_3_code": "mig", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8227", "native_tokenizers": [], @@ -201,9 +238,11 @@ }, { "name": "Mixtec, Chayuco", + "depth": 5, "iso_1_code": null, "iso_3_code": "mih", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8228", "native_tokenizers": [], @@ -213,9 +252,11 @@ }, { "name": "Mixtec, Chigmecatitl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "mii", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8229", "native_tokenizers": [], @@ -223,9 +264,11 @@ }, { "name": "Mixtec, Pe\u00f1oles", + "depth": 5, "iso_1_code": null, "iso_3_code": "mil", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8230", "native_tokenizers": [], @@ -235,9 +278,11 @@ }, { "name": "Mixtec, Alacatlatzala", + "depth": 5, "iso_1_code": null, "iso_3_code": "mim", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8231", "native_tokenizers": [], @@ -247,9 +292,11 @@ }, { "name": "Mixtec, Pinotepa Nacional", + "depth": 5, "iso_1_code": null, "iso_3_code": "mio", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8232", "native_tokenizers": [], @@ -259,9 +306,11 @@ }, { "name": "Mixtec, Apasco-Apoala", + "depth": 5, "iso_1_code": null, "iso_3_code": "mip", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8233", "native_tokenizers": [], @@ -271,9 +320,11 @@ }, { "name": "Mixtec, Southern Puebla", + "depth": 5, "iso_1_code": null, "iso_3_code": "mit", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8234", "native_tokenizers": [], @@ -283,9 +334,11 @@ }, { "name": "Mixtec, Cacaloxtepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "miu", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8235", "native_tokenizers": [], @@ -293,9 +346,11 @@ }, { "name": "Mixtec, Mixtepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mix", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8236", "native_tokenizers": [], @@ -303,9 +358,11 @@ }, { "name": "Mixtec, Ayutla", + "depth": 5, "iso_1_code": null, "iso_3_code": "miy", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8237", "native_tokenizers": [], @@ -315,9 +372,11 @@ }, { "name": "Mixtec, Coatzospan", + "depth": 5, "iso_1_code": null, "iso_3_code": "miz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8238", "native_tokenizers": [], @@ -327,9 +386,11 @@ }, { "name": "Mixtec, San Juan Colorado", + "depth": 5, "iso_1_code": null, "iso_3_code": "mjc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8239", "native_tokenizers": [], @@ -339,9 +400,11 @@ }, { "name": "Mixtec, Silacayoapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "mks", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8240", "native_tokenizers": [], @@ -351,9 +414,11 @@ }, { "name": "Mixtec, Yosond\u00faa", + "depth": 5, "iso_1_code": null, "iso_3_code": "mpm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8241", "native_tokenizers": [], @@ -363,9 +428,11 @@ }, { "name": "Mixtec, Tlazoyaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mqh", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8242", "native_tokenizers": [], @@ -373,9 +440,11 @@ }, { "name": "Mixtec, Tututepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mtu", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8243", "native_tokenizers": [], @@ -383,9 +452,11 @@ }, { "name": "Mixtec, Tida\u00e1", + "depth": 5, "iso_1_code": null, "iso_3_code": "mtx", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8244", "native_tokenizers": [], @@ -393,9 +464,11 @@ }, { "name": "Mixtec, Yucua\u00f1e", + "depth": 5, "iso_1_code": null, "iso_3_code": "mvg", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8245", "native_tokenizers": [], @@ -403,9 +476,11 @@ }, { "name": "Mixtec, Northwest Oaxaca", + "depth": 5, "iso_1_code": null, "iso_3_code": "mxa", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8246", "native_tokenizers": [], @@ -413,9 +488,11 @@ }, { "name": "Mixtec, Tezoatl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "mxb", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8247", "native_tokenizers": [], @@ -425,9 +502,11 @@ }, { "name": "Mixtec, Huitepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mxs", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8248", "native_tokenizers": [], @@ -435,9 +514,11 @@ }, { "name": "Mixtec, Jamiltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mxt", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8249", "native_tokenizers": [], @@ -447,9 +528,11 @@ }, { "name": "Mixtec, Metlat\u00f3noc", + "depth": 5, "iso_1_code": null, "iso_3_code": "mxv", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8250", "native_tokenizers": [], @@ -459,9 +542,11 @@ }, { "name": "Mixtec, Southeastern Nochixtl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "mxy", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8251", "native_tokenizers": [], @@ -469,9 +554,11 @@ }, { "name": "Mixtec, Santa Mar\u00eda Zacatepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "mza", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8252", "native_tokenizers": [], @@ -481,9 +568,11 @@ }, { "name": "Mixtec, Juxtlahuaca", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8253", "native_tokenizers": [], @@ -491,9 +580,11 @@ }, { "name": "Mixtec, Ixtayutla", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmj", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8254", "native_tokenizers": [], @@ -501,9 +592,11 @@ }, { "name": "Mixtec, Mitlatongo", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8255", "native_tokenizers": [], @@ -511,9 +604,11 @@ }, { "name": "Mixtec, Soyaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8256", "native_tokenizers": [], @@ -521,9 +616,11 @@ }, { "name": "Mixtec, Tamazola", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmx", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8257", "native_tokenizers": [], @@ -531,9 +628,11 @@ }, { "name": "Mixtec, Alcozauca", + "depth": 5, "iso_1_code": null, "iso_3_code": "xta", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8258", "native_tokenizers": [], @@ -541,9 +640,11 @@ }, { "name": "Mixtec, Chazumba", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtb", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8259", "native_tokenizers": [], @@ -551,9 +652,11 @@ }, { "name": "Mixtec, Diuxi-Tilantongo", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtd", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8260", "native_tokenizers": [], @@ -563,9 +666,11 @@ }, { "name": "Mixtec, Sinicahua", + "depth": 5, "iso_1_code": null, "iso_3_code": "xti", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8261", "native_tokenizers": [], @@ -573,9 +678,11 @@ }, { "name": "Mixtec, San Juan Teita", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtj", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8262", "native_tokenizers": [], @@ -583,9 +690,11 @@ }, { "name": "Mixtec, Tijaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtl", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8263", "native_tokenizers": [], @@ -593,9 +702,11 @@ }, { "name": "Mixtec, Magdalena Pe\u00f1asco", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8264", "native_tokenizers": [], @@ -605,9 +716,11 @@ }, { "name": "Mixtec, Northern Tlaxiaco", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtn", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8265", "native_tokenizers": [], @@ -617,9 +730,11 @@ }, { "name": "Mixtec, San Miguel Piedras", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtp", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8266", "native_tokenizers": [], @@ -627,9 +742,11 @@ }, { "name": "Mixtec, Sindihui", + "depth": 5, "iso_1_code": null, "iso_3_code": "xts", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8267", "native_tokenizers": [], @@ -637,9 +754,11 @@ }, { "name": "Mixtec, Tacahua", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtt", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8268", "native_tokenizers": [], @@ -647,9 +766,11 @@ }, { "name": "Mixtec, Cuyamecalco", + "depth": 5, "iso_1_code": null, "iso_3_code": "xtu", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8269", "native_tokenizers": [], @@ -657,15 +778,18 @@ }, { "name": "Mixtec, Yolox\u00f3chitl", + "depth": 5, "iso_1_code": null, "iso_3_code": "xty", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8270", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8218", "native_tokenizers": [], @@ -673,14 +797,17 @@ }, { "name": "Trique", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Triqui, Copala", + "depth": 5, "iso_1_code": null, "iso_3_code": "trc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8272", "native_tokenizers": [], @@ -690,9 +817,11 @@ }, { "name": "Triqui, San Mart\u00edn Itunyoso", + "depth": 5, "iso_1_code": null, "iso_3_code": "trq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8273", "native_tokenizers": [], @@ -702,9 +831,11 @@ }, { "name": "Triqui, Chicahuaxtla", + "depth": 5, "iso_1_code": null, "iso_3_code": "trs", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8274", "native_tokenizers": [], @@ -713,18 +844,21 @@ ] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8271", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8214", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8209", "native_tokenizers": [], @@ -732,19 +866,23 @@ }, { "name": "Popolocan-Zapotecan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Popolocan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chocholtec", + "depth": 4, "iso_1_code": null, "iso_3_code": "coz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8277", "native_tokenizers": [], @@ -752,9 +890,11 @@ }, { "name": "Ixcatec", + "depth": 4, "iso_1_code": null, "iso_3_code": "ixc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8278", "native_tokenizers": [], @@ -762,14 +902,17 @@ }, { "name": "Mazatec", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mazatec, San Jer\u00f3nimo Tec\u00f3atl", + "depth": 5, "iso_1_code": null, "iso_3_code": "maa", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8280", "native_tokenizers": [], @@ -779,9 +922,11 @@ }, { "name": "Mazatec, Jalapa de D\u00edaz", + "depth": 5, "iso_1_code": null, "iso_3_code": "maj", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8281", "native_tokenizers": [], @@ -791,9 +936,11 @@ }, { "name": "Mazatec, Chiquihuitl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "maq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8282", "native_tokenizers": [], @@ -803,9 +950,11 @@ }, { "name": "Mazatec, Huautla", + "depth": 5, "iso_1_code": null, "iso_3_code": "mau", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8283", "native_tokenizers": [], @@ -815,9 +964,11 @@ }, { "name": "Mazatec, Ixcatl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "mzi", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8284", "native_tokenizers": [], @@ -825,9 +976,11 @@ }, { "name": "Mazatec, Puebla and Northeastern", + "depth": 5, "iso_1_code": null, "iso_3_code": "pbm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8285", "native_tokenizers": [], @@ -835,9 +988,11 @@ }, { "name": "Mazatec, Soyaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmp", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8286", "native_tokenizers": [], @@ -845,9 +1000,11 @@ }, { "name": "Mazatec, Ayautla", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmy", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8287", "native_tokenizers": [], @@ -857,15 +1014,18 @@ }, { "name": "Mazatec, Mazatl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "vmz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8288", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8279", "native_tokenizers": [], @@ -873,14 +1033,17 @@ }, { "name": "Popoloca", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Popoloca, Mezontla", + "depth": 5, "iso_1_code": null, "iso_3_code": "pbe", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8290", "native_tokenizers": [], @@ -888,9 +1051,11 @@ }, { "name": "Popoloca, Coyotepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "pbf", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8291", "native_tokenizers": [], @@ -898,9 +1063,11 @@ }, { "name": "Popoloca, Santa In\u00e9s Ahuatempan", + "depth": 5, "iso_1_code": null, "iso_3_code": "pca", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8292", "native_tokenizers": [], @@ -908,9 +1075,11 @@ }, { "name": "Popoloca, San Marcos Tlacoyalco", + "depth": 5, "iso_1_code": null, "iso_3_code": "pls", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8293", "native_tokenizers": [], @@ -920,9 +1089,11 @@ }, { "name": "Popoloca, San Juan Atzingo", + "depth": 5, "iso_1_code": null, "iso_3_code": "poe", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8294", "native_tokenizers": [], @@ -932,9 +1103,11 @@ }, { "name": "Popoloca, San Felipe Otlaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "pow", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8295", "native_tokenizers": [], @@ -942,9 +1115,11 @@ }, { "name": "Popoloca, San Lu\u00eds Temalacayuca", + "depth": 5, "iso_1_code": null, "iso_3_code": "pps", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8296", "native_tokenizers": [], @@ -953,12 +1128,14 @@ ] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8289", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8276", "native_tokenizers": [], @@ -966,19 +1143,23 @@ }, { "name": "Zapotecan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chatino", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chatino, Eastern Highland", + "depth": 5, "iso_1_code": null, "iso_3_code": "cly", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8299", "native_tokenizers": [], @@ -988,9 +1169,11 @@ }, { "name": "Chatino, Tataltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "cta", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8300", "native_tokenizers": [], @@ -1000,9 +1183,11 @@ }, { "name": "Chatino, Western Highland", + "depth": 5, "iso_1_code": null, "iso_3_code": "ctp", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8301", "native_tokenizers": [], @@ -1012,9 +1197,11 @@ }, { "name": "Chatino, Zacatepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "ctz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8302", "native_tokenizers": [], @@ -1022,9 +1209,11 @@ }, { "name": "Chatino, Nopala", + "depth": 5, "iso_1_code": null, "iso_3_code": "cya", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8303", "native_tokenizers": [], @@ -1034,15 +1223,18 @@ }, { "name": "Chatino, Zenzontepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "czn", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8304", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8298", "native_tokenizers": [], @@ -1050,14 +1242,17 @@ }, { "name": "Zapotec", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zapotec, Sierra de Ju\u00e1rez", + "depth": 5, "iso_1_code": null, "iso_3_code": "zaa", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8306", "native_tokenizers": [], @@ -1067,9 +1262,11 @@ }, { "name": "Zapotec, Western Tlacolula Valley", + "depth": 5, "iso_1_code": null, "iso_3_code": "zab", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8307", "native_tokenizers": [], @@ -1079,9 +1276,11 @@ }, { "name": "Zapotec, Ocotl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "zac", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8308", "native_tokenizers": [], @@ -1091,9 +1290,11 @@ }, { "name": "Zapotec, Cajonos", + "depth": 5, "iso_1_code": null, "iso_3_code": "zad", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8309", "native_tokenizers": [], @@ -1103,9 +1304,11 @@ }, { "name": "Zapotec, Yareni", + "depth": 5, "iso_1_code": null, "iso_3_code": "zae", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8310", "native_tokenizers": [], @@ -1115,9 +1318,11 @@ }, { "name": "Zapotec, Ayoquesco", + "depth": 5, "iso_1_code": null, "iso_3_code": "zaf", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8311", "native_tokenizers": [], @@ -1125,9 +1330,11 @@ }, { "name": "Zapotec, Isthmus", + "depth": 5, "iso_1_code": null, "iso_3_code": "zai", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8312", "native_tokenizers": [], @@ -1137,9 +1344,11 @@ }, { "name": "Zapotec, Miahuatl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "zam", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8313", "native_tokenizers": [], @@ -1149,9 +1358,11 @@ }, { "name": "Zapotec, Ozolotepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "zao", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8314", "native_tokenizers": [], @@ -1161,9 +1372,11 @@ }, { "name": "Zapotec, Alo\u00e1pam", + "depth": 5, "iso_1_code": null, "iso_3_code": "zaq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8315", "native_tokenizers": [], @@ -1171,9 +1384,11 @@ }, { "name": "Zapotec, Rinc\u00f3n", + "depth": 5, "iso_1_code": null, "iso_3_code": "zar", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8316", "native_tokenizers": [], @@ -1183,9 +1398,11 @@ }, { "name": "Zapotec, Santo Domingo Albarradas", + "depth": 5, "iso_1_code": null, "iso_3_code": "zas", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8317", "native_tokenizers": [], @@ -1195,9 +1412,11 @@ }, { "name": "Zapotec, Tabaa", + "depth": 5, "iso_1_code": null, "iso_3_code": "zat", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8318", "native_tokenizers": [], @@ -1207,9 +1426,11 @@ }, { "name": "Zapotec, Yatzachi", + "depth": 5, "iso_1_code": null, "iso_3_code": "zav", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8319", "native_tokenizers": [], @@ -1219,9 +1440,11 @@ }, { "name": "Zapotec, Mitla", + "depth": 5, "iso_1_code": null, "iso_3_code": "zaw", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8320", "native_tokenizers": [], @@ -1231,9 +1454,11 @@ }, { "name": "Zapotec, Xadani", + "depth": 5, "iso_1_code": null, "iso_3_code": "zax", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8321", "native_tokenizers": [], @@ -1241,9 +1466,11 @@ }, { "name": "Zapotec, Coatecas Altas", + "depth": 5, "iso_1_code": null, "iso_3_code": "zca", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8322", "native_tokenizers": [], @@ -1253,9 +1480,11 @@ }, { "name": "Zapotec, Las Delicias", + "depth": 5, "iso_1_code": null, "iso_3_code": "zcd", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8323", "native_tokenizers": [], @@ -1263,9 +1492,11 @@ }, { "name": "Zapotec, Asunci\u00f3n Mixtepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "zoo", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8324", "native_tokenizers": [], @@ -1273,9 +1504,11 @@ }, { "name": "Zapotec, Lachiguiri", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpa", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8325", "native_tokenizers": [], @@ -1285,9 +1518,11 @@ }, { "name": "Zapotec, Yautepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpb", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8326", "native_tokenizers": [], @@ -1295,9 +1530,11 @@ }, { "name": "Zapotec, Choapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8327", "native_tokenizers": [], @@ -1307,9 +1544,11 @@ }, { "name": "Zapotec, Southeastern Ixtl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpd", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8328", "native_tokenizers": [], @@ -1317,9 +1556,11 @@ }, { "name": "Zapotec, Petapa", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpe", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8329", "native_tokenizers": [], @@ -1327,9 +1568,11 @@ }, { "name": "Zapotec, San Pedro Quiatoni", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpf", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8330", "native_tokenizers": [], @@ -1337,9 +1580,11 @@ }, { "name": "Zapotec, Guevea de Humboldt", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpg", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8331", "native_tokenizers": [], @@ -1349,9 +1594,11 @@ }, { "name": "Zapotec, Totomachapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "zph", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8332", "native_tokenizers": [], @@ -1359,9 +1606,11 @@ }, { "name": "Zapotec, Santa Mar\u00eda Quiegolani", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpi", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8333", "native_tokenizers": [], @@ -1371,9 +1620,11 @@ }, { "name": "Zapotec, Quiavicuzas", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpj", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8334", "native_tokenizers": [], @@ -1383,9 +1634,11 @@ }, { "name": "Zapotec, Tlacolulita", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpk", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8335", "native_tokenizers": [], @@ -1393,9 +1646,11 @@ }, { "name": "Zapotec, Lachix\u00edo", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpl", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8336", "native_tokenizers": [], @@ -1405,9 +1660,11 @@ }, { "name": "Zapotec, Mixtepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8337", "native_tokenizers": [], @@ -1417,9 +1674,11 @@ }, { "name": "Zapotec, Santa In\u00e9s Yatzechi", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpn", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8338", "native_tokenizers": [], @@ -1427,9 +1686,11 @@ }, { "name": "Zapotec, Amatl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpo", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8339", "native_tokenizers": [], @@ -1439,9 +1700,11 @@ }, { "name": "Zapotec, El Alto", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpp", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8340", "native_tokenizers": [], @@ -1449,9 +1712,11 @@ }, { "name": "Zapotec, Zoogocho", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8341", "native_tokenizers": [], @@ -1461,9 +1726,11 @@ }, { "name": "Zapotec, Santiago Xanica", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpr", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8342", "native_tokenizers": [], @@ -1471,9 +1738,11 @@ }, { "name": "Zapotec, Coatl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "zps", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8343", "native_tokenizers": [], @@ -1481,9 +1750,11 @@ }, { "name": "Zapotec, San Vicente Coatl\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpt", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8344", "native_tokenizers": [], @@ -1493,9 +1764,11 @@ }, { "name": "Zapotec, Yal\u00e1lag", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpu", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8345", "native_tokenizers": [], @@ -1505,9 +1778,11 @@ }, { "name": "Zapotec, Chichicapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpv", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8346", "native_tokenizers": [], @@ -1517,9 +1792,11 @@ }, { "name": "Zapotec, Zaniza", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpw", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8347", "native_tokenizers": [], @@ -1527,9 +1804,11 @@ }, { "name": "Zapotec, San Baltazar Loxicha", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpx", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8348", "native_tokenizers": [], @@ -1537,9 +1816,11 @@ }, { "name": "Zapotec, Mazaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpy", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8349", "native_tokenizers": [], @@ -1547,9 +1828,11 @@ }, { "name": "Zapotec, Texmelucan", + "depth": 5, "iso_1_code": null, "iso_3_code": "zpz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8350", "native_tokenizers": [], @@ -1559,9 +1842,11 @@ }, { "name": "Zapotec, Southern Rincon", + "depth": 5, "iso_1_code": null, "iso_3_code": "zsr", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8351", "native_tokenizers": [], @@ -1571,9 +1856,11 @@ }, { "name": "Zapotec, Elotepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "zte", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8352", "native_tokenizers": [], @@ -1581,9 +1868,11 @@ }, { "name": "Zapotec, Xanagu\u00eda", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztg", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8353", "native_tokenizers": [], @@ -1591,9 +1880,11 @@ }, { "name": "Zapotec, Lapagu\u00eda-Guivini", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztl", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8354", "native_tokenizers": [], @@ -1601,9 +1892,11 @@ }, { "name": "Zapotec, San Agust\u00edn Mixtepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8355", "native_tokenizers": [], @@ -1611,9 +1904,11 @@ }, { "name": "Zapotec, Santa Catarina Albarradas", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztn", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8356", "native_tokenizers": [], @@ -1621,9 +1916,11 @@ }, { "name": "Zapotec, Loxicha", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztp", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8357", "native_tokenizers": [], @@ -1631,9 +1928,11 @@ }, { "name": "Zapotec, Quioquitani-Quier\u00ed", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8358", "native_tokenizers": [], @@ -1643,9 +1942,11 @@ }, { "name": "Zapotec, Tilquiapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "zts", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8359", "native_tokenizers": [], @@ -1653,9 +1954,11 @@ }, { "name": "Zapotec, Tejalapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztt", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8360", "native_tokenizers": [], @@ -1663,9 +1966,11 @@ }, { "name": "Zapotec, G\u00fcil\u00e1", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztu", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8361", "native_tokenizers": [], @@ -1673,9 +1978,11 @@ }, { "name": "Zapotec, Zaachila", + "depth": 5, "iso_1_code": null, "iso_3_code": "ztx", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8362", "native_tokenizers": [], @@ -1683,9 +1990,11 @@ }, { "name": "Zapotec, Yatee", + "depth": 5, "iso_1_code": null, "iso_3_code": "zty", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8363", "native_tokenizers": [], @@ -1694,24 +2003,28 @@ ] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8305", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8297", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8275", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8208", "native_tokenizers": [], @@ -1719,24 +2032,29 @@ }, { "name": "Western Otomanguean", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oto-Pame-Chinantecan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinantecan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinantec, Comaltepec", + "depth": 4, "iso_1_code": null, "iso_3_code": "cco", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8367", "native_tokenizers": [], @@ -1746,9 +2064,11 @@ }, { "name": "Chinantec, Ojitl\u00e1n", + "depth": 4, "iso_1_code": null, "iso_3_code": "chj", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8368", "native_tokenizers": [], @@ -1758,9 +2078,11 @@ }, { "name": "Chinantec, Quiotepec", + "depth": 4, "iso_1_code": null, "iso_3_code": "chq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8369", "native_tokenizers": [], @@ -1770,9 +2092,11 @@ }, { "name": "Chinantec, Ozumac\u00edn", + "depth": 4, "iso_1_code": null, "iso_3_code": "chz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8370", "native_tokenizers": [], @@ -1782,9 +2106,11 @@ }, { "name": "Chinantec, Lealao", + "depth": 4, "iso_1_code": null, "iso_3_code": "cle", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8371", "native_tokenizers": [], @@ -1794,9 +2120,11 @@ }, { "name": "Chinantec, Lalana", + "depth": 4, "iso_1_code": null, "iso_3_code": "cnl", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8372", "native_tokenizers": [], @@ -1806,9 +2134,11 @@ }, { "name": "Chinantec, Tepetotutla", + "depth": 4, "iso_1_code": null, "iso_3_code": "cnt", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8373", "native_tokenizers": [], @@ -1818,9 +2148,11 @@ }, { "name": "Chinantec, Palantla", + "depth": 4, "iso_1_code": null, "iso_3_code": "cpa", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8374", "native_tokenizers": [], @@ -1830,9 +2162,11 @@ }, { "name": "Chinantec, Chiltepec", + "depth": 4, "iso_1_code": null, "iso_3_code": "csa", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8375", "native_tokenizers": [], @@ -1840,9 +2174,11 @@ }, { "name": "Chinantec, Sochiapam", + "depth": 4, "iso_1_code": null, "iso_3_code": "cso", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8376", "native_tokenizers": [], @@ -1852,9 +2188,11 @@ }, { "name": "Chinantec, Tepinapa", + "depth": 4, "iso_1_code": null, "iso_3_code": "cte", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8377", "native_tokenizers": [], @@ -1862,9 +2200,11 @@ }, { "name": "Chinantec, Tlacoatzintepec", + "depth": 4, "iso_1_code": null, "iso_3_code": "ctl", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8378", "native_tokenizers": [], @@ -1872,9 +2212,11 @@ }, { "name": "Chinantec, Usila", + "depth": 4, "iso_1_code": null, "iso_3_code": "cuc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8379", "native_tokenizers": [], @@ -1884,15 +2226,18 @@ }, { "name": "Chinantec, Valle Nacional", + "depth": 4, "iso_1_code": null, "iso_3_code": "cvn", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8380", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8366", "native_tokenizers": [], @@ -1900,14 +2245,17 @@ }, { "name": "Oto-Pamean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chichimeco-Jonaz", + "depth": 4, "iso_1_code": null, "iso_3_code": "pei", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8382", "native_tokenizers": [], @@ -1915,14 +2263,17 @@ }, { "name": "Matlatzinca-Ocuilteco", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Matlatzinca, San Francisco", + "depth": 5, "iso_1_code": null, "iso_3_code": "mat", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8384", "native_tokenizers": [], @@ -1930,15 +2281,18 @@ }, { "name": "Matlatzinca, Atzingo", + "depth": 5, "iso_1_code": null, "iso_3_code": "ocu", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8385", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8383", "native_tokenizers": [], @@ -1946,14 +2300,17 @@ }, { "name": "Mazahua", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mazahua, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "maz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8387", "native_tokenizers": [], @@ -1963,15 +2320,18 @@ }, { "name": "Mazahua, Michoac\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "mmc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8388", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8386", "native_tokenizers": [], @@ -1979,14 +2339,17 @@ }, { "name": "Otomi", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Otomi, Mezquital", + "depth": 5, "iso_1_code": null, "iso_3_code": "ote", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8390", "native_tokenizers": [], @@ -1996,9 +2359,11 @@ }, { "name": "Otomi, Tilapa", + "depth": 5, "iso_1_code": null, "iso_3_code": "otl", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8391", "native_tokenizers": [], @@ -2006,9 +2371,11 @@ }, { "name": "Otomi, Eastern Highland", + "depth": 5, "iso_1_code": null, "iso_3_code": "otm", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8392", "native_tokenizers": [], @@ -2018,9 +2385,11 @@ }, { "name": "Otomi, Tenango", + "depth": 5, "iso_1_code": null, "iso_3_code": "otn", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8393", "native_tokenizers": [], @@ -2030,9 +2399,11 @@ }, { "name": "Otomi, Quer\u00e9taro", + "depth": 5, "iso_1_code": null, "iso_3_code": "otq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8394", "native_tokenizers": [], @@ -2042,9 +2413,11 @@ }, { "name": "Otom\u00ed, Estado de M\u00e9xico", + "depth": 5, "iso_1_code": null, "iso_3_code": "ots", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8395", "native_tokenizers": [], @@ -2054,9 +2427,11 @@ }, { "name": "Otomi, Temoaya", + "depth": 5, "iso_1_code": null, "iso_3_code": "ott", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8396", "native_tokenizers": [], @@ -2064,9 +2439,11 @@ }, { "name": "Otomi, Texcatepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "otx", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8397", "native_tokenizers": [], @@ -2074,15 +2451,18 @@ }, { "name": "Otomi, Ixtenco", + "depth": 5, "iso_1_code": null, "iso_3_code": "otz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8398", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8389", "native_tokenizers": [], @@ -2090,14 +2470,17 @@ }, { "name": "Pame", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pame, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "pbs", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8400", "native_tokenizers": [], @@ -2105,9 +2488,11 @@ }, { "name": "Pame, Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": "pmq", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8401", "native_tokenizers": [], @@ -2117,27 +2502,32 @@ }, { "name": "Pame, Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": "pmz", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8402", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8399", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8381", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8365", "native_tokenizers": [], @@ -2145,25 +2535,30 @@ }, { "name": "Tlapanec-Manguean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Manguean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chiapanec", + "depth": 4, "iso_1_code": null, "iso_3_code": "cip", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8405", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8404", "native_tokenizers": [], @@ -2171,14 +2566,17 @@ }, { "name": "Tlapanec-Subtiaba", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Subtiaba", + "depth": 4, "iso_1_code": null, "iso_3_code": "sut", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8407", "native_tokenizers": [], @@ -2186,14 +2584,17 @@ }, { "name": "Tlapanec", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Me\u2019phaa, Malinaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "tcf", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8409", "native_tokenizers": [], @@ -2203,9 +2604,11 @@ }, { "name": "Me\u2019phaa, Azoy\u00fa", + "depth": 5, "iso_1_code": null, "iso_3_code": "tpc", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8410", "native_tokenizers": [], @@ -2213,9 +2616,11 @@ }, { "name": "Me\u2019phaa, Tlacoapa", + "depth": 5, "iso_1_code": null, "iso_3_code": "tpl", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8411", "native_tokenizers": [], @@ -2223,39 +2628,46 @@ }, { "name": "Me\u2019phaa, Acatepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "tpx", "children": [], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8412", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8408", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8406", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8403", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8364", "native_tokenizers": [], "scripts": [] } ], + "family": "Otomanguean", "tokenizers": {}, "node_i": "8207", "native_tokenizers": [], diff --git a/data/Paezan.json b/data/Paezan.json index c23c135f39032acd4506acae1cb95feea88b077e..f25781b94de0397d2e13a66842288ea0f1dc33b4 100644 --- a/data/Paezan.json +++ b/data/Paezan.json @@ -1,13 +1,16 @@ { "name": "Paezan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andaqui", + "depth": 1, "iso_1_code": null, "iso_3_code": "ana", "children": [], + "family": "Paezan", "tokenizers": {}, "node_i": "8414", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Coconuco", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anserma", + "depth": 2, "iso_1_code": null, "iso_3_code": "ans", "children": [], + "family": "Paezan", "tokenizers": {}, "node_i": "8416", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Caramanta", + "depth": 2, "iso_1_code": null, "iso_3_code": "crf", "children": [], + "family": "Paezan", "tokenizers": {}, "node_i": "8417", "native_tokenizers": [], @@ -40,9 +48,11 @@ }, { "name": "Misak", + "depth": 2, "iso_1_code": null, "iso_3_code": "gum", "children": [], + "family": "Paezan", "tokenizers": {}, "node_i": "8418", "native_tokenizers": [], @@ -52,15 +62,18 @@ }, { "name": "Totoro", + "depth": 2, "iso_1_code": null, "iso_3_code": "ttk", "children": [], + "family": "Paezan", "tokenizers": {}, "node_i": "8419", "native_tokenizers": [], "scripts": [] } ], + "family": "Paezan", "tokenizers": {}, "node_i": "8415", "native_tokenizers": [], @@ -68,14 +81,17 @@ }, { "name": "Paezan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nasa", + "depth": 2, "iso_1_code": null, "iso_3_code": "pbb", "children": [], + "family": "Paezan", "tokenizers": {}, "node_i": "8421", "native_tokenizers": [], @@ -84,12 +100,14 @@ ] } ], + "family": "Paezan", "tokenizers": {}, "node_i": "8420", "native_tokenizers": [], "scripts": [] } ], + "family": "Paezan", "tokenizers": {}, "node_i": "8413", "native_tokenizers": [], diff --git a/data/Palaihnihan.json b/data/Palaihnihan.json index 82c76bdbc3764bbbbfc93cf0bab3133d3744481b..537e595aca37ab9aaf69edb561c932f145e59b40 100644 --- a/data/Palaihnihan.json +++ b/data/Palaihnihan.json @@ -1,13 +1,16 @@ { "name": "Palaihnihan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Achumawi", + "depth": 1, "iso_1_code": null, "iso_3_code": "acv", "children": [], + "family": "Palaihnihan", "tokenizers": {}, "node_i": "8423", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Atsugewi", + "depth": 1, "iso_1_code": null, "iso_3_code": "atw", "children": [], + "family": "Palaihnihan", "tokenizers": {}, "node_i": "8424", "native_tokenizers": [], "scripts": [] } ], + "family": "Palaihnihan", "tokenizers": {}, "node_i": "8422", "native_tokenizers": [], diff --git a/data/Panoan.json b/data/Panoan.json index 12912d021e54a96d5e7b283a7fc208e4c021265b..d99b57302563965dc4cc1c5c54a39d132f723371 100644 --- a/data/Panoan.json +++ b/data/Panoan.json @@ -1,13 +1,16 @@ { "name": "Panoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaxarar\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": "ktx", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8426", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Pisabo", + "depth": 1, "iso_1_code": null, "iso_3_code": "pig", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8427", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Sensi", + "depth": 1, "iso_1_code": null, "iso_3_code": "sni", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8428", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Kulina Pano", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpk", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8429", "native_tokenizers": [], @@ -45,14 +54,17 @@ }, { "name": "Bolivian Panoan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pacahuara", + "depth": 2, "iso_1_code": null, "iso_3_code": "pcp", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8431", "native_tokenizers": [], @@ -60,14 +72,17 @@ }, { "name": "Ch\u00e1kobo", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ch\u00e1cobo", + "depth": 3, "iso_1_code": null, "iso_3_code": "cao", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8433", "native_tokenizers": [], @@ -76,12 +91,14 @@ ] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8432", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8430", "native_tokenizers": [], @@ -89,14 +106,17 @@ }, { "name": "Mainline", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Poyan\u00e1wa", + "depth": 2, "iso_1_code": null, "iso_3_code": "pyn", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8435", "native_tokenizers": [], @@ -104,9 +124,11 @@ }, { "name": "Tuxin\u00e1wa", + "depth": 2, "iso_1_code": null, "iso_3_code": "tux", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8436", "native_tokenizers": [], @@ -114,14 +136,17 @@ }, { "name": "Cashibo", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kakataibo-Kashibo", + "depth": 3, "iso_1_code": null, "iso_3_code": "cbr", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8438", "native_tokenizers": [], @@ -130,6 +155,7 @@ ] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8437", "native_tokenizers": [], @@ -137,20 +163,24 @@ }, { "name": "Pano", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Panobo", + "depth": 3, "iso_1_code": null, "iso_3_code": "pno", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8440", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8439", "native_tokenizers": [], @@ -158,14 +188,17 @@ }, { "name": "Shipibo", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Capanahua", + "depth": 3, "iso_1_code": null, "iso_3_code": "kaq", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8442", "native_tokenizers": [], @@ -175,9 +208,11 @@ }, { "name": "Katuk\u00edna, Panoan", + "depth": 3, "iso_1_code": null, "iso_3_code": "knt", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8443", "native_tokenizers": [], @@ -185,9 +220,11 @@ }, { "name": "Marubo", + "depth": 3, "iso_1_code": null, "iso_3_code": "mzr", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8444", "native_tokenizers": [], @@ -195,9 +232,11 @@ }, { "name": "Remo", + "depth": 3, "iso_1_code": null, "iso_3_code": "rem", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8445", "native_tokenizers": [], @@ -205,9 +244,11 @@ }, { "name": "Shipibo-Conibo", + "depth": 3, "iso_1_code": null, "iso_3_code": "shp", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8446", "native_tokenizers": [], @@ -216,6 +257,7 @@ ] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8441", "native_tokenizers": [], @@ -223,14 +265,17 @@ }, { "name": "Tri-State", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kashinawa", + "depth": 3, "iso_1_code": null, "iso_3_code": "cbs", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8448", "native_tokenizers": [], @@ -240,9 +285,11 @@ }, { "name": "Sharanahua", + "depth": 3, "iso_1_code": null, "iso_3_code": "mcd", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8449", "native_tokenizers": [], @@ -252,9 +299,11 @@ }, { "name": "Yaminahua", + "depth": 3, "iso_1_code": null, "iso_3_code": "yaa", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8450", "native_tokenizers": [], @@ -264,9 +313,11 @@ }, { "name": "Yawanawa", + "depth": 3, "iso_1_code": null, "iso_3_code": "ywn", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8451", "native_tokenizers": [], @@ -274,14 +325,17 @@ }, { "name": "Amawaka", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amahuaca", + "depth": 4, "iso_1_code": null, "iso_3_code": "amc", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8453", "native_tokenizers": [], @@ -289,21 +343,25 @@ }, { "name": "Isconahua", + "depth": 4, "iso_1_code": null, "iso_3_code": "isc", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8454", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8452", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8447", "native_tokenizers": [], @@ -311,14 +369,17 @@ }, { "name": "Unclassified", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atsahuaca", + "depth": 3, "iso_1_code": null, "iso_3_code": "atc", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8456", "native_tokenizers": [], @@ -326,9 +387,11 @@ }, { "name": "Yora", + "depth": 3, "iso_1_code": null, "iso_3_code": "mts", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8457", "native_tokenizers": [], @@ -336,21 +399,25 @@ }, { "name": "Nukuini", + "depth": 3, "iso_1_code": null, "iso_3_code": "nuc", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8458", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8455", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8434", "native_tokenizers": [], @@ -358,14 +425,17 @@ }, { "name": "Mayoruna-Mats\u00e9s", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Matses", + "depth": 2, "iso_1_code": null, "iso_3_code": "mcf", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8460", "native_tokenizers": [], @@ -375,9 +445,11 @@ }, { "name": "Mat\u00eds", + "depth": 2, "iso_1_code": null, "iso_3_code": "mpq", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8461", "native_tokenizers": [], @@ -385,21 +457,25 @@ }, { "name": "Korubo", + "depth": 2, "iso_1_code": null, "iso_3_code": "xor", "children": [], + "family": "Panoan", "tokenizers": {}, "node_i": "8462", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8459", "native_tokenizers": [], "scripts": [] } ], + "family": "Panoan", "tokenizers": {}, "node_i": "8425", "native_tokenizers": [], diff --git a/data/Pauwasi.json b/data/Pauwasi.json index f299e54d4074206ed45717ebadf76e9ff8bcc562..2b203375649c0d750f55920cfb1a498df3481467 100644 --- a/data/Pauwasi.json +++ b/data/Pauwasi.json @@ -1,18 +1,22 @@ { "name": "Pauwasi", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Emem", + "depth": 2, "iso_1_code": null, "iso_3_code": "enr", "children": [], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8465", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Zorop", + "depth": 2, "iso_1_code": null, "iso_3_code": "wfg", "children": [], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8466", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Karkar-Yuri", + "depth": 2, "iso_1_code": null, "iso_3_code": "yuj", "children": [], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8467", "native_tokenizers": [], @@ -41,6 +49,7 @@ ] } ], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8464", "native_tokenizers": [], @@ -48,14 +57,17 @@ }, { "name": "Western", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tebi", + "depth": 2, "iso_1_code": null, "iso_3_code": "dmu", "children": [], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8469", "native_tokenizers": [], @@ -63,21 +75,25 @@ }, { "name": "Towei", + "depth": 2, "iso_1_code": null, "iso_3_code": "ttn", "children": [], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8470", "native_tokenizers": [], "scripts": [] } ], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8468", "native_tokenizers": [], "scripts": [] } ], + "family": "Pauwasi", "tokenizers": {}, "node_i": "8463", "native_tokenizers": [], diff --git a/data/Piawi.json b/data/Piawi.json index 2e0a4dadb646c26a6c2c2db76d90285ff329c2cf..b78688860c61377dc10e6e29b0f631713a2c75f4 100644 --- a/data/Piawi.json +++ b/data/Piawi.json @@ -1,13 +1,16 @@ { "name": "Piawi", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pinai-Hagahai", + "depth": 1, "iso_1_code": null, "iso_3_code": "pnn", "children": [], + "family": "Piawi", "tokenizers": {}, "node_i": "8472", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Haruai", + "depth": 1, "iso_1_code": null, "iso_3_code": "tmd", "children": [], + "family": "Piawi", "tokenizers": {}, "node_i": "8473", "native_tokenizers": [], @@ -26,6 +31,7 @@ ] } ], + "family": "Piawi", "tokenizers": {}, "node_i": "8471", "native_tokenizers": [], diff --git a/data/Pidgin.json b/data/Pidgin.json index 57ae7b2b345451d719e4a6dc499a5c9c6248410c..8c6a6626067c0fae8d5477841914e4840fac9fee 100644 --- a/data/Pidgin.json +++ b/data/Pidgin.json @@ -1,13 +1,16 @@ { "name": "Pidgin", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mobilian", + "depth": 1, "iso_1_code": null, "iso_3_code": "mod", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8475", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Ndyuka-Trio Pidgin", + "depth": 1, "iso_1_code": null, "iso_3_code": "njt", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8476", "native_tokenizers": [], @@ -25,14 +30,17 @@ }, { "name": "Amerindian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinook Wawa", + "depth": 2, "iso_1_code": null, "iso_3_code": "chn", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8478", "native_tokenizers": [], @@ -40,15 +48,18 @@ }, { "name": "Delaware, Pidgin", + "depth": 2, "iso_1_code": null, "iso_3_code": "dep", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8479", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8477", "native_tokenizers": [], @@ -56,20 +67,24 @@ }, { "name": "Assamese based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nefamese", + "depth": 2, "iso_1_code": null, "iso_3_code": "nef", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8481", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8480", "native_tokenizers": [], @@ -77,25 +92,30 @@ }, { "name": "English based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atlantic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Liberian English", + "depth": 3, "iso_1_code": null, "iso_3_code": "lir", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8484", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8483", "native_tokenizers": [], @@ -103,26 +123,31 @@ }, { "name": "Pacific", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinese Pidgin English", + "depth": 3, "iso_1_code": null, "iso_3_code": "cpi", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8486", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8485", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8482", "native_tokenizers": [], @@ -130,20 +155,24 @@ }, { "name": "French based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tay Boi", + "depth": 2, "iso_1_code": null, "iso_3_code": "tas", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8488", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8487", "native_tokenizers": [], @@ -151,14 +180,17 @@ }, { "name": "Hausa based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barikanchi", + "depth": 2, "iso_1_code": null, "iso_3_code": "bxo", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8490", "native_tokenizers": [], @@ -166,15 +198,18 @@ }, { "name": "Gibanawa", + "depth": 2, "iso_1_code": null, "iso_3_code": "gib", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8491", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8489", "native_tokenizers": [], @@ -182,20 +217,24 @@ }, { "name": "Iha based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iha Based Pidgin", + "depth": 2, "iso_1_code": null, "iso_3_code": "ihb", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8493", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8492", "native_tokenizers": [], @@ -203,20 +242,24 @@ }, { "name": "Malay based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Broome Pearling Lugger Pidgin", + "depth": 2, "iso_1_code": null, "iso_3_code": "bpl", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8495", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8494", "native_tokenizers": [], @@ -224,14 +267,17 @@ }, { "name": "Motu based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Motu, Hiri", + "depth": 2, "iso_1_code": "ho", "iso_3_code": "hmo", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8497", "native_tokenizers": [], @@ -240,6 +286,7 @@ ] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8496", "native_tokenizers": [], @@ -247,20 +294,24 @@ }, { "name": "Onin based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Onin Based Pidgin", + "depth": 2, "iso_1_code": null, "iso_3_code": "onx", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8499", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8498", "native_tokenizers": [], @@ -268,20 +319,24 @@ }, { "name": "Romance based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lingua Franca", + "depth": 2, "iso_1_code": null, "iso_3_code": "pml", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8501", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8500", "native_tokenizers": [], @@ -289,20 +344,24 @@ }, { "name": "Swahili based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Settla", + "depth": 2, "iso_1_code": null, "iso_3_code": "sta", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8503", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8502", "native_tokenizers": [], @@ -310,26 +369,31 @@ }, { "name": "Zulu based", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pidgin Bantu", + "depth": 2, "iso_1_code": null, "iso_3_code": "fng", "children": [], + "family": "Pidgin", "tokenizers": {}, "node_i": "8505", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8504", "native_tokenizers": [], "scripts": [] } ], + "family": "Pidgin", "tokenizers": {}, "node_i": "8474", "native_tokenizers": [], diff --git a/data/Pomoan.json b/data/Pomoan.json index 5d3e3b9450204c5855f581736c7d9772bae21cc8..11077a17d8c9533807b6781ed1f50bd19994af70 100644 --- a/data/Pomoan.json +++ b/data/Pomoan.json @@ -1,13 +1,16 @@ { "name": "Pomoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pomo, Eastern", + "depth": 1, "iso_1_code": null, "iso_3_code": "peb", "children": [], + "family": "Pomoan", "tokenizers": {}, "node_i": "8507", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Pomo, Northeastern", + "depth": 1, "iso_1_code": null, "iso_3_code": "pef", "children": [], + "family": "Pomoan", "tokenizers": {}, "node_i": "8508", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Pomo, Southeastern", + "depth": 1, "iso_1_code": null, "iso_3_code": "pom", "children": [], + "family": "Pomoan", "tokenizers": {}, "node_i": "8509", "native_tokenizers": [], @@ -35,14 +42,17 @@ }, { "name": "Western", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pomo, Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": "pej", "children": [], + "family": "Pomoan", "tokenizers": {}, "node_i": "8511", "native_tokenizers": [], @@ -50,14 +60,17 @@ }, { "name": "Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kashaya", + "depth": 3, "iso_1_code": null, "iso_3_code": "kju", "children": [], + "family": "Pomoan", "tokenizers": {}, "node_i": "8513", "native_tokenizers": [], @@ -65,9 +78,11 @@ }, { "name": "Pomo, Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": "peq", "children": [], + "family": "Pomoan", "tokenizers": {}, "node_i": "8514", "native_tokenizers": [], @@ -75,27 +90,32 @@ }, { "name": "Pomo, Central", + "depth": 3, "iso_1_code": null, "iso_3_code": "poo", "children": [], + "family": "Pomoan", "tokenizers": {}, "node_i": "8515", "native_tokenizers": [], "scripts": [] } ], + "family": "Pomoan", "tokenizers": {}, "node_i": "8512", "native_tokenizers": [], "scripts": [] } ], + "family": "Pomoan", "tokenizers": {}, "node_i": "8510", "native_tokenizers": [], "scripts": [] } ], + "family": "Pomoan", "tokenizers": {}, "node_i": "8506", "native_tokenizers": [], diff --git a/data/Puinavean.json b/data/Puinavean.json index 69088b63fe56700fe31e0677073d0fa8e115397b..311f1ac14f6bc8d132a255fc075677a5b1990a06 100644 --- a/data/Puinavean.json +++ b/data/Puinavean.json @@ -1,13 +1,16 @@ { "name": "Puinavean", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "D\u00e2w", + "depth": 1, "iso_1_code": null, "iso_3_code": "kwa", "children": [], + "family": "Puinavean", "tokenizers": {}, "node_i": "8517", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Puinave", + "depth": 1, "iso_1_code": null, "iso_3_code": "pui", "children": [], + "family": "Puinavean", "tokenizers": {}, "node_i": "8518", "native_tokenizers": [], @@ -27,14 +32,17 @@ }, { "name": "Cacua", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cacua", + "depth": 2, "iso_1_code": null, "iso_3_code": "cbv", "children": [], + "family": "Puinavean", "tokenizers": {}, "node_i": "8520", "native_tokenizers": [], @@ -44,15 +52,18 @@ }, { "name": "Nukak Mak\u00fa", + "depth": 2, "iso_1_code": null, "iso_3_code": "mbr", "children": [], + "family": "Puinavean", "tokenizers": {}, "node_i": "8521", "native_tokenizers": [], "scripts": [] } ], + "family": "Puinavean", "tokenizers": {}, "node_i": "8519", "native_tokenizers": [], @@ -60,14 +71,17 @@ }, { "name": "Hupda", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hupd\u00eb", + "depth": 2, "iso_1_code": null, "iso_3_code": "jup", "children": [], + "family": "Puinavean", "tokenizers": {}, "node_i": "8523", "native_tokenizers": [], @@ -75,15 +89,18 @@ }, { "name": "Yuhup", + "depth": 2, "iso_1_code": null, "iso_3_code": "yab", "children": [], + "family": "Puinavean", "tokenizers": {}, "node_i": "8524", "native_tokenizers": [], "scripts": [] } ], + "family": "Puinavean", "tokenizers": {}, "node_i": "8522", "native_tokenizers": [], @@ -91,14 +108,17 @@ }, { "name": "Kaburi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nad\u00ebb", + "depth": 2, "iso_1_code": null, "iso_3_code": "mbj", "children": [], + "family": "Puinavean", "tokenizers": {}, "node_i": "8526", "native_tokenizers": [], @@ -107,12 +127,14 @@ ] } ], + "family": "Puinavean", "tokenizers": {}, "node_i": "8525", "native_tokenizers": [], "scripts": [] } ], + "family": "Puinavean", "tokenizers": {}, "node_i": "8516", "native_tokenizers": [], diff --git a/data/Purian.json b/data/Purian.json index 7146b2c89624b3e33661d43efca89d9f9073ec09..9f83d9b0cfd7a6def44bb35b5fcc169b47fec95f 100644 --- a/data/Purian.json +++ b/data/Purian.json @@ -1,13 +1,16 @@ { "name": "Purian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Puri", + "depth": 1, "iso_1_code": null, "iso_3_code": "prr", "children": [], + "family": "Purian", "tokenizers": {}, "node_i": "8528", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Korop\u00f3", + "depth": 1, "iso_1_code": null, "iso_3_code": "xxr", "children": [], + "family": "Purian", "tokenizers": {}, "node_i": "8529", "native_tokenizers": [], "scripts": [] } ], + "family": "Purian", "tokenizers": {}, "node_i": "8527", "native_tokenizers": [], diff --git a/data/Quechuan.json b/data/Quechuan.json index 8a5e36aa996858141cd9e5080bbfe4800f72c6ac..2f771cc221957c9cf9c00eaa711792da0e4344a2 100644 --- a/data/Quechuan.json +++ b/data/Quechuan.json @@ -1,18 +1,22 @@ { "name": "Quechuan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Quechua", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Pacaraos", + "depth": 2, "iso_1_code": "qu", "iso_3_code": "qvp", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8532", "native_tokenizers": [], @@ -20,14 +24,17 @@ }, { "name": "Ap-am-ah", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Huallaga", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qub", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8534", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Quechua, Ambo-Pasco", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qva", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8535", "native_tokenizers": [], @@ -49,9 +58,11 @@ }, { "name": "Quechua, Panao", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qxh", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8536", "native_tokenizers": [], @@ -61,14 +72,17 @@ }, { "name": "Alto Mara\u00f1\u00f3n", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Huamal\u00edes-Dos de Mayo", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvh", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8538", "native_tokenizers": [], @@ -78,9 +92,11 @@ }, { "name": "Quechua, Margos-Yarowilca-Lauricocha", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvm", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8539", "native_tokenizers": [], @@ -89,6 +105,7 @@ ] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8537", "native_tokenizers": [], @@ -96,14 +113,17 @@ }, { "name": "Alto Pativilca", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Cajatambo North Lima", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvl", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8541", "native_tokenizers": [], @@ -111,21 +131,25 @@ }, { "name": "Quechua, Chiqui\u00e1n", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qxa", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8542", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8540", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8533", "native_tokenizers": [], @@ -133,14 +157,17 @@ }, { "name": "Wankay", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Chaupihuaranga", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qur", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8544", "native_tokenizers": [], @@ -148,9 +175,11 @@ }, { "name": "Quechua, Yauyos", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qux", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8545", "native_tokenizers": [], @@ -158,9 +187,11 @@ }, { "name": "Quechua, North Jun\u00edn", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qvn", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8546", "native_tokenizers": [], @@ -170,9 +201,11 @@ }, { "name": "Quechua, Huaylla Wanca", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qvw", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8547", "native_tokenizers": [], @@ -182,9 +215,11 @@ }, { "name": "Quechua, Chincha", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qxc", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8548", "native_tokenizers": [], @@ -192,9 +227,11 @@ }, { "name": "Quechua, Santa Ana de Tusi Pasco", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qxt", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8549", "native_tokenizers": [], @@ -202,15 +239,18 @@ }, { "name": "Quechua, Jauja Wanca", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qxw", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8550", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8543", "native_tokenizers": [], @@ -218,14 +258,17 @@ }, { "name": "Waylay", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Corongo Ancash", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qwa", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8552", "native_tokenizers": [], @@ -233,9 +276,11 @@ }, { "name": "Quechua, Huaylas Ancash", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qwh", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8553", "native_tokenizers": [], @@ -245,9 +290,11 @@ }, { "name": "Quechua, Sihuas Ancash", + "depth": 3, "iso_1_code": "qu", "iso_3_code": "qws", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8554", "native_tokenizers": [], @@ -255,14 +302,17 @@ }, { "name": "Conchucos", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Northern Conchucos", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qxn", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8556", "native_tokenizers": [], @@ -272,9 +322,11 @@ }, { "name": "Quechua, Southern Conchucos", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qxo", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8557", "native_tokenizers": [], @@ -283,18 +335,21 @@ ] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8555", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8551", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8531", "native_tokenizers": [], @@ -302,24 +357,29 @@ }, { "name": "Peripheral Quechua", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinchay", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern Chinchay", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inga", + "depth": 4, "iso_1_code": null, "iso_3_code": "inb", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8561", "native_tokenizers": [], @@ -329,9 +389,11 @@ }, { "name": "Inga, Jungle", + "depth": 4, "iso_1_code": null, "iso_3_code": "inj", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8562", "native_tokenizers": [], @@ -339,9 +401,11 @@ }, { "name": "Quichua, Calder\u00f3n Highland", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qud", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8563", "native_tokenizers": [], @@ -349,9 +413,11 @@ }, { "name": "Quichua, Chimborazo Highland", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qug", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8564", "native_tokenizers": [], @@ -361,9 +427,11 @@ }, { "name": "Quechua, Chachapoyas", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "quk", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8565", "native_tokenizers": [], @@ -371,9 +439,11 @@ }, { "name": "Quechua, Southern Pastaza", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qup", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8566", "native_tokenizers": [], @@ -383,9 +453,11 @@ }, { "name": "Quichua, Tena Lowland", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "quw", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8567", "native_tokenizers": [], @@ -395,9 +467,11 @@ }, { "name": "Quichua, Imbabura Highland", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvi", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8568", "native_tokenizers": [], @@ -407,9 +481,11 @@ }, { "name": "Quichua, Loja Highland", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvj", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8569", "native_tokenizers": [], @@ -417,9 +493,11 @@ }, { "name": "Quichua, Napo", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvo", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8570", "native_tokenizers": [], @@ -429,9 +507,11 @@ }, { "name": "Quechua, San Mart\u00edn", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvs", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8571", "native_tokenizers": [], @@ -441,9 +521,11 @@ }, { "name": "Quichua, Northern Pastaza", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvz", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8572", "native_tokenizers": [], @@ -453,9 +535,11 @@ }, { "name": "Quichua, Salasaca Highland", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qxl", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8573", "native_tokenizers": [], @@ -465,9 +549,11 @@ }, { "name": "Quichua, Ca\u00f1ar Highland", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qxr", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8574", "native_tokenizers": [], @@ -476,6 +562,7 @@ ] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8560", "native_tokenizers": [], @@ -483,14 +570,17 @@ }, { "name": "Southern Chinchay", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, South Bolivian", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "quh", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8576", "native_tokenizers": [], @@ -500,9 +590,11 @@ }, { "name": "Quechua, North Bolivian", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qul", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8577", "native_tokenizers": [], @@ -512,9 +604,11 @@ }, { "name": "Quichua, Santiago del Estero", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qus", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8578", "native_tokenizers": [], @@ -524,14 +618,17 @@ }, { "name": "Southern Peruvian Quechua", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Ayacucho", + "depth": 5, "iso_1_code": "qu", "iso_3_code": "quy", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8580", "native_tokenizers": [], @@ -541,9 +638,11 @@ }, { "name": "Quechua, Cusco", + "depth": 5, "iso_1_code": "qu", "iso_3_code": "quz", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8581", "native_tokenizers": [], @@ -553,9 +652,11 @@ }, { "name": "Quechua, Eastern Apur\u00edmac", + "depth": 5, "iso_1_code": "qu", "iso_3_code": "qve", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8582", "native_tokenizers": [], @@ -565,9 +666,11 @@ }, { "name": "Quechua, Puno", + "depth": 5, "iso_1_code": "qu", "iso_3_code": "qxp", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8583", "native_tokenizers": [], @@ -575,27 +678,32 @@ }, { "name": "Quechua, Arequipa-La Uni\u00f3n", + "depth": 5, "iso_1_code": "qu", "iso_3_code": "qxu", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8584", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8579", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8575", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8559", "native_tokenizers": [], @@ -603,19 +711,23 @@ }, { "name": "Yungay", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Quechua, Lambayeque", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "quf", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8587", "native_tokenizers": [], @@ -625,9 +737,11 @@ }, { "name": "Quechua, Cajamarca", + "depth": 4, "iso_1_code": "qu", "iso_3_code": "qvc", "children": [], + "family": "Quechuan", "tokenizers": {}, "node_i": "8588", "native_tokenizers": [], @@ -636,24 +750,28 @@ ] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8586", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8585", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8558", "native_tokenizers": [], "scripts": [] } ], + "family": "Quechuan", "tokenizers": {}, "node_i": "8530", "native_tokenizers": [], diff --git a/data/Ramu-Lower Sepik.json b/data/Ramu-Lower Sepik.json index 8688a689ddf04f9c351ff30fdb3e64a99de56ae2..393af7f0986cfce1801e3a653e2da691edf8d34f 100644 --- a/data/Ramu-Lower Sepik.json +++ b/data/Ramu-Lower Sepik.json @@ -1,24 +1,29 @@ { "name": "Ramu-Lower Sepik", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kambot", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ap Ma", + "depth": 2, "iso_1_code": null, "iso_3_code": "kbx", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8591", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8590", "native_tokenizers": [], @@ -26,25 +31,30 @@ }, { "name": "Lower Sepik", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angoram", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angoram", + "depth": 3, "iso_1_code": null, "iso_3_code": "aog", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8594", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8593", "native_tokenizers": [], @@ -52,20 +62,24 @@ }, { "name": "Chambri", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chambri", + "depth": 3, "iso_1_code": null, "iso_3_code": "can", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8596", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8595", "native_tokenizers": [], @@ -73,14 +87,17 @@ }, { "name": "Karawari", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karawari", + "depth": 3, "iso_1_code": null, "iso_3_code": "tzx", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8598", "native_tokenizers": [], @@ -88,15 +105,18 @@ }, { "name": "Yimas", + "depth": 3, "iso_1_code": null, "iso_3_code": "yee", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8599", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8597", "native_tokenizers": [], @@ -104,14 +124,17 @@ }, { "name": "Nor", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Murik", + "depth": 3, "iso_1_code": null, "iso_3_code": "mtf", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8601", "native_tokenizers": [], @@ -119,21 +142,25 @@ }, { "name": "Kopar", + "depth": 3, "iso_1_code": null, "iso_3_code": "xop", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8602", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8600", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8592", "native_tokenizers": [], @@ -141,19 +168,23 @@ }, { "name": "Ramu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Grass", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abu", + "depth": 3, "iso_1_code": null, "iso_3_code": "ado", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8605", "native_tokenizers": [], @@ -161,9 +192,11 @@ }, { "name": "Ambakich", + "depth": 3, "iso_1_code": null, "iso_3_code": "aew", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8606", "native_tokenizers": [], @@ -171,9 +204,11 @@ }, { "name": "Waran", + "depth": 3, "iso_1_code": null, "iso_3_code": "byz", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8607", "native_tokenizers": [], @@ -181,15 +216,18 @@ }, { "name": "Gorovu", + "depth": 3, "iso_1_code": null, "iso_3_code": "grq", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8608", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8604", "native_tokenizers": [], @@ -197,14 +235,17 @@ }, { "name": "Middle Ramu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aiome", + "depth": 3, "iso_1_code": null, "iso_3_code": "aki", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8610", "native_tokenizers": [], @@ -212,9 +253,11 @@ }, { "name": "Anor", + "depth": 3, "iso_1_code": null, "iso_3_code": "anj", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8611", "native_tokenizers": [], @@ -222,15 +265,18 @@ }, { "name": "Rao", + "depth": 3, "iso_1_code": null, "iso_3_code": "rao", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8612", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8609", "native_tokenizers": [], @@ -238,14 +284,17 @@ }, { "name": "Mikarew", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kire", + "depth": 3, "iso_1_code": null, "iso_3_code": "geb", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8614", "native_tokenizers": [], @@ -255,9 +304,11 @@ }, { "name": "Aruamu", + "depth": 3, "iso_1_code": null, "iso_3_code": "msy", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8615", "native_tokenizers": [], @@ -267,9 +318,11 @@ }, { "name": "Akukem", + "depth": 3, "iso_1_code": null, "iso_3_code": "spm", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8616", "native_tokenizers": [], @@ -278,6 +331,7 @@ ] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8613", "native_tokenizers": [], @@ -285,19 +339,23 @@ }, { "name": "Ottilien", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Borei", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mbore", + "depth": 4, "iso_1_code": null, "iso_3_code": "gai", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8619", "native_tokenizers": [], @@ -306,6 +364,7 @@ ] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8618", "native_tokenizers": [], @@ -313,14 +372,17 @@ }, { "name": "Bosmun-Awar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awar", + "depth": 4, "iso_1_code": null, "iso_3_code": "aya", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8621", "native_tokenizers": [], @@ -328,15 +390,18 @@ }, { "name": "Bosmun", + "depth": 4, "iso_1_code": null, "iso_3_code": "bqs", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8622", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8620", "native_tokenizers": [], @@ -344,14 +409,17 @@ }, { "name": "Watam", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kayan", + "depth": 4, "iso_1_code": null, "iso_3_code": "kct", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8624", "native_tokenizers": [], @@ -359,21 +427,25 @@ }, { "name": "Marangis", + "depth": 4, "iso_1_code": null, "iso_3_code": "wax", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8625", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8623", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8617", "native_tokenizers": [], @@ -381,14 +453,17 @@ }, { "name": "Tamolan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chini", + "depth": 3, "iso_1_code": null, "iso_3_code": "afi", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8627", "native_tokenizers": [], @@ -396,9 +471,11 @@ }, { "name": "Breri", + "depth": 3, "iso_1_code": null, "iso_3_code": "brq", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8628", "native_tokenizers": [], @@ -406,9 +483,11 @@ }, { "name": "Igana", + "depth": 3, "iso_1_code": null, "iso_3_code": "igg", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8629", "native_tokenizers": [], @@ -416,9 +495,11 @@ }, { "name": "Inapang", + "depth": 3, "iso_1_code": null, "iso_3_code": "mzu", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8630", "native_tokenizers": [], @@ -426,9 +507,11 @@ }, { "name": "Romkun", + "depth": 3, "iso_1_code": null, "iso_3_code": "rmk", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8631", "native_tokenizers": [], @@ -436,15 +519,18 @@ }, { "name": "Kominimung", + "depth": 3, "iso_1_code": null, "iso_3_code": "xoi", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8632", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8626", "native_tokenizers": [], @@ -452,14 +538,17 @@ }, { "name": "Tanggu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andarum", + "depth": 3, "iso_1_code": null, "iso_3_code": "aod", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8634", "native_tokenizers": [], @@ -467,9 +556,11 @@ }, { "name": "Kanggape", + "depth": 3, "iso_1_code": null, "iso_3_code": "igm", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8635", "native_tokenizers": [], @@ -477,9 +568,11 @@ }, { "name": "Tanguat", + "depth": 3, "iso_1_code": null, "iso_3_code": "tbs", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8636", "native_tokenizers": [], @@ -487,27 +580,32 @@ }, { "name": "Tanggu", + "depth": 3, "iso_1_code": null, "iso_3_code": "tgu", "children": [], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8637", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8633", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8603", "native_tokenizers": [], "scripts": [] } ], + "family": "Ramu-Lower Sepik", "tokenizers": {}, "node_i": "8589", "native_tokenizers": [], diff --git a/data/Sahaptian.json b/data/Sahaptian.json index 684d06e055d38825a0ef4d02028bb465c2bcd35a..373c1477429e2e9054be3661032f26b3f7a65304 100644 --- a/data/Sahaptian.json +++ b/data/Sahaptian.json @@ -1,13 +1,16 @@ { "name": "Sahaptian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nez Perce", + "depth": 1, "iso_1_code": null, "iso_3_code": "nez", "children": [], + "family": "Sahaptian", "tokenizers": {}, "node_i": "8639", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Sahaptin", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tenino", + "depth": 2, "iso_1_code": null, "iso_3_code": "tqn", "children": [], + "family": "Sahaptian", "tokenizers": {}, "node_i": "8641", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Umatilla", + "depth": 2, "iso_1_code": null, "iso_3_code": "uma", "children": [], + "family": "Sahaptian", "tokenizers": {}, "node_i": "8642", "native_tokenizers": [], @@ -40,9 +48,11 @@ }, { "name": "Walla Walla", + "depth": 2, "iso_1_code": null, "iso_3_code": "waa", "children": [], + "family": "Sahaptian", "tokenizers": {}, "node_i": "8643", "native_tokenizers": [], @@ -50,21 +60,25 @@ }, { "name": "Yakama", + "depth": 2, "iso_1_code": null, "iso_3_code": "yak", "children": [], + "family": "Sahaptian", "tokenizers": {}, "node_i": "8644", "native_tokenizers": [], "scripts": [] } ], + "family": "Sahaptian", "tokenizers": {}, "node_i": "8640", "native_tokenizers": [], "scripts": [] } ], + "family": "Sahaptian", "tokenizers": {}, "node_i": "8638", "native_tokenizers": [], diff --git a/data/Salish.json b/data/Salish.json index 12c6cbc8fd42aa2dc2bdb60df838cfab90916cc3..a887acb46ecf9200436d820a5e7a122c285ca61d 100644 --- a/data/Salish.json +++ b/data/Salish.json @@ -1,13 +1,16 @@ { "name": "Salish", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bella Coola", + "depth": 1, "iso_1_code": null, "iso_3_code": "blc", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8646", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Tillamook", + "depth": 1, "iso_1_code": null, "iso_3_code": "til", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8647", "native_tokenizers": [], @@ -25,14 +30,17 @@ }, { "name": "Central Salish", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Clallam", + "depth": 2, "iso_1_code": null, "iso_3_code": "clm", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8649", "native_tokenizers": [], @@ -40,9 +48,11 @@ }, { "name": "Comox", + "depth": 2, "iso_1_code": null, "iso_3_code": "coo", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8650", "native_tokenizers": [], @@ -50,9 +60,11 @@ }, { "name": "Halkomelem", + "depth": 2, "iso_1_code": null, "iso_3_code": "hur", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8651", "native_tokenizers": [], @@ -60,9 +72,11 @@ }, { "name": "Nooksack", + "depth": 2, "iso_1_code": null, "iso_3_code": "nok", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8652", "native_tokenizers": [], @@ -70,9 +84,11 @@ }, { "name": "Pentlatch", + "depth": 2, "iso_1_code": null, "iso_3_code": "ptw", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8653", "native_tokenizers": [], @@ -80,9 +96,11 @@ }, { "name": "Sechelt", + "depth": 2, "iso_1_code": null, "iso_3_code": "sec", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8654", "native_tokenizers": [], @@ -90,9 +108,11 @@ }, { "name": "Squamish", + "depth": 2, "iso_1_code": null, "iso_3_code": "squ", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8655", "native_tokenizers": [], @@ -100,9 +120,11 @@ }, { "name": "Northern Straits Salish", + "depth": 2, "iso_1_code": null, "iso_3_code": "str", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8656", "native_tokenizers": [], @@ -110,9 +132,11 @@ }, { "name": "Twana", + "depth": 2, "iso_1_code": null, "iso_3_code": "twa", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8657", "native_tokenizers": [], @@ -120,14 +144,17 @@ }, { "name": "Lushootseed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lushootseed", + "depth": 3, "iso_1_code": null, "iso_3_code": "lut", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8659", "native_tokenizers": [], @@ -135,9 +162,11 @@ }, { "name": "Skagit", + "depth": 3, "iso_1_code": null, "iso_3_code": "ska", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8660", "native_tokenizers": [], @@ -145,9 +174,11 @@ }, { "name": "Southern Lushootseed", + "depth": 3, "iso_1_code": null, "iso_3_code": "slh", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8661", "native_tokenizers": [], @@ -155,21 +186,25 @@ }, { "name": "Snohomish", + "depth": 3, "iso_1_code": null, "iso_3_code": "sno", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8662", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8658", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8648", "native_tokenizers": [], @@ -177,14 +212,17 @@ }, { "name": "Interior", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lillooet", + "depth": 2, "iso_1_code": null, "iso_3_code": "lil", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8664", "native_tokenizers": [], @@ -192,9 +230,11 @@ }, { "name": "Shuswap", + "depth": 2, "iso_1_code": null, "iso_3_code": "shs", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8665", "native_tokenizers": [], @@ -202,20 +242,24 @@ }, { "name": "Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Thompson", + "depth": 3, "iso_1_code": null, "iso_3_code": "thp", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8667", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8666", "native_tokenizers": [], @@ -223,14 +267,17 @@ }, { "name": "Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Columbia-Wenatchi", + "depth": 3, "iso_1_code": null, "iso_3_code": "col", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8669", "native_tokenizers": [], @@ -238,9 +285,11 @@ }, { "name": "Coeur d\u2019Alene", + "depth": 3, "iso_1_code": null, "iso_3_code": "crd", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8670", "native_tokenizers": [], @@ -248,9 +297,11 @@ }, { "name": "Okanagan", + "depth": 3, "iso_1_code": null, "iso_3_code": "oka", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8671", "native_tokenizers": [], @@ -258,14 +309,17 @@ }, { "name": "Kalispel", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalispel-Pend d\u2019Oreille", + "depth": 4, "iso_1_code": null, "iso_3_code": "fla", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8673", "native_tokenizers": [], @@ -273,27 +327,32 @@ }, { "name": "Spokane", + "depth": 4, "iso_1_code": null, "iso_3_code": "spo", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8674", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8672", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8668", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8663", "native_tokenizers": [], @@ -301,19 +360,23 @@ }, { "name": "Tsamosan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inland", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chehalis, Upper", + "depth": 3, "iso_1_code": null, "iso_3_code": "cjh", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8677", "native_tokenizers": [], @@ -321,15 +384,18 @@ }, { "name": "Cowlitz", + "depth": 3, "iso_1_code": null, "iso_3_code": "cow", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8678", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8676", "native_tokenizers": [], @@ -337,14 +403,17 @@ }, { "name": "Maritime", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chehalis, Lower", + "depth": 3, "iso_1_code": null, "iso_3_code": "cea", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8680", "native_tokenizers": [], @@ -352,27 +421,32 @@ }, { "name": "Quinault", + "depth": 3, "iso_1_code": null, "iso_3_code": "qun", "children": [], + "family": "Salish", "tokenizers": {}, "node_i": "8681", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8679", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8675", "native_tokenizers": [], "scripts": [] } ], + "family": "Salish", "tokenizers": {}, "node_i": "8645", "native_tokenizers": [], diff --git a/data/Senagi.json b/data/Senagi.json index c1672545f8686a54a0fe78aaa2680ac8ef0a3147..dc7ed03b3e5ce392080b22d29320a6eab2c9c864 100644 --- a/data/Senagi.json +++ b/data/Senagi.json @@ -1,13 +1,16 @@ { "name": "Senagi", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angor", + "depth": 1, "iso_1_code": null, "iso_3_code": "agg", "children": [], + "family": "Senagi", "tokenizers": {}, "node_i": "8683", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Dla", + "depth": 1, "iso_1_code": null, "iso_3_code": "kbv", "children": [], + "family": "Senagi", "tokenizers": {}, "node_i": "8684", "native_tokenizers": [], "scripts": [] } ], + "family": "Senagi", "tokenizers": {}, "node_i": "8682", "native_tokenizers": [], diff --git a/data/Sepik.json b/data/Sepik.json index ab884d0b5f5842a9a7b595c36e871423af3778e5..bc625eec9e78706f88008f40723d79346fb60e89 100644 --- a/data/Sepik.json +++ b/data/Sepik.json @@ -1,18 +1,22 @@ { "name": "Sepik", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abau", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abau", + "depth": 2, "iso_1_code": null, "iso_3_code": "aau", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8687", "native_tokenizers": [], @@ -21,6 +25,7 @@ ] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8686", "native_tokenizers": [], @@ -28,14 +33,17 @@ }, { "name": "Iwam", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amal", + "depth": 2, "iso_1_code": null, "iso_3_code": "aad", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8689", "native_tokenizers": [], @@ -43,9 +51,11 @@ }, { "name": "Iwam", + "depth": 2, "iso_1_code": null, "iso_3_code": "iwm", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8690", "native_tokenizers": [], @@ -53,9 +63,11 @@ }, { "name": "Iwam, Sepik", + "depth": 2, "iso_1_code": null, "iso_3_code": "iws", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8691", "native_tokenizers": [], @@ -64,6 +76,7 @@ ] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8688", "native_tokenizers": [], @@ -71,14 +84,17 @@ }, { "name": "Leonhard Schultze", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pefiyahe", + "depth": 2, "iso_1_code": null, "iso_3_code": "ppq", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8693", "native_tokenizers": [], @@ -86,9 +102,11 @@ }, { "name": "Tuwari", + "depth": 2, "iso_1_code": null, "iso_3_code": "tww", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8694", "native_tokenizers": [], @@ -96,9 +114,11 @@ }, { "name": "Walio", + "depth": 2, "iso_1_code": null, "iso_3_code": "wla", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8695", "native_tokenizers": [], @@ -106,15 +126,18 @@ }, { "name": "Yawiyo", + "depth": 2, "iso_1_code": null, "iso_3_code": "ybx", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8696", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8692", "native_tokenizers": [], @@ -122,14 +145,17 @@ }, { "name": "Ndu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ambulas", + "depth": 2, "iso_1_code": null, "iso_3_code": "abt", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8698", "native_tokenizers": [], @@ -139,9 +165,11 @@ }, { "name": "Burui", + "depth": 2, "iso_1_code": null, "iso_3_code": "bry", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8699", "native_tokenizers": [], @@ -149,9 +177,11 @@ }, { "name": "Boikin", + "depth": 2, "iso_1_code": null, "iso_3_code": "bzf", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8700", "native_tokenizers": [], @@ -159,9 +189,11 @@ }, { "name": "Gaikundi", + "depth": 2, "iso_1_code": null, "iso_3_code": "gbf", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8701", "native_tokenizers": [], @@ -169,9 +201,11 @@ }, { "name": "Iatmul", + "depth": 2, "iso_1_code": null, "iso_3_code": "ian", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8702", "native_tokenizers": [], @@ -181,9 +215,11 @@ }, { "name": "Mevembet", + "depth": 2, "iso_1_code": null, "iso_3_code": "keh", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8703", "native_tokenizers": [], @@ -191,9 +227,11 @@ }, { "name": "Koiwat", + "depth": 2, "iso_1_code": null, "iso_3_code": "kxt", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8704", "native_tokenizers": [], @@ -201,9 +239,11 @@ }, { "name": "Manambu", + "depth": 2, "iso_1_code": null, "iso_3_code": "mle", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8705", "native_tokenizers": [], @@ -211,9 +251,11 @@ }, { "name": "Gala", + "depth": 2, "iso_1_code": null, "iso_3_code": "nud", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8706", "native_tokenizers": [], @@ -221,9 +263,11 @@ }, { "name": "Sos Kundi", + "depth": 2, "iso_1_code": null, "iso_3_code": "sdk", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8707", "native_tokenizers": [], @@ -231,9 +275,11 @@ }, { "name": "Sengo", + "depth": 2, "iso_1_code": null, "iso_3_code": "spk", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8708", "native_tokenizers": [], @@ -241,9 +287,11 @@ }, { "name": "Hanga Hundi", + "depth": 2, "iso_1_code": null, "iso_3_code": "wos", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8709", "native_tokenizers": [], @@ -253,15 +301,18 @@ }, { "name": "Yalaku", + "depth": 2, "iso_1_code": null, "iso_3_code": "ylg", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8710", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8697", "native_tokenizers": [], @@ -269,14 +320,17 @@ }, { "name": "Nukuma", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kwoma", + "depth": 2, "iso_1_code": null, "iso_3_code": "kmo", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8712", "native_tokenizers": [], @@ -286,9 +340,11 @@ }, { "name": "Kwanga", + "depth": 2, "iso_1_code": null, "iso_3_code": "kwj", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8713", "native_tokenizers": [], @@ -298,9 +354,11 @@ }, { "name": "Mende", + "depth": 2, "iso_1_code": null, "iso_3_code": "sim", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8714", "native_tokenizers": [], @@ -309,6 +367,7 @@ ] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8711", "native_tokenizers": [], @@ -316,14 +375,17 @@ }, { "name": "Ram", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pouye", + "depth": 2, "iso_1_code": null, "iso_3_code": "bye", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8716", "native_tokenizers": [], @@ -331,9 +393,11 @@ }, { "name": "Awtuw", + "depth": 2, "iso_1_code": null, "iso_3_code": "kmn", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8717", "native_tokenizers": [], @@ -341,15 +405,18 @@ }, { "name": "Karawa", + "depth": 2, "iso_1_code": null, "iso_3_code": "xrw", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8718", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8715", "native_tokenizers": [], @@ -357,19 +424,23 @@ }, { "name": "Sepik Hill", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alamblak", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alamblak", + "depth": 3, "iso_1_code": null, "iso_3_code": "amp", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8721", "native_tokenizers": [], @@ -379,15 +450,18 @@ }, { "name": "Kaningra", + "depth": 3, "iso_1_code": null, "iso_3_code": "knr", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8722", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8720", "native_tokenizers": [], @@ -395,14 +469,17 @@ }, { "name": "Bahinemo", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Berinomo", + "depth": 3, "iso_1_code": null, "iso_3_code": "bit", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8724", "native_tokenizers": [], @@ -410,9 +487,11 @@ }, { "name": "Bahinemo", + "depth": 3, "iso_1_code": null, "iso_3_code": "bjh", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8725", "native_tokenizers": [], @@ -420,9 +499,11 @@ }, { "name": "Bisis", + "depth": 3, "iso_1_code": null, "iso_3_code": "bnw", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8726", "native_tokenizers": [], @@ -430,9 +511,11 @@ }, { "name": "Kapriman", + "depth": 3, "iso_1_code": null, "iso_3_code": "dju", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8727", "native_tokenizers": [], @@ -440,9 +523,11 @@ }, { "name": "Mari", + "depth": 3, "iso_1_code": null, "iso_3_code": "mbx", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8728", "native_tokenizers": [], @@ -450,9 +535,11 @@ }, { "name": "Sumariup", + "depth": 3, "iso_1_code": null, "iso_3_code": "siv", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8729", "native_tokenizers": [], @@ -460,15 +547,18 @@ }, { "name": "Watakataui", + "depth": 3, "iso_1_code": null, "iso_3_code": "wtk", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8730", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8723", "native_tokenizers": [], @@ -476,14 +566,17 @@ }, { "name": "Papi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baiyamo", + "depth": 3, "iso_1_code": null, "iso_3_code": "ppe", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8732", "native_tokenizers": [], @@ -491,15 +584,18 @@ }, { "name": "Asaba", + "depth": 3, "iso_1_code": null, "iso_3_code": "seo", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8733", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8731", "native_tokenizers": [], @@ -507,14 +603,17 @@ }, { "name": "Sanio", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Niksek", + "depth": 3, "iso_1_code": null, "iso_3_code": "gbe", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8735", "native_tokenizers": [], @@ -522,9 +621,11 @@ }, { "name": "Hewa", + "depth": 3, "iso_1_code": null, "iso_3_code": "ham", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8736", "native_tokenizers": [], @@ -532,9 +633,11 @@ }, { "name": "Piame", + "depth": 3, "iso_1_code": null, "iso_3_code": "pin", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8737", "native_tokenizers": [], @@ -542,9 +645,11 @@ }, { "name": "Saniyo-Hiyewe", + "depth": 3, "iso_1_code": null, "iso_3_code": "sny", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8738", "native_tokenizers": [], @@ -553,12 +658,14 @@ ] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8734", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8719", "native_tokenizers": [], @@ -566,14 +673,17 @@ }, { "name": "Tama", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ayi", + "depth": 2, "iso_1_code": null, "iso_3_code": "ayq", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8740", "native_tokenizers": [], @@ -581,9 +691,11 @@ }, { "name": "Pahi", + "depth": 2, "iso_1_code": null, "iso_3_code": "lgt", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8741", "native_tokenizers": [], @@ -591,9 +703,11 @@ }, { "name": "Mehek", + "depth": 2, "iso_1_code": null, "iso_3_code": "nux", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8742", "native_tokenizers": [], @@ -601,9 +715,11 @@ }, { "name": "Pasi", + "depth": 2, "iso_1_code": null, "iso_3_code": "psq", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8743", "native_tokenizers": [], @@ -611,9 +727,11 @@ }, { "name": "Yessan-Mayo", + "depth": 2, "iso_1_code": null, "iso_3_code": "yss", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8744", "native_tokenizers": [], @@ -623,15 +741,18 @@ }, { "name": "Kalou", + "depth": 2, "iso_1_code": null, "iso_3_code": "ywa", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8745", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8739", "native_tokenizers": [], @@ -639,14 +760,17 @@ }, { "name": "Wogamusin-Chenapian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chenapian", + "depth": 2, "iso_1_code": null, "iso_3_code": "cjn", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8747", "native_tokenizers": [], @@ -654,15 +778,18 @@ }, { "name": "Wogamusin", + "depth": 2, "iso_1_code": null, "iso_3_code": "wog", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8748", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8746", "native_tokenizers": [], @@ -670,14 +797,17 @@ }, { "name": "Yellow River", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ak", + "depth": 2, "iso_1_code": null, "iso_3_code": "akq", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8750", "native_tokenizers": [], @@ -685,9 +815,11 @@ }, { "name": "Awun", + "depth": 2, "iso_1_code": null, "iso_3_code": "aww", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8751", "native_tokenizers": [], @@ -695,15 +827,18 @@ }, { "name": "Namia", + "depth": 2, "iso_1_code": null, "iso_3_code": "nnm", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8752", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8749", "native_tokenizers": [], @@ -711,26 +846,31 @@ }, { "name": "Yerakai", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yerakai", + "depth": 2, "iso_1_code": null, "iso_3_code": "yra", "children": [], + "family": "Sepik", "tokenizers": {}, "node_i": "8754", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8753", "native_tokenizers": [], "scripts": [] } ], + "family": "Sepik", "tokenizers": {}, "node_i": "8685", "native_tokenizers": [], diff --git a/data/Sign language.json b/data/Sign language.json index 19fbc0ce3c200cb019f2d1be8abc79a2b58ba9df..275606108f0c135303529364afef27c60deaa3b6 100644 --- a/data/Sign language.json +++ b/data/Sign language.json @@ -1,13 +1,16 @@ { "name": "Sign language", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "International Sign", + "depth": 1, "iso_1_code": null, "iso_3_code": "ils", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8756", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Deaf community sign language", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Argentine Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "aed", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8758", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Armenian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "aen", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8759", "native_tokenizers": [], @@ -40,9 +48,11 @@ }, { "name": "Afghan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "afg", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8760", "native_tokenizers": [], @@ -50,9 +60,11 @@ }, { "name": "American Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ase", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8761", "native_tokenizers": [], @@ -60,9 +72,11 @@ }, { "name": "Auslan", + "depth": 2, "iso_1_code": null, "iso_3_code": "asf", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8762", "native_tokenizers": [], @@ -70,9 +84,11 @@ }, { "name": "Algerian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "asp", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8763", "native_tokenizers": [], @@ -80,9 +96,11 @@ }, { "name": "Austrian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "asq", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8764", "native_tokenizers": [], @@ -90,9 +108,11 @@ }, { "name": "British Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "bfi", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8765", "native_tokenizers": [], @@ -100,9 +120,11 @@ }, { "name": "Malian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "bog", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8766", "native_tokenizers": [], @@ -110,9 +132,11 @@ }, { "name": "Bulgarian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "bqn", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8767", "native_tokenizers": [], @@ -120,9 +144,11 @@ }, { "name": "Bolivian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "bvl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8768", "native_tokenizers": [], @@ -130,9 +156,11 @@ }, { "name": "Brazilian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "bzs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8769", "native_tokenizers": [], @@ -140,9 +168,11 @@ }, { "name": "Chadian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "cds", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8770", "native_tokenizers": [], @@ -150,9 +180,11 @@ }, { "name": "Catalan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csc", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8771", "native_tokenizers": [], @@ -160,9 +192,11 @@ }, { "name": "Chiangmai Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csd", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8772", "native_tokenizers": [], @@ -170,9 +204,11 @@ }, { "name": "Czech Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "cse", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8773", "native_tokenizers": [], @@ -180,9 +216,11 @@ }, { "name": "Cuban Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csf", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8774", "native_tokenizers": [], @@ -190,9 +228,11 @@ }, { "name": "Chilean Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csg", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8775", "native_tokenizers": [], @@ -200,9 +240,11 @@ }, { "name": "Chinese Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8776", "native_tokenizers": [], @@ -210,9 +252,11 @@ }, { "name": "Colombian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csn", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8777", "native_tokenizers": [], @@ -220,9 +264,11 @@ }, { "name": "Croatian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csq", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8778", "native_tokenizers": [], @@ -230,9 +276,11 @@ }, { "name": "Costa Rican Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csr", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8779", "native_tokenizers": [], @@ -240,9 +288,11 @@ }, { "name": "Cambodian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "csx", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8780", "native_tokenizers": [], @@ -250,9 +300,11 @@ }, { "name": "Dominican Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "doq", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8781", "native_tokenizers": [], @@ -260,9 +312,11 @@ }, { "name": "Sign Language of the Netherlands", + "depth": 2, "iso_1_code": null, "iso_3_code": "dse", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8782", "native_tokenizers": [], @@ -270,9 +324,11 @@ }, { "name": "Danish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "dsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8783", "native_tokenizers": [], @@ -280,9 +336,11 @@ }, { "name": "Ecuadorian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ecs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8784", "native_tokenizers": [], @@ -290,9 +348,11 @@ }, { "name": "Egyptian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "esl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8785", "native_tokenizers": [], @@ -300,9 +360,11 @@ }, { "name": "Salvadoran Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "esn", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8786", "native_tokenizers": [], @@ -310,9 +372,11 @@ }, { "name": "Estonian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "eso", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8787", "native_tokenizers": [], @@ -320,9 +384,11 @@ }, { "name": "Ethiopian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "eth", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8788", "native_tokenizers": [], @@ -330,9 +396,11 @@ }, { "name": "Quebec Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "fcs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8789", "native_tokenizers": [], @@ -340,9 +408,11 @@ }, { "name": "Finnish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "fse", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8790", "native_tokenizers": [], @@ -350,9 +420,11 @@ }, { "name": "French Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "fsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8791", "native_tokenizers": [], @@ -360,9 +432,11 @@ }, { "name": "Finland-Swedish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "fss", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8792", "native_tokenizers": [], @@ -370,9 +444,11 @@ }, { "name": "Ghanaian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "gse", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8793", "native_tokenizers": [], @@ -380,9 +456,11 @@ }, { "name": "German Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "gsg", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8794", "native_tokenizers": [], @@ -390,9 +468,11 @@ }, { "name": "Guatemalan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "gsm", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8795", "native_tokenizers": [], @@ -400,9 +480,11 @@ }, { "name": "Greek Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "gss", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8796", "native_tokenizers": [], @@ -410,9 +492,11 @@ }, { "name": "Guinean Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "gus", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8797", "native_tokenizers": [], @@ -420,9 +504,11 @@ }, { "name": "Hanoi Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "hab", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8798", "native_tokenizers": [], @@ -430,9 +516,11 @@ }, { "name": "Haiphong Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "haf", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8799", "native_tokenizers": [], @@ -440,9 +528,11 @@ }, { "name": "Honduran Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "hds", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8800", "native_tokenizers": [], @@ -450,9 +540,11 @@ }, { "name": "Hong Kong Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "hks", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8801", "native_tokenizers": [], @@ -460,9 +552,11 @@ }, { "name": "Ho Chi Minh City Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "hos", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8802", "native_tokenizers": [], @@ -470,9 +564,11 @@ }, { "name": "Hawai\u2018i Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "hps", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8803", "native_tokenizers": [], @@ -480,9 +576,11 @@ }, { "name": "Hungarian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "hsh", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8804", "native_tokenizers": [], @@ -490,9 +588,11 @@ }, { "name": "Hausa Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "hsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8805", "native_tokenizers": [], @@ -500,9 +600,11 @@ }, { "name": "Icelandic Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "icl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8806", "native_tokenizers": [], @@ -510,9 +612,11 @@ }, { "name": "Indonesian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "inl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8807", "native_tokenizers": [], @@ -520,9 +624,11 @@ }, { "name": "Indian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ins", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8808", "native_tokenizers": [], @@ -530,9 +636,11 @@ }, { "name": "Italian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ise", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8809", "native_tokenizers": [], @@ -540,9 +648,11 @@ }, { "name": "Irish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "isg", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8810", "native_tokenizers": [], @@ -550,9 +660,11 @@ }, { "name": "Israeli Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "isr", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8811", "native_tokenizers": [], @@ -560,9 +672,11 @@ }, { "name": "Jamaican Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "jls", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8812", "native_tokenizers": [], @@ -570,9 +684,11 @@ }, { "name": "Jordanian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "jos", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8813", "native_tokenizers": [], @@ -580,9 +696,11 @@ }, { "name": "Japanese Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "jsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8814", "native_tokenizers": [], @@ -590,9 +708,11 @@ }, { "name": "Selangor Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "kgi", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8815", "native_tokenizers": [], @@ -600,9 +720,11 @@ }, { "name": "Korean Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "kvk", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8816", "native_tokenizers": [], @@ -610,9 +732,11 @@ }, { "name": "Libyan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lbs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8817", "native_tokenizers": [], @@ -620,9 +744,11 @@ }, { "name": "Guinea-Bissau Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lgs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8818", "native_tokenizers": [], @@ -630,9 +756,11 @@ }, { "name": "Lithuanian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lls", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8819", "native_tokenizers": [], @@ -640,9 +768,11 @@ }, { "name": "Burundian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsb", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8820", "native_tokenizers": [], @@ -650,9 +780,11 @@ }, { "name": "Latvian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8821", "native_tokenizers": [], @@ -660,9 +792,11 @@ }, { "name": "Tibetan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsn", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8822", "native_tokenizers": [], @@ -670,9 +804,11 @@ }, { "name": "Laos Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lso", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8823", "native_tokenizers": [], @@ -680,9 +816,11 @@ }, { "name": "Panamanian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsp", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8824", "native_tokenizers": [], @@ -690,9 +828,11 @@ }, { "name": "Trinidad and Tobago Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lst", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8825", "native_tokenizers": [], @@ -700,9 +840,11 @@ }, { "name": "Seychelles Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsw", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8826", "native_tokenizers": [], @@ -710,9 +852,11 @@ }, { "name": "Mauritian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsy", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8827", "native_tokenizers": [], @@ -720,9 +864,11 @@ }, { "name": "Malawian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lws", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8828", "native_tokenizers": [], @@ -730,9 +876,11 @@ }, { "name": "Maltese Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "mdl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8829", "native_tokenizers": [], @@ -740,9 +888,11 @@ }, { "name": "Mexican Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "mfs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8830", "native_tokenizers": [], @@ -750,9 +900,11 @@ }, { "name": "Mongolian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "msr", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8831", "native_tokenizers": [], @@ -760,9 +912,11 @@ }, { "name": "Malagasy Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "mzc", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8832", "native_tokenizers": [], @@ -770,9 +924,11 @@ }, { "name": "Mozambican Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "mzy", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8833", "native_tokenizers": [], @@ -780,9 +936,11 @@ }, { "name": "Namibian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "nbs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8834", "native_tokenizers": [], @@ -790,9 +948,11 @@ }, { "name": "Nicaraguan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ncs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8835", "native_tokenizers": [], @@ -800,9 +960,11 @@ }, { "name": "Nigerian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "nsi", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8836", "native_tokenizers": [], @@ -810,9 +972,11 @@ }, { "name": "Norwegian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "nsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8837", "native_tokenizers": [], @@ -820,9 +984,11 @@ }, { "name": "Nepalese Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "nsp", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8838", "native_tokenizers": [], @@ -830,9 +996,11 @@ }, { "name": "Maritime Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "nsr", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8839", "native_tokenizers": [], @@ -840,9 +1008,11 @@ }, { "name": "New Zealand Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "nzs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8840", "native_tokenizers": [], @@ -850,9 +1020,11 @@ }, { "name": "Papua New Guinean Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "pgz", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8841", "native_tokenizers": [], @@ -860,9 +1032,11 @@ }, { "name": "Pakistan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "pks", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8842", "native_tokenizers": [], @@ -870,9 +1044,11 @@ }, { "name": "Peruvian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "prl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8843", "native_tokenizers": [], @@ -880,9 +1056,11 @@ }, { "name": "Iranian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "psc", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8844", "native_tokenizers": [], @@ -890,9 +1068,11 @@ }, { "name": "Penang Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "psg", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8845", "native_tokenizers": [], @@ -900,9 +1080,11 @@ }, { "name": "Puerto Rican Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "psl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8846", "native_tokenizers": [], @@ -910,9 +1092,11 @@ }, { "name": "Polish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "pso", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8847", "native_tokenizers": [], @@ -920,9 +1104,11 @@ }, { "name": "Filipino Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "psp", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8848", "native_tokenizers": [], @@ -930,9 +1116,11 @@ }, { "name": "Portuguese Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "psr", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8849", "native_tokenizers": [], @@ -940,9 +1128,11 @@ }, { "name": "Paraguayan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "pys", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8850", "native_tokenizers": [], @@ -950,9 +1140,11 @@ }, { "name": "Romanian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "rms", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8851", "native_tokenizers": [], @@ -960,9 +1152,11 @@ }, { "name": "Russian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "rsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8852", "native_tokenizers": [], @@ -970,9 +1164,11 @@ }, { "name": "Rwandan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "rsn", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8853", "native_tokenizers": [], @@ -980,9 +1176,11 @@ }, { "name": "Saudi Arabian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sdl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8854", "native_tokenizers": [], @@ -990,9 +1188,11 @@ }, { "name": "French Belgian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sfb", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8855", "native_tokenizers": [], @@ -1000,9 +1200,11 @@ }, { "name": "South African Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sfs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8856", "native_tokenizers": [], @@ -1010,9 +1212,11 @@ }, { "name": "Swiss-German Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sgg", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8857", "native_tokenizers": [], @@ -1020,9 +1224,11 @@ }, { "name": "Sierra Leone Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sgx", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8858", "native_tokenizers": [], @@ -1030,9 +1236,11 @@ }, { "name": "Swiss-Italian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "slf", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8859", "native_tokenizers": [], @@ -1040,9 +1248,11 @@ }, { "name": "Singapore Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sls", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8860", "native_tokenizers": [], @@ -1050,9 +1260,11 @@ }, { "name": "Albanian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sqk", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8861", "native_tokenizers": [], @@ -1060,9 +1272,11 @@ }, { "name": "Sri Lankan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sqs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8862", "native_tokenizers": [], @@ -1070,9 +1284,11 @@ }, { "name": "Spanish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ssp", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8863", "native_tokenizers": [], @@ -1080,9 +1296,11 @@ }, { "name": "Swiss-French Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ssr", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8864", "native_tokenizers": [], @@ -1090,9 +1308,11 @@ }, { "name": "Slovakian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "svk", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8865", "native_tokenizers": [], @@ -1100,9 +1320,11 @@ }, { "name": "Swedish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "swl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8866", "native_tokenizers": [], @@ -1110,9 +1332,11 @@ }, { "name": "Solomon Islands Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "szs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8867", "native_tokenizers": [], @@ -1120,9 +1344,11 @@ }, { "name": "Tunisian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "tse", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8868", "native_tokenizers": [], @@ -1130,9 +1356,11 @@ }, { "name": "Turkish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "tsm", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8869", "native_tokenizers": [], @@ -1140,9 +1368,11 @@ }, { "name": "Thai Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "tsq", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8870", "native_tokenizers": [], @@ -1150,9 +1380,11 @@ }, { "name": "Taiwan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "tss", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8871", "native_tokenizers": [], @@ -1160,9 +1392,11 @@ }, { "name": "Tanzanian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "tza", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8872", "native_tokenizers": [], @@ -1170,9 +1404,11 @@ }, { "name": "Ugandan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ugn", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8873", "native_tokenizers": [], @@ -1180,9 +1416,11 @@ }, { "name": "Uruguayan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ugy", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8874", "native_tokenizers": [], @@ -1190,9 +1428,11 @@ }, { "name": "Ukrainian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ukl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8875", "native_tokenizers": [], @@ -1200,9 +1440,11 @@ }, { "name": "Flemish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "vgt", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8876", "native_tokenizers": [], @@ -1210,9 +1452,11 @@ }, { "name": "Moldova Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "vsi", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8877", "native_tokenizers": [], @@ -1220,9 +1464,11 @@ }, { "name": "Venezuelan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "vsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8878", "native_tokenizers": [], @@ -1230,9 +1476,11 @@ }, { "name": "Valencian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "vsv", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8879", "native_tokenizers": [], @@ -1240,9 +1488,11 @@ }, { "name": "West Bengal Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "wbs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8880", "native_tokenizers": [], @@ -1250,9 +1500,11 @@ }, { "name": "Kenyan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "xki", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8881", "native_tokenizers": [], @@ -1260,9 +1512,11 @@ }, { "name": "Malaysian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "xml", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8882", "native_tokenizers": [], @@ -1270,9 +1524,11 @@ }, { "name": "Moroccan Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "xms", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8883", "native_tokenizers": [], @@ -1280,9 +1536,11 @@ }, { "name": "Slovenian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ysl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8884", "native_tokenizers": [], @@ -1290,9 +1548,11 @@ }, { "name": "Myanmar Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ysm", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8885", "native_tokenizers": [], @@ -1300,9 +1560,11 @@ }, { "name": "Zimbabwe Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "zib", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8886", "native_tokenizers": [], @@ -1310,15 +1572,18 @@ }, { "name": "Zambian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "zsl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8887", "native_tokenizers": [], "scripts": [] } ], + "family": "Sign language", "tokenizers": {}, "node_i": "8757", "native_tokenizers": [], @@ -1326,14 +1591,17 @@ }, { "name": "Shared sign language", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adamorobe Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ads", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8889", "native_tokenizers": [], @@ -1341,9 +1609,11 @@ }, { "name": "Algerian Jewish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ajs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8890", "native_tokenizers": [], @@ -1351,9 +1621,11 @@ }, { "name": "Australian Aborigines Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "asw", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8891", "native_tokenizers": [], @@ -1361,9 +1633,11 @@ }, { "name": "Ban Khor Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "bfk", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8892", "native_tokenizers": [], @@ -1371,9 +1645,11 @@ }, { "name": "Kata Kolok", + "depth": 2, "iso_1_code": null, "iso_3_code": "bqy", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8893", "native_tokenizers": [], @@ -1381,9 +1657,11 @@ }, { "name": "Mardin Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "dsz", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8894", "native_tokenizers": [], @@ -1391,9 +1669,11 @@ }, { "name": "Miyakubo Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ehs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8895", "native_tokenizers": [], @@ -1401,9 +1681,11 @@ }, { "name": "Ghandruk Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "gds", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8896", "native_tokenizers": [], @@ -1411,9 +1693,11 @@ }, { "name": "Inuit Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "iks", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8897", "native_tokenizers": [], @@ -1421,9 +1705,11 @@ }, { "name": "Konchri Sain", + "depth": 2, "iso_1_code": null, "iso_3_code": "jcs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8898", "native_tokenizers": [], @@ -1431,9 +1717,11 @@ }, { "name": "Jhyankot Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "jhs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8899", "native_tokenizers": [], @@ -1441,9 +1729,11 @@ }, { "name": "Amami Koniya Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "jks", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8900", "native_tokenizers": [], @@ -1451,9 +1741,11 @@ }, { "name": "Jumli Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "jus", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8901", "native_tokenizers": [], @@ -1461,9 +1753,11 @@ }, { "name": "Albarradas Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsc", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8902", "native_tokenizers": [], @@ -1471,9 +1765,11 @@ }, { "name": "Sivia Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "lsv", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8903", "native_tokenizers": [], @@ -1481,9 +1777,11 @@ }, { "name": "Martha\u2019s Vineyard Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "mre", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8904", "native_tokenizers": [], @@ -1491,9 +1789,11 @@ }, { "name": "Yucatec Maya Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "msd", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8905", "native_tokenizers": [], @@ -1501,9 +1801,11 @@ }, { "name": "Old Kentish Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "okl", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8906", "native_tokenizers": [], @@ -1511,9 +1813,11 @@ }, { "name": "Providencia Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "prz", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8907", "native_tokenizers": [], @@ -1521,9 +1825,11 @@ }, { "name": "Plains Indian Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "psd", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8908", "native_tokenizers": [], @@ -1531,9 +1837,11 @@ }, { "name": "Bribri Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "rib", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8909", "native_tokenizers": [], @@ -1541,9 +1849,11 @@ }, { "name": "Brunca Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "rnb", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8910", "native_tokenizers": [], @@ -1551,9 +1861,11 @@ }, { "name": "Miriwoong Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "rsm", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8911", "native_tokenizers": [], @@ -1561,9 +1873,11 @@ }, { "name": "Kufr Qassem Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "sqx", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8912", "native_tokenizers": [], @@ -1571,9 +1885,11 @@ }, { "name": "Al-Sayyid Bedouin Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "syy", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8913", "native_tokenizers": [], @@ -1581,9 +1897,11 @@ }, { "name": "Tebul Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "tsy", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8914", "native_tokenizers": [], @@ -1591,9 +1909,11 @@ }, { "name": "Kaapor Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "uks", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8915", "native_tokenizers": [], @@ -1601,9 +1921,11 @@ }, { "name": "Yolngu Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "ygs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8916", "native_tokenizers": [], @@ -1611,21 +1933,25 @@ }, { "name": "Yan-nhangu Sign Language", + "depth": 2, "iso_1_code": null, "iso_3_code": "yhs", "children": [], + "family": "Sign language", "tokenizers": {}, "node_i": "8917", "native_tokenizers": [], "scripts": [] } ], + "family": "Sign language", "tokenizers": {}, "node_i": "8888", "native_tokenizers": [], "scripts": [] } ], + "family": "Sign language", "tokenizers": {}, "node_i": "8755", "native_tokenizers": [], diff --git a/data/Sino-Tibetan.json b/data/Sino-Tibetan.json index 69760c71620287e5ca39effd41ef14c8ec3a4d76..69e8d0bbef303f5a8c9f4e2d9ca60ac78c6c1735 100644 --- a/data/Sino-Tibetan.json +++ b/data/Sino-Tibetan.json @@ -1,18 +1,22 @@ { "name": "Sino-Tibetan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinese", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chinese, Min Dong", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "cdo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8920", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Chinese, Jinyu", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "cjy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8921", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "Chinese, Mandarin", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "cmn", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Hani": { "full_object": "SpaCyTokenizer(\"zh\", {\"nlp\": {\"tokenizer\": {\"segmenter\": \"jieba\"}}})", @@ -52,9 +60,11 @@ }, { "name": "Pinghua, Northern", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "cnp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8923", "native_tokenizers": [], @@ -62,9 +72,11 @@ }, { "name": "Chinese, Pu-Xian", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "cpx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8924", "native_tokenizers": [], @@ -72,9 +84,11 @@ }, { "name": "Pinghua, Southern", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "csp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8925", "native_tokenizers": [], @@ -82,9 +96,11 @@ }, { "name": "Chinese, Huizhou", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "czh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8926", "native_tokenizers": [], @@ -92,9 +108,11 @@ }, { "name": "Chinese, Min Zhong", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "czo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8927", "native_tokenizers": [], @@ -102,9 +120,11 @@ }, { "name": "Dungan", + "depth": 2, "iso_1_code": null, "iso_3_code": "dng", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8928", "native_tokenizers": [], @@ -114,9 +134,11 @@ }, { "name": "Chinese, Gan", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "gan", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8929", "native_tokenizers": [], @@ -124,9 +146,11 @@ }, { "name": "Chinese, Hakka", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "hak", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Hani": { "full_object": "SpaCyTokenizer(\"zh\", {\"nlp\": {\"tokenizer\": {\"segmenter\": \"jieba\"}}})", @@ -147,9 +171,11 @@ }, { "name": "Chinese, Xiang", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "hsn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8931", "native_tokenizers": [], @@ -157,9 +183,11 @@ }, { "name": "Chinese, Classical", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "lzh", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Hani": { "full_object": "StanzaTokenizer(\"lzh\")", @@ -179,9 +207,11 @@ }, { "name": "Chinese, Min Bei", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "mnp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8933", "native_tokenizers": [], @@ -189,9 +219,11 @@ }, { "name": "Chinese, Min Nan", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "nan", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8934", "native_tokenizers": [], @@ -199,9 +231,11 @@ }, { "name": "Chinese, Wu", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "wuu", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Hani": { "full_object": "SpaCyTokenizer(\"zh\", {\"nlp\": {\"tokenizer\": {\"segmenter\": \"jieba\"}}})", @@ -221,9 +255,11 @@ }, { "name": "Chinese, Yue", + "depth": 2, "iso_1_code": "zh", "iso_3_code": "yue", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Hani": { "full_object": "SpaCyTokenizer(\"zh\", {\"nlp\": {\"tokenizer\": {\"segmenter\": \"jieba\"}}})", @@ -242,6 +278,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": { "Hani": { "full_object": "SpaCyTokenizer(\"zh\", {\"nlp\": {\"tokenizer\": {\"segmenter\": \"jieba\"}}})", @@ -257,14 +294,17 @@ }, { "name": "Tibeto-Burman", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Meitei", + "depth": 2, "iso_1_code": null, "iso_3_code": "mni", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8938", "native_tokenizers": [], @@ -276,14 +316,17 @@ }, { "name": "Angami-Pochuri", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naga, Mao", + "depth": 3, "iso_1_code": null, "iso_3_code": "nbi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8940", "native_tokenizers": [], @@ -291,9 +334,11 @@ }, { "name": "Naga, Angami", + "depth": 3, "iso_1_code": null, "iso_3_code": "njm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8941", "native_tokenizers": [], @@ -303,9 +348,11 @@ }, { "name": "Naga, Khezha", + "depth": 3, "iso_1_code": null, "iso_3_code": "nkh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8942", "native_tokenizers": [], @@ -313,9 +360,11 @@ }, { "name": "Naga, Northern Rengma", + "depth": 3, "iso_1_code": null, "iso_3_code": "nnl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8943", "native_tokenizers": [], @@ -325,9 +374,11 @@ }, { "name": "Naga, Pochuri", + "depth": 3, "iso_1_code": null, "iso_3_code": "npo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8944", "native_tokenizers": [], @@ -337,9 +388,11 @@ }, { "name": "Naga, Southern Rengma", + "depth": 3, "iso_1_code": null, "iso_3_code": "nre", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8945", "native_tokenizers": [], @@ -349,9 +402,11 @@ }, { "name": "Naga, Chokri", + "depth": 3, "iso_1_code": null, "iso_3_code": "nri", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8946", "native_tokenizers": [], @@ -361,9 +416,11 @@ }, { "name": "Naga, Sumi", + "depth": 3, "iso_1_code": null, "iso_3_code": "nsm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8947", "native_tokenizers": [], @@ -373,9 +430,11 @@ }, { "name": "Naga, Poumai", + "depth": 3, "iso_1_code": null, "iso_3_code": "pmx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8948", "native_tokenizers": [], @@ -384,6 +443,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8939", "native_tokenizers": [], @@ -391,14 +451,17 @@ }, { "name": "Central Naga", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naga, Lotha", + "depth": 3, "iso_1_code": null, "iso_3_code": "njh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8950", "native_tokenizers": [], @@ -406,9 +469,11 @@ }, { "name": "Naga, Ao", + "depth": 3, "iso_1_code": null, "iso_3_code": "njo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8951", "native_tokenizers": [], @@ -418,9 +483,11 @@ }, { "name": "Naga, Sangtam", + "depth": 3, "iso_1_code": null, "iso_3_code": "nsa", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8952", "native_tokenizers": [], @@ -430,9 +497,11 @@ }, { "name": "Naga, Yimchungru", + "depth": 3, "iso_1_code": null, "iso_3_code": "yim", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8953", "native_tokenizers": [], @@ -441,6 +510,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8949", "native_tokenizers": [], @@ -448,19 +518,23 @@ }, { "name": "Central Tibeto-Burman", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Digarish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Idu-Mishmi", + "depth": 4, "iso_1_code": null, "iso_3_code": "clk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8956", "native_tokenizers": [], @@ -468,15 +542,18 @@ }, { "name": "Digaro-Mishmi", + "depth": 4, "iso_1_code": null, "iso_3_code": "mhu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8957", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8955", "native_tokenizers": [], @@ -484,14 +561,17 @@ }, { "name": "Hrusish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hruso", + "depth": 4, "iso_1_code": null, "iso_3_code": "hru", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8959", "native_tokenizers": [], @@ -499,15 +579,18 @@ }, { "name": "Miji", + "depth": 4, "iso_1_code": null, "iso_3_code": "sjl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8960", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8958", "native_tokenizers": [], @@ -515,20 +598,24 @@ }, { "name": "Keman", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Zakhring", + "depth": 4, "iso_1_code": null, "iso_3_code": "zkr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8962", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8961", "native_tokenizers": [], @@ -536,14 +623,17 @@ }, { "name": "Kho-Bwa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bugun", + "depth": 4, "iso_1_code": null, "iso_3_code": "bgg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8964", "native_tokenizers": [], @@ -551,9 +641,11 @@ }, { "name": "Chug", + "depth": 4, "iso_1_code": null, "iso_3_code": "cvg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8965", "native_tokenizers": [], @@ -561,9 +653,11 @@ }, { "name": "Lish", + "depth": 4, "iso_1_code": null, "iso_3_code": "lsh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8966", "native_tokenizers": [], @@ -571,9 +665,11 @@ }, { "name": "Sartang", + "depth": 4, "iso_1_code": null, "iso_3_code": "onp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8967", "native_tokenizers": [], @@ -581,9 +677,11 @@ }, { "name": "Sherdukpen", + "depth": 4, "iso_1_code": null, "iso_3_code": "sdp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8968", "native_tokenizers": [], @@ -591,15 +689,18 @@ }, { "name": "Puroik", + "depth": 4, "iso_1_code": null, "iso_3_code": "suv", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8969", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8963", "native_tokenizers": [], @@ -607,20 +708,24 @@ }, { "name": "Lepcha", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lepcha", + "depth": 4, "iso_1_code": null, "iso_3_code": "lep", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8971", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8970", "native_tokenizers": [], @@ -628,20 +733,24 @@ }, { "name": "Mijish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miju-Mishmi", + "depth": 4, "iso_1_code": null, "iso_3_code": "mxj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8973", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8972", "native_tokenizers": [], @@ -649,14 +758,17 @@ }, { "name": "Nungish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Drung", + "depth": 4, "iso_1_code": null, "iso_3_code": "duu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8975", "native_tokenizers": [], @@ -664,9 +776,11 @@ }, { "name": "Anong", + "depth": 4, "iso_1_code": null, "iso_3_code": "nun", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8976", "native_tokenizers": [], @@ -674,9 +788,11 @@ }, { "name": "Rawang", + "depth": 4, "iso_1_code": null, "iso_3_code": "raw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8977", "native_tokenizers": [], @@ -685,6 +801,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8974", "native_tokenizers": [], @@ -692,14 +809,17 @@ }, { "name": "Tani", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Adi", + "depth": 4, "iso_1_code": null, "iso_3_code": "adi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8979", "native_tokenizers": [], @@ -709,9 +829,11 @@ }, { "name": "Adi, Galo", + "depth": 4, "iso_1_code": null, "iso_3_code": "adl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8980", "native_tokenizers": [], @@ -721,9 +843,11 @@ }, { "name": "Apatani", + "depth": 4, "iso_1_code": null, "iso_3_code": "apt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8981", "native_tokenizers": [], @@ -733,9 +857,11 @@ }, { "name": "Mising", + "depth": 4, "iso_1_code": null, "iso_3_code": "mrg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8982", "native_tokenizers": [], @@ -745,9 +871,11 @@ }, { "name": "Na", + "depth": 4, "iso_1_code": null, "iso_3_code": "nbt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8983", "native_tokenizers": [], @@ -755,9 +883,11 @@ }, { "name": "Nyishi", + "depth": 4, "iso_1_code": null, "iso_3_code": "njz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8984", "native_tokenizers": [], @@ -767,21 +897,25 @@ }, { "name": "Tagin", + "depth": 4, "iso_1_code": null, "iso_3_code": "tgj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8985", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8978", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8954", "native_tokenizers": [], @@ -789,14 +923,17 @@ }, { "name": "Karbi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amri Karbi", + "depth": 3, "iso_1_code": null, "iso_3_code": "ajz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8987", "native_tokenizers": [], @@ -806,9 +943,11 @@ }, { "name": "Karbi", + "depth": 3, "iso_1_code": null, "iso_3_code": "mjw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8988", "native_tokenizers": [], @@ -817,6 +956,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8986", "native_tokenizers": [], @@ -824,19 +964,23 @@ }, { "name": "Karenic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karen, Bwe", + "depth": 4, "iso_1_code": null, "iso_3_code": "bwe", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8991", "native_tokenizers": [], @@ -844,9 +988,11 @@ }, { "name": "Kayah, Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "eky", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8992", "native_tokenizers": [], @@ -854,9 +1000,11 @@ }, { "name": "Karen, Geko", + "depth": 4, "iso_1_code": null, "iso_3_code": "ghk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8993", "native_tokenizers": [], @@ -864,9 +1012,11 @@ }, { "name": "Kayaw", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8994", "native_tokenizers": [], @@ -874,9 +1024,11 @@ }, { "name": "Karen, Geba", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8995", "native_tokenizers": [], @@ -884,9 +1036,11 @@ }, { "name": "Kawyaw", + "depth": 4, "iso_1_code": null, "iso_3_code": "kxf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8996", "native_tokenizers": [], @@ -894,9 +1048,11 @@ }, { "name": "Kayah, Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "kyu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8997", "native_tokenizers": [], @@ -907,6 +1063,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8990", "native_tokenizers": [], @@ -914,14 +1071,17 @@ }, { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lahta", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8999", "native_tokenizers": [], @@ -929,9 +1089,11 @@ }, { "name": "Yinbaw", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9000", "native_tokenizers": [], @@ -939,9 +1101,11 @@ }, { "name": "Yintale", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9001", "native_tokenizers": [], @@ -949,9 +1113,11 @@ }, { "name": "Zayein", + "depth": 4, "iso_1_code": null, "iso_3_code": "kxk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9002", "native_tokenizers": [], @@ -959,15 +1125,18 @@ }, { "name": "Kayan", + "depth": 4, "iso_1_code": null, "iso_3_code": "pdu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9003", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8998", "native_tokenizers": [], @@ -975,14 +1144,17 @@ }, { "name": "Peripheral", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pa\u2019o", + "depth": 4, "iso_1_code": null, "iso_3_code": "blk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9005", "native_tokenizers": [], @@ -992,9 +1164,11 @@ }, { "name": "Karen, Pwo Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "kjp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9006", "native_tokenizers": [], @@ -1002,9 +1176,11 @@ }, { "name": "Karen, Phrae Pwo", + "depth": 4, "iso_1_code": null, "iso_3_code": "kjt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9007", "native_tokenizers": [], @@ -1012,9 +1188,11 @@ }, { "name": "Karen, Pwo Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "pwo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9008", "native_tokenizers": [], @@ -1022,9 +1200,11 @@ }, { "name": "Karen, Pwo Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "pww", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9009", "native_tokenizers": [], @@ -1033,6 +1213,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9004", "native_tokenizers": [], @@ -1040,14 +1221,17 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karen, Mobwa", + "depth": 4, "iso_1_code": null, "iso_3_code": "jkm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9011", "native_tokenizers": [], @@ -1055,9 +1239,11 @@ }, { "name": "Karen, Paku", + "depth": 4, "iso_1_code": null, "iso_3_code": "jkp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9012", "native_tokenizers": [], @@ -1065,9 +1251,11 @@ }, { "name": "Karen, S\u2019gaw", + "depth": 4, "iso_1_code": null, "iso_3_code": "ksw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9013", "native_tokenizers": [], @@ -1077,21 +1265,25 @@ }, { "name": "Wewaw", + "depth": 4, "iso_1_code": null, "iso_3_code": "wea", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9014", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9010", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "8989", "native_tokenizers": [], @@ -1099,14 +1291,17 @@ }, { "name": "Kuki-Chin", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Thaiphum", + "depth": 3, "iso_1_code": null, "iso_3_code": "cth", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9016", "native_tokenizers": [], @@ -1114,14 +1309,17 @@ }, { "name": "Central", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Ngawn", + "depth": 4, "iso_1_code": null, "iso_3_code": "cnw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9018", "native_tokenizers": [], @@ -1131,9 +1329,11 @@ }, { "name": "Pangkhua", + "depth": 4, "iso_1_code": null, "iso_3_code": "pkh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9019", "native_tokenizers": [], @@ -1141,9 +1341,11 @@ }, { "name": "Chin, Tawr", + "depth": 4, "iso_1_code": null, "iso_3_code": "tcp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9020", "native_tokenizers": [], @@ -1151,14 +1353,17 @@ }, { "name": "Lai", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Bawm", + "depth": 5, "iso_1_code": null, "iso_3_code": "bgr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9022", "native_tokenizers": [], @@ -1168,9 +1373,11 @@ }, { "name": "Chin, Bualkhaw", + "depth": 5, "iso_1_code": null, "iso_3_code": "cbl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9023", "native_tokenizers": [], @@ -1178,9 +1385,11 @@ }, { "name": "Chin, Falam", + "depth": 5, "iso_1_code": null, "iso_3_code": "cfm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9024", "native_tokenizers": [], @@ -1190,9 +1399,11 @@ }, { "name": "Chin, Hakha", + "depth": 5, "iso_1_code": null, "iso_3_code": "cnh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9025", "native_tokenizers": [], @@ -1201,6 +1412,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9021", "native_tokenizers": [], @@ -1208,14 +1420,17 @@ }, { "name": "Mizo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biate", + "depth": 5, "iso_1_code": null, "iso_3_code": "biu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9027", "native_tokenizers": [], @@ -1225,9 +1440,11 @@ }, { "name": "Hmar", + "depth": 5, "iso_1_code": null, "iso_3_code": "hmr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9028", "native_tokenizers": [], @@ -1237,9 +1454,11 @@ }, { "name": "Hrangkhol", + "depth": 5, "iso_1_code": null, "iso_3_code": "hra", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9029", "native_tokenizers": [], @@ -1249,9 +1468,11 @@ }, { "name": "Mizo", + "depth": 5, "iso_1_code": null, "iso_3_code": "lus", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9030", "native_tokenizers": [], @@ -1261,21 +1482,25 @@ }, { "name": "Sakachep", + "depth": 5, "iso_1_code": null, "iso_3_code": "sch", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9031", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9026", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9017", "native_tokenizers": [], @@ -1283,14 +1508,17 @@ }, { "name": "Maraic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Zotung", + "depth": 4, "iso_1_code": null, "iso_3_code": "czt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9033", "native_tokenizers": [], @@ -1300,9 +1528,11 @@ }, { "name": "Chin, Senthang", + "depth": 4, "iso_1_code": null, "iso_3_code": "sez", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9034", "native_tokenizers": [], @@ -1310,9 +1540,11 @@ }, { "name": "Chin, Zyphe", + "depth": 4, "iso_1_code": null, "iso_3_code": "zyp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9035", "native_tokenizers": [], @@ -1322,14 +1554,17 @@ }, { "name": "Mara", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Lautu", + "depth": 5, "iso_1_code": null, "iso_3_code": "clt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9037", "native_tokenizers": [], @@ -1337,21 +1572,25 @@ }, { "name": "Mara", + "depth": 5, "iso_1_code": null, "iso_3_code": "mrh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9038", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9036", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9032", "native_tokenizers": [], @@ -1359,14 +1598,17 @@ }, { "name": "Northwestern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aimol", + "depth": 4, "iso_1_code": null, "iso_3_code": "aim", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9040", "native_tokenizers": [], @@ -1376,9 +1618,11 @@ }, { "name": "Anal", + "depth": 4, "iso_1_code": null, "iso_3_code": "anm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9041", "native_tokenizers": [], @@ -1388,9 +1632,11 @@ }, { "name": "Chiru", + "depth": 4, "iso_1_code": null, "iso_3_code": "cdf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9042", "native_tokenizers": [], @@ -1400,9 +1646,11 @@ }, { "name": "Naga, Kharam", + "depth": 4, "iso_1_code": null, "iso_3_code": "kfw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9043", "native_tokenizers": [], @@ -1410,9 +1658,11 @@ }, { "name": "Kom", + "depth": 4, "iso_1_code": null, "iso_3_code": "kmm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9044", "native_tokenizers": [], @@ -1422,9 +1672,11 @@ }, { "name": "Lamkang", + "depth": 4, "iso_1_code": null, "iso_3_code": "lmk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9045", "native_tokenizers": [], @@ -1434,9 +1686,11 @@ }, { "name": "Naga, Chothe", + "depth": 4, "iso_1_code": null, "iso_3_code": "nct", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9046", "native_tokenizers": [], @@ -1446,9 +1700,11 @@ }, { "name": "Naga, Monsang", + "depth": 4, "iso_1_code": null, "iso_3_code": "nmh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9047", "native_tokenizers": [], @@ -1458,9 +1714,11 @@ }, { "name": "Naga, Tarao", + "depth": 4, "iso_1_code": null, "iso_3_code": "tro", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9048", "native_tokenizers": [], @@ -1469,6 +1727,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9039", "native_tokenizers": [], @@ -1476,19 +1735,23 @@ }, { "name": "Peripheral", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naga, Moyon", + "depth": 5, "iso_1_code": null, "iso_3_code": "nmo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9051", "native_tokenizers": [], @@ -1498,9 +1761,11 @@ }, { "name": "Purum", + "depth": 5, "iso_1_code": null, "iso_3_code": "pub", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9052", "native_tokenizers": [], @@ -1508,9 +1773,11 @@ }, { "name": "Ralte", + "depth": 5, "iso_1_code": null, "iso_3_code": "ral", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9053", "native_tokenizers": [], @@ -1518,9 +1785,11 @@ }, { "name": "Simte", + "depth": 5, "iso_1_code": null, "iso_3_code": "smt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9054", "native_tokenizers": [], @@ -1530,14 +1799,17 @@ }, { "name": "Sizang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Siyin", + "depth": 6, "iso_1_code": null, "iso_3_code": "csy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9056", "native_tokenizers": [], @@ -1547,9 +1819,11 @@ }, { "name": "Gangte", + "depth": 6, "iso_1_code": null, "iso_3_code": "gnb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9057", "native_tokenizers": [], @@ -1559,9 +1833,11 @@ }, { "name": "Vaiphei", + "depth": 6, "iso_1_code": null, "iso_3_code": "vap", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9058", "native_tokenizers": [], @@ -1571,9 +1847,11 @@ }, { "name": "Zo", + "depth": 6, "iso_1_code": null, "iso_3_code": "zom", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9059", "native_tokenizers": [], @@ -1582,6 +1860,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9055", "native_tokenizers": [], @@ -1589,14 +1868,17 @@ }, { "name": "Thado", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Tedim", + "depth": 6, "iso_1_code": null, "iso_3_code": "ctd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9061", "native_tokenizers": [], @@ -1606,9 +1888,11 @@ }, { "name": "Chin, Paite", + "depth": 6, "iso_1_code": null, "iso_3_code": "pck", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9062", "native_tokenizers": [], @@ -1618,9 +1902,11 @@ }, { "name": "Chin, Thado", + "depth": 6, "iso_1_code": null, "iso_3_code": "tcz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9063", "native_tokenizers": [], @@ -1629,12 +1915,14 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9060", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9050", "native_tokenizers": [], @@ -1642,14 +1930,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Eastern Khumi", + "depth": 5, "iso_1_code": null, "iso_3_code": "cek", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9065", "native_tokenizers": [], @@ -1659,9 +1950,11 @@ }, { "name": "Mro-Khimi", + "depth": 5, "iso_1_code": null, "iso_3_code": "cmr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9066", "native_tokenizers": [], @@ -1671,9 +1964,11 @@ }, { "name": "Chin, Khumi", + "depth": 5, "iso_1_code": null, "iso_3_code": "cnk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9067", "native_tokenizers": [], @@ -1683,9 +1978,11 @@ }, { "name": "Chin, Songlai", + "depth": 5, "iso_1_code": null, "iso_3_code": "csj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9068", "native_tokenizers": [], @@ -1693,9 +1990,11 @@ }, { "name": "Chin, Sumtu", + "depth": 5, "iso_1_code": null, "iso_3_code": "csv", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9069", "native_tokenizers": [], @@ -1703,9 +2002,11 @@ }, { "name": "Chin, Rungtu", + "depth": 5, "iso_1_code": null, "iso_3_code": "rtc", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9070", "native_tokenizers": [], @@ -1713,9 +2014,11 @@ }, { "name": "Shendu", + "depth": 5, "iso_1_code": null, "iso_3_code": "shl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9071", "native_tokenizers": [], @@ -1723,9 +2026,11 @@ }, { "name": "Chin, Rawngtu", + "depth": 5, "iso_1_code": null, "iso_3_code": "weu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9072", "native_tokenizers": [], @@ -1733,19 +2038,23 @@ }, { "name": "Cho-Asho", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asho", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, L\u00e4okt\u00fc", + "depth": 7, "iso_1_code": null, "iso_3_code": "cey", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9075", "native_tokenizers": [], @@ -1753,9 +2062,11 @@ }, { "name": "Chin, Laitu", + "depth": 7, "iso_1_code": null, "iso_3_code": "clj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9076", "native_tokenizers": [], @@ -1763,15 +2074,18 @@ }, { "name": "Chin, Asho", + "depth": 7, "iso_1_code": null, "iso_3_code": "csh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9077", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9074", "native_tokenizers": [], @@ -1779,14 +2093,17 @@ }, { "name": "Cho", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Kaang", + "depth": 7, "iso_1_code": null, "iso_3_code": "ckn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9079", "native_tokenizers": [], @@ -1794,9 +2111,11 @@ }, { "name": "Chin, Uppu", + "depth": 7, "iso_1_code": null, "iso_3_code": "cnb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9080", "native_tokenizers": [], @@ -1804,9 +2123,11 @@ }, { "name": "Chin, Daai", + "depth": 7, "iso_1_code": null, "iso_3_code": "dao", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9081", "native_tokenizers": [], @@ -1814,9 +2135,11 @@ }, { "name": "Chin, Matu", + "depth": 7, "iso_1_code": null, "iso_3_code": "hlt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9082", "native_tokenizers": [], @@ -1826,9 +2149,11 @@ }, { "name": "Chin, M\u00fc\u00fcn", + "depth": 7, "iso_1_code": null, "iso_3_code": "mwq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9083", "native_tokenizers": [], @@ -1837,30 +2162,35 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9078", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9073", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9064", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9049", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9015", "native_tokenizers": [], @@ -1868,24 +2198,29 @@ }, { "name": "Ngwi-Burmese", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burmish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Achang", + "depth": 5, "iso_1_code": null, "iso_3_code": "acn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9087", "native_tokenizers": [], @@ -1895,9 +2230,11 @@ }, { "name": "Zaiwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "atb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9088", "native_tokenizers": [], @@ -1907,9 +2244,11 @@ }, { "name": "Pela", + "depth": 5, "iso_1_code": null, "iso_3_code": "bxd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9089", "native_tokenizers": [], @@ -1917,9 +2256,11 @@ }, { "name": "Hpon", + "depth": 5, "iso_1_code": null, "iso_3_code": "hpo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9090", "native_tokenizers": [], @@ -1927,9 +2268,11 @@ }, { "name": "Lacid", + "depth": 5, "iso_1_code": null, "iso_3_code": "lsi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9091", "native_tokenizers": [], @@ -1939,9 +2282,11 @@ }, { "name": "Lhao Vo", + "depth": 5, "iso_1_code": null, "iso_3_code": "mhx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9092", "native_tokenizers": [], @@ -1950,6 +2295,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9086", "native_tokenizers": [], @@ -1957,14 +2303,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Danu", + "depth": 5, "iso_1_code": null, "iso_3_code": "dnv", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9094", "native_tokenizers": [], @@ -1972,9 +2321,11 @@ }, { "name": "Intha", + "depth": 5, "iso_1_code": null, "iso_3_code": "int", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9095", "native_tokenizers": [], @@ -1982,9 +2333,11 @@ }, { "name": "Burmese", + "depth": 5, "iso_1_code": "my", "iso_3_code": "mya", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9096", "native_tokenizers": [], @@ -1994,9 +2347,11 @@ }, { "name": "Rakhine", + "depth": 5, "iso_1_code": null, "iso_3_code": "rki", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9097", "native_tokenizers": [], @@ -2004,9 +2359,11 @@ }, { "name": "Marma", + "depth": 5, "iso_1_code": null, "iso_3_code": "rmz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9098", "native_tokenizers": [], @@ -2014,9 +2371,11 @@ }, { "name": "Taungyo", + "depth": 5, "iso_1_code": null, "iso_3_code": "tco", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9099", "native_tokenizers": [], @@ -2024,21 +2383,25 @@ }, { "name": "Tavoyan", + "depth": 5, "iso_1_code": null, "iso_3_code": "tvn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9100", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9093", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9085", "native_tokenizers": [], @@ -2046,14 +2409,17 @@ }, { "name": "Mru", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chin, Anu-Khongso", + "depth": 4, "iso_1_code": null, "iso_3_code": "anl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9102", "native_tokenizers": [], @@ -2061,15 +2427,18 @@ }, { "name": "Mru", + "depth": 4, "iso_1_code": null, "iso_3_code": "mro", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9103", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9101", "native_tokenizers": [], @@ -2077,19 +2446,23 @@ }, { "name": "Ngwi", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hlersu", + "depth": 5, "iso_1_code": null, "iso_3_code": "hle", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9106", "native_tokenizers": [], @@ -2097,9 +2470,11 @@ }, { "name": "Jinuo, Youle", + "depth": 5, "iso_1_code": null, "iso_3_code": "jiu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9107", "native_tokenizers": [], @@ -2107,9 +2482,11 @@ }, { "name": "Jinuo, Buyuan", + "depth": 5, "iso_1_code": null, "iso_3_code": "jiy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9108", "native_tokenizers": [], @@ -2117,9 +2494,11 @@ }, { "name": "Lahu Shi", + "depth": 5, "iso_1_code": null, "iso_3_code": "lhi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9109", "native_tokenizers": [], @@ -2129,9 +2508,11 @@ }, { "name": "Lahu", + "depth": 5, "iso_1_code": null, "iso_3_code": "lhu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9110", "native_tokenizers": [], @@ -2141,9 +2522,11 @@ }, { "name": "Lisu", + "depth": 5, "iso_1_code": null, "iso_3_code": "lis", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9111", "native_tokenizers": [], @@ -2153,9 +2536,11 @@ }, { "name": "Kucong", + "depth": 5, "iso_1_code": null, "iso_3_code": "lkc", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9112", "native_tokenizers": [], @@ -2163,9 +2548,11 @@ }, { "name": "Lamu", + "depth": 5, "iso_1_code": null, "iso_3_code": "llh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9113", "native_tokenizers": [], @@ -2173,9 +2560,11 @@ }, { "name": "Lipo", + "depth": 5, "iso_1_code": null, "iso_3_code": "lpo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9114", "native_tokenizers": [], @@ -2183,9 +2572,11 @@ }, { "name": "Lawu", + "depth": 5, "iso_1_code": null, "iso_3_code": "lwu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9115", "native_tokenizers": [], @@ -2193,9 +2584,11 @@ }, { "name": "Nusu", + "depth": 5, "iso_1_code": null, "iso_3_code": "nuf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9116", "native_tokenizers": [], @@ -2203,9 +2596,11 @@ }, { "name": "Lolopo", + "depth": 5, "iso_1_code": null, "iso_3_code": "ycl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9117", "native_tokenizers": [], @@ -2213,9 +2608,11 @@ }, { "name": "Lalo, Dongshanba", + "depth": 5, "iso_1_code": null, "iso_3_code": "yik", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9118", "native_tokenizers": [], @@ -2223,9 +2620,11 @@ }, { "name": "Miqie", + "depth": 5, "iso_1_code": null, "iso_3_code": "yiq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9119", "native_tokenizers": [], @@ -2233,9 +2632,11 @@ }, { "name": "Lalu, Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": "yit", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9120", "native_tokenizers": [], @@ -2243,9 +2644,11 @@ }, { "name": "Limi", + "depth": 5, "iso_1_code": null, "iso_3_code": "ylm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9121", "native_tokenizers": [], @@ -2253,9 +2656,11 @@ }, { "name": "Mili", + "depth": 5, "iso_1_code": null, "iso_3_code": "ymh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9122", "native_tokenizers": [], @@ -2263,9 +2668,11 @@ }, { "name": "Lang\u2019e", + "depth": 5, "iso_1_code": null, "iso_3_code": "yne", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9123", "native_tokenizers": [], @@ -2273,9 +2680,11 @@ }, { "name": "Sani", + "depth": 5, "iso_1_code": null, "iso_3_code": "ysn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9124", "native_tokenizers": [], @@ -2283,9 +2692,11 @@ }, { "name": "Lolopo, Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": "ysp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9125", "native_tokenizers": [], @@ -2293,9 +2704,11 @@ }, { "name": "Talu", + "depth": 5, "iso_1_code": null, "iso_3_code": "yta", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9126", "native_tokenizers": [], @@ -2303,9 +2716,11 @@ }, { "name": "Tanglang", + "depth": 5, "iso_1_code": null, "iso_3_code": "ytl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9127", "native_tokenizers": [], @@ -2313,9 +2728,11 @@ }, { "name": "Lalu, Western", + "depth": 5, "iso_1_code": null, "iso_3_code": "ywl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9128", "native_tokenizers": [], @@ -2323,9 +2740,11 @@ }, { "name": "Lalo, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "ywt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9129", "native_tokenizers": [], @@ -2333,15 +2752,18 @@ }, { "name": "Zauzou", + "depth": 5, "iso_1_code": null, "iso_3_code": "zal", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9130", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9105", "native_tokenizers": [], @@ -2349,14 +2771,17 @@ }, { "name": "Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuosu", + "depth": 5, "iso_1_code": "ii", "iso_3_code": "iii", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9132", "native_tokenizers": [], @@ -2364,9 +2789,11 @@ }, { "name": "Katso", + "depth": 5, "iso_1_code": null, "iso_3_code": "kaf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9133", "native_tokenizers": [], @@ -2374,9 +2801,11 @@ }, { "name": "Samei", + "depth": 5, "iso_1_code": null, "iso_3_code": "smh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9134", "native_tokenizers": [], @@ -2384,9 +2813,11 @@ }, { "name": "Chesu", + "depth": 5, "iso_1_code": null, "iso_3_code": "ych", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9135", "native_tokenizers": [], @@ -2394,9 +2825,11 @@ }, { "name": "Gepo", + "depth": 5, "iso_1_code": null, "iso_3_code": "ygp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9136", "native_tokenizers": [], @@ -2404,9 +2837,11 @@ }, { "name": "Nasu, Wusa", + "depth": 5, "iso_1_code": null, "iso_3_code": "yig", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9137", "native_tokenizers": [], @@ -2414,9 +2849,11 @@ }, { "name": "Awu", + "depth": 5, "iso_1_code": null, "iso_3_code": "yiu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9138", "native_tokenizers": [], @@ -2424,9 +2861,11 @@ }, { "name": "Naluo", + "depth": 5, "iso_1_code": null, "iso_3_code": "ylo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9139", "native_tokenizers": [], @@ -2434,9 +2873,11 @@ }, { "name": "Aluo", + "depth": 5, "iso_1_code": null, "iso_3_code": "yna", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9140", "native_tokenizers": [], @@ -2444,9 +2885,11 @@ }, { "name": "Samatao", + "depth": 5, "iso_1_code": null, "iso_3_code": "ysd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9141", "native_tokenizers": [], @@ -2454,9 +2897,11 @@ }, { "name": "Sanie", + "depth": 5, "iso_1_code": null, "iso_3_code": "ysy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9142", "native_tokenizers": [], @@ -2464,9 +2909,11 @@ }, { "name": "Yi, Wuding-Luquan", + "depth": 5, "iso_1_code": null, "iso_3_code": "ywq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9143", "native_tokenizers": [], @@ -2474,9 +2921,11 @@ }, { "name": "Nasu, Wumeng", + "depth": 5, "iso_1_code": null, "iso_3_code": "ywu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9144", "native_tokenizers": [], @@ -2484,15 +2933,18 @@ }, { "name": "Ayizi", + "depth": 5, "iso_1_code": null, "iso_3_code": "yyz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9145", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9131", "native_tokenizers": [], @@ -2500,14 +2952,17 @@ }, { "name": "Southeastern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alugu", + "depth": 5, "iso_1_code": null, "iso_3_code": "aub", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9147", "native_tokenizers": [], @@ -2515,9 +2970,11 @@ }, { "name": "Azha", + "depth": 5, "iso_1_code": null, "iso_3_code": "aza", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9148", "native_tokenizers": [], @@ -2525,9 +2982,11 @@ }, { "name": "Laghuu", + "depth": 5, "iso_1_code": null, "iso_3_code": "lgh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9149", "native_tokenizers": [], @@ -2535,9 +2994,11 @@ }, { "name": "Nisu, Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": "nos", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9150", "native_tokenizers": [], @@ -2545,9 +3006,11 @@ }, { "name": "Nisu, Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": "nsd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9151", "native_tokenizers": [], @@ -2555,9 +3018,11 @@ }, { "name": "Nisu, Northwestern", + "depth": 5, "iso_1_code": null, "iso_3_code": "nsf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9152", "native_tokenizers": [], @@ -2565,9 +3030,11 @@ }, { "name": "Nisu, Southwestern", + "depth": 5, "iso_1_code": null, "iso_3_code": "nsv", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9153", "native_tokenizers": [], @@ -2575,9 +3042,11 @@ }, { "name": "Mantsi", + "depth": 5, "iso_1_code": null, "iso_3_code": "nty", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9154", "native_tokenizers": [], @@ -2585,9 +3054,11 @@ }, { "name": "Phula", + "depth": 5, "iso_1_code": null, "iso_3_code": "phh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9155", "native_tokenizers": [], @@ -2595,9 +3066,11 @@ }, { "name": "Bokha", + "depth": 5, "iso_1_code": null, "iso_3_code": "ybk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9156", "native_tokenizers": [], @@ -2605,9 +3078,11 @@ }, { "name": "Phowa, Hlepho", + "depth": 5, "iso_1_code": null, "iso_3_code": "yhl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9157", "native_tokenizers": [], @@ -2615,9 +3090,11 @@ }, { "name": "Ache", + "depth": 5, "iso_1_code": null, "iso_3_code": "yif", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9158", "native_tokenizers": [], @@ -2625,9 +3102,11 @@ }, { "name": "Pholo", + "depth": 5, "iso_1_code": null, "iso_3_code": "yip", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9159", "native_tokenizers": [], @@ -2635,9 +3114,11 @@ }, { "name": "Nisu, Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": "yiv", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9160", "native_tokenizers": [], @@ -2645,9 +3126,11 @@ }, { "name": "Axi", + "depth": 5, "iso_1_code": null, "iso_3_code": "yix", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9161", "native_tokenizers": [], @@ -2655,9 +3138,11 @@ }, { "name": "Azhe", + "depth": 5, "iso_1_code": null, "iso_3_code": "yiz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9162", "native_tokenizers": [], @@ -2665,9 +3150,11 @@ }, { "name": "Khlula", + "depth": 5, "iso_1_code": null, "iso_3_code": "ykl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9163", "native_tokenizers": [], @@ -2675,9 +3162,11 @@ }, { "name": "Kua-nsi", + "depth": 5, "iso_1_code": null, "iso_3_code": "ykn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9164", "native_tokenizers": [], @@ -2685,9 +3174,11 @@ }, { "name": "Kathu", + "depth": 5, "iso_1_code": null, "iso_3_code": "ykt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9165", "native_tokenizers": [], @@ -2695,9 +3186,11 @@ }, { "name": "Kuamasi", + "depth": 5, "iso_1_code": null, "iso_3_code": "yku", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9166", "native_tokenizers": [], @@ -2705,9 +3198,11 @@ }, { "name": "Muji, Southern", + "depth": 5, "iso_1_code": null, "iso_3_code": "ymc", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9167", "native_tokenizers": [], @@ -2715,9 +3210,11 @@ }, { "name": "Moji", + "depth": 5, "iso_1_code": null, "iso_3_code": "ymi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9168", "native_tokenizers": [], @@ -2725,9 +3222,11 @@ }, { "name": "Muji, Qila", + "depth": 5, "iso_1_code": null, "iso_3_code": "ymq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9169", "native_tokenizers": [], @@ -2735,9 +3234,11 @@ }, { "name": "Muji, Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": "ymx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9170", "native_tokenizers": [], @@ -2745,9 +3246,11 @@ }, { "name": "Muzi", + "depth": 5, "iso_1_code": null, "iso_3_code": "ymz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9171", "native_tokenizers": [], @@ -2755,9 +3258,11 @@ }, { "name": "Phala", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypa", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9172", "native_tokenizers": [], @@ -2765,9 +3270,11 @@ }, { "name": "Phowa, Labo", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9173", "native_tokenizers": [], @@ -2775,9 +3282,11 @@ }, { "name": "Phola", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9174", "native_tokenizers": [], @@ -2785,9 +3294,11 @@ }, { "name": "Phupha", + "depth": 5, "iso_1_code": null, "iso_3_code": "yph", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9175", "native_tokenizers": [], @@ -2795,9 +3306,11 @@ }, { "name": "Phuma", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9176", "native_tokenizers": [], @@ -2805,9 +3318,11 @@ }, { "name": "Phowa, Ani", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9177", "native_tokenizers": [], @@ -2815,9 +3330,11 @@ }, { "name": "Phola, Alo", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9178", "native_tokenizers": [], @@ -2825,9 +3342,11 @@ }, { "name": "Phupa", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9179", "native_tokenizers": [], @@ -2835,9 +3354,11 @@ }, { "name": "Phuza", + "depth": 5, "iso_1_code": null, "iso_3_code": "ypz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9180", "native_tokenizers": [], @@ -2845,9 +3366,11 @@ }, { "name": "Sonaga", + "depth": 5, "iso_1_code": null, "iso_3_code": "ysg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9181", "native_tokenizers": [], @@ -2855,9 +3378,11 @@ }, { "name": "Nisi", + "depth": 5, "iso_1_code": null, "iso_3_code": "yso", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9182", "native_tokenizers": [], @@ -2865,9 +3390,11 @@ }, { "name": "Thopho", + "depth": 5, "iso_1_code": null, "iso_3_code": "ytp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9183", "native_tokenizers": [], @@ -2875,15 +3402,18 @@ }, { "name": "Zokhuo", + "depth": 5, "iso_1_code": null, "iso_3_code": "yzk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9184", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9146", "native_tokenizers": [], @@ -2891,14 +3421,17 @@ }, { "name": "Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akeu", + "depth": 5, "iso_1_code": null, "iso_3_code": "aeu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9186", "native_tokenizers": [], @@ -2908,9 +3441,11 @@ }, { "name": "Akha", + "depth": 5, "iso_1_code": null, "iso_3_code": "ahk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9187", "native_tokenizers": [], @@ -2920,9 +3455,11 @@ }, { "name": "Biyo", + "depth": 5, "iso_1_code": null, "iso_3_code": "byo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9188", "native_tokenizers": [], @@ -2930,9 +3467,11 @@ }, { "name": "C\u00f4\u00f4ng", + "depth": 5, "iso_1_code": null, "iso_3_code": "cnc", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9189", "native_tokenizers": [], @@ -2940,9 +3479,11 @@ }, { "name": "Enu", + "depth": 5, "iso_1_code": null, "iso_3_code": "enu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9190", "native_tokenizers": [], @@ -2950,9 +3491,11 @@ }, { "name": "Hani", + "depth": 5, "iso_1_code": null, "iso_3_code": "hni", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9191", "native_tokenizers": [], @@ -2960,9 +3503,11 @@ }, { "name": "Honi", + "depth": 5, "iso_1_code": null, "iso_3_code": "how", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9192", "native_tokenizers": [], @@ -2970,9 +3515,11 @@ }, { "name": "Kaduo", + "depth": 5, "iso_1_code": null, "iso_3_code": "ktp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9193", "native_tokenizers": [], @@ -2980,9 +3527,11 @@ }, { "name": "Lopi", + "depth": 5, "iso_1_code": null, "iso_3_code": "lov", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9194", "native_tokenizers": [], @@ -2990,9 +3539,11 @@ }, { "name": "Mpi", + "depth": 5, "iso_1_code": null, "iso_3_code": "mpz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9195", "native_tokenizers": [], @@ -3000,9 +3551,11 @@ }, { "name": "Phana\u2019", + "depth": 5, "iso_1_code": null, "iso_3_code": "phq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9196", "native_tokenizers": [], @@ -3010,9 +3563,11 @@ }, { "name": "Sangkong", + "depth": 5, "iso_1_code": null, "iso_3_code": "sgk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9197", "native_tokenizers": [], @@ -3020,9 +3575,11 @@ }, { "name": "Sila", + "depth": 5, "iso_1_code": null, "iso_3_code": "slt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9198", "native_tokenizers": [], @@ -3030,9 +3587,11 @@ }, { "name": "Chepya", + "depth": 5, "iso_1_code": null, "iso_3_code": "ycp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9199", "native_tokenizers": [], @@ -3040,9 +3599,11 @@ }, { "name": "Muda", + "depth": 5, "iso_1_code": null, "iso_3_code": "ymd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9200", "native_tokenizers": [], @@ -3050,14 +3611,17 @@ }, { "name": "Bisoid", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bisu", + "depth": 6, "iso_1_code": null, "iso_3_code": "bzi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9202", "native_tokenizers": [], @@ -3067,9 +3631,11 @@ }, { "name": "Laomian", + "depth": 6, "iso_1_code": null, "iso_3_code": "lwm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9203", "native_tokenizers": [], @@ -3077,9 +3643,11 @@ }, { "name": "Phunoi", + "depth": 6, "iso_1_code": null, "iso_3_code": "pho", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9204", "native_tokenizers": [], @@ -3087,21 +3655,25 @@ }, { "name": "Pyen", + "depth": 6, "iso_1_code": null, "iso_3_code": "pyy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9205", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9201", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9185", "native_tokenizers": [], @@ -3109,14 +3681,17 @@ }, { "name": "Unclassified", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Laopang", + "depth": 5, "iso_1_code": null, "iso_3_code": "lbg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9207", "native_tokenizers": [], @@ -3124,27 +3699,32 @@ }, { "name": "Ugong", + "depth": 5, "iso_1_code": null, "iso_3_code": "ugo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9208", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9206", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9104", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9084", "native_tokenizers": [], @@ -3152,19 +3732,23 @@ }, { "name": "Northeastern Tibeto-Burman", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bai", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bai, Central", + "depth": 4, "iso_1_code": null, "iso_3_code": "bca", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9211", "native_tokenizers": [], @@ -3172,9 +3756,11 @@ }, { "name": "Bai, Panyi", + "depth": 4, "iso_1_code": null, "iso_3_code": "bfc", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9212", "native_tokenizers": [], @@ -3182,9 +3768,11 @@ }, { "name": "Bai, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "bfs", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9213", "native_tokenizers": [], @@ -3192,15 +3780,18 @@ }, { "name": "Bai, Lama", + "depth": 4, "iso_1_code": null, "iso_3_code": "lay", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9214", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9210", "native_tokenizers": [], @@ -3208,20 +3799,24 @@ }, { "name": "Baima", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baima", + "depth": 4, "iso_1_code": null, "iso_3_code": "bqh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9216", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9215", "native_tokenizers": [], @@ -3229,20 +3824,24 @@ }, { "name": "Ersuish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ersu", + "depth": 4, "iso_1_code": null, "iso_3_code": "ers", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9218", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9217", "native_tokenizers": [], @@ -3250,14 +3849,17 @@ }, { "name": "Naic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Namuyi", + "depth": 4, "iso_1_code": null, "iso_3_code": "nmy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9220", "native_tokenizers": [], @@ -3265,9 +3867,11 @@ }, { "name": "Narua", + "depth": 4, "iso_1_code": null, "iso_3_code": "nru", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9221", "native_tokenizers": [], @@ -3275,9 +3879,11 @@ }, { "name": "Naxi", + "depth": 4, "iso_1_code": null, "iso_3_code": "nxq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9222", "native_tokenizers": [], @@ -3285,15 +3891,18 @@ }, { "name": "Shuhi", + "depth": 4, "iso_1_code": null, "iso_3_code": "sxg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9223", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9219", "native_tokenizers": [], @@ -3301,14 +3910,17 @@ }, { "name": "Qiangic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Qiang, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "cng", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9225", "native_tokenizers": [], @@ -3316,9 +3928,11 @@ }, { "name": "Minyag, Eastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "emq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9226", "native_tokenizers": [], @@ -3326,9 +3940,11 @@ }, { "name": "Guiqiong", + "depth": 4, "iso_1_code": null, "iso_3_code": "gqi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9227", "native_tokenizers": [], @@ -3336,9 +3952,11 @@ }, { "name": "Pumi, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "pmi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9228", "native_tokenizers": [], @@ -3346,9 +3964,11 @@ }, { "name": "Pumi, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "pmj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9229", "native_tokenizers": [], @@ -3356,9 +3976,11 @@ }, { "name": "Queyu", + "depth": 4, "iso_1_code": null, "iso_3_code": "qvy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9230", "native_tokenizers": [], @@ -3366,9 +3988,11 @@ }, { "name": "Qiang, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "qxs", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9231", "native_tokenizers": [], @@ -3376,9 +4000,11 @@ }, { "name": "Minyag, Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "wmg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9232", "native_tokenizers": [], @@ -3386,15 +4012,18 @@ }, { "name": "Zhaba", + "depth": 4, "iso_1_code": null, "iso_3_code": "zhb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9233", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9224", "native_tokenizers": [], @@ -3402,14 +4031,17 @@ }, { "name": "rGyalrongic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Horpa", + "depth": 4, "iso_1_code": null, "iso_3_code": "ero", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9235", "native_tokenizers": [], @@ -3417,9 +4049,11 @@ }, { "name": "sTodsde", + "depth": 4, "iso_1_code": null, "iso_3_code": "jih", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9236", "native_tokenizers": [], @@ -3427,9 +4061,11 @@ }, { "name": "Lavrung", + "depth": 4, "iso_1_code": null, "iso_3_code": "jiq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9237", "native_tokenizers": [], @@ -3437,15 +4073,18 @@ }, { "name": "Jiarong", + "depth": 4, "iso_1_code": null, "iso_3_code": "jya", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9238", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9234", "native_tokenizers": [], @@ -3453,14 +4092,17 @@ }, { "name": "Tujia", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tujia, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "tji", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9240", "native_tokenizers": [], @@ -3468,21 +4110,25 @@ }, { "name": "Tujia, Southern", + "depth": 4, "iso_1_code": null, "iso_3_code": "tjs", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9241", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9239", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9209", "native_tokenizers": [], @@ -3490,19 +4136,23 @@ }, { "name": "Sal", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boro-Garo", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Deori", + "depth": 4, "iso_1_code": null, "iso_3_code": "der", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9244", "native_tokenizers": [], @@ -3510,9 +4160,11 @@ }, { "name": "Garo", + "depth": 4, "iso_1_code": null, "iso_3_code": "grt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9245", "native_tokenizers": [], @@ -3522,9 +4174,11 @@ }, { "name": "Megam", + "depth": 4, "iso_1_code": null, "iso_3_code": "mef", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9246", "native_tokenizers": [], @@ -3532,9 +4186,11 @@ }, { "name": "Tippera", + "depth": 4, "iso_1_code": null, "iso_3_code": "tpe", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9247", "native_tokenizers": [], @@ -3542,14 +4198,17 @@ }, { "name": "Boro-Tiwa", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tiwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "lax", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9249", "native_tokenizers": [], @@ -3557,14 +4216,17 @@ }, { "name": "Boro", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boro", + "depth": 6, "iso_1_code": null, "iso_3_code": "brx", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -3585,15 +4247,18 @@ }, { "name": "Kachari", + "depth": 6, "iso_1_code": null, "iso_3_code": "xac", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9252", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -3608,6 +4273,7 @@ "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -3623,14 +4289,17 @@ }, { "name": "Dimasa-Kokborok", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dimasa", + "depth": 5, "iso_1_code": null, "iso_3_code": "dis", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9254", "native_tokenizers": [], @@ -3640,14 +4309,17 @@ }, { "name": "Kok Borok", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Riang", + "depth": 6, "iso_1_code": null, "iso_3_code": "ria", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9256", "native_tokenizers": [], @@ -3657,9 +4329,11 @@ }, { "name": "Kok Borok", + "depth": 6, "iso_1_code": null, "iso_3_code": "trp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9257", "native_tokenizers": [], @@ -3669,21 +4343,25 @@ }, { "name": "Usoi", + "depth": 6, "iso_1_code": null, "iso_3_code": "usi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9258", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9255", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9253", "native_tokenizers": [], @@ -3691,14 +4369,17 @@ }, { "name": "Koch", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atong", + "depth": 5, "iso_1_code": null, "iso_3_code": "aot", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9260", "native_tokenizers": [], @@ -3706,9 +4387,11 @@ }, { "name": "Koch", + "depth": 5, "iso_1_code": null, "iso_3_code": "kdq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9261", "native_tokenizers": [], @@ -3716,9 +4399,11 @@ }, { "name": "Rabha", + "depth": 5, "iso_1_code": null, "iso_3_code": "rah", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9262", "native_tokenizers": [], @@ -3726,15 +4411,18 @@ }, { "name": "Ruga", + "depth": 5, "iso_1_code": null, "iso_3_code": "ruh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9263", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9259", "native_tokenizers": [], @@ -3742,14 +4430,17 @@ }, { "name": "Northern Naga", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naga, Khiamniungan", + "depth": 5, "iso_1_code": null, "iso_3_code": "kix", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9265", "native_tokenizers": [], @@ -3759,9 +4450,11 @@ }, { "name": "Naga, Lainong", + "depth": 5, "iso_1_code": null, "iso_3_code": "lzn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9266", "native_tokenizers": [], @@ -3769,9 +4462,11 @@ }, { "name": "Naga, Chang", + "depth": 5, "iso_1_code": null, "iso_3_code": "nbc", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9267", "native_tokenizers": [], @@ -3781,9 +4476,11 @@ }, { "name": "Naga, Konyak", + "depth": 5, "iso_1_code": null, "iso_3_code": "nbe", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9268", "native_tokenizers": [], @@ -3793,9 +4490,11 @@ }, { "name": "Naga, Nocte", + "depth": 5, "iso_1_code": null, "iso_3_code": "njb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9269", "native_tokenizers": [], @@ -3805,9 +4504,11 @@ }, { "name": "Naga, Lao", + "depth": 5, "iso_1_code": null, "iso_3_code": "nlq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9270", "native_tokenizers": [], @@ -3815,9 +4516,11 @@ }, { "name": "Naga, Wancho", + "depth": 5, "iso_1_code": null, "iso_3_code": "nnp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9271", "native_tokenizers": [], @@ -3827,9 +4530,11 @@ }, { "name": "Naga, Ponyo-Gongwang", + "depth": 5, "iso_1_code": null, "iso_3_code": "npg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9272", "native_tokenizers": [], @@ -3837,9 +4542,11 @@ }, { "name": "Naga, Phom", + "depth": 5, "iso_1_code": null, "iso_3_code": "nph", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9273", "native_tokenizers": [], @@ -3849,9 +4556,11 @@ }, { "name": "Naga, Chen-Kayu", + "depth": 5, "iso_1_code": null, "iso_3_code": "nqq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9274", "native_tokenizers": [], @@ -3859,9 +4568,11 @@ }, { "name": "Naga, Tangshang", + "depth": 5, "iso_1_code": null, "iso_3_code": "nst", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9275", "native_tokenizers": [], @@ -3871,9 +4582,11 @@ }, { "name": "Naga, Tutsa", + "depth": 5, "iso_1_code": null, "iso_3_code": "tvt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9276", "native_tokenizers": [], @@ -3881,21 +4594,25 @@ }, { "name": "Naga, Paungnyuan", + "depth": 5, "iso_1_code": null, "iso_3_code": "umn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9277", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9264", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -3911,14 +4628,17 @@ }, { "name": "Dhimalish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dhimal", + "depth": 4, "iso_1_code": null, "iso_3_code": "dhi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9279", "native_tokenizers": [], @@ -3926,15 +4646,18 @@ }, { "name": "Toto", + "depth": 4, "iso_1_code": null, "iso_3_code": "txo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9280", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9278", "native_tokenizers": [], @@ -3942,19 +4665,23 @@ }, { "name": "Jingppaw-Asakia", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asakian", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chak", + "depth": 5, "iso_1_code": null, "iso_3_code": "ckh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9283", "native_tokenizers": [], @@ -3962,9 +4689,11 @@ }, { "name": "Kadu", + "depth": 5, "iso_1_code": null, "iso_3_code": "zkd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9284", "native_tokenizers": [], @@ -3972,15 +4701,18 @@ }, { "name": "Kanan", + "depth": 5, "iso_1_code": null, "iso_3_code": "zkn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9285", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9282", "native_tokenizers": [], @@ -3988,14 +4720,17 @@ }, { "name": "Jingphaw", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jingpho", + "depth": 5, "iso_1_code": null, "iso_3_code": "kac", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9287", "native_tokenizers": [], @@ -4005,9 +4740,11 @@ }, { "name": "Singpho", + "depth": 5, "iso_1_code": null, "iso_3_code": "sgp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9288", "native_tokenizers": [], @@ -4015,9 +4752,11 @@ }, { "name": "Taman", + "depth": 5, "iso_1_code": null, "iso_3_code": "tcl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9289", "native_tokenizers": [], @@ -4025,27 +4764,32 @@ }, { "name": "Turung", + "depth": 5, "iso_1_code": null, "iso_3_code": "try", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9290", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9286", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9281", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4061,14 +4805,17 @@ }, { "name": "Tangkhulic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naga, Khoibu", + "depth": 3, "iso_1_code": null, "iso_3_code": "nkb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9292", "native_tokenizers": [], @@ -4076,9 +4823,11 @@ }, { "name": "Naga, Tangkhul", + "depth": 3, "iso_1_code": null, "iso_3_code": "nmf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9293", "native_tokenizers": [], @@ -4088,9 +4837,11 @@ }, { "name": "Naga, Maring", + "depth": 3, "iso_1_code": null, "iso_3_code": "nng", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9294", "native_tokenizers": [], @@ -4100,15 +4851,18 @@ }, { "name": "Naga, Tangkhul", + "depth": 3, "iso_1_code": null, "iso_3_code": "ntx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9295", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9291", "native_tokenizers": [], @@ -4116,14 +4870,17 @@ }, { "name": "Unclassified", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Darlong", + "depth": 3, "iso_1_code": null, "iso_3_code": "dln", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9297", "native_tokenizers": [], @@ -4133,9 +4890,11 @@ }, { "name": "Koro", + "depth": 3, "iso_1_code": null, "iso_3_code": "jkr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9298", "native_tokenizers": [], @@ -4143,9 +4902,11 @@ }, { "name": "Naga, Makuri", + "depth": 3, "iso_1_code": null, "iso_3_code": "jmn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9299", "native_tokenizers": [], @@ -4153,9 +4914,11 @@ }, { "name": "Khamba", + "depth": 3, "iso_1_code": null, "iso_3_code": "kbg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9300", "native_tokenizers": [], @@ -4163,9 +4926,11 @@ }, { "name": "Naga, Long Phuri", + "depth": 3, "iso_1_code": null, "iso_3_code": "lpn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9301", "native_tokenizers": [], @@ -4173,9 +4938,11 @@ }, { "name": "Naga, Inpui", + "depth": 3, "iso_1_code": null, "iso_3_code": "nkf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9302", "native_tokenizers": [], @@ -4185,9 +4952,11 @@ }, { "name": "Naga, Puimei", + "depth": 3, "iso_1_code": null, "iso_3_code": "npu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9303", "native_tokenizers": [], @@ -4195,9 +4964,11 @@ }, { "name": "Naga, Akyaung Ari", + "depth": 3, "iso_1_code": null, "iso_3_code": "nqy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9304", "native_tokenizers": [], @@ -4205,9 +4976,11 @@ }, { "name": "Naga, Kokak", + "depth": 3, "iso_1_code": null, "iso_3_code": "nxk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9305", "native_tokenizers": [], @@ -4215,9 +4988,11 @@ }, { "name": "Naga, Jejara", + "depth": 3, "iso_1_code": null, "iso_3_code": "pzn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9306", "native_tokenizers": [], @@ -4225,9 +5000,11 @@ }, { "name": "Ranglong", + "depth": 3, "iso_1_code": null, "iso_3_code": "rnl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9307", "native_tokenizers": [], @@ -4236,6 +5013,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9296", "native_tokenizers": [], @@ -4243,14 +5021,17 @@ }, { "name": "Western Naga", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naga, Rongmei", + "depth": 3, "iso_1_code": null, "iso_3_code": "nbu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9309", "native_tokenizers": [], @@ -4260,9 +5041,11 @@ }, { "name": "Naga, Liangmai", + "depth": 3, "iso_1_code": null, "iso_3_code": "njn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9310", "native_tokenizers": [], @@ -4272,9 +5055,11 @@ }, { "name": "Koireng", + "depth": 3, "iso_1_code": null, "iso_3_code": "nkd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9311", "native_tokenizers": [], @@ -4282,9 +5067,11 @@ }, { "name": "Naga, Thangal", + "depth": 3, "iso_1_code": null, "iso_3_code": "nki", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9312", "native_tokenizers": [], @@ -4294,9 +5081,11 @@ }, { "name": "Naga, Maram", + "depth": 3, "iso_1_code": null, "iso_3_code": "nma", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9313", "native_tokenizers": [], @@ -4306,9 +5095,11 @@ }, { "name": "Naga, Mzieme", + "depth": 3, "iso_1_code": null, "iso_3_code": "nme", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9314", "native_tokenizers": [], @@ -4316,9 +5107,11 @@ }, { "name": "Naga, Zeme", + "depth": 3, "iso_1_code": null, "iso_3_code": "nzm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9315", "native_tokenizers": [], @@ -4327,6 +5120,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9308", "native_tokenizers": [], @@ -4334,19 +5128,23 @@ }, { "name": "Western Tibeto-Burman", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bodish", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gongduk", + "depth": 4, "iso_1_code": null, "iso_3_code": "goe", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9318", "native_tokenizers": [], @@ -4354,9 +5152,11 @@ }, { "name": "Monpa, Kalaktang", + "depth": 4, "iso_1_code": null, "iso_3_code": "kkf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9319", "native_tokenizers": [], @@ -4364,9 +5164,11 @@ }, { "name": "Lhokpu", + "depth": 4, "iso_1_code": null, "iso_3_code": "lhp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9320", "native_tokenizers": [], @@ -4374,9 +5176,11 @@ }, { "name": "Olekha", + "depth": 4, "iso_1_code": null, "iso_3_code": "ole", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9321", "native_tokenizers": [], @@ -4384,9 +5188,11 @@ }, { "name": "Tshangla", + "depth": 4, "iso_1_code": null, "iso_3_code": "tsj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9322", "native_tokenizers": [], @@ -4394,14 +5200,17 @@ }, { "name": "Central Bodish", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Choni", + "depth": 5, "iso_1_code": null, "iso_3_code": "cda", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9324", "native_tokenizers": [], @@ -4409,9 +5218,11 @@ }, { "name": "Tseku", + "depth": 5, "iso_1_code": null, "iso_3_code": "tsk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9325", "native_tokenizers": [], @@ -4419,20 +5230,24 @@ }, { "name": "Amdo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tibetan, Amdo", + "depth": 6, "iso_1_code": null, "iso_3_code": "adx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9327", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9326", "native_tokenizers": [], @@ -4440,14 +5255,17 @@ }, { "name": "Central", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tibetan, Central", + "depth": 6, "iso_1_code": "bo", "iso_3_code": "bod", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9329", "native_tokenizers": [], @@ -4457,14 +5275,17 @@ }, { "name": "gTsang", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dolpo", + "depth": 7, "iso_1_code": null, "iso_3_code": "dre", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9331", "native_tokenizers": [], @@ -4472,9 +5293,11 @@ }, { "name": "Gyalsumdo", + "depth": 7, "iso_1_code": null, "iso_3_code": "gyo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9332", "native_tokenizers": [], @@ -4482,9 +5305,11 @@ }, { "name": "Humla", + "depth": 7, "iso_1_code": null, "iso_3_code": "hut", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9333", "native_tokenizers": [], @@ -4492,9 +5317,11 @@ }, { "name": "Jirel", + "depth": 7, "iso_1_code": null, "iso_3_code": "jul", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9334", "native_tokenizers": [], @@ -4502,9 +5329,11 @@ }, { "name": "Kyerung", + "depth": 7, "iso_1_code": null, "iso_3_code": "kgy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9335", "native_tokenizers": [], @@ -4512,9 +5341,11 @@ }, { "name": "Nubri", + "depth": 7, "iso_1_code": null, "iso_3_code": "kte", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9336", "native_tokenizers": [], @@ -4522,9 +5353,11 @@ }, { "name": "Lhomi", + "depth": 7, "iso_1_code": null, "iso_3_code": "lhm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9337", "native_tokenizers": [], @@ -4532,9 +5365,11 @@ }, { "name": "Lhowa", + "depth": 7, "iso_1_code": null, "iso_3_code": "loy", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9338", "native_tokenizers": [], @@ -4542,9 +5377,11 @@ }, { "name": "Mugom-Karmarong", + "depth": 7, "iso_1_code": null, "iso_3_code": "muk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9339", "native_tokenizers": [], @@ -4552,9 +5389,11 @@ }, { "name": "Hyolmo", + "depth": 7, "iso_1_code": null, "iso_3_code": "scp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9340", "native_tokenizers": [], @@ -4562,9 +5401,11 @@ }, { "name": "Syuba", + "depth": 7, "iso_1_code": null, "iso_3_code": "syw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9341", "native_tokenizers": [], @@ -4572,9 +5413,11 @@ }, { "name": "Tichurong", + "depth": 7, "iso_1_code": null, "iso_3_code": "tcn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9342", "native_tokenizers": [], @@ -4582,9 +5425,11 @@ }, { "name": "Tsum", + "depth": 7, "iso_1_code": null, "iso_3_code": "ttz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9343", "native_tokenizers": [], @@ -4592,9 +5437,11 @@ }, { "name": "Sherpa", + "depth": 7, "iso_1_code": null, "iso_3_code": "xsr", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4611,6 +5458,7 @@ ] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4626,14 +5474,17 @@ }, { "name": "Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Brokkat", + "depth": 7, "iso_1_code": null, "iso_3_code": "bro", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9346", "native_tokenizers": [], @@ -4641,9 +5492,11 @@ }, { "name": "Chocangacakha", + "depth": 7, "iso_1_code": null, "iso_3_code": "cgk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9347", "native_tokenizers": [], @@ -4651,9 +5504,11 @@ }, { "name": "Dzongkha", + "depth": 7, "iso_1_code": "dz", "iso_3_code": "dzo", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9348", "native_tokenizers": [], @@ -4663,9 +5518,11 @@ }, { "name": "Groma", + "depth": 7, "iso_1_code": null, "iso_3_code": "gro", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9349", "native_tokenizers": [], @@ -4673,9 +5530,11 @@ }, { "name": "Lakha", + "depth": 7, "iso_1_code": null, "iso_3_code": "lkh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9350", "native_tokenizers": [], @@ -4683,9 +5542,11 @@ }, { "name": "Lunanakha", + "depth": 7, "iso_1_code": null, "iso_3_code": "luk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9351", "native_tokenizers": [], @@ -4693,9 +5554,11 @@ }, { "name": "Layakha", + "depth": 7, "iso_1_code": null, "iso_3_code": "lya", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9352", "native_tokenizers": [], @@ -4703,9 +5566,11 @@ }, { "name": "Brokpake", + "depth": 7, "iso_1_code": null, "iso_3_code": "sgt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9353", "native_tokenizers": [], @@ -4713,15 +5578,18 @@ }, { "name": "Sikkimese", + "depth": 7, "iso_1_code": null, "iso_3_code": "sip", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9354", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9345", "native_tokenizers": [], @@ -4729,14 +5597,17 @@ }, { "name": "Western", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jad", + "depth": 7, "iso_1_code": null, "iso_3_code": "jda", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9356", "native_tokenizers": [], @@ -4744,9 +5615,11 @@ }, { "name": "Stod Bhoti", + "depth": 7, "iso_1_code": null, "iso_3_code": "sbu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9357", "native_tokenizers": [], @@ -4754,21 +5627,25 @@ }, { "name": "Spiti Bhoti", + "depth": 7, "iso_1_code": null, "iso_3_code": "spt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9358", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9355", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4784,20 +5661,24 @@ }, { "name": "Khams", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tibetan, Khams", + "depth": 6, "iso_1_code": null, "iso_3_code": "khg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9360", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9359", "native_tokenizers": [], @@ -4805,14 +5686,17 @@ }, { "name": "Unclassified", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Naaba", + "depth": 6, "iso_1_code": null, "iso_3_code": "nao", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9362", "native_tokenizers": [], @@ -4820,15 +5704,18 @@ }, { "name": "Walungge", + "depth": 6, "iso_1_code": null, "iso_3_code": "ola", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9363", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9361", "native_tokenizers": [], @@ -4836,14 +5723,17 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balti", + "depth": 6, "iso_1_code": null, "iso_3_code": "bft", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9365", "native_tokenizers": [], @@ -4851,9 +5741,11 @@ }, { "name": "Changthang", + "depth": 6, "iso_1_code": null, "iso_3_code": "cna", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9366", "native_tokenizers": [], @@ -4861,9 +5753,11 @@ }, { "name": "Ladakhi", + "depth": 6, "iso_1_code": null, "iso_3_code": "lbj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9367", "native_tokenizers": [], @@ -4873,9 +5767,11 @@ }, { "name": "Purig", + "depth": 6, "iso_1_code": null, "iso_3_code": "prx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9368", "native_tokenizers": [], @@ -4883,21 +5779,25 @@ }, { "name": "Zangskari", + "depth": 6, "iso_1_code": null, "iso_3_code": "zau", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9369", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9364", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -4913,14 +5813,17 @@ }, { "name": "East Bodish", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dakpakha", + "depth": 5, "iso_1_code": null, "iso_3_code": "dka", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9371", "native_tokenizers": [], @@ -4928,9 +5831,11 @@ }, { "name": "Monpa, Tawang", + "depth": 5, "iso_1_code": null, "iso_3_code": "twm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9372", "native_tokenizers": [], @@ -4938,14 +5843,17 @@ }, { "name": "Bumthang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dzalakha", + "depth": 6, "iso_1_code": null, "iso_3_code": "dzl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9374", "native_tokenizers": [], @@ -4953,9 +5861,11 @@ }, { "name": "Bumthangkha", + "depth": 6, "iso_1_code": null, "iso_3_code": "kjz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9375", "native_tokenizers": [], @@ -4963,9 +5873,11 @@ }, { "name": "Nyenkha", + "depth": 6, "iso_1_code": null, "iso_3_code": "neh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9376", "native_tokenizers": [], @@ -4973,9 +5885,11 @@ }, { "name": "Nupbikha", + "depth": 6, "iso_1_code": null, "iso_3_code": "npb", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9377", "native_tokenizers": [], @@ -4983,9 +5897,11 @@ }, { "name": "Chalikha", + "depth": 6, "iso_1_code": null, "iso_3_code": "tgf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9378", "native_tokenizers": [], @@ -4993,9 +5909,11 @@ }, { "name": "Khengkha", + "depth": 6, "iso_1_code": null, "iso_3_code": "xkf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9379", "native_tokenizers": [], @@ -5003,21 +5921,25 @@ }, { "name": "Kurtokha", + "depth": 6, "iso_1_code": null, "iso_3_code": "xkz", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9380", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9373", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9370", "native_tokenizers": [], @@ -5025,14 +5947,17 @@ }, { "name": "West Bodish", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dura", + "depth": 5, "iso_1_code": null, "iso_3_code": "drq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9382", "native_tokenizers": [], @@ -5040,9 +5965,11 @@ }, { "name": "Kaike", + "depth": 5, "iso_1_code": null, "iso_3_code": "kzq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9383", "native_tokenizers": [], @@ -5050,14 +5977,17 @@ }, { "name": "Ghale", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ghale, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "ghe", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5075,9 +6005,11 @@ }, { "name": "Ghale, Northern", + "depth": 6, "iso_1_code": null, "iso_3_code": "ghh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9386", "native_tokenizers": [], @@ -5085,15 +6017,18 @@ }, { "name": "Kuke", + "depth": 6, "iso_1_code": null, "iso_3_code": "ght", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9387", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5109,19 +6044,23 @@ }, { "name": "Gurung-Tamang", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gurungic", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chantyal", + "depth": 7, "iso_1_code": null, "iso_3_code": "chx", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9390", "native_tokenizers": [], @@ -5129,9 +6068,11 @@ }, { "name": "Gurung", + "depth": 7, "iso_1_code": null, "iso_3_code": "gvr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9391", "native_tokenizers": [], @@ -5139,9 +6080,11 @@ }, { "name": "Nyeshangte", + "depth": 7, "iso_1_code": null, "iso_3_code": "nmm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9392", "native_tokenizers": [], @@ -5149,9 +6092,11 @@ }, { "name": "Nar Phu", + "depth": 7, "iso_1_code": null, "iso_3_code": "npa", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9393", "native_tokenizers": [], @@ -5159,9 +6104,11 @@ }, { "name": "Seke", + "depth": 7, "iso_1_code": null, "iso_3_code": "skj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9394", "native_tokenizers": [], @@ -5169,15 +6116,18 @@ }, { "name": "Thakali", + "depth": 7, "iso_1_code": null, "iso_3_code": "ths", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9395", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9389", "native_tokenizers": [], @@ -5185,14 +6135,17 @@ }, { "name": "Tamang", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tamang, Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": "taj", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5210,9 +6163,11 @@ }, { "name": "Tamang, Western", + "depth": 7, "iso_1_code": null, "iso_3_code": "tdg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9398", "native_tokenizers": [], @@ -5220,15 +6175,18 @@ }, { "name": "Tamang, Eastern Gorkha", + "depth": 7, "iso_1_code": null, "iso_3_code": "tge", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9399", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5243,6 +6201,7 @@ "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5257,6 +6216,7 @@ "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5272,19 +6232,23 @@ }, { "name": "West Himalayish", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Almora", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Byangsi", + "depth": 6, "iso_1_code": null, "iso_3_code": "bee", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9402", "native_tokenizers": [], @@ -5292,9 +6256,11 @@ }, { "name": "Chaudangsi", + "depth": 6, "iso_1_code": null, "iso_3_code": "cdn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9403", "native_tokenizers": [], @@ -5302,9 +6268,11 @@ }, { "name": "Darmiya", + "depth": 6, "iso_1_code": null, "iso_3_code": "drd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9404", "native_tokenizers": [], @@ -5312,15 +6280,18 @@ }, { "name": "Rangkas", + "depth": 6, "iso_1_code": null, "iso_3_code": "rgk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9405", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9401", "native_tokenizers": [], @@ -5328,14 +6299,17 @@ }, { "name": "Kinauri", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gahri", + "depth": 6, "iso_1_code": null, "iso_3_code": "bfu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9407", "native_tokenizers": [], @@ -5343,9 +6317,11 @@ }, { "name": "Kinnauri, Chitkuli", + "depth": 6, "iso_1_code": null, "iso_3_code": "cik", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9408", "native_tokenizers": [], @@ -5353,9 +6329,11 @@ }, { "name": "Jangshung", + "depth": 6, "iso_1_code": null, "iso_3_code": "jna", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9409", "native_tokenizers": [], @@ -5363,9 +6341,11 @@ }, { "name": "Kinnauri", + "depth": 6, "iso_1_code": null, "iso_3_code": "kfk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9410", "native_tokenizers": [], @@ -5373,9 +6353,11 @@ }, { "name": "Pattani", + "depth": 6, "iso_1_code": null, "iso_3_code": "lae", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9411", "native_tokenizers": [], @@ -5383,9 +6365,11 @@ }, { "name": "Tinani", + "depth": 6, "iso_1_code": null, "iso_3_code": "lbf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9412", "native_tokenizers": [], @@ -5393,9 +6377,11 @@ }, { "name": "Kinnauri, Bhoti", + "depth": 6, "iso_1_code": null, "iso_3_code": "nes", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9413", "native_tokenizers": [], @@ -5403,9 +6389,11 @@ }, { "name": "Rongpo", + "depth": 6, "iso_1_code": null, "iso_3_code": "rnp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9414", "native_tokenizers": [], @@ -5413,9 +6401,11 @@ }, { "name": "Shumcho", + "depth": 6, "iso_1_code": null, "iso_3_code": "scu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9415", "native_tokenizers": [], @@ -5423,9 +6413,11 @@ }, { "name": "Sunam", + "depth": 6, "iso_1_code": null, "iso_3_code": "ssk", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9416", "native_tokenizers": [], @@ -5433,9 +6425,11 @@ }, { "name": "Kinnauri, Chhoyul", + "depth": 6, "iso_1_code": null, "iso_3_code": "tpq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9417", "native_tokenizers": [], @@ -5443,27 +6437,32 @@ }, { "name": "Kanashi", + "depth": 6, "iso_1_code": null, "iso_3_code": "xns", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9418", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9406", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9400", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5479,24 +6478,29 @@ }, { "name": "Himalayan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Himalayan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chepang-Bhujel", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bhujel", + "depth": 6, "iso_1_code": null, "iso_3_code": "byh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9422", "native_tokenizers": [], @@ -5504,15 +6508,18 @@ }, { "name": "Chepang", + "depth": 6, "iso_1_code": null, "iso_3_code": "cdm", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9423", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9421", "native_tokenizers": [], @@ -5520,19 +6527,23 @@ }, { "name": "Kham-Magar", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kham", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kham, Gamal", + "depth": 7, "iso_1_code": null, "iso_3_code": "kgj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9426", "native_tokenizers": [], @@ -5540,9 +6551,11 @@ }, { "name": "Kham, Eastern Parbate", + "depth": 7, "iso_1_code": null, "iso_3_code": "kif", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9427", "native_tokenizers": [], @@ -5550,9 +6563,11 @@ }, { "name": "Kham, Sheshi", + "depth": 7, "iso_1_code": null, "iso_3_code": "kip", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9428", "native_tokenizers": [], @@ -5560,15 +6575,18 @@ }, { "name": "Kham, Western Parbate", + "depth": 7, "iso_1_code": null, "iso_3_code": "kjl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9429", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9425", "native_tokenizers": [], @@ -5576,14 +6594,17 @@ }, { "name": "Magar", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Magar, Eastern", + "depth": 7, "iso_1_code": null, "iso_3_code": "mgp", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9431", "native_tokenizers": [], @@ -5591,21 +6612,25 @@ }, { "name": "Magar, Western", + "depth": 7, "iso_1_code": null, "iso_3_code": "mrd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9432", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9430", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9424", "native_tokenizers": [], @@ -5613,14 +6638,17 @@ }, { "name": "Newar", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Newar", + "depth": 6, "iso_1_code": null, "iso_3_code": "new", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5638,15 +6666,18 @@ }, { "name": "Pahari", + "depth": 6, "iso_1_code": null, "iso_3_code": "phj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9435", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5662,14 +6693,17 @@ }, { "name": "Raute-Raji", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rawat", + "depth": 6, "iso_1_code": null, "iso_3_code": "jnl", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9437", "native_tokenizers": [], @@ -5677,9 +6711,11 @@ }, { "name": "Raute", + "depth": 6, "iso_1_code": null, "iso_3_code": "rau", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9438", "native_tokenizers": [], @@ -5687,15 +6723,18 @@ }, { "name": "Raji", + "depth": 6, "iso_1_code": null, "iso_3_code": "rji", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9439", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9436", "native_tokenizers": [], @@ -5703,14 +6742,17 @@ }, { "name": "Thangmi-Baraamu", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baram", + "depth": 6, "iso_1_code": null, "iso_3_code": "brd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9441", "native_tokenizers": [], @@ -5718,21 +6760,25 @@ }, { "name": "Thangmi", + "depth": 6, "iso_1_code": null, "iso_3_code": "thf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9442", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9440", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5748,19 +6794,23 @@ }, { "name": "Kiranti", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Athpariya", + "depth": 6, "iso_1_code": null, "iso_3_code": "aph", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9445", "native_tokenizers": [], @@ -5768,9 +6818,11 @@ }, { "name": "Bantawa", + "depth": 6, "iso_1_code": null, "iso_3_code": "bap", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9446", "native_tokenizers": [], @@ -5778,9 +6830,11 @@ }, { "name": "Belhariya", + "depth": 6, "iso_1_code": null, "iso_3_code": "byw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9447", "native_tokenizers": [], @@ -5788,9 +6842,11 @@ }, { "name": "Chhintang", + "depth": 6, "iso_1_code": null, "iso_3_code": "ctn", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9448", "native_tokenizers": [], @@ -5798,9 +6854,11 @@ }, { "name": "Chhiling", + "depth": 6, "iso_1_code": null, "iso_3_code": "cur", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9449", "native_tokenizers": [], @@ -5808,9 +6866,11 @@ }, { "name": "Chukwa", + "depth": 6, "iso_1_code": null, "iso_3_code": "cuw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9450", "native_tokenizers": [], @@ -5818,9 +6878,11 @@ }, { "name": "Mewahang, Eastern", + "depth": 6, "iso_1_code": null, "iso_3_code": "emg", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9451", "native_tokenizers": [], @@ -5828,9 +6890,11 @@ }, { "name": "Kulung", + "depth": 6, "iso_1_code": null, "iso_3_code": "kle", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5848,9 +6912,11 @@ }, { "name": "Lohorung", + "depth": 6, "iso_1_code": null, "iso_3_code": "lbr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9453", "native_tokenizers": [], @@ -5858,9 +6924,11 @@ }, { "name": "Limbu", + "depth": 6, "iso_1_code": null, "iso_3_code": "lif", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5879,9 +6947,11 @@ }, { "name": "Mugali", + "depth": 6, "iso_1_code": null, "iso_3_code": "lmh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9455", "native_tokenizers": [], @@ -5889,9 +6959,11 @@ }, { "name": "Yamphu, Southern", + "depth": 6, "iso_1_code": null, "iso_3_code": "lrr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9456", "native_tokenizers": [], @@ -5899,9 +6971,11 @@ }, { "name": "Yakkha, Chhathare", + "depth": 6, "iso_1_code": null, "iso_3_code": "luu", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9457", "native_tokenizers": [], @@ -5909,9 +6983,11 @@ }, { "name": "Nachiring", + "depth": 6, "iso_1_code": null, "iso_3_code": "ncd", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9458", "native_tokenizers": [], @@ -5919,9 +6995,11 @@ }, { "name": "Phangduwali", + "depth": 6, "iso_1_code": null, "iso_3_code": "phw", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9459", "native_tokenizers": [], @@ -5929,9 +7007,11 @@ }, { "name": "Puma", + "depth": 6, "iso_1_code": null, "iso_3_code": "pum", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9460", "native_tokenizers": [], @@ -5939,9 +7019,11 @@ }, { "name": "Dungmali", + "depth": 6, "iso_1_code": null, "iso_3_code": "raa", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9461", "native_tokenizers": [], @@ -5949,9 +7031,11 @@ }, { "name": "Chamling", + "depth": 6, "iso_1_code": null, "iso_3_code": "rab", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9462", "native_tokenizers": [], @@ -5959,9 +7043,11 @@ }, { "name": "Mewahang, Western", + "depth": 6, "iso_1_code": null, "iso_3_code": "raf", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9463", "native_tokenizers": [], @@ -5969,9 +7055,11 @@ }, { "name": "Saam", + "depth": 6, "iso_1_code": null, "iso_3_code": "raq", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9464", "native_tokenizers": [], @@ -5979,9 +7067,11 @@ }, { "name": "Sampang", + "depth": 6, "iso_1_code": null, "iso_3_code": "rav", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -5999,9 +7089,11 @@ }, { "name": "Yakkha", + "depth": 6, "iso_1_code": null, "iso_3_code": "ybh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9466", "native_tokenizers": [], @@ -6009,15 +7101,18 @@ }, { "name": "Yamphu", + "depth": 6, "iso_1_code": null, "iso_3_code": "ybi", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9467", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6033,14 +7128,17 @@ }, { "name": "Western", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bahing", + "depth": 6, "iso_1_code": null, "iso_3_code": "bhj", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9469", "native_tokenizers": [], @@ -6048,9 +7146,11 @@ }, { "name": "Dumi", + "depth": 6, "iso_1_code": null, "iso_3_code": "dus", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9470", "native_tokenizers": [], @@ -6058,9 +7158,11 @@ }, { "name": "Jerung", + "depth": 6, "iso_1_code": null, "iso_3_code": "jee", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9471", "native_tokenizers": [], @@ -6068,9 +7170,11 @@ }, { "name": "Koyee", + "depth": 6, "iso_1_code": null, "iso_3_code": "kkt", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9472", "native_tokenizers": [], @@ -6078,9 +7182,11 @@ }, { "name": "Khaling", + "depth": 6, "iso_1_code": null, "iso_3_code": "klr", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9473", "native_tokenizers": [], @@ -6088,9 +7194,11 @@ }, { "name": "Sunwar", + "depth": 6, "iso_1_code": null, "iso_3_code": "suz", "children": [], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6108,9 +7216,11 @@ }, { "name": "Thulung", + "depth": 6, "iso_1_code": null, "iso_3_code": "tdh", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9475", "native_tokenizers": [], @@ -6118,9 +7228,11 @@ }, { "name": "Tilung", + "depth": 6, "iso_1_code": null, "iso_3_code": "tij", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9476", "native_tokenizers": [], @@ -6128,9 +7240,11 @@ }, { "name": "Wayu", + "depth": 6, "iso_1_code": null, "iso_3_code": "vay", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9477", "native_tokenizers": [], @@ -6138,15 +7252,18 @@ }, { "name": "Wambule", + "depth": 6, "iso_1_code": null, "iso_3_code": "wme", "children": [], + "family": "Sino-Tibetan", "tokenizers": {}, "node_i": "9478", "native_tokenizers": [], "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6161,6 +7278,7 @@ "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6175,6 +7293,7 @@ "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6189,6 +7308,7 @@ "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6203,6 +7323,7 @@ "scripts": [] } ], + "family": "Sino-Tibetan", "tokenizers": { "Deva": { "full_object": "IndicNLPTokenizer(\"hi\")", @@ -6217,22 +7338,8 @@ "scripts": [] } ], - "tokenizers": { - "Hani": { - "full_object": "SpaCyTokenizer(\"zh\", {\"nlp\": {\"tokenizer\": {\"segmenter\": \"jieba\"}}})", - "original_lang_name": "chinese", - "original_lang_code": "zho", - "script": "Hani", - "class_name": "SpaCyTokenizer" - }, - "Deva": { - "full_object": "IndicNLPTokenizer(\"hi\")", - "original_lang_name": "bodo", - "original_lang_code": "brx", - "script": "Deva", - "class_name": "IndicNLPTokenizer" - } - }, + "family": "Sino-Tibetan", + "tokenizers": {}, "node_i": "8918", "native_tokenizers": [], "scripts": [] diff --git a/data/Siouan-Catawban.json b/data/Siouan-Catawban.json index 7ffa8e9410cae81a3cdb6361b347b0677ff99c96..f518cd3c49629a22f498c8c382dbe9b84640cd23 100644 --- a/data/Siouan-Catawban.json +++ b/data/Siouan-Catawban.json @@ -1,18 +1,22 @@ { "name": "Siouan-Catawban", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Catawban", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Catawba", + "depth": 2, "iso_1_code": null, "iso_3_code": "chc", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9481", "native_tokenizers": [], @@ -20,15 +24,18 @@ }, { "name": "Woccon", + "depth": 2, "iso_1_code": null, "iso_3_code": "xwc", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9482", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9480", "native_tokenizers": [], @@ -36,14 +43,17 @@ }, { "name": "Siouan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mandan", + "depth": 2, "iso_1_code": null, "iso_3_code": "mhq", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9484", "native_tokenizers": [], @@ -51,14 +61,17 @@ }, { "name": "Mississippi Valley-Ohio Valley Siouan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Michigamea", + "depth": 3, "iso_1_code": null, "iso_3_code": "cmm", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9486", "native_tokenizers": [], @@ -66,9 +79,11 @@ }, { "name": "Ofo", + "depth": 3, "iso_1_code": null, "iso_3_code": "ofo", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9487", "native_tokenizers": [], @@ -76,9 +91,11 @@ }, { "name": "Tutelo", + "depth": 3, "iso_1_code": null, "iso_3_code": "tta", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9488", "native_tokenizers": [], @@ -86,14 +103,17 @@ }, { "name": "Mississippi Valley Siouan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biloxi", + "depth": 4, "iso_1_code": null, "iso_3_code": "bll", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9490", "native_tokenizers": [], @@ -101,14 +121,17 @@ }, { "name": "Chiwere-Winnebago", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iowa-Oto", + "depth": 5, "iso_1_code": null, "iso_3_code": "iow", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9492", "native_tokenizers": [], @@ -116,15 +139,18 @@ }, { "name": "Ho-Chunk", + "depth": 5, "iso_1_code": null, "iso_3_code": "win", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9493", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9491", "native_tokenizers": [], @@ -132,14 +158,17 @@ }, { "name": "Dakota", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Assiniboine", + "depth": 5, "iso_1_code": null, "iso_3_code": "asb", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9495", "native_tokenizers": [], @@ -147,9 +176,11 @@ }, { "name": "Dakota", + "depth": 5, "iso_1_code": null, "iso_3_code": "dak", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9496", "native_tokenizers": [], @@ -159,9 +190,11 @@ }, { "name": "Lakota", + "depth": 5, "iso_1_code": null, "iso_3_code": "lkt", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9497", "native_tokenizers": [], @@ -169,15 +202,18 @@ }, { "name": "Stoney", + "depth": 5, "iso_1_code": null, "iso_3_code": "sto", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9498", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9494", "native_tokenizers": [], @@ -185,14 +221,17 @@ }, { "name": "Dhegihan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kansa", + "depth": 5, "iso_1_code": null, "iso_3_code": "ksk", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9500", "native_tokenizers": [], @@ -200,9 +239,11 @@ }, { "name": "Omaha-Ponca", + "depth": 5, "iso_1_code": null, "iso_3_code": "oma", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9501", "native_tokenizers": [], @@ -210,9 +251,11 @@ }, { "name": "Osage", + "depth": 5, "iso_1_code": null, "iso_3_code": "osa", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9502", "native_tokenizers": [], @@ -220,27 +263,32 @@ }, { "name": "Quapaw", + "depth": 5, "iso_1_code": null, "iso_3_code": "qua", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9503", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9499", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9489", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9485", "native_tokenizers": [], @@ -248,14 +296,17 @@ }, { "name": "Missouri River Siouan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Crow", + "depth": 3, "iso_1_code": null, "iso_3_code": "cro", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9505", "native_tokenizers": [], @@ -263,27 +314,32 @@ }, { "name": "Hidatsa", + "depth": 3, "iso_1_code": null, "iso_3_code": "hid", "children": [], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9506", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9504", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9483", "native_tokenizers": [], "scripts": [] } ], + "family": "Siouan-Catawban", "tokenizers": {}, "node_i": "9479", "native_tokenizers": [], diff --git a/data/Skou.json b/data/Skou.json index 29b9c480f7c39d92e7b33171a012630c446139ea..8cfaa5aa24bd02c5d99e7a2bd0fd1cb82afef414 100644 --- a/data/Skou.json +++ b/data/Skou.json @@ -1,24 +1,29 @@ { "name": "Skou", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "I\u2019saka", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "I\u2019saka", + "depth": 2, "iso_1_code": null, "iso_3_code": "ksi", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9509", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9508", "native_tokenizers": [], @@ -26,24 +31,29 @@ }, { "name": "Skou-Serra-Lagoon", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuclear Skou", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern Skou", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dumo", + "depth": 4, "iso_1_code": null, "iso_3_code": "vam", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9513", "native_tokenizers": [], @@ -51,15 +61,18 @@ }, { "name": "Wutung", + "depth": 4, "iso_1_code": null, "iso_3_code": "wut", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9514", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9512", "native_tokenizers": [], @@ -67,26 +80,31 @@ }, { "name": "Skou", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Skou", + "depth": 4, "iso_1_code": null, "iso_3_code": "skv", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9516", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9515", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9511", "native_tokenizers": [], @@ -94,19 +112,23 @@ }, { "name": "Serra Hills", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lagoon", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bauni", + "depth": 4, "iso_1_code": null, "iso_3_code": "bpe", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9519", "native_tokenizers": [], @@ -114,9 +136,11 @@ }, { "name": "Bouni", + "depth": 4, "iso_1_code": null, "iso_3_code": "suo", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9520", "native_tokenizers": [], @@ -124,15 +148,18 @@ }, { "name": "Uni", + "depth": 4, "iso_1_code": null, "iso_3_code": "uni", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9521", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9518", "native_tokenizers": [], @@ -140,20 +167,24 @@ }, { "name": "Puari", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Puare", + "depth": 4, "iso_1_code": null, "iso_3_code": "pux", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9523", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9522", "native_tokenizers": [], @@ -161,25 +192,30 @@ }, { "name": "Rawo-Main Serra", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Main Serra", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pin", + "depth": 5, "iso_1_code": null, "iso_3_code": "wmx", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9526", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9525", "native_tokenizers": [], @@ -187,44 +223,52 @@ }, { "name": "Rawo", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rawo", + "depth": 5, "iso_1_code": null, "iso_3_code": "rwa", "children": [], + "family": "Skou", "tokenizers": {}, "node_i": "9528", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9527", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9524", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9517", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9510", "native_tokenizers": [], "scripts": [] } ], + "family": "Skou", "tokenizers": {}, "node_i": "9507", "native_tokenizers": [], diff --git a/data/Somahai.json b/data/Somahai.json index 8d2388998225919a1d3bb7592d9b3ed4720f2482..a0851094d3e352b5fda2664b0fef24a3c8b8b681 100644 --- a/data/Somahai.json +++ b/data/Somahai.json @@ -1,13 +1,16 @@ { "name": "Somahai", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Momina", + "depth": 1, "iso_1_code": null, "iso_3_code": "mmb", "children": [], + "family": "Somahai", "tokenizers": {}, "node_i": "9530", "native_tokenizers": [], @@ -15,15 +18,18 @@ }, { "name": "Momuna", + "depth": 1, "iso_1_code": null, "iso_3_code": "mqf", "children": [], + "family": "Somahai", "tokenizers": {}, "node_i": "9531", "native_tokenizers": [], "scripts": [] } ], + "family": "Somahai", "tokenizers": {}, "node_i": "9529", "native_tokenizers": [], diff --git a/data/South Bougainville.json b/data/South Bougainville.json index bd5f3a5ec5335142a90f163d99ae7306fea3ce02..e582d1a0c693549ec5612ba35e9942a2f5771a0f 100644 --- a/data/South Bougainville.json +++ b/data/South Bougainville.json @@ -1,18 +1,22 @@ { "name": "South Bougainville", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buin", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Terei", + "depth": 2, "iso_1_code": null, "iso_3_code": "buo", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9564", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Motuna", + "depth": 2, "iso_1_code": null, "iso_3_code": "siw", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9565", "native_tokenizers": [], @@ -30,15 +36,18 @@ }, { "name": "Uisai", + "depth": 2, "iso_1_code": null, "iso_3_code": "uis", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9566", "native_tokenizers": [], "scripts": [] } ], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9563", "native_tokenizers": [], @@ -46,14 +55,17 @@ }, { "name": "Nasioi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koromira", + "depth": 2, "iso_1_code": null, "iso_3_code": "kqj", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9568", "native_tokenizers": [], @@ -61,9 +73,11 @@ }, { "name": "Daantanai\u2019", + "depth": 2, "iso_1_code": null, "iso_3_code": "lni", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9569", "native_tokenizers": [], @@ -71,9 +85,11 @@ }, { "name": "Naasioi", + "depth": 2, "iso_1_code": null, "iso_3_code": "nas", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9570", "native_tokenizers": [], @@ -83,9 +99,11 @@ }, { "name": "Sibe", + "depth": 2, "iso_1_code": null, "iso_3_code": "nco", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9571", "native_tokenizers": [], @@ -93,9 +111,11 @@ }, { "name": "Oune", + "depth": 2, "iso_1_code": null, "iso_3_code": "oue", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9572", "native_tokenizers": [], @@ -103,21 +123,25 @@ }, { "name": "Simeku", + "depth": 2, "iso_1_code": null, "iso_3_code": "smz", "children": [], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9573", "native_tokenizers": [], "scripts": [] } ], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9567", "native_tokenizers": [], "scripts": [] } ], + "family": "South Bougainville", "tokenizers": {}, "node_i": "9562", "native_tokenizers": [], diff --git a/data/South-Central Papuan.json b/data/South-Central Papuan.json index 15e051ec84fd769a33aa59c38f74458820c39fab..2a4d70e1a463399ea053d8cf0a429032975f9638 100644 --- a/data/South-Central Papuan.json +++ b/data/South-Central Papuan.json @@ -1,23 +1,28 @@ { "name": "South-Central Papuan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Morehead-Upper Maro", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nambu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Namo", + "depth": 3, "iso_1_code": null, "iso_3_code": "mxw", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9535", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Nambo", + "depth": 3, "iso_1_code": null, "iso_3_code": "ncm", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9536", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Neme", + "depth": 3, "iso_1_code": null, "iso_3_code": "nex", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9537", "native_tokenizers": [], @@ -45,9 +54,11 @@ }, { "name": "Namat", + "depth": 3, "iso_1_code": null, "iso_3_code": "nkm", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9538", "native_tokenizers": [], @@ -55,9 +66,11 @@ }, { "name": "Nama", + "depth": 3, "iso_1_code": null, "iso_3_code": "nmx", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9539", "native_tokenizers": [], @@ -65,15 +78,18 @@ }, { "name": "Nen", + "depth": 3, "iso_1_code": null, "iso_3_code": "nqn", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9540", "native_tokenizers": [], "scripts": [] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9534", "native_tokenizers": [], @@ -81,14 +97,17 @@ }, { "name": "Tonda", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Blafe", + "depth": 3, "iso_1_code": null, "iso_3_code": "bfh", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9542", "native_tokenizers": [], @@ -96,9 +115,11 @@ }, { "name": "Rema", + "depth": 3, "iso_1_code": null, "iso_3_code": "bow", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9543", "native_tokenizers": [], @@ -106,9 +127,11 @@ }, { "name": "Wartha Thuntai", + "depth": 3, "iso_1_code": null, "iso_3_code": "gnt", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9544", "native_tokenizers": [], @@ -116,9 +139,11 @@ }, { "name": "Kanum, Ngk\u00e2lmpw", + "depth": 3, "iso_1_code": null, "iso_3_code": "kcd", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9545", "native_tokenizers": [], @@ -126,9 +151,11 @@ }, { "name": "Kanum, B\u00e4di", + "depth": 3, "iso_1_code": null, "iso_3_code": "khd", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9546", "native_tokenizers": [], @@ -136,9 +163,11 @@ }, { "name": "Kanum, Sota", + "depth": 3, "iso_1_code": null, "iso_3_code": "krz", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9547", "native_tokenizers": [], @@ -146,9 +175,11 @@ }, { "name": "Kanum, Sm\u00e4rky", + "depth": 3, "iso_1_code": null, "iso_3_code": "kxq", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9548", "native_tokenizers": [], @@ -156,9 +187,11 @@ }, { "name": "Kanja", + "depth": 3, "iso_1_code": null, "iso_3_code": "pep", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9549", "native_tokenizers": [], @@ -166,9 +199,11 @@ }, { "name": "Aramba", + "depth": 3, "iso_1_code": null, "iso_3_code": "stk", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9550", "native_tokenizers": [], @@ -176,15 +211,18 @@ }, { "name": "W\u00e1ra", + "depth": 3, "iso_1_code": null, "iso_3_code": "tci", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9551", "native_tokenizers": [], "scripts": [] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9541", "native_tokenizers": [], @@ -192,26 +230,31 @@ }, { "name": "Yey", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yei", + "depth": 3, "iso_1_code": null, "iso_3_code": "jei", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9553", "native_tokenizers": [], "scripts": [] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9552", "native_tokenizers": [], "scripts": [] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9533", "native_tokenizers": [], @@ -219,14 +262,17 @@ }, { "name": "Pahoturi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Idi", + "depth": 2, "iso_1_code": null, "iso_3_code": "idi", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9555", "native_tokenizers": [], @@ -234,15 +280,18 @@ }, { "name": "Agob", + "depth": 2, "iso_1_code": null, "iso_3_code": "kit", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9556", "native_tokenizers": [], "scripts": [] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9554", "native_tokenizers": [], @@ -250,14 +299,17 @@ }, { "name": "Waia", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tabo", + "depth": 2, "iso_1_code": null, "iso_3_code": "knv", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9558", "native_tokenizers": [], @@ -266,6 +318,7 @@ ] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9557", "native_tokenizers": [], @@ -273,14 +326,17 @@ }, { "name": "Yelmek-Maklew", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yelmek", + "depth": 2, "iso_1_code": null, "iso_3_code": "jel", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9560", "native_tokenizers": [], @@ -288,21 +344,25 @@ }, { "name": "Maklew", + "depth": 2, "iso_1_code": null, "iso_3_code": "mgf", "children": [], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9561", "native_tokenizers": [], "scripts": [] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9559", "native_tokenizers": [], "scripts": [] } ], + "family": "South-Central Papuan", "tokenizers": {}, "node_i": "9532", "native_tokenizers": [], diff --git "a/data/S\303\241livan.json" "b/data/S\303\241livan.json" index 297571a210df6196d1a85624ae3c63a5773550f4..8a34fc5ff9e4bcf8dcaf0dff7012314fef9b2ae0 100644 --- "a/data/S\303\241livan.json" +++ "b/data/S\303\241livan.json" @@ -1,13 +1,16 @@ { "name": "S\u00e1livan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "S\u00e1liba", + "depth": 1, "iso_1_code": null, "iso_3_code": "slc", "children": [], + "family": "S\u00e1livan", "tokenizers": {}, "node_i": "9575", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Piaroa-Maco", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Piaroa", + "depth": 2, "iso_1_code": null, "iso_3_code": "pid", "children": [], + "family": "S\u00e1livan", "tokenizers": {}, "node_i": "9577", "native_tokenizers": [], @@ -30,21 +36,25 @@ }, { "name": "Maco", + "depth": 2, "iso_1_code": null, "iso_3_code": "wpc", "children": [], + "family": "S\u00e1livan", "tokenizers": {}, "node_i": "9578", "native_tokenizers": [], "scripts": [] } ], + "family": "S\u00e1livan", "tokenizers": {}, "node_i": "9576", "native_tokenizers": [], "scripts": [] } ], + "family": "S\u00e1livan", "tokenizers": {}, "node_i": "9574", "native_tokenizers": [], diff --git a/data/Tacanan.json b/data/Tacanan.json index 4c5b68684ce4caf755a0d1d7bf1f0f8e1175a383..3f7aec5d338b7512b9cfb24c433bc14b0ec4d60f 100644 --- a/data/Tacanan.json +++ b/data/Tacanan.json @@ -1,13 +1,16 @@ { "name": "Tacanan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cavine\u00f1a", + "depth": 1, "iso_1_code": null, "iso_3_code": "cav", "children": [], + "family": "Tacanan", "tokenizers": {}, "node_i": "9580", "native_tokenizers": [], @@ -17,14 +20,17 @@ }, { "name": "Chama", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ese Ejja", + "depth": 2, "iso_1_code": null, "iso_3_code": "ese", "children": [], + "family": "Tacanan", "tokenizers": {}, "node_i": "9582", "native_tokenizers": [], @@ -34,15 +40,18 @@ }, { "name": "Toromono", + "depth": 2, "iso_1_code": null, "iso_3_code": "tno", "children": [], + "family": "Tacanan", "tokenizers": {}, "node_i": "9583", "native_tokenizers": [], "scripts": [] } ], + "family": "Tacanan", "tokenizers": {}, "node_i": "9581", "native_tokenizers": [], @@ -50,14 +59,17 @@ }, { "name": "Tacana", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Araona", + "depth": 2, "iso_1_code": null, "iso_3_code": "aro", "children": [], + "family": "Tacanan", "tokenizers": {}, "node_i": "9585", "native_tokenizers": [], @@ -65,9 +77,11 @@ }, { "name": "Reyesano", + "depth": 2, "iso_1_code": null, "iso_3_code": "rey", "children": [], + "family": "Tacanan", "tokenizers": {}, "node_i": "9586", "native_tokenizers": [], @@ -75,9 +89,11 @@ }, { "name": "Tacana", + "depth": 2, "iso_1_code": null, "iso_3_code": "tna", "children": [], + "family": "Tacanan", "tokenizers": {}, "node_i": "9587", "native_tokenizers": [], @@ -86,12 +102,14 @@ ] } ], + "family": "Tacanan", "tokenizers": {}, "node_i": "9584", "native_tokenizers": [], "scripts": [] } ], + "family": "Tacanan", "tokenizers": {}, "node_i": "9579", "native_tokenizers": [], diff --git a/data/Takelman.json b/data/Takelman.json index b9a17d4f676378e6ed4b124850071c8c3e1a551b..68b29efa66e298b0fa8ca22b53b52ebd9757383d 100644 --- a/data/Takelman.json +++ b/data/Takelman.json @@ -1,13 +1,16 @@ { "name": "Takelman", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalapuya", + "depth": 1, "iso_1_code": null, "iso_3_code": "kyl", "children": [], + "family": "Takelman", "tokenizers": {}, "node_i": "9589", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Northern Kalapuya", + "depth": 1, "iso_1_code": null, "iso_3_code": "nrt", "children": [], + "family": "Takelman", "tokenizers": {}, "node_i": "9590", "native_tokenizers": [], @@ -25,15 +30,18 @@ }, { "name": "Southern Kalapuya", + "depth": 1, "iso_1_code": null, "iso_3_code": "sxk", "children": [], + "family": "Takelman", "tokenizers": {}, "node_i": "9591", "native_tokenizers": [], "scripts": [] } ], + "family": "Takelman", "tokenizers": {}, "node_i": "9588", "native_tokenizers": [], diff --git a/data/Tarascan.json b/data/Tarascan.json index 1d357806e048fabf1a063ae478d5e3b8e0d934aa..4e73ee2b9b6ecf89be46c4d2792195d6c1079d4a 100644 --- a/data/Tarascan.json +++ b/data/Tarascan.json @@ -1,13 +1,16 @@ { "name": "Tarascan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Purepecha, Western Highland", + "depth": 1, "iso_1_code": null, "iso_3_code": "pua", "children": [], + "family": "Tarascan", "tokenizers": {}, "node_i": "9593", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Purepecha", + "depth": 1, "iso_1_code": null, "iso_3_code": "tsz", "children": [], + "family": "Tarascan", "tokenizers": {}, "node_i": "9594", "native_tokenizers": [], @@ -28,6 +33,7 @@ ] } ], + "family": "Tarascan", "tokenizers": {}, "node_i": "9592", "native_tokenizers": [], diff --git a/data/Tequistlatecan.json b/data/Tequistlatecan.json index e61244478a994dfbc4d24dfe16560e830ee9310d..b0bb8d6b77e212b408964bc75fe6233e36d94380 100644 --- a/data/Tequistlatecan.json +++ b/data/Tequistlatecan.json @@ -1,13 +1,16 @@ { "name": "Tequistlatecan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chontal, Highland Oaxaca", + "depth": 1, "iso_1_code": null, "iso_3_code": "chd", "children": [], + "family": "Tequistlatecan", "tokenizers": {}, "node_i": "9596", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Chontal, Lowland Oaxaca", + "depth": 1, "iso_1_code": null, "iso_3_code": "clo", "children": [], + "family": "Tequistlatecan", "tokenizers": {}, "node_i": "9597", "native_tokenizers": [], "scripts": [] } ], + "family": "Tequistlatecan", "tokenizers": {}, "node_i": "9595", "native_tokenizers": [], diff --git a/data/Tiniguan.json b/data/Tiniguan.json index 2867ef1f5748ec322af1023e242ff926522a62e8..6d4158e2fdeb9cd3868a34654f9a0ed3283e12b7 100644 --- a/data/Tiniguan.json +++ b/data/Tiniguan.json @@ -1,19 +1,23 @@ { "name": "Tiniguan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tinigua", + "depth": 1, "iso_1_code": null, "iso_3_code": "tit", "children": [], + "family": "Tiniguan", "tokenizers": {}, "node_i": "9599", "native_tokenizers": [], "scripts": [] } ], + "family": "Tiniguan", "tokenizers": {}, "node_i": "9598", "native_tokenizers": [], diff --git a/data/Tor-Kwerba.json b/data/Tor-Kwerba.json index 30fee78cd50a97cf229dc7b55b32700e14894b97..ccc3d298e181272971bc4af013942951c749bf61 100644 --- a/data/Tor-Kwerba.json +++ b/data/Tor-Kwerba.json @@ -1,29 +1,35 @@ { "name": "Tor-Kwerba", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Greater Kwerba", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isirawa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isirawa", + "depth": 3, "iso_1_code": null, "iso_3_code": "srl", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9603", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9602", "native_tokenizers": [], @@ -31,19 +37,23 @@ }, { "name": "Kwerba", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuclear", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bagusa", + "depth": 4, "iso_1_code": null, "iso_3_code": "bqb", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9606", "native_tokenizers": [], @@ -51,9 +61,11 @@ }, { "name": "Kwerba", + "depth": 4, "iso_1_code": null, "iso_3_code": "kwe", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9607", "native_tokenizers": [], @@ -61,9 +73,11 @@ }, { "name": "Trimuris", + "depth": 4, "iso_1_code": null, "iso_3_code": "tip", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9608", "native_tokenizers": [], @@ -71,9 +85,11 @@ }, { "name": "Kauwera", + "depth": 4, "iso_1_code": null, "iso_3_code": "xau", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9609", "native_tokenizers": [], @@ -81,15 +97,18 @@ }, { "name": "Kwerba Mamberamo", + "depth": 4, "iso_1_code": null, "iso_3_code": "xwr", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9610", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9605", "native_tokenizers": [], @@ -97,14 +116,17 @@ }, { "name": "West Coast", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Airoran", + "depth": 4, "iso_1_code": null, "iso_3_code": "air", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9612", "native_tokenizers": [], @@ -112,27 +134,32 @@ }, { "name": "Samarokena", + "depth": 4, "iso_1_code": null, "iso_3_code": "tmj", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9613", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9611", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9604", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9601", "native_tokenizers": [], @@ -140,19 +167,23 @@ }, { "name": "Orya-Tor", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Orya", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Orya", + "depth": 3, "iso_1_code": null, "iso_3_code": "ury", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9616", "native_tokenizers": [], @@ -161,6 +192,7 @@ ] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9615", "native_tokenizers": [], @@ -168,20 +200,24 @@ }, { "name": "Sause", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sause", + "depth": 3, "iso_1_code": null, "iso_3_code": "sao", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9618", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9617", "native_tokenizers": [], @@ -189,14 +225,17 @@ }, { "name": "Tor", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Betaf", + "depth": 3, "iso_1_code": null, "iso_3_code": "bfe", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9620", "native_tokenizers": [], @@ -204,9 +243,11 @@ }, { "name": "Berik", + "depth": 3, "iso_1_code": null, "iso_3_code": "bkl", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9621", "native_tokenizers": [], @@ -216,9 +257,11 @@ }, { "name": "Beneraf", + "depth": 3, "iso_1_code": null, "iso_3_code": "bnv", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9622", "native_tokenizers": [], @@ -226,9 +269,11 @@ }, { "name": "Dabe", + "depth": 3, "iso_1_code": null, "iso_3_code": "dbe", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9623", "native_tokenizers": [], @@ -236,9 +281,11 @@ }, { "name": "Itik", + "depth": 3, "iso_1_code": null, "iso_3_code": "itx", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9624", "native_tokenizers": [], @@ -246,9 +293,11 @@ }, { "name": "Jofotek-Bromnya", + "depth": 3, "iso_1_code": null, "iso_3_code": "jbr", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9625", "native_tokenizers": [], @@ -256,9 +305,11 @@ }, { "name": "Keijar", + "depth": 3, "iso_1_code": null, "iso_3_code": "kdy", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9626", "native_tokenizers": [], @@ -266,9 +317,11 @@ }, { "name": "Kwinsu", + "depth": 3, "iso_1_code": null, "iso_3_code": "kuc", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9627", "native_tokenizers": [], @@ -276,9 +329,11 @@ }, { "name": "Kwesten", + "depth": 3, "iso_1_code": null, "iso_3_code": "kwt", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9628", "native_tokenizers": [], @@ -286,9 +341,11 @@ }, { "name": "Mander", + "depth": 3, "iso_1_code": null, "iso_3_code": "mqr", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9629", "native_tokenizers": [], @@ -296,9 +353,11 @@ }, { "name": "Dineor", + "depth": 3, "iso_1_code": null, "iso_3_code": "mrx", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9630", "native_tokenizers": [], @@ -306,9 +365,11 @@ }, { "name": "Vitou", + "depth": 3, "iso_1_code": null, "iso_3_code": "vto", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9631", "native_tokenizers": [], @@ -316,27 +377,32 @@ }, { "name": "Wares", + "depth": 3, "iso_1_code": null, "iso_3_code": "wai", "children": [], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9632", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9619", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9614", "native_tokenizers": [], "scripts": [] } ], + "family": "Tor-Kwerba", "tokenizers": {}, "node_i": "9600", "native_tokenizers": [], diff --git a/data/Torricelli.json b/data/Torricelli.json index a5b01cae65552f553824107779d711a70b863cd5..5cabccc8cd895dacf32a94a6d4216625c1442ea7 100644 --- a/data/Torricelli.json +++ b/data/Torricelli.json @@ -1,23 +1,28 @@ { "name": "Torricelli", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kombio-Arapesh", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arapesh", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abu\u2019", + "depth": 3, "iso_1_code": null, "iso_3_code": "aah", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9636", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Mufian", + "depth": 3, "iso_1_code": null, "iso_3_code": "aoj", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9637", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Weri", + "depth": 3, "iso_1_code": null, "iso_3_code": "aon", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9638", "native_tokenizers": [], @@ -47,9 +56,11 @@ }, { "name": "Bukiyip", + "depth": 3, "iso_1_code": null, "iso_3_code": "ape", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9639", "native_tokenizers": [], @@ -58,6 +69,7 @@ ] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9635", "native_tokenizers": [], @@ -65,14 +77,17 @@ }, { "name": "Kombio", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aruek", + "depth": 3, "iso_1_code": null, "iso_3_code": "aur", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9641", "native_tokenizers": [], @@ -80,9 +95,11 @@ }, { "name": "Eitiep", + "depth": 3, "iso_1_code": null, "iso_3_code": "eit", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9642", "native_tokenizers": [], @@ -90,9 +107,11 @@ }, { "name": "Aro", + "depth": 3, "iso_1_code": null, "iso_3_code": "tei", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9643", "native_tokenizers": [], @@ -100,9 +119,11 @@ }, { "name": "Wom", + "depth": 3, "iso_1_code": null, "iso_3_code": "wmo", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9644", "native_tokenizers": [], @@ -110,9 +131,11 @@ }, { "name": "Kombio", + "depth": 3, "iso_1_code": null, "iso_3_code": "xbi", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9645", "native_tokenizers": [], @@ -122,21 +145,25 @@ }, { "name": "Yambes", + "depth": 3, "iso_1_code": null, "iso_3_code": "ymb", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9646", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9640", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9634", "native_tokenizers": [], @@ -144,25 +171,30 @@ }, { "name": "Maimai", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Beli", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Beli", + "depth": 3, "iso_1_code": null, "iso_3_code": "bey", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9649", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9648", "native_tokenizers": [], @@ -170,20 +202,24 @@ }, { "name": "Laeko-Libuat", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Laeko-Libuat", + "depth": 3, "iso_1_code": null, "iso_3_code": "lkl", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9651", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9650", "native_tokenizers": [], @@ -191,14 +227,17 @@ }, { "name": "Maimai Proper", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Heiyoho", + "depth": 3, "iso_1_code": null, "iso_3_code": "auk", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9653", "native_tokenizers": [], @@ -206,9 +245,11 @@ }, { "name": "Siliput", + "depth": 3, "iso_1_code": null, "iso_3_code": "mkc", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9654", "native_tokenizers": [], @@ -216,15 +257,18 @@ }, { "name": "Yahang", + "depth": 3, "iso_1_code": null, "iso_3_code": "rhp", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9655", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9652", "native_tokenizers": [], @@ -232,26 +276,31 @@ }, { "name": "Wiaki", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Minidien", + "depth": 3, "iso_1_code": null, "iso_3_code": "wii", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9657", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9656", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9647", "native_tokenizers": [], @@ -259,14 +308,17 @@ }, { "name": "Marienberg", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bungain", + "depth": 2, "iso_1_code": null, "iso_3_code": "but", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9659", "native_tokenizers": [], @@ -274,9 +326,11 @@ }, { "name": "Buna", + "depth": 2, "iso_1_code": null, "iso_3_code": "bvn", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9660", "native_tokenizers": [], @@ -284,9 +338,11 @@ }, { "name": "Elepi", + "depth": 2, "iso_1_code": null, "iso_3_code": "ele", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9661", "native_tokenizers": [], @@ -294,9 +350,11 @@ }, { "name": "Kamasau", + "depth": 2, "iso_1_code": null, "iso_3_code": "kms", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9662", "native_tokenizers": [], @@ -306,9 +364,11 @@ }, { "name": "Juwar", + "depth": 2, "iso_1_code": null, "iso_3_code": "mwb", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9663", "native_tokenizers": [], @@ -316,9 +376,11 @@ }, { "name": "Wiarumus", + "depth": 2, "iso_1_code": null, "iso_3_code": "tua", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9664", "native_tokenizers": [], @@ -326,15 +388,18 @@ }, { "name": "Urimo", + "depth": 2, "iso_1_code": null, "iso_3_code": "urx", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9665", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9658", "native_tokenizers": [], @@ -342,14 +407,17 @@ }, { "name": "Monumbo", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lilau", + "depth": 2, "iso_1_code": null, "iso_3_code": "lll", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9667", "native_tokenizers": [], @@ -357,15 +425,18 @@ }, { "name": "Monumbo", + "depth": 2, "iso_1_code": null, "iso_3_code": "mxk", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9668", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9666", "native_tokenizers": [], @@ -373,14 +444,17 @@ }, { "name": "Urim", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Urim", + "depth": 2, "iso_1_code": null, "iso_3_code": "uri", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9670", "native_tokenizers": [], @@ -389,6 +463,7 @@ ] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9669", "native_tokenizers": [], @@ -396,19 +471,23 @@ }, { "name": "Wapei-Palei", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Palei", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ambrak", + "depth": 3, "iso_1_code": null, "iso_3_code": "aag", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9673", "native_tokenizers": [], @@ -416,9 +495,11 @@ }, { "name": "Agi", + "depth": 3, "iso_1_code": null, "iso_3_code": "aif", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9674", "native_tokenizers": [], @@ -426,9 +507,11 @@ }, { "name": "Mol", + "depth": 3, "iso_1_code": null, "iso_3_code": "alx", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9675", "native_tokenizers": [], @@ -436,9 +519,11 @@ }, { "name": "Bragat", + "depth": 3, "iso_1_code": null, "iso_3_code": "aof", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9676", "native_tokenizers": [], @@ -446,9 +531,11 @@ }, { "name": "Aruop", + "depth": 3, "iso_1_code": null, "iso_3_code": "lsr", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9677", "native_tokenizers": [], @@ -456,9 +543,11 @@ }, { "name": "Nabi", + "depth": 3, "iso_1_code": null, "iso_3_code": "mty", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9678", "native_tokenizers": [], @@ -466,9 +555,11 @@ }, { "name": "Wanap", + "depth": 3, "iso_1_code": null, "iso_3_code": "wnp", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9679", "native_tokenizers": [], @@ -476,9 +567,11 @@ }, { "name": "Yangum Dey", + "depth": 3, "iso_1_code": null, "iso_3_code": "yde", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9680", "native_tokenizers": [], @@ -486,9 +579,11 @@ }, { "name": "Yangum Gel", + "depth": 3, "iso_1_code": null, "iso_3_code": "ygl", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9681", "native_tokenizers": [], @@ -496,15 +591,18 @@ }, { "name": "Yangum Mon", + "depth": 3, "iso_1_code": null, "iso_3_code": "ymo", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9682", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9672", "native_tokenizers": [], @@ -512,14 +610,17 @@ }, { "name": "Urat", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Urat", + "depth": 3, "iso_1_code": null, "iso_3_code": "urt", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9684", "native_tokenizers": [], @@ -528,6 +629,7 @@ ] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9683", "native_tokenizers": [], @@ -535,14 +637,17 @@ }, { "name": "Wapei", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Au", + "depth": 3, "iso_1_code": null, "iso_3_code": "avt", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9686", "native_tokenizers": [], @@ -552,9 +657,11 @@ }, { "name": "Dia", + "depth": 3, "iso_1_code": null, "iso_3_code": "dia", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9687", "native_tokenizers": [], @@ -562,9 +669,11 @@ }, { "name": "Elkei", + "depth": 3, "iso_1_code": null, "iso_3_code": "elk", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9688", "native_tokenizers": [], @@ -572,9 +681,11 @@ }, { "name": "Gnau", + "depth": 3, "iso_1_code": null, "iso_3_code": "gnu", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9689", "native_tokenizers": [], @@ -582,9 +693,11 @@ }, { "name": "Ningil", + "depth": 3, "iso_1_code": null, "iso_3_code": "niz", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9690", "native_tokenizers": [], @@ -592,9 +705,11 @@ }, { "name": "Olo", + "depth": 3, "iso_1_code": null, "iso_3_code": "ong", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9691", "native_tokenizers": [], @@ -604,9 +719,11 @@ }, { "name": "Sinagen", + "depth": 3, "iso_1_code": null, "iso_3_code": "siu", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9692", "native_tokenizers": [], @@ -614,9 +731,11 @@ }, { "name": "Walman", + "depth": 3, "iso_1_code": null, "iso_3_code": "van", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9693", "native_tokenizers": [], @@ -624,9 +743,11 @@ }, { "name": "Yeri", + "depth": 3, "iso_1_code": null, "iso_3_code": "yev", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9694", "native_tokenizers": [], @@ -634,9 +755,11 @@ }, { "name": "Yis", + "depth": 3, "iso_1_code": null, "iso_3_code": "yis", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9695", "native_tokenizers": [], @@ -644,9 +767,11 @@ }, { "name": "Yil", + "depth": 3, "iso_1_code": null, "iso_3_code": "yll", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9696", "native_tokenizers": [], @@ -654,21 +779,25 @@ }, { "name": "Yau", + "depth": 3, "iso_1_code": null, "iso_3_code": "yyu", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9697", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9685", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9671", "native_tokenizers": [], @@ -676,14 +805,17 @@ }, { "name": "West Wapei", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Seti", + "depth": 2, "iso_1_code": null, "iso_3_code": "sbi", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9699", "native_tokenizers": [], @@ -691,9 +823,11 @@ }, { "name": "Seta", + "depth": 2, "iso_1_code": null, "iso_3_code": "stf", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9700", "native_tokenizers": [], @@ -701,14 +835,17 @@ }, { "name": "One", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "One, Molmo", + "depth": 3, "iso_1_code": null, "iso_3_code": "aun", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9702", "native_tokenizers": [], @@ -716,9 +853,11 @@ }, { "name": "One, Inebu", + "depth": 3, "iso_1_code": null, "iso_3_code": "oin", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9703", "native_tokenizers": [], @@ -726,9 +865,11 @@ }, { "name": "One, Kwamtim", + "depth": 3, "iso_1_code": null, "iso_3_code": "okk", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9704", "native_tokenizers": [], @@ -736,9 +877,11 @@ }, { "name": "One, Kabore", + "depth": 3, "iso_1_code": null, "iso_3_code": "onk", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9705", "native_tokenizers": [], @@ -746,9 +889,11 @@ }, { "name": "One, Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": "onr", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9706", "native_tokenizers": [], @@ -756,27 +901,32 @@ }, { "name": "One, Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": "osu", "children": [], + "family": "Torricelli", "tokenizers": {}, "node_i": "9707", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9701", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9698", "native_tokenizers": [], "scripts": [] } ], + "family": "Torricelli", "tokenizers": {}, "node_i": "9633", "native_tokenizers": [], diff --git a/data/Totonacan.json b/data/Totonacan.json index e1b7bac0cba4c5242390d34737b893f261fca329..6a5a60232ab576c8d6806a11eb5d03a0eae74315 100644 --- a/data/Totonacan.json +++ b/data/Totonacan.json @@ -1,18 +1,22 @@ { "name": "Totonacan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tepehua", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tepehua, Huehuetla", + "depth": 2, "iso_1_code": null, "iso_3_code": "tee", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9710", "native_tokenizers": [], @@ -22,9 +26,11 @@ }, { "name": "Tepehua, Pisaflores", + "depth": 2, "iso_1_code": null, "iso_3_code": "tpp", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9711", "native_tokenizers": [], @@ -34,9 +40,11 @@ }, { "name": "Tepehua, Tlachichilco", + "depth": 2, "iso_1_code": null, "iso_3_code": "tpt", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9712", "native_tokenizers": [], @@ -45,6 +53,7 @@ ] } ], + "family": "Totonacan", "tokenizers": {}, "node_i": "9709", "native_tokenizers": [], @@ -52,14 +61,17 @@ }, { "name": "Totonac", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Totonac, Tecpatl\u00e1n", + "depth": 2, "iso_1_code": null, "iso_3_code": "tcw", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9714", "native_tokenizers": [], @@ -67,9 +79,11 @@ }, { "name": "Totonac, Upper Necaxa", + "depth": 2, "iso_1_code": null, "iso_3_code": "tku", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9715", "native_tokenizers": [], @@ -79,9 +93,11 @@ }, { "name": "Totonac, Yecuatla", + "depth": 2, "iso_1_code": null, "iso_3_code": "tlc", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9716", "native_tokenizers": [], @@ -89,9 +105,11 @@ }, { "name": "Totonac, Filomena Mata-Coahuitl\u00e1n", + "depth": 2, "iso_1_code": null, "iso_3_code": "tlp", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9717", "native_tokenizers": [], @@ -99,9 +117,11 @@ }, { "name": "Totonac, Coyutla", + "depth": 2, "iso_1_code": null, "iso_3_code": "toc", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9718", "native_tokenizers": [], @@ -111,9 +131,11 @@ }, { "name": "Totonac, Xicotepec de Ju\u00e1rez", + "depth": 2, "iso_1_code": null, "iso_3_code": "too", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9719", "native_tokenizers": [], @@ -123,9 +145,11 @@ }, { "name": "Totonac, Papantla", + "depth": 2, "iso_1_code": null, "iso_3_code": "top", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9720", "native_tokenizers": [], @@ -135,9 +159,11 @@ }, { "name": "Totonac, Highland", + "depth": 2, "iso_1_code": null, "iso_3_code": "tos", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9721", "native_tokenizers": [], @@ -147,21 +173,25 @@ }, { "name": "Totonaco del cerro Xinolat\u00e9petl", + "depth": 2, "iso_1_code": null, "iso_3_code": "tqt", "children": [], + "family": "Totonacan", "tokenizers": {}, "node_i": "9722", "native_tokenizers": [], "scripts": [] } ], + "family": "Totonacan", "tokenizers": {}, "node_i": "9713", "native_tokenizers": [], "scripts": [] } ], + "family": "Totonacan", "tokenizers": {}, "node_i": "9708", "native_tokenizers": [], diff --git a/data/Trans-New Guinea.json b/data/Trans-New Guinea.json index 5687a9cb940937fc517457fdb8b41a45ba77cda1..3962efa2ee729a01de27fb84c7766e2306e656a7 100644 --- a/data/Trans-New Guinea.json +++ b/data/Trans-New Guinea.json @@ -1,23 +1,28 @@ { "name": "Trans-New Guinea", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angaatiha", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angaataha", + "depth": 3, "iso_1_code": null, "iso_3_code": "agm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9726", "native_tokenizers": [], @@ -26,6 +31,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9725", "native_tokenizers": [], @@ -33,14 +39,17 @@ }, { "name": "Nuclear Angan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ankave", + "depth": 3, "iso_1_code": null, "iso_3_code": "aak", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9728", "native_tokenizers": [], @@ -50,9 +59,11 @@ }, { "name": "Tainae", + "depth": 3, "iso_1_code": null, "iso_3_code": "ago", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9729", "native_tokenizers": [], @@ -60,9 +71,11 @@ }, { "name": "Safeyoka", + "depth": 3, "iso_1_code": null, "iso_3_code": "apz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9730", "native_tokenizers": [], @@ -72,9 +85,11 @@ }, { "name": "Yipma", + "depth": 3, "iso_1_code": null, "iso_3_code": "byr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9731", "native_tokenizers": [], @@ -84,9 +99,11 @@ }, { "name": "Hamtai", + "depth": 3, "iso_1_code": null, "iso_3_code": "hmt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9732", "native_tokenizers": [], @@ -94,9 +111,11 @@ }, { "name": "Kawacha", + "depth": 3, "iso_1_code": null, "iso_3_code": "kcb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9733", "native_tokenizers": [], @@ -104,9 +123,11 @@ }, { "name": "Kamasa", + "depth": 3, "iso_1_code": null, "iso_3_code": "klp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9734", "native_tokenizers": [], @@ -114,9 +135,11 @@ }, { "name": "Menya", + "depth": 3, "iso_1_code": null, "iso_3_code": "mcr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9735", "native_tokenizers": [], @@ -124,9 +147,11 @@ }, { "name": "Akoye", + "depth": 3, "iso_1_code": null, "iso_3_code": "miw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9736", "native_tokenizers": [], @@ -134,9 +159,11 @@ }, { "name": "Simbari", + "depth": 3, "iso_1_code": null, "iso_3_code": "smb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9737", "native_tokenizers": [], @@ -144,9 +171,11 @@ }, { "name": "Susuami", + "depth": 3, "iso_1_code": null, "iso_3_code": "ssu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9738", "native_tokenizers": [], @@ -154,21 +183,25 @@ }, { "name": "Yagwoia", + "depth": 3, "iso_1_code": null, "iso_3_code": "ygw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9739", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9727", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9724", "native_tokenizers": [], @@ -176,19 +209,23 @@ }, { "name": "Asmat-Kamoro", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asmat", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asmat, Casuarina Coast", + "depth": 3, "iso_1_code": null, "iso_3_code": "asc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9742", "native_tokenizers": [], @@ -196,9 +233,11 @@ }, { "name": "Asmat, Yaosakor", + "depth": 3, "iso_1_code": null, "iso_3_code": "asy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9743", "native_tokenizers": [], @@ -206,9 +245,11 @@ }, { "name": "Asmat, Central", + "depth": 3, "iso_1_code": null, "iso_3_code": "cns", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9744", "native_tokenizers": [], @@ -216,9 +257,11 @@ }, { "name": "Asmat, North", + "depth": 3, "iso_1_code": null, "iso_3_code": "nks", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9745", "native_tokenizers": [], @@ -226,9 +269,11 @@ }, { "name": "Citak, Tamnim", + "depth": 3, "iso_1_code": null, "iso_3_code": "tml", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9746", "native_tokenizers": [], @@ -236,15 +281,18 @@ }, { "name": "Citak", + "depth": 3, "iso_1_code": null, "iso_3_code": "txt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9747", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9741", "native_tokenizers": [], @@ -252,20 +300,24 @@ }, { "name": "Diuwe", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Diuwe", + "depth": 3, "iso_1_code": null, "iso_3_code": "diy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9749", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9748", "native_tokenizers": [], @@ -273,20 +325,24 @@ }, { "name": "Kamoro", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamoro", + "depth": 3, "iso_1_code": null, "iso_3_code": "kgq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9751", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9750", "native_tokenizers": [], @@ -294,14 +350,17 @@ }, { "name": "Sabakor", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Buruwai", + "depth": 3, "iso_1_code": null, "iso_3_code": "asi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9753", "native_tokenizers": [], @@ -309,15 +368,18 @@ }, { "name": "Kamberau", + "depth": 3, "iso_1_code": null, "iso_3_code": "irx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9754", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9752", "native_tokenizers": [], @@ -325,26 +387,31 @@ }, { "name": "Sempan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sempan", + "depth": 3, "iso_1_code": null, "iso_3_code": "xse", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9756", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9755", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9740", "native_tokenizers": [], @@ -352,14 +419,17 @@ }, { "name": "Awin-Pare", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aekyom", + "depth": 2, "iso_1_code": null, "iso_3_code": "awi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9758", "native_tokenizers": [], @@ -369,15 +439,18 @@ }, { "name": "Pa", + "depth": 2, "iso_1_code": null, "iso_3_code": "ppt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9759", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9757", "native_tokenizers": [], @@ -385,14 +458,17 @@ }, { "name": "Bosavi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eibela", + "depth": 2, "iso_1_code": null, "iso_3_code": "ail", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9761", "native_tokenizers": [], @@ -400,9 +476,11 @@ }, { "name": "Kaluli", + "depth": 2, "iso_1_code": null, "iso_3_code": "bco", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9762", "native_tokenizers": [], @@ -412,9 +490,11 @@ }, { "name": "Bedamuni", + "depth": 2, "iso_1_code": null, "iso_3_code": "beo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9763", "native_tokenizers": [], @@ -422,9 +502,11 @@ }, { "name": "Dibiyaso", + "depth": 2, "iso_1_code": null, "iso_3_code": "dby", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9764", "native_tokenizers": [], @@ -432,9 +514,11 @@ }, { "name": "Edolo", + "depth": 2, "iso_1_code": null, "iso_3_code": "etr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9765", "native_tokenizers": [], @@ -444,9 +528,11 @@ }, { "name": "Kasua", + "depth": 2, "iso_1_code": null, "iso_3_code": "khs", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9766", "native_tokenizers": [], @@ -456,9 +542,11 @@ }, { "name": "Onobasulu", + "depth": 2, "iso_1_code": null, "iso_3_code": "onn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9767", "native_tokenizers": [], @@ -466,9 +554,11 @@ }, { "name": "Sonia", + "depth": 2, "iso_1_code": null, "iso_3_code": "siq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9768", "native_tokenizers": [], @@ -476,15 +566,18 @@ }, { "name": "Turumsa", + "depth": 2, "iso_1_code": null, "iso_3_code": "tqm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9769", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9760", "native_tokenizers": [], @@ -492,19 +585,23 @@ }, { "name": "Chimbu-Wahgi", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chimbu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chuave", + "depth": 3, "iso_1_code": null, "iso_3_code": "cjv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9772", "native_tokenizers": [], @@ -514,9 +611,11 @@ }, { "name": "Dom", + "depth": 3, "iso_1_code": null, "iso_3_code": "doa", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9773", "native_tokenizers": [], @@ -524,9 +623,11 @@ }, { "name": "Golin", + "depth": 3, "iso_1_code": null, "iso_3_code": "gvf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9774", "native_tokenizers": [], @@ -536,9 +637,11 @@ }, { "name": "Kuman", + "depth": 3, "iso_1_code": null, "iso_3_code": "kue", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9775", "native_tokenizers": [], @@ -548,9 +651,11 @@ }, { "name": "Nomane", + "depth": 3, "iso_1_code": null, "iso_3_code": "nof", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9776", "native_tokenizers": [], @@ -558,9 +663,11 @@ }, { "name": "Yui", + "depth": 3, "iso_1_code": null, "iso_3_code": "sll", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9777", "native_tokenizers": [], @@ -570,15 +677,18 @@ }, { "name": "Sinasina", + "depth": 3, "iso_1_code": null, "iso_3_code": "sst", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9778", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9771", "native_tokenizers": [], @@ -586,19 +696,23 @@ }, { "name": "Hagen", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaugel", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Imbongu", + "depth": 4, "iso_1_code": null, "iso_3_code": "imo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9781", "native_tokenizers": [], @@ -608,9 +722,11 @@ }, { "name": "Bo-Ung", + "depth": 4, "iso_1_code": null, "iso_3_code": "mux", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9782", "native_tokenizers": [], @@ -620,9 +736,11 @@ }, { "name": "Umbu-Ungu", + "depth": 4, "iso_1_code": null, "iso_3_code": "ubu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9783", "native_tokenizers": [], @@ -631,6 +749,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9780", "native_tokenizers": [], @@ -638,14 +757,17 @@ }, { "name": "Melpa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Melpa", + "depth": 4, "iso_1_code": null, "iso_3_code": "med", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9785", "native_tokenizers": [], @@ -654,12 +776,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9784", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9779", "native_tokenizers": [], @@ -667,14 +791,17 @@ }, { "name": "Jimi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kandawo", + "depth": 3, "iso_1_code": null, "iso_3_code": "gam", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9787", "native_tokenizers": [], @@ -684,9 +811,11 @@ }, { "name": "Maring", + "depth": 3, "iso_1_code": null, "iso_3_code": "mbw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9788", "native_tokenizers": [], @@ -694,15 +823,18 @@ }, { "name": "Narak", + "depth": 3, "iso_1_code": null, "iso_3_code": "nac", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9789", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9786", "native_tokenizers": [], @@ -710,14 +842,17 @@ }, { "name": "Wahgi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nii", + "depth": 3, "iso_1_code": null, "iso_3_code": "nii", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9791", "native_tokenizers": [], @@ -727,9 +862,11 @@ }, { "name": "Wahgi", + "depth": 3, "iso_1_code": null, "iso_3_code": "wgi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9792", "native_tokenizers": [], @@ -737,9 +874,11 @@ }, { "name": "Yuwei", + "depth": 3, "iso_1_code": null, "iso_3_code": "whg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9793", "native_tokenizers": [], @@ -748,12 +887,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9790", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9770", "native_tokenizers": [], @@ -761,20 +902,24 @@ }, { "name": "Damal", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Damal", + "depth": 2, "iso_1_code": null, "iso_3_code": "uhn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9795", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9794", "native_tokenizers": [], @@ -782,20 +927,24 @@ }, { "name": "Dem", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dem", + "depth": 2, "iso_1_code": null, "iso_3_code": "dem", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9797", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9796", "native_tokenizers": [], @@ -803,14 +952,17 @@ }, { "name": "Duna-Bogaya", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bogaya", + "depth": 2, "iso_1_code": null, "iso_3_code": "boq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9799", "native_tokenizers": [], @@ -818,15 +970,18 @@ }, { "name": "Duna", + "depth": 2, "iso_1_code": null, "iso_3_code": "duc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9800", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9798", "native_tokenizers": [], @@ -834,14 +989,17 @@ }, { "name": "East Kutubu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fiwaga", + "depth": 2, "iso_1_code": null, "iso_3_code": "fiw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9802", "native_tokenizers": [], @@ -849,15 +1007,18 @@ }, { "name": "Foi", + "depth": 2, "iso_1_code": null, "iso_3_code": "foi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9803", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9801", "native_tokenizers": [], @@ -865,14 +1026,17 @@ }, { "name": "East Strickland", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fembe", + "depth": 2, "iso_1_code": null, "iso_3_code": "agl", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9805", "native_tokenizers": [], @@ -880,9 +1044,11 @@ }, { "name": "Gebusi", + "depth": 2, "iso_1_code": null, "iso_3_code": "goi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9806", "native_tokenizers": [], @@ -890,9 +1056,11 @@ }, { "name": "Kubo", + "depth": 2, "iso_1_code": null, "iso_3_code": "jko", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9807", "native_tokenizers": [], @@ -900,9 +1068,11 @@ }, { "name": "Odoodee", + "depth": 2, "iso_1_code": null, "iso_3_code": "kkc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9808", "native_tokenizers": [], @@ -912,9 +1082,11 @@ }, { "name": "Konai", + "depth": 2, "iso_1_code": null, "iso_3_code": "kxw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9809", "native_tokenizers": [], @@ -924,15 +1096,18 @@ }, { "name": "Samo", + "depth": 2, "iso_1_code": null, "iso_3_code": "smq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9810", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9804", "native_tokenizers": [], @@ -940,24 +1115,29 @@ }, { "name": "Eleman", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nuclear Eleman", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Toaripi", + "depth": 4, "iso_1_code": null, "iso_3_code": "tqo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9814", "native_tokenizers": [], @@ -967,15 +1147,18 @@ }, { "name": "Tairuma", + "depth": 4, "iso_1_code": null, "iso_3_code": "uar", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9815", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9813", "native_tokenizers": [], @@ -983,14 +1166,17 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Opao", + "depth": 4, "iso_1_code": null, "iso_3_code": "opo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9817", "native_tokenizers": [], @@ -998,9 +1184,11 @@ }, { "name": "Orokolo", + "depth": 4, "iso_1_code": null, "iso_3_code": "oro", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9818", "native_tokenizers": [], @@ -1008,21 +1196,25 @@ }, { "name": "Keoru-Ahia", + "depth": 4, "iso_1_code": null, "iso_3_code": "xeu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9819", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9816", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9812", "native_tokenizers": [], @@ -1030,20 +1222,24 @@ }, { "name": "Purari", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Purari", + "depth": 3, "iso_1_code": null, "iso_3_code": "iar", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9821", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9820", "native_tokenizers": [], @@ -1051,26 +1247,31 @@ }, { "name": "Tate", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kaki Ae", + "depth": 3, "iso_1_code": null, "iso_3_code": "tbd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9823", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9822", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9811", "native_tokenizers": [], @@ -1078,19 +1279,23 @@ }, { "name": "Engan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angal-Kewa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Angal", + "depth": 3, "iso_1_code": null, "iso_3_code": "age", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9826", "native_tokenizers": [], @@ -1098,9 +1303,11 @@ }, { "name": "Angal Heneng", + "depth": 3, "iso_1_code": null, "iso_3_code": "akh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9827", "native_tokenizers": [], @@ -1110,9 +1317,11 @@ }, { "name": "Angal Enen", + "depth": 3, "iso_1_code": null, "iso_3_code": "aoe", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9828", "native_tokenizers": [], @@ -1120,9 +1329,11 @@ }, { "name": "Kewapi, West", + "depth": 3, "iso_1_code": null, "iso_3_code": "kew", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9829", "native_tokenizers": [], @@ -1132,9 +1343,11 @@ }, { "name": "Kewapi, East", + "depth": 3, "iso_1_code": null, "iso_3_code": "kjs", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9830", "native_tokenizers": [], @@ -1144,9 +1357,11 @@ }, { "name": "Pole", + "depth": 3, "iso_1_code": null, "iso_3_code": "kjy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9831", "native_tokenizers": [], @@ -1154,9 +1369,11 @@ }, { "name": "Samberigi", + "depth": 3, "iso_1_code": null, "iso_3_code": "ssx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9832", "native_tokenizers": [], @@ -1165,6 +1382,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9825", "native_tokenizers": [], @@ -1172,14 +1390,17 @@ }, { "name": "Enga", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bisorio", + "depth": 3, "iso_1_code": null, "iso_3_code": "bir", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9834", "native_tokenizers": [], @@ -1187,9 +1408,11 @@ }, { "name": "Enga", + "depth": 3, "iso_1_code": null, "iso_3_code": "enq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9835", "native_tokenizers": [], @@ -1199,9 +1422,11 @@ }, { "name": "Ipili", + "depth": 3, "iso_1_code": null, "iso_3_code": "ipi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9836", "native_tokenizers": [], @@ -1211,9 +1436,11 @@ }, { "name": "Kyaka", + "depth": 3, "iso_1_code": null, "iso_3_code": "kyc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9837", "native_tokenizers": [], @@ -1223,9 +1450,11 @@ }, { "name": "Lembena", + "depth": 3, "iso_1_code": null, "iso_3_code": "leq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9838", "native_tokenizers": [], @@ -1233,15 +1462,18 @@ }, { "name": "Nete", + "depth": 3, "iso_1_code": null, "iso_3_code": "net", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9839", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9833", "native_tokenizers": [], @@ -1249,14 +1481,17 @@ }, { "name": "Huli", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Huli", + "depth": 3, "iso_1_code": null, "iso_3_code": "hui", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9841", "native_tokenizers": [], @@ -1265,12 +1500,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9840", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9824", "native_tokenizers": [], @@ -1278,24 +1515,29 @@ }, { "name": "Finisterre-Huon", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Finisterre", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Erap", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Finongan", + "depth": 4, "iso_1_code": null, "iso_3_code": "fag", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9845", "native_tokenizers": [], @@ -1303,9 +1545,11 @@ }, { "name": "Nema", + "depth": 4, "iso_1_code": null, "iso_3_code": "gsn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9846", "native_tokenizers": [], @@ -1313,9 +1557,11 @@ }, { "name": "Doloman", + "depth": 4, "iso_1_code": null, "iso_3_code": "mhf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9847", "native_tokenizers": [], @@ -1323,9 +1569,11 @@ }, { "name": "Mungkip", + "depth": 4, "iso_1_code": null, "iso_3_code": "mpv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9848", "native_tokenizers": [], @@ -1333,9 +1581,11 @@ }, { "name": "Nakame", + "depth": 4, "iso_1_code": null, "iso_3_code": "nib", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9849", "native_tokenizers": [], @@ -1343,9 +1593,11 @@ }, { "name": "Nek", + "depth": 4, "iso_1_code": null, "iso_3_code": "nif", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9850", "native_tokenizers": [], @@ -1355,9 +1607,11 @@ }, { "name": "Sama", + "depth": 4, "iso_1_code": null, "iso_3_code": "nis", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9851", "native_tokenizers": [], @@ -1365,9 +1619,11 @@ }, { "name": "Nuk", + "depth": 4, "iso_1_code": null, "iso_3_code": "noc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9852", "native_tokenizers": [], @@ -1375,9 +1631,11 @@ }, { "name": "Numanggang", + "depth": 4, "iso_1_code": null, "iso_3_code": "nop", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9853", "native_tokenizers": [], @@ -1387,9 +1645,11 @@ }, { "name": "Ma Manda", + "depth": 4, "iso_1_code": null, "iso_3_code": "skc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9854", "native_tokenizers": [], @@ -1397,9 +1657,11 @@ }, { "name": "Uri", + "depth": 4, "iso_1_code": null, "iso_3_code": "uvh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9855", "native_tokenizers": [], @@ -1408,6 +1670,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9844", "native_tokenizers": [], @@ -1415,14 +1678,17 @@ }, { "name": "Gusap-Mot", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Madi", + "depth": 4, "iso_1_code": null, "iso_3_code": "grg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9857", "native_tokenizers": [], @@ -1430,9 +1696,11 @@ }, { "name": "Iyo", + "depth": 4, "iso_1_code": null, "iso_3_code": "nca", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9858", "native_tokenizers": [], @@ -1442,9 +1710,11 @@ }, { "name": "Neko", + "depth": 4, "iso_1_code": null, "iso_3_code": "nej", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9859", "native_tokenizers": [], @@ -1452,9 +1722,11 @@ }, { "name": "Nekgini", + "depth": 4, "iso_1_code": null, "iso_3_code": "nkg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9860", "native_tokenizers": [], @@ -1462,9 +1734,11 @@ }, { "name": "Ngaing", + "depth": 4, "iso_1_code": null, "iso_3_code": "nnf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9861", "native_tokenizers": [], @@ -1472,9 +1746,11 @@ }, { "name": "Rawa", + "depth": 4, "iso_1_code": null, "iso_3_code": "rwo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9862", "native_tokenizers": [], @@ -1484,15 +1760,18 @@ }, { "name": "Ufim", + "depth": 4, "iso_1_code": null, "iso_3_code": "ufi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9863", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9856", "native_tokenizers": [], @@ -1500,14 +1779,17 @@ }, { "name": "Uruwa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Weliki", + "depth": 4, "iso_1_code": null, "iso_3_code": "klh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9865", "native_tokenizers": [], @@ -1515,9 +1797,11 @@ }, { "name": "Nukna", + "depth": 4, "iso_1_code": null, "iso_3_code": "klt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9866", "native_tokenizers": [], @@ -1527,9 +1811,11 @@ }, { "name": "Kutong", + "depth": 4, "iso_1_code": null, "iso_3_code": "skm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9867", "native_tokenizers": [], @@ -1537,9 +1823,11 @@ }, { "name": "Tayatuk", + "depth": 4, "iso_1_code": null, "iso_3_code": "smc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9868", "native_tokenizers": [], @@ -1547,9 +1835,11 @@ }, { "name": "Yau", + "depth": 4, "iso_1_code": null, "iso_3_code": "yuw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9869", "native_tokenizers": [], @@ -1558,6 +1848,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9864", "native_tokenizers": [], @@ -1565,14 +1856,17 @@ }, { "name": "Wantoat", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awara", + "depth": 4, "iso_1_code": null, "iso_3_code": "awx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9871", "native_tokenizers": [], @@ -1582,9 +1876,11 @@ }, { "name": "Tuma-Irumu", + "depth": 4, "iso_1_code": null, "iso_3_code": "iou", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9872", "native_tokenizers": [], @@ -1594,9 +1890,11 @@ }, { "name": "Wantoat", + "depth": 4, "iso_1_code": null, "iso_3_code": "wnc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9873", "native_tokenizers": [], @@ -1605,6 +1903,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9870", "native_tokenizers": [], @@ -1612,14 +1911,17 @@ }, { "name": "Warup", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Muratayak", + "depth": 4, "iso_1_code": null, "iso_3_code": "asx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9875", "native_tokenizers": [], @@ -1627,9 +1929,11 @@ }, { "name": "Gamane", + "depth": 4, "iso_1_code": null, "iso_3_code": "bmp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9876", "native_tokenizers": [], @@ -1637,9 +1941,11 @@ }, { "name": "Gwahatike", + "depth": 4, "iso_1_code": null, "iso_3_code": "dah", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9877", "native_tokenizers": [], @@ -1649,9 +1955,11 @@ }, { "name": "Degenang", + "depth": 4, "iso_1_code": null, "iso_3_code": "dge", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9878", "native_tokenizers": [], @@ -1659,9 +1967,11 @@ }, { "name": "Forak", + "depth": 4, "iso_1_code": null, "iso_3_code": "frq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9879", "native_tokenizers": [], @@ -1669,9 +1979,11 @@ }, { "name": "Guya", + "depth": 4, "iso_1_code": null, "iso_3_code": "gka", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9880", "native_tokenizers": [], @@ -1679,9 +1991,11 @@ }, { "name": "Asaro\u2019o", + "depth": 4, "iso_1_code": null, "iso_3_code": "mtv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9881", "native_tokenizers": [], @@ -1689,15 +2003,18 @@ }, { "name": "Tand\u0268", + "depth": 4, "iso_1_code": null, "iso_3_code": "ygm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9882", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9874", "native_tokenizers": [], @@ -1705,14 +2022,17 @@ }, { "name": "Yupna", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bonkiman", + "depth": 4, "iso_1_code": null, "iso_3_code": "bop", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9884", "native_tokenizers": [], @@ -1720,9 +2040,11 @@ }, { "name": "Domung", + "depth": 4, "iso_1_code": null, "iso_3_code": "dev", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9885", "native_tokenizers": [], @@ -1730,9 +2052,11 @@ }, { "name": "Ma", + "depth": 4, "iso_1_code": null, "iso_3_code": "mjn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9886", "native_tokenizers": [], @@ -1740,9 +2064,11 @@ }, { "name": "Nankina", + "depth": 4, "iso_1_code": null, "iso_3_code": "nnk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9887", "native_tokenizers": [], @@ -1750,9 +2076,11 @@ }, { "name": "Yout Wam", + "depth": 4, "iso_1_code": null, "iso_3_code": "ytw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9888", "native_tokenizers": [], @@ -1760,9 +2088,11 @@ }, { "name": "Yopno", + "depth": 4, "iso_1_code": null, "iso_3_code": "yut", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9889", "native_tokenizers": [], @@ -1771,12 +2101,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9883", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9843", "native_tokenizers": [], @@ -1784,19 +2116,23 @@ }, { "name": "Huon", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dedua", + "depth": 4, "iso_1_code": null, "iso_3_code": "ded", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9892", "native_tokenizers": [], @@ -1806,9 +2142,11 @@ }, { "name": "Kube", + "depth": 4, "iso_1_code": null, "iso_3_code": "kgf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9893", "native_tokenizers": [], @@ -1818,9 +2156,11 @@ }, { "name": "K\u00e2te", + "depth": 4, "iso_1_code": null, "iso_3_code": "kmg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9894", "native_tokenizers": [], @@ -1830,9 +2170,11 @@ }, { "name": "Borong", + "depth": 4, "iso_1_code": null, "iso_3_code": "ksr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9895", "native_tokenizers": [], @@ -1842,9 +2184,11 @@ }, { "name": "Mape", + "depth": 4, "iso_1_code": null, "iso_3_code": "mlh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9896", "native_tokenizers": [], @@ -1854,9 +2198,11 @@ }, { "name": "Migabac", + "depth": 4, "iso_1_code": null, "iso_3_code": "mpp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9897", "native_tokenizers": [], @@ -1866,9 +2212,11 @@ }, { "name": "Momare", + "depth": 4, "iso_1_code": null, "iso_3_code": "msz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9898", "native_tokenizers": [], @@ -1876,15 +2224,18 @@ }, { "name": "Sene", + "depth": 4, "iso_1_code": null, "iso_3_code": "sej", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9899", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9891", "native_tokenizers": [], @@ -1892,20 +2243,24 @@ }, { "name": "Kovai", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kovai", + "depth": 4, "iso_1_code": null, "iso_3_code": "kqb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9901", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9900", "native_tokenizers": [], @@ -1913,14 +2268,17 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Somba-Siawari", + "depth": 4, "iso_1_code": null, "iso_3_code": "bmu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9903", "native_tokenizers": [], @@ -1930,9 +2288,11 @@ }, { "name": "Kinalakna", + "depth": 4, "iso_1_code": null, "iso_3_code": "kco", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9904", "native_tokenizers": [], @@ -1940,9 +2300,11 @@ }, { "name": "Komba", + "depth": 4, "iso_1_code": null, "iso_3_code": "kpf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9905", "native_tokenizers": [], @@ -1952,9 +2314,11 @@ }, { "name": "Kumukio", + "depth": 4, "iso_1_code": null, "iso_3_code": "kuo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9906", "native_tokenizers": [], @@ -1962,9 +2326,11 @@ }, { "name": "Mesem", + "depth": 4, "iso_1_code": null, "iso_3_code": "mci", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9907", "native_tokenizers": [], @@ -1972,9 +2338,11 @@ }, { "name": "Nabak", + "depth": 4, "iso_1_code": null, "iso_3_code": "naf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9908", "native_tokenizers": [], @@ -1984,9 +2352,11 @@ }, { "name": "Nomu", + "depth": 4, "iso_1_code": null, "iso_3_code": "noh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9909", "native_tokenizers": [], @@ -1994,9 +2364,11 @@ }, { "name": "Ono", + "depth": 4, "iso_1_code": null, "iso_3_code": "ons", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9910", "native_tokenizers": [], @@ -2006,9 +2378,11 @@ }, { "name": "Sialum", + "depth": 4, "iso_1_code": null, "iso_3_code": "slw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9911", "native_tokenizers": [], @@ -2016,9 +2390,11 @@ }, { "name": "Selepet", + "depth": 4, "iso_1_code": null, "iso_3_code": "spl", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9912", "native_tokenizers": [], @@ -2028,9 +2404,11 @@ }, { "name": "Tobo", + "depth": 4, "iso_1_code": null, "iso_3_code": "tbv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9913", "native_tokenizers": [], @@ -2038,9 +2416,11 @@ }, { "name": "Timbe", + "depth": 4, "iso_1_code": null, "iso_3_code": "tim", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9914", "native_tokenizers": [], @@ -2049,18 +2429,21 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9902", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9890", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9842", "native_tokenizers": [], @@ -2068,19 +2451,23 @@ }, { "name": "Gogodala-Suki", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gogodala", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ari", + "depth": 3, "iso_1_code": null, "iso_3_code": "aac", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9917", "native_tokenizers": [], @@ -2088,9 +2475,11 @@ }, { "name": "Gogodala", + "depth": 3, "iso_1_code": null, "iso_3_code": "ggw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9918", "native_tokenizers": [], @@ -2098,15 +2487,18 @@ }, { "name": "Waruna", + "depth": 3, "iso_1_code": null, "iso_3_code": "wrv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9919", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9916", "native_tokenizers": [], @@ -2114,26 +2506,31 @@ }, { "name": "Suki", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suki", + "depth": 3, "iso_1_code": null, "iso_3_code": "sui", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9921", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9920", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9915", "native_tokenizers": [], @@ -2141,24 +2538,29 @@ }, { "name": "Greater Binanderean", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Binanderean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North Binanderean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Suena", + "depth": 4, "iso_1_code": null, "iso_3_code": "sue", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9925", "native_tokenizers": [], @@ -2168,9 +2570,11 @@ }, { "name": "Zia", + "depth": 4, "iso_1_code": null, "iso_3_code": "zia", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9926", "native_tokenizers": [], @@ -2179,6 +2583,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9924", "native_tokenizers": [], @@ -2186,19 +2591,23 @@ }, { "name": "Nuclear Binanderean", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Binandere", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Binandere", + "depth": 5, "iso_1_code": null, "iso_3_code": "bhg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9929", "native_tokenizers": [], @@ -2207,6 +2616,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9928", "native_tokenizers": [], @@ -2214,24 +2624,29 @@ }, { "name": "South Binanderean", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Coastal Binanderean", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baruga", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baruga", + "depth": 7, "iso_1_code": null, "iso_3_code": "bjz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9933", "native_tokenizers": [], @@ -2239,15 +2654,18 @@ }, { "name": "Doghoro", + "depth": 7, "iso_1_code": null, "iso_3_code": "dgx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9934", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9932", "native_tokenizers": [], @@ -2255,14 +2673,17 @@ }, { "name": "Gaena-Korafe", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gaina", + "depth": 7, "iso_1_code": null, "iso_3_code": "gcn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9936", "native_tokenizers": [], @@ -2270,9 +2691,11 @@ }, { "name": "Korafe-Yegha", + "depth": 7, "iso_1_code": null, "iso_3_code": "kpr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9937", "native_tokenizers": [], @@ -2281,6 +2704,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9935", "native_tokenizers": [], @@ -2288,14 +2712,17 @@ }, { "name": "Notu", + "depth": 6, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ewage-Notu", + "depth": 7, "iso_1_code": null, "iso_3_code": "nou", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9939", "native_tokenizers": [], @@ -2304,12 +2731,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9938", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9931", "native_tokenizers": [], @@ -2317,14 +2746,17 @@ }, { "name": "Orokaivan", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aeka", + "depth": 6, "iso_1_code": null, "iso_3_code": "aez", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9941", "native_tokenizers": [], @@ -2332,9 +2764,11 @@ }, { "name": "Hunjara-Kaina Ke", + "depth": 6, "iso_1_code": null, "iso_3_code": "hkk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9942", "native_tokenizers": [], @@ -2342,9 +2776,11 @@ }, { "name": "Orokaiva", + "depth": 6, "iso_1_code": null, "iso_3_code": "okv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9943", "native_tokenizers": [], @@ -2353,18 +2789,21 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9940", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9930", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9927", "native_tokenizers": [], @@ -2372,26 +2811,31 @@ }, { "name": "Yekora", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yekora", + "depth": 4, "iso_1_code": null, "iso_3_code": "ykr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9945", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9944", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9923", "native_tokenizers": [], @@ -2399,14 +2843,17 @@ }, { "name": "Guhu-Samane", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guhu-Samane", + "depth": 3, "iso_1_code": null, "iso_3_code": "ghs", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9947", "native_tokenizers": [], @@ -2415,12 +2862,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9946", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9922", "native_tokenizers": [], @@ -2428,25 +2877,30 @@ }, { "name": "Inland Gulf", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ipiko", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ipiko", + "depth": 3, "iso_1_code": null, "iso_3_code": "ipo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9950", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9949", "native_tokenizers": [], @@ -2454,14 +2908,17 @@ }, { "name": "Minanibai", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Foia Foia", + "depth": 3, "iso_1_code": null, "iso_3_code": "ffi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9952", "native_tokenizers": [], @@ -2469,9 +2926,11 @@ }, { "name": "Hoia Hoia", + "depth": 3, "iso_1_code": null, "iso_3_code": "hhi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9953", "native_tokenizers": [], @@ -2479,9 +2938,11 @@ }, { "name": "Hoyahoya", + "depth": 3, "iso_1_code": null, "iso_3_code": "hhy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9954", "native_tokenizers": [], @@ -2489,9 +2950,11 @@ }, { "name": "Minanibai", + "depth": 3, "iso_1_code": null, "iso_3_code": "mcv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9955", "native_tokenizers": [], @@ -2499,9 +2962,11 @@ }, { "name": "Mubami", + "depth": 3, "iso_1_code": null, "iso_3_code": "tsx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9956", "native_tokenizers": [], @@ -2509,21 +2974,25 @@ }, { "name": "Karami", + "depth": 3, "iso_1_code": null, "iso_3_code": "xar", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9957", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9951", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9948", "native_tokenizers": [], @@ -2531,24 +3000,29 @@ }, { "name": "Kainantu-Goroka", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gorokan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fore", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fore", + "depth": 4, "iso_1_code": null, "iso_3_code": "for", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9961", "native_tokenizers": [], @@ -2558,15 +3032,18 @@ }, { "name": "Gimi", + "depth": 4, "iso_1_code": null, "iso_3_code": "gim", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9962", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9960", "native_tokenizers": [], @@ -2574,14 +3051,17 @@ }, { "name": "Gahuku-Benabena", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dano", + "depth": 4, "iso_1_code": null, "iso_3_code": "aso", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9964", "native_tokenizers": [], @@ -2591,9 +3071,11 @@ }, { "name": "Benabena", + "depth": 4, "iso_1_code": null, "iso_3_code": "bef", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9965", "native_tokenizers": [], @@ -2603,9 +3085,11 @@ }, { "name": "Alekano", + "depth": 4, "iso_1_code": null, "iso_3_code": "gah", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9966", "native_tokenizers": [], @@ -2615,15 +3099,18 @@ }, { "name": "Tokano", + "depth": 4, "iso_1_code": null, "iso_3_code": "zuh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9967", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9963", "native_tokenizers": [], @@ -2631,20 +3118,24 @@ }, { "name": "Gende", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gende", + "depth": 4, "iso_1_code": null, "iso_3_code": "gaf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9969", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9968", "native_tokenizers": [], @@ -2652,20 +3143,24 @@ }, { "name": "Isabi", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isabi", + "depth": 4, "iso_1_code": null, "iso_3_code": "isa", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9971", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9970", "native_tokenizers": [], @@ -2673,14 +3168,17 @@ }, { "name": "Kamano-Yagaria", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wagama", + "depth": 4, "iso_1_code": null, "iso_3_code": "abg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9973", "native_tokenizers": [], @@ -2688,9 +3186,11 @@ }, { "name": "Inoke-Yate", + "depth": 4, "iso_1_code": null, "iso_3_code": "ino", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9974", "native_tokenizers": [], @@ -2700,9 +3200,11 @@ }, { "name": "Kamano", + "depth": 4, "iso_1_code": null, "iso_3_code": "kbq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9975", "native_tokenizers": [], @@ -2712,9 +3214,11 @@ }, { "name": "Kanite", + "depth": 4, "iso_1_code": null, "iso_3_code": "kmu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9976", "native_tokenizers": [], @@ -2724,9 +3228,11 @@ }, { "name": "Keyagana", + "depth": 4, "iso_1_code": null, "iso_3_code": "kyg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9977", "native_tokenizers": [], @@ -2736,15 +3242,18 @@ }, { "name": "Yagaria", + "depth": 4, "iso_1_code": null, "iso_3_code": "ygr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9978", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9972", "native_tokenizers": [], @@ -2752,14 +3261,17 @@ }, { "name": "Siane", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Siane", + "depth": 4, "iso_1_code": null, "iso_3_code": "snp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9980", "native_tokenizers": [], @@ -2769,9 +3281,11 @@ }, { "name": "Yaweyuha", + "depth": 4, "iso_1_code": null, "iso_3_code": "yby", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9981", "native_tokenizers": [], @@ -2780,12 +3294,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9979", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9959", "native_tokenizers": [], @@ -2793,14 +3309,17 @@ }, { "name": "Kainantu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aziana", + "depth": 3, "iso_1_code": null, "iso_3_code": "gat", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9983", "native_tokenizers": [], @@ -2808,14 +3327,17 @@ }, { "name": "Gadsup-Auyana-Awa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Agarabi", + "depth": 4, "iso_1_code": null, "iso_3_code": "agd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9985", "native_tokenizers": [], @@ -2825,9 +3347,11 @@ }, { "name": "Awiyaana", + "depth": 4, "iso_1_code": null, "iso_3_code": "auy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9986", "native_tokenizers": [], @@ -2837,9 +3361,11 @@ }, { "name": "Awa", + "depth": 4, "iso_1_code": null, "iso_3_code": "awb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9987", "native_tokenizers": [], @@ -2849,9 +3375,11 @@ }, { "name": "Gadsup", + "depth": 4, "iso_1_code": null, "iso_3_code": "gaj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9988", "native_tokenizers": [], @@ -2859,9 +3387,11 @@ }, { "name": "Kosena", + "depth": 4, "iso_1_code": null, "iso_3_code": "kze", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9989", "native_tokenizers": [], @@ -2871,9 +3401,11 @@ }, { "name": "Ontenu", + "depth": 4, "iso_1_code": null, "iso_3_code": "ont", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9990", "native_tokenizers": [], @@ -2881,9 +3413,11 @@ }, { "name": "Usarufa", + "depth": 4, "iso_1_code": null, "iso_3_code": "usa", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9991", "native_tokenizers": [], @@ -2892,6 +3426,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9984", "native_tokenizers": [], @@ -2899,20 +3434,24 @@ }, { "name": "Kambaira", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asa\u2019a", + "depth": 4, "iso_1_code": null, "iso_3_code": "kyy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9993", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9992", "native_tokenizers": [], @@ -2920,20 +3459,24 @@ }, { "name": "Owenia", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Owenia", + "depth": 4, "iso_1_code": null, "iso_3_code": "wsr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9995", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9994", "native_tokenizers": [], @@ -2941,14 +3484,17 @@ }, { "name": "Tairora", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Binumarien", + "depth": 4, "iso_1_code": null, "iso_3_code": "bjr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9997", "native_tokenizers": [], @@ -2958,9 +3504,11 @@ }, { "name": "Tairora, South", + "depth": 4, "iso_1_code": null, "iso_3_code": "omw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9998", "native_tokenizers": [], @@ -2970,9 +3518,11 @@ }, { "name": "Tairora, North", + "depth": 4, "iso_1_code": null, "iso_3_code": "tbg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9999", "native_tokenizers": [], @@ -2982,9 +3532,11 @@ }, { "name": "Waffa", + "depth": 4, "iso_1_code": null, "iso_3_code": "waj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10000", "native_tokenizers": [], @@ -2993,18 +3545,21 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9996", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9982", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9958", "native_tokenizers": [], @@ -3012,14 +3567,17 @@ }, { "name": "Kamula", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kamula", + "depth": 2, "iso_1_code": null, "iso_3_code": "xla", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10002", "native_tokenizers": [], @@ -3028,6 +3586,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10001", "native_tokenizers": [], @@ -3035,14 +3594,17 @@ }, { "name": "Kayagar", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Atohwaim", + "depth": 2, "iso_1_code": null, "iso_3_code": "aqm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10004", "native_tokenizers": [], @@ -3050,9 +3612,11 @@ }, { "name": "Kayagar", + "depth": 2, "iso_1_code": null, "iso_3_code": "kyt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10005", "native_tokenizers": [], @@ -3060,15 +3624,18 @@ }, { "name": "Tamagario", + "depth": 2, "iso_1_code": null, "iso_3_code": "tcg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10006", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10003", "native_tokenizers": [], @@ -3076,14 +3643,17 @@ }, { "name": "Kiwaian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bamu", + "depth": 2, "iso_1_code": null, "iso_3_code": "bcf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10008", "native_tokenizers": [], @@ -3091,9 +3661,11 @@ }, { "name": "Kiwai, Northeast", + "depth": 2, "iso_1_code": null, "iso_3_code": "kiw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10009", "native_tokenizers": [], @@ -3101,9 +3673,11 @@ }, { "name": "Kiwai, Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": "kjd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10010", "native_tokenizers": [], @@ -3111,9 +3685,11 @@ }, { "name": "Waboda", + "depth": 2, "iso_1_code": null, "iso_3_code": "kmx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10011", "native_tokenizers": [], @@ -3121,9 +3697,11 @@ }, { "name": "Kerewo", + "depth": 2, "iso_1_code": null, "iso_3_code": "kxz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10012", "native_tokenizers": [], @@ -3131,9 +3709,11 @@ }, { "name": "Morigi", + "depth": 2, "iso_1_code": null, "iso_3_code": "mdb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10013", "native_tokenizers": [], @@ -3141,15 +3721,18 @@ }, { "name": "Kibiri", + "depth": 2, "iso_1_code": null, "iso_3_code": "prm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10014", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10007", "native_tokenizers": [], @@ -3157,14 +3740,17 @@ }, { "name": "Kolopom", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kimaghima", + "depth": 2, "iso_1_code": null, "iso_3_code": "kig", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10016", "native_tokenizers": [], @@ -3172,9 +3758,11 @@ }, { "name": "Ndom", + "depth": 2, "iso_1_code": null, "iso_3_code": "nqm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10017", "native_tokenizers": [], @@ -3182,15 +3770,18 @@ }, { "name": "Riantana", + "depth": 2, "iso_1_code": null, "iso_3_code": "ran", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10018", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10015", "native_tokenizers": [], @@ -3198,19 +3789,23 @@ }, { "name": "Madang", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Croisilles", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amaimon", + "depth": 3, "iso_1_code": null, "iso_3_code": "ali", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10021", "native_tokenizers": [], @@ -3218,20 +3813,24 @@ }, { "name": "Kare", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kare", + "depth": 4, "iso_1_code": null, "iso_3_code": "kmf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10023", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10022", "native_tokenizers": [], @@ -3239,14 +3838,17 @@ }, { "name": "Kokon", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Girawa", + "depth": 4, "iso_1_code": null, "iso_3_code": "bbr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10025", "native_tokenizers": [], @@ -3256,9 +3858,11 @@ }, { "name": "Kein", + "depth": 4, "iso_1_code": null, "iso_3_code": "bmh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10026", "native_tokenizers": [], @@ -3268,15 +3872,18 @@ }, { "name": "Munit", + "depth": 4, "iso_1_code": null, "iso_3_code": "mtc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10027", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10024", "native_tokenizers": [], @@ -3284,14 +3891,17 @@ }, { "name": "Kowan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amako", + "depth": 4, "iso_1_code": null, "iso_3_code": "koz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10029", "native_tokenizers": [], @@ -3299,9 +3909,11 @@ }, { "name": "Waskia", + "depth": 4, "iso_1_code": null, "iso_3_code": "wsk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10030", "native_tokenizers": [], @@ -3310,6 +3922,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10028", "native_tokenizers": [], @@ -3317,19 +3930,23 @@ }, { "name": "Mabuso", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gum", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amele", + "depth": 5, "iso_1_code": null, "iso_3_code": "aey", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10033", "native_tokenizers": [], @@ -3339,9 +3956,11 @@ }, { "name": "Fulumu", + "depth": 5, "iso_1_code": null, "iso_3_code": "bbd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10034", "native_tokenizers": [], @@ -3349,9 +3968,11 @@ }, { "name": "Gumalu", + "depth": 5, "iso_1_code": null, "iso_3_code": "gmu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10035", "native_tokenizers": [], @@ -3359,9 +3980,11 @@ }, { "name": "Sihan", + "depth": 5, "iso_1_code": null, "iso_3_code": "snr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10036", "native_tokenizers": [], @@ -3369,14 +3992,17 @@ }, { "name": "Panim-Isebe", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Isebe", + "depth": 6, "iso_1_code": null, "iso_3_code": "igo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10038", "native_tokenizers": [], @@ -3384,21 +4010,25 @@ }, { "name": "Panim", + "depth": 6, "iso_1_code": null, "iso_3_code": "pnr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10039", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10037", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10032", "native_tokenizers": [], @@ -3406,14 +4036,17 @@ }, { "name": "Hanseman", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baimak", + "depth": 5, "iso_1_code": null, "iso_3_code": "bmx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10041", "native_tokenizers": [], @@ -3421,9 +4054,11 @@ }, { "name": "Bagupi", + "depth": 5, "iso_1_code": null, "iso_3_code": "bpi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10042", "native_tokenizers": [], @@ -3431,9 +4066,11 @@ }, { "name": "Wagi", + "depth": 5, "iso_1_code": null, "iso_3_code": "fad", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10043", "native_tokenizers": [], @@ -3443,9 +4080,11 @@ }, { "name": "Gal", + "depth": 5, "iso_1_code": null, "iso_3_code": "gap", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10044", "native_tokenizers": [], @@ -3453,9 +4092,11 @@ }, { "name": "Nobonob", + "depth": 5, "iso_1_code": null, "iso_3_code": "gaw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10045", "native_tokenizers": [], @@ -3465,9 +4106,11 @@ }, { "name": "Garus", + "depth": 5, "iso_1_code": null, "iso_3_code": "gyb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10046", "native_tokenizers": [], @@ -3475,9 +4118,11 @@ }, { "name": "Mawan", + "depth": 5, "iso_1_code": null, "iso_3_code": "mcz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10047", "native_tokenizers": [], @@ -3485,9 +4130,11 @@ }, { "name": "Matepi", + "depth": 5, "iso_1_code": null, "iso_3_code": "mqe", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10048", "native_tokenizers": [], @@ -3495,9 +4142,11 @@ }, { "name": "Nake", + "depth": 5, "iso_1_code": null, "iso_3_code": "nbk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10049", "native_tokenizers": [], @@ -3505,9 +4154,11 @@ }, { "name": "Rempi", + "depth": 5, "iso_1_code": null, "iso_3_code": "rmp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10050", "native_tokenizers": [], @@ -3515,9 +4166,11 @@ }, { "name": "Rapting", + "depth": 5, "iso_1_code": null, "iso_3_code": "rpt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10051", "native_tokenizers": [], @@ -3525,9 +4178,11 @@ }, { "name": "Saruga", + "depth": 5, "iso_1_code": null, "iso_3_code": "sra", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10052", "native_tokenizers": [], @@ -3535,9 +4190,11 @@ }, { "name": "Yoidik", + "depth": 5, "iso_1_code": null, "iso_3_code": "ydk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10053", "native_tokenizers": [], @@ -3545,14 +4202,17 @@ }, { "name": "Silopi-Utu", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Utu", + "depth": 6, "iso_1_code": null, "iso_3_code": "utu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10055", "native_tokenizers": [], @@ -3560,15 +4220,18 @@ }, { "name": "Silopi", + "depth": 6, "iso_1_code": null, "iso_3_code": "xsp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10056", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10054", "native_tokenizers": [], @@ -3576,14 +4239,17 @@ }, { "name": "Wamas-Samosa-Murupi-Mosimo", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mosimo", + "depth": 6, "iso_1_code": null, "iso_3_code": "mqv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10058", "native_tokenizers": [], @@ -3591,9 +4257,11 @@ }, { "name": "Murupi", + "depth": 6, "iso_1_code": null, "iso_3_code": "mqw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10059", "native_tokenizers": [], @@ -3601,9 +4269,11 @@ }, { "name": "Samosa", + "depth": 6, "iso_1_code": null, "iso_3_code": "swm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10060", "native_tokenizers": [], @@ -3611,27 +4281,32 @@ }, { "name": "Wamas", + "depth": 6, "iso_1_code": null, "iso_3_code": "wmc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10061", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10057", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10040", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10031", "native_tokenizers": [], @@ -3639,14 +4314,17 @@ }, { "name": "Mugil", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bargam", + "depth": 4, "iso_1_code": null, "iso_3_code": "mlp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10063", "native_tokenizers": [], @@ -3655,6 +4333,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10062", "native_tokenizers": [], @@ -3662,14 +4341,17 @@ }, { "name": "Northern Adelbert", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gavak", + "depth": 4, "iso_1_code": null, "iso_3_code": "dmc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10065", "native_tokenizers": [], @@ -3677,14 +4359,17 @@ }, { "name": "Kaukombar", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mala", + "depth": 5, "iso_1_code": null, "iso_3_code": "ped", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10067", "native_tokenizers": [], @@ -3692,9 +4377,11 @@ }, { "name": "Miani", + "depth": 5, "iso_1_code": null, "iso_3_code": "pla", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10068", "native_tokenizers": [], @@ -3702,9 +4389,11 @@ }, { "name": "Maia", + "depth": 5, "iso_1_code": null, "iso_3_code": "sks", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10069", "native_tokenizers": [], @@ -3712,15 +4401,18 @@ }, { "name": "Maiani", + "depth": 5, "iso_1_code": null, "iso_3_code": "tnh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10070", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10066", "native_tokenizers": [], @@ -3728,19 +4420,23 @@ }, { "name": "Kumil-Tibor", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kumil", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bepour", + "depth": 6, "iso_1_code": null, "iso_3_code": "bie", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10073", "native_tokenizers": [], @@ -3748,9 +4444,11 @@ }, { "name": "Mauwake", + "depth": 6, "iso_1_code": null, "iso_3_code": "mhl", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10074", "native_tokenizers": [], @@ -3760,15 +4458,18 @@ }, { "name": "Moere", + "depth": 6, "iso_1_code": null, "iso_3_code": "mvq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10075", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10072", "native_tokenizers": [], @@ -3776,14 +4477,17 @@ }, { "name": "Tibor", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pamosu", + "depth": 6, "iso_1_code": null, "iso_3_code": "hih", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10077", "native_tokenizers": [], @@ -3791,9 +4495,11 @@ }, { "name": "Mawak", + "depth": 6, "iso_1_code": null, "iso_3_code": "mjj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10078", "native_tokenizers": [], @@ -3801,9 +4507,11 @@ }, { "name": "Hember Avu", + "depth": 6, "iso_1_code": null, "iso_3_code": "mmi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10079", "native_tokenizers": [], @@ -3811,9 +4519,11 @@ }, { "name": "Mokati", + "depth": 6, "iso_1_code": null, "iso_3_code": "wnb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10080", "native_tokenizers": [], @@ -3821,21 +4531,25 @@ }, { "name": "Kowaki", + "depth": 6, "iso_1_code": null, "iso_3_code": "xow", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10081", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10076", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10071", "native_tokenizers": [], @@ -3843,14 +4557,17 @@ }, { "name": "Manep-Barem", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Brem", + "depth": 5, "iso_1_code": null, "iso_3_code": "buq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10083", "native_tokenizers": [], @@ -3858,15 +4575,18 @@ }, { "name": "Manep", + "depth": 5, "iso_1_code": null, "iso_3_code": "mkr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10084", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10082", "native_tokenizers": [], @@ -3874,19 +4594,23 @@ }, { "name": "Numugen", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karian-Usan-Yaban", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karian", + "depth": 6, "iso_1_code": null, "iso_3_code": "bql", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10087", "native_tokenizers": [], @@ -3894,9 +4618,11 @@ }, { "name": "Usan", + "depth": 6, "iso_1_code": null, "iso_3_code": "wnu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10088", "native_tokenizers": [], @@ -3906,15 +4632,18 @@ }, { "name": "Yaben", + "depth": 6, "iso_1_code": null, "iso_3_code": "ybm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10089", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10086", "native_tokenizers": [], @@ -3922,14 +4651,17 @@ }, { "name": "Yarawata-Parawen-Ukuriguma", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Parawen", + "depth": 6, "iso_1_code": null, "iso_3_code": "prw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10091", "native_tokenizers": [], @@ -3937,9 +4669,11 @@ }, { "name": "Ukuriguma", + "depth": 6, "iso_1_code": null, "iso_3_code": "ukg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10092", "native_tokenizers": [], @@ -3947,27 +4681,32 @@ }, { "name": "Yarawata", + "depth": 6, "iso_1_code": null, "iso_3_code": "yrw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10093", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10090", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10085", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10064", "native_tokenizers": [], @@ -3975,14 +4714,17 @@ }, { "name": "Omosan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pal", + "depth": 4, "iso_1_code": null, "iso_3_code": "abw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10095", "native_tokenizers": [], @@ -3990,21 +4732,25 @@ }, { "name": "Kovol", + "depth": 4, "iso_1_code": null, "iso_3_code": "kgu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10096", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10094", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10020", "native_tokenizers": [], @@ -4012,14 +4758,17 @@ }, { "name": "Kalam-Kobon", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kalam", + "depth": 3, "iso_1_code": null, "iso_3_code": "kmh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10098", "native_tokenizers": [], @@ -4029,9 +4778,11 @@ }, { "name": "Kobon", + "depth": 3, "iso_1_code": null, "iso_3_code": "kpw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10099", "native_tokenizers": [], @@ -4041,9 +4792,11 @@ }, { "name": "Tay", + "depth": 3, "iso_1_code": null, "iso_3_code": "taw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10100", "native_tokenizers": [], @@ -4052,6 +4805,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10097", "native_tokenizers": [], @@ -4059,14 +4813,17 @@ }, { "name": "Rai Coast", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wasembo", + "depth": 3, "iso_1_code": null, "iso_3_code": "gsp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10102", "native_tokenizers": [], @@ -4074,14 +4831,17 @@ }, { "name": "Biyom-Tauya", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biyom", + "depth": 4, "iso_1_code": null, "iso_3_code": "bpm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10104", "native_tokenizers": [], @@ -4089,15 +4849,18 @@ }, { "name": "Tauya", + "depth": 4, "iso_1_code": null, "iso_3_code": "tya", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10105", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10103", "native_tokenizers": [], @@ -4105,14 +4868,17 @@ }, { "name": "Evapia", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kou", + "depth": 4, "iso_1_code": null, "iso_3_code": "snz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10107", "native_tokenizers": [], @@ -4120,9 +4886,11 @@ }, { "name": "Wia", + "depth": 4, "iso_1_code": null, "iso_3_code": "ssj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10108", "native_tokenizers": [], @@ -4130,9 +4898,11 @@ }, { "name": "Watiwa", + "depth": 4, "iso_1_code": null, "iso_3_code": "wtf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10109", "native_tokenizers": [], @@ -4140,15 +4910,18 @@ }, { "name": "Koromu", + "depth": 4, "iso_1_code": null, "iso_3_code": "xes", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10110", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10106", "native_tokenizers": [], @@ -4156,14 +4929,17 @@ }, { "name": "Kabenau", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Taupi", + "depth": 4, "iso_1_code": null, "iso_3_code": "awm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10112", "native_tokenizers": [], @@ -4171,9 +4947,11 @@ }, { "name": "Migum", + "depth": 4, "iso_1_code": null, "iso_3_code": "klm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10113", "native_tokenizers": [], @@ -4181,9 +4959,11 @@ }, { "name": "Lemio", + "depth": 4, "iso_1_code": null, "iso_3_code": "lei", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10114", "native_tokenizers": [], @@ -4191,9 +4971,11 @@ }, { "name": "Pulabu", + "depth": 4, "iso_1_code": null, "iso_3_code": "pup", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10115", "native_tokenizers": [], @@ -4201,9 +4983,11 @@ }, { "name": "Siroi", + "depth": 4, "iso_1_code": null, "iso_3_code": "ssd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10116", "native_tokenizers": [], @@ -4212,6 +4996,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10111", "native_tokenizers": [], @@ -4219,14 +5004,17 @@ }, { "name": "Mindjim", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anjam", + "depth": 4, "iso_1_code": null, "iso_3_code": "boj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10118", "native_tokenizers": [], @@ -4236,9 +5024,11 @@ }, { "name": "Bongu", + "depth": 4, "iso_1_code": null, "iso_3_code": "bpu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10119", "native_tokenizers": [], @@ -4246,9 +5036,11 @@ }, { "name": "Soq", + "depth": 4, "iso_1_code": null, "iso_3_code": "mdc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10120", "native_tokenizers": [], @@ -4256,15 +5048,18 @@ }, { "name": "Sam", + "depth": 4, "iso_1_code": null, "iso_3_code": "snx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10121", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10117", "native_tokenizers": [], @@ -4272,14 +5067,17 @@ }, { "name": "Nuru", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Uyajitaya", + "depth": 4, "iso_1_code": null, "iso_3_code": "duk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10123", "native_tokenizers": [], @@ -4287,9 +5085,11 @@ }, { "name": "Ogea", + "depth": 4, "iso_1_code": null, "iso_3_code": "eri", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10124", "native_tokenizers": [], @@ -4299,9 +5099,11 @@ }, { "name": "Jilim", + "depth": 4, "iso_1_code": null, "iso_3_code": "jil", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10125", "native_tokenizers": [], @@ -4309,9 +5111,11 @@ }, { "name": "Waube", + "depth": 4, "iso_1_code": null, "iso_3_code": "kop", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10126", "native_tokenizers": [], @@ -4319,9 +5123,11 @@ }, { "name": "Rerau", + "depth": 4, "iso_1_code": null, "iso_3_code": "rea", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10127", "native_tokenizers": [], @@ -4329,9 +5135,11 @@ }, { "name": "Uya", + "depth": 4, "iso_1_code": null, "iso_3_code": "usu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10128", "native_tokenizers": [], @@ -4339,15 +5147,18 @@ }, { "name": "Dubuporo", + "depth": 4, "iso_1_code": null, "iso_3_code": "ynl", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10129", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10122", "native_tokenizers": [], @@ -4355,14 +5166,17 @@ }, { "name": "Peka", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Danaru", + "depth": 4, "iso_1_code": null, "iso_3_code": "dnr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10131", "native_tokenizers": [], @@ -4370,9 +5184,11 @@ }, { "name": "Sumau", + "depth": 4, "iso_1_code": null, "iso_3_code": "six", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10132", "native_tokenizers": [], @@ -4380,9 +5196,11 @@ }, { "name": "Kobuka", + "depth": 4, "iso_1_code": null, "iso_3_code": "urg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10133", "native_tokenizers": [], @@ -4390,9 +5208,11 @@ }, { "name": "Sob", + "depth": 4, "iso_1_code": null, "iso_3_code": "urw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10134", "native_tokenizers": [], @@ -4401,6 +5221,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10130", "native_tokenizers": [], @@ -4408,14 +5229,17 @@ }, { "name": "Yaganon", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dumun", + "depth": 4, "iso_1_code": null, "iso_3_code": "dui", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10136", "native_tokenizers": [], @@ -4423,9 +5247,11 @@ }, { "name": "Ganglau", + "depth": 4, "iso_1_code": null, "iso_3_code": "ggl", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10137", "native_tokenizers": [], @@ -4433,9 +5259,11 @@ }, { "name": "Saep", + "depth": 4, "iso_1_code": null, "iso_3_code": "spd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10138", "native_tokenizers": [], @@ -4443,21 +5271,25 @@ }, { "name": "Yabong", + "depth": 4, "iso_1_code": null, "iso_3_code": "ybo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10139", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10135", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10101", "native_tokenizers": [], @@ -4465,30 +5297,36 @@ }, { "name": "South Adelbert", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Josephstaal", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Osum", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Utarmbung", + "depth": 5, "iso_1_code": null, "iso_3_code": "omo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10143", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10142", "native_tokenizers": [], @@ -4496,14 +5334,17 @@ }, { "name": "Pomoikan", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anamuxra", + "depth": 5, "iso_1_code": null, "iso_3_code": "imi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10145", "native_tokenizers": [], @@ -4511,9 +5352,11 @@ }, { "name": "Moresada", + "depth": 5, "iso_1_code": null, "iso_3_code": "msx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10146", "native_tokenizers": [], @@ -4521,15 +5364,18 @@ }, { "name": "Anam", + "depth": 5, "iso_1_code": null, "iso_3_code": "pda", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10147", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10144", "native_tokenizers": [], @@ -4537,26 +5383,31 @@ }, { "name": "Wadaginam", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wadaginam", + "depth": 5, "iso_1_code": null, "iso_3_code": "wdg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10149", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10148", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10141", "native_tokenizers": [], @@ -4564,19 +5415,23 @@ }, { "name": "Sogeram", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central Sogeram", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apal", + "depth": 5, "iso_1_code": null, "iso_3_code": "ena", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10152", "native_tokenizers": [], @@ -4584,9 +5439,11 @@ }, { "name": "Magiyi", + "depth": 5, "iso_1_code": null, "iso_3_code": "gmg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10153", "native_tokenizers": [], @@ -4594,9 +5451,11 @@ }, { "name": "Manat", + "depth": 5, "iso_1_code": null, "iso_3_code": "pmr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10154", "native_tokenizers": [], @@ -4604,14 +5463,17 @@ }, { "name": "North Central Sogeram", + "depth": 5, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mum", + "depth": 6, "iso_1_code": null, "iso_3_code": "kqa", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10156", "native_tokenizers": [], @@ -4621,21 +5483,25 @@ }, { "name": "Sirva", + "depth": 6, "iso_1_code": null, "iso_3_code": "sbq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10157", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10155", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10151", "native_tokenizers": [], @@ -4643,14 +5509,17 @@ }, { "name": "East Sogeram", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kursav", + "depth": 5, "iso_1_code": null, "iso_3_code": "faj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10159", "native_tokenizers": [], @@ -4658,9 +5527,11 @@ }, { "name": "Gants", + "depth": 5, "iso_1_code": null, "iso_3_code": "gao", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10160", "native_tokenizers": [], @@ -4668,9 +5539,11 @@ }, { "name": "Mag\u0268", + "depth": 5, "iso_1_code": null, "iso_3_code": "gkd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10161", "native_tokenizers": [], @@ -4678,15 +5551,18 @@ }, { "name": "Aisi", + "depth": 5, "iso_1_code": null, "iso_3_code": "mmq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10162", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10158", "native_tokenizers": [], @@ -4694,14 +5570,17 @@ }, { "name": "West Sogeram", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nend", + "depth": 5, "iso_1_code": null, "iso_3_code": "anh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10164", "native_tokenizers": [], @@ -4709,33 +5588,39 @@ }, { "name": "Mand", + "depth": 5, "iso_1_code": null, "iso_3_code": "ate", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10165", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10163", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10150", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10140", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10019", "native_tokenizers": [], @@ -4743,19 +5628,23 @@ }, { "name": "Marind", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Boazi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuni-Boazi", + "depth": 3, "iso_1_code": null, "iso_3_code": "kvg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10168", "native_tokenizers": [], @@ -4765,15 +5654,18 @@ }, { "name": "Zimakani", + "depth": 3, "iso_1_code": null, "iso_3_code": "zik", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10169", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10167", "native_tokenizers": [], @@ -4781,14 +5673,17 @@ }, { "name": "Nuclear Marind", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Marind, Bian", + "depth": 3, "iso_1_code": null, "iso_3_code": "bpv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10171", "native_tokenizers": [], @@ -4796,15 +5691,18 @@ }, { "name": "Marind", + "depth": 3, "iso_1_code": null, "iso_3_code": "mrz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10172", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10170", "native_tokenizers": [], @@ -4812,14 +5710,17 @@ }, { "name": "Yaqay", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Warkay-Bipim", + "depth": 3, "iso_1_code": null, "iso_3_code": "bgv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10174", "native_tokenizers": [], @@ -4827,21 +5728,25 @@ }, { "name": "Yaqay", + "depth": 3, "iso_1_code": null, "iso_3_code": "jaq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10175", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10173", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10166", "native_tokenizers": [], @@ -4849,19 +5754,23 @@ }, { "name": "Mek", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lik", + "depth": 3, "iso_1_code": null, "iso_3_code": "eip", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10178", "native_tokenizers": [], @@ -4869,9 +5778,11 @@ }, { "name": "Yale, Kosarek", + "depth": 3, "iso_1_code": null, "iso_3_code": "kkl", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10179", "native_tokenizers": [], @@ -4881,9 +5792,11 @@ }, { "name": "Korupun-Sela", + "depth": 3, "iso_1_code": null, "iso_3_code": "kpq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10180", "native_tokenizers": [], @@ -4893,9 +5806,11 @@ }, { "name": "Una", + "depth": 3, "iso_1_code": null, "iso_3_code": "mtg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10181", "native_tokenizers": [], @@ -4905,9 +5820,11 @@ }, { "name": "Nalca", + "depth": 3, "iso_1_code": null, "iso_3_code": "nlc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10182", "native_tokenizers": [], @@ -4917,15 +5834,18 @@ }, { "name": "Nipsan", + "depth": 3, "iso_1_code": null, "iso_3_code": "nps", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10183", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10177", "native_tokenizers": [], @@ -4933,26 +5853,31 @@ }, { "name": "Western", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ketengban", + "depth": 3, "iso_1_code": null, "iso_3_code": "xte", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10185", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10184", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10176", "native_tokenizers": [], @@ -4960,14 +5885,17 @@ }, { "name": "Mombum", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koneraw", + "depth": 2, "iso_1_code": null, "iso_3_code": "kdw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10187", "native_tokenizers": [], @@ -4975,15 +5903,18 @@ }, { "name": "Mombum", + "depth": 2, "iso_1_code": null, "iso_3_code": "mso", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10188", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10186", "native_tokenizers": [], @@ -4991,20 +5922,24 @@ }, { "name": "Mor", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mor", + "depth": 2, "iso_1_code": null, "iso_3_code": "moq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10190", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10189", "native_tokenizers": [], @@ -5012,20 +5947,24 @@ }, { "name": "Moraori", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Morori", + "depth": 2, "iso_1_code": null, "iso_3_code": "mok", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10192", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10191", "native_tokenizers": [], @@ -5033,24 +5972,29 @@ }, { "name": "Ok-Awyu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awyu-Dumut", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awyu", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aghu", + "depth": 4, "iso_1_code": null, "iso_3_code": "ahh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10196", "native_tokenizers": [], @@ -5058,9 +6002,11 @@ }, { "name": "Awyu, South", + "depth": 4, "iso_1_code": null, "iso_3_code": "aws", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10197", "native_tokenizers": [], @@ -5068,9 +6014,11 @@ }, { "name": "Awyu, Central", + "depth": 4, "iso_1_code": null, "iso_3_code": "awu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10198", "native_tokenizers": [], @@ -5078,9 +6026,11 @@ }, { "name": "Awyu, Jair", + "depth": 4, "iso_1_code": null, "iso_3_code": "awv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10199", "native_tokenizers": [], @@ -5088,9 +6038,11 @@ }, { "name": "Awyu, Edera", + "depth": 4, "iso_1_code": null, "iso_3_code": "awy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10200", "native_tokenizers": [], @@ -5098,9 +6050,11 @@ }, { "name": "Awyu, Asue", + "depth": 4, "iso_1_code": null, "iso_3_code": "psa", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10201", "native_tokenizers": [], @@ -5108,15 +6062,18 @@ }, { "name": "Awyu, North", + "depth": 4, "iso_1_code": null, "iso_3_code": "yir", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10202", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10195", "native_tokenizers": [], @@ -5124,14 +6081,17 @@ }, { "name": "Dumut", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mandobo Atas", + "depth": 4, "iso_1_code": null, "iso_3_code": "aax", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10204", "native_tokenizers": [], @@ -5139,9 +6099,11 @@ }, { "name": "Mandobo Bawah", + "depth": 4, "iso_1_code": null, "iso_3_code": "bwp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10205", "native_tokenizers": [], @@ -5149,9 +6111,11 @@ }, { "name": "Ketum", + "depth": 4, "iso_1_code": null, "iso_3_code": "ktt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10206", "native_tokenizers": [], @@ -5159,9 +6123,11 @@ }, { "name": "Kombai", + "depth": 4, "iso_1_code": null, "iso_3_code": "tyn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10207", "native_tokenizers": [], @@ -5169,9 +6135,11 @@ }, { "name": "Wambon", + "depth": 4, "iso_1_code": null, "iso_3_code": "wms", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10208", "native_tokenizers": [], @@ -5179,15 +6147,18 @@ }, { "name": "Wanggom", + "depth": 4, "iso_1_code": null, "iso_3_code": "wng", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10209", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10203", "native_tokenizers": [], @@ -5195,20 +6166,24 @@ }, { "name": "Korowai", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Korowai", + "depth": 4, "iso_1_code": null, "iso_3_code": "khe", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10211", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10210", "native_tokenizers": [], @@ -5216,26 +6191,31 @@ }, { "name": "Sawi", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sawi", + "depth": 4, "iso_1_code": null, "iso_3_code": "saw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10213", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10212", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10194", "native_tokenizers": [], @@ -5243,19 +6223,23 @@ }, { "name": "Ok", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Lowland", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Morop", + "depth": 4, "iso_1_code": null, "iso_3_code": "iwo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10216", "native_tokenizers": [], @@ -5263,9 +6247,11 @@ }, { "name": "Muyu, North", + "depth": 4, "iso_1_code": null, "iso_3_code": "kti", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10217", "native_tokenizers": [], @@ -5273,9 +6259,11 @@ }, { "name": "Muyu, South", + "depth": 4, "iso_1_code": null, "iso_3_code": "kts", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10218", "native_tokenizers": [], @@ -5283,9 +6271,11 @@ }, { "name": "Ninggerum", + "depth": 4, "iso_1_code": null, "iso_3_code": "nxr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10219", "native_tokenizers": [], @@ -5293,9 +6283,11 @@ }, { "name": "Yongkom", + "depth": 4, "iso_1_code": null, "iso_3_code": "yon", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10220", "native_tokenizers": [], @@ -5304,6 +6296,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10215", "native_tokenizers": [], @@ -5311,14 +6304,17 @@ }, { "name": "Mountain", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bimin", + "depth": 4, "iso_1_code": null, "iso_3_code": "bhl", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10222", "native_tokenizers": [], @@ -5328,9 +6324,11 @@ }, { "name": "Faiwol", + "depth": 4, "iso_1_code": null, "iso_3_code": "fai", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10223", "native_tokenizers": [], @@ -5340,9 +6338,11 @@ }, { "name": "Mian", + "depth": 4, "iso_1_code": null, "iso_3_code": "mpt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10224", "native_tokenizers": [], @@ -5352,9 +6352,11 @@ }, { "name": "Nakai", + "depth": 4, "iso_1_code": null, "iso_3_code": "nkj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10225", "native_tokenizers": [], @@ -5362,9 +6364,11 @@ }, { "name": "Setaman", + "depth": 4, "iso_1_code": null, "iso_3_code": "stm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10226", "native_tokenizers": [], @@ -5372,9 +6376,11 @@ }, { "name": "Suganga", + "depth": 4, "iso_1_code": null, "iso_3_code": "sug", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10227", "native_tokenizers": [], @@ -5382,9 +6388,11 @@ }, { "name": "Tifal", + "depth": 4, "iso_1_code": null, "iso_3_code": "tif", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10228", "native_tokenizers": [], @@ -5394,9 +6402,11 @@ }, { "name": "Telefol", + "depth": 4, "iso_1_code": null, "iso_3_code": "tlf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10229", "native_tokenizers": [], @@ -5406,15 +6416,18 @@ }, { "name": "Urapmin", + "depth": 4, "iso_1_code": null, "iso_3_code": "urm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10230", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10221", "native_tokenizers": [], @@ -5422,14 +6435,17 @@ }, { "name": "Ngalum", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsaukambo", + "depth": 4, "iso_1_code": null, "iso_3_code": "kvz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10232", "native_tokenizers": [], @@ -5437,9 +6453,11 @@ }, { "name": "Komyandaret", + "depth": 4, "iso_1_code": null, "iso_3_code": "kzv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10233", "native_tokenizers": [], @@ -5447,9 +6465,11 @@ }, { "name": "Ngalum", + "depth": 4, "iso_1_code": null, "iso_3_code": "szb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10234", "native_tokenizers": [], @@ -5458,6 +6478,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10231", "native_tokenizers": [], @@ -5465,20 +6486,24 @@ }, { "name": "Tangko", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tangko", + "depth": 4, "iso_1_code": null, "iso_3_code": "tkx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10236", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10235", "native_tokenizers": [], @@ -5486,14 +6511,17 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Burumakok", + "depth": 4, "iso_1_code": null, "iso_3_code": "aip", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10238", "native_tokenizers": [], @@ -5501,9 +6529,11 @@ }, { "name": "Kwer", + "depth": 4, "iso_1_code": null, "iso_3_code": "kwr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10239", "native_tokenizers": [], @@ -5511,27 +6541,32 @@ }, { "name": "Kopkaka", + "depth": 4, "iso_1_code": null, "iso_3_code": "opk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10240", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10237", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10214", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10193", "native_tokenizers": [], @@ -5539,14 +6574,17 @@ }, { "name": "Oksapmin", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oksapmin", + "depth": 2, "iso_1_code": null, "iso_3_code": "opm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10242", "native_tokenizers": [], @@ -5555,6 +6593,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10241", "native_tokenizers": [], @@ -5562,20 +6601,24 @@ }, { "name": "Pawaian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pawaia", + "depth": 2, "iso_1_code": null, "iso_3_code": "pwa", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10244", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10243", "native_tokenizers": [], @@ -5583,19 +6626,23 @@ }, { "name": "South Bird\u2019s Head", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Inanwatan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Duriankere", + "depth": 3, "iso_1_code": null, "iso_3_code": "dbn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10247", "native_tokenizers": [], @@ -5603,15 +6650,18 @@ }, { "name": "Suabo", + "depth": 3, "iso_1_code": null, "iso_3_code": "szp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10248", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10246", "native_tokenizers": [], @@ -5619,14 +6669,17 @@ }, { "name": "Konda-Yahadian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Konda", + "depth": 3, "iso_1_code": null, "iso_3_code": "knd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10250", "native_tokenizers": [], @@ -5634,15 +6687,18 @@ }, { "name": "Yahadian", + "depth": 3, "iso_1_code": null, "iso_3_code": "ner", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10251", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10249", "native_tokenizers": [], @@ -5650,25 +6706,30 @@ }, { "name": "South Bird\u2019s Head Proper", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kokoda", + "depth": 4, "iso_1_code": null, "iso_3_code": "xod", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10254", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10253", "native_tokenizers": [], @@ -5676,14 +6737,17 @@ }, { "name": "Eastern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kemberano", + "depth": 4, "iso_1_code": null, "iso_3_code": "bzp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10256", "native_tokenizers": [], @@ -5691,15 +6755,18 @@ }, { "name": "Arandai", + "depth": 4, "iso_1_code": null, "iso_3_code": "jbj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10257", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10255", "native_tokenizers": [], @@ -5707,14 +6774,17 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kais", + "depth": 4, "iso_1_code": null, "iso_3_code": "kzm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10259", "native_tokenizers": [], @@ -5722,9 +6792,11 @@ }, { "name": "Puragi", + "depth": 4, "iso_1_code": null, "iso_3_code": "pru", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10260", "native_tokenizers": [], @@ -5732,27 +6804,32 @@ }, { "name": "Kaburi", + "depth": 4, "iso_1_code": null, "iso_3_code": "uka", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10261", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10258", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10252", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10245", "native_tokenizers": [], @@ -5760,19 +6837,23 @@ }, { "name": "Southeast Papuan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dagan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Daga", + "depth": 3, "iso_1_code": null, "iso_3_code": "dgz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10264", "native_tokenizers": [], @@ -5782,9 +6863,11 @@ }, { "name": "Umanakaina", + "depth": 3, "iso_1_code": null, "iso_3_code": "gdn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10265", "native_tokenizers": [], @@ -5794,9 +6877,11 @@ }, { "name": "Ginuman", + "depth": 3, "iso_1_code": null, "iso_3_code": "gnm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10266", "native_tokenizers": [], @@ -5804,9 +6889,11 @@ }, { "name": "Dima", + "depth": 3, "iso_1_code": null, "iso_3_code": "jma", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10267", "native_tokenizers": [], @@ -5814,9 +6901,11 @@ }, { "name": "Mapena", + "depth": 3, "iso_1_code": null, "iso_3_code": "mnm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10268", "native_tokenizers": [], @@ -5824,9 +6913,11 @@ }, { "name": "Maiwa", + "depth": 3, "iso_1_code": null, "iso_3_code": "mti", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10269", "native_tokenizers": [], @@ -5836,9 +6927,11 @@ }, { "name": "Onjob", + "depth": 3, "iso_1_code": null, "iso_3_code": "onj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10270", "native_tokenizers": [], @@ -5846,9 +6939,11 @@ }, { "name": "Kanasi", + "depth": 3, "iso_1_code": null, "iso_3_code": "soq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10271", "native_tokenizers": [], @@ -5858,15 +6953,18 @@ }, { "name": "Turaka", + "depth": 3, "iso_1_code": null, "iso_3_code": "trh", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10272", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10263", "native_tokenizers": [], @@ -5874,25 +6972,30 @@ }, { "name": "Goilalan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fuyug", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fuyug", + "depth": 4, "iso_1_code": null, "iso_3_code": "fuy", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10275", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10274", "native_tokenizers": [], @@ -5900,14 +7003,17 @@ }, { "name": "Kunimaipa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biangai", + "depth": 4, "iso_1_code": null, "iso_3_code": "big", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10277", "native_tokenizers": [], @@ -5917,9 +7023,11 @@ }, { "name": "Kunimaipa", + "depth": 4, "iso_1_code": null, "iso_3_code": "kup", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10278", "native_tokenizers": [], @@ -5929,9 +7037,11 @@ }, { "name": "Tauade", + "depth": 4, "iso_1_code": null, "iso_3_code": "ttd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10279", "native_tokenizers": [], @@ -5939,9 +7049,11 @@ }, { "name": "Amam", + "depth": 4, "iso_1_code": null, "iso_3_code": "wer", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10280", "native_tokenizers": [], @@ -5950,12 +7062,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10276", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10273", "native_tokenizers": [], @@ -5963,19 +7077,23 @@ }, { "name": "Koiarian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baraic", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u00d6mie", + "depth": 4, "iso_1_code": null, "iso_3_code": "aom", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10283", "native_tokenizers": [], @@ -5985,9 +7103,11 @@ }, { "name": "Barai", + "depth": 4, "iso_1_code": null, "iso_3_code": "bbb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10284", "native_tokenizers": [], @@ -5997,9 +7117,11 @@ }, { "name": "Ese", + "depth": 4, "iso_1_code": null, "iso_3_code": "mcq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10285", "native_tokenizers": [], @@ -6009,9 +7131,11 @@ }, { "name": "Namiae", + "depth": 4, "iso_1_code": null, "iso_3_code": "nvm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10286", "native_tokenizers": [], @@ -6020,6 +7144,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10282", "native_tokenizers": [], @@ -6027,14 +7152,17 @@ }, { "name": "Koiaric", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Biage", + "depth": 4, "iso_1_code": null, "iso_3_code": "bdf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10288", "native_tokenizers": [], @@ -6042,9 +7170,11 @@ }, { "name": "Koiari", + "depth": 4, "iso_1_code": null, "iso_3_code": "kbk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10289", "native_tokenizers": [], @@ -6052,9 +7182,11 @@ }, { "name": "Koiali, Mountain", + "depth": 4, "iso_1_code": null, "iso_3_code": "kpx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10290", "native_tokenizers": [], @@ -6064,21 +7196,25 @@ }, { "name": "Koita", + "depth": 4, "iso_1_code": null, "iso_3_code": "kqi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10291", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10287", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10281", "native_tokenizers": [], @@ -6086,14 +7222,17 @@ }, { "name": "Kwalean", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Humene", + "depth": 3, "iso_1_code": null, "iso_3_code": "huf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10293", "native_tokenizers": [], @@ -6101,9 +7240,11 @@ }, { "name": "Uare", + "depth": 3, "iso_1_code": null, "iso_3_code": "ksj", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10294", "native_tokenizers": [], @@ -6113,15 +7254,18 @@ }, { "name": "Mulaha", + "depth": 3, "iso_1_code": null, "iso_3_code": "mfw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10295", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10292", "native_tokenizers": [], @@ -6129,14 +7273,17 @@ }, { "name": "Mailuan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bauwaki", + "depth": 3, "iso_1_code": null, "iso_3_code": "bwk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10297", "native_tokenizers": [], @@ -6144,9 +7291,11 @@ }, { "name": "Binahari", + "depth": 3, "iso_1_code": null, "iso_3_code": "bxz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10298", "native_tokenizers": [], @@ -6154,9 +7303,11 @@ }, { "name": "Domu", + "depth": 3, "iso_1_code": null, "iso_3_code": "dof", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10299", "native_tokenizers": [], @@ -6164,9 +7315,11 @@ }, { "name": "Laua", + "depth": 3, "iso_1_code": null, "iso_3_code": "luf", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10300", "native_tokenizers": [], @@ -6174,9 +7327,11 @@ }, { "name": "Magi", + "depth": 3, "iso_1_code": null, "iso_3_code": "mgu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10301", "native_tokenizers": [], @@ -6184,15 +7339,18 @@ }, { "name": "Morawa", + "depth": 3, "iso_1_code": null, "iso_3_code": "mze", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10302", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10296", "native_tokenizers": [], @@ -6200,14 +7358,17 @@ }, { "name": "Manubaran", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Doromu-Koki", + "depth": 3, "iso_1_code": null, "iso_3_code": "kqc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10304", "native_tokenizers": [], @@ -6217,15 +7378,18 @@ }, { "name": "Maria", + "depth": 3, "iso_1_code": null, "iso_3_code": "mds", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10305", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10303", "native_tokenizers": [], @@ -6233,14 +7397,17 @@ }, { "name": "Yareban", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aneme Wake", + "depth": 3, "iso_1_code": null, "iso_3_code": "aby", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10307", "native_tokenizers": [], @@ -6250,9 +7417,11 @@ }, { "name": "Bariji", + "depth": 3, "iso_1_code": null, "iso_3_code": "bjc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10308", "native_tokenizers": [], @@ -6260,9 +7429,11 @@ }, { "name": "Moikodi", + "depth": 3, "iso_1_code": null, "iso_3_code": "mkp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10309", "native_tokenizers": [], @@ -6270,9 +7441,11 @@ }, { "name": "Nawaru", + "depth": 3, "iso_1_code": null, "iso_3_code": "nwr", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10310", "native_tokenizers": [], @@ -6280,9 +7453,11 @@ }, { "name": "Yareba", + "depth": 3, "iso_1_code": null, "iso_3_code": "yrb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10311", "native_tokenizers": [], @@ -6291,12 +7466,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10306", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10262", "native_tokenizers": [], @@ -6304,20 +7481,24 @@ }, { "name": "Tanah Merah", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tanahmerah", + "depth": 2, "iso_1_code": null, "iso_3_code": "tcm", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10313", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10312", "native_tokenizers": [], @@ -6325,14 +7506,17 @@ }, { "name": "Teberan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dadibi", + "depth": 2, "iso_1_code": null, "iso_3_code": "mps", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10315", "native_tokenizers": [], @@ -6342,9 +7526,11 @@ }, { "name": "Folopa", + "depth": 2, "iso_1_code": null, "iso_3_code": "ppo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10316", "native_tokenizers": [], @@ -6353,6 +7539,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10314", "native_tokenizers": [], @@ -6360,14 +7547,17 @@ }, { "name": "Tirio", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abom", + "depth": 2, "iso_1_code": null, "iso_3_code": "aob", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10318", "native_tokenizers": [], @@ -6375,9 +7565,11 @@ }, { "name": "Makayam", + "depth": 2, "iso_1_code": null, "iso_3_code": "aup", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10319", "native_tokenizers": [], @@ -6385,9 +7577,11 @@ }, { "name": "Baramu", + "depth": 2, "iso_1_code": null, "iso_3_code": "bmz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10320", "native_tokenizers": [], @@ -6395,9 +7589,11 @@ }, { "name": "Bitur", + "depth": 2, "iso_1_code": null, "iso_3_code": "mcc", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10321", "native_tokenizers": [], @@ -6405,15 +7601,18 @@ }, { "name": "Kiunum", + "depth": 2, "iso_1_code": null, "iso_3_code": "wei", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10322", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10317", "native_tokenizers": [], @@ -6421,25 +7620,30 @@ }, { "name": "Turama-Kikorian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kairi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Rumu", + "depth": 3, "iso_1_code": null, "iso_3_code": "klq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10325", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10324", "native_tokenizers": [], @@ -6447,14 +7651,17 @@ }, { "name": "Kaser", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Barikewa", + "depth": 3, "iso_1_code": null, "iso_3_code": "jbk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10327", "native_tokenizers": [], @@ -6462,9 +7669,11 @@ }, { "name": "Mouwase", + "depth": 3, "iso_1_code": null, "iso_3_code": "jmw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10328", "native_tokenizers": [], @@ -6472,21 +7681,25 @@ }, { "name": "Ikobi", + "depth": 3, "iso_1_code": null, "iso_3_code": "meb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10329", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10326", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10323", "native_tokenizers": [], @@ -6494,24 +7707,29 @@ }, { "name": "West", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dani", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dani Proper", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Dani, Upper Grand Valley", + "depth": 4, "iso_1_code": null, "iso_3_code": "dna", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10333", "native_tokenizers": [], @@ -6519,9 +7737,11 @@ }, { "name": "Dani, Lower Grand Valley", + "depth": 4, "iso_1_code": null, "iso_3_code": "dni", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10334", "native_tokenizers": [], @@ -6529,9 +7749,11 @@ }, { "name": "Dani, Mid Grand Valley", + "depth": 4, "iso_1_code": null, "iso_3_code": "dnt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10335", "native_tokenizers": [], @@ -6539,9 +7761,11 @@ }, { "name": "Dani, Western", + "depth": 4, "iso_1_code": null, "iso_3_code": "dnw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10336", "native_tokenizers": [], @@ -6551,9 +7775,11 @@ }, { "name": "Hupla", + "depth": 4, "iso_1_code": null, "iso_3_code": "hap", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10337", "native_tokenizers": [], @@ -6561,9 +7787,11 @@ }, { "name": "Nggem", + "depth": 4, "iso_1_code": null, "iso_3_code": "nbq", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10338", "native_tokenizers": [], @@ -6573,15 +7801,18 @@ }, { "name": "Walak", + "depth": 4, "iso_1_code": null, "iso_3_code": "wlw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10339", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10332", "native_tokenizers": [], @@ -6589,14 +7820,17 @@ }, { "name": "Ngalik", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nduga", + "depth": 4, "iso_1_code": null, "iso_3_code": "ndx", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10341", "native_tokenizers": [], @@ -6604,9 +7838,11 @@ }, { "name": "Yali, Ninia", + "depth": 4, "iso_1_code": null, "iso_3_code": "nlk", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10342", "native_tokenizers": [], @@ -6614,9 +7850,11 @@ }, { "name": "Silimo", + "depth": 4, "iso_1_code": null, "iso_3_code": "wul", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10343", "native_tokenizers": [], @@ -6624,9 +7862,11 @@ }, { "name": "Yali, Pass Valley", + "depth": 4, "iso_1_code": null, "iso_3_code": "yac", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10344", "native_tokenizers": [], @@ -6634,9 +7874,11 @@ }, { "name": "Yali, Angguruk", + "depth": 4, "iso_1_code": null, "iso_3_code": "yli", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10345", "native_tokenizers": [], @@ -6645,6 +7887,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10340", "native_tokenizers": [], @@ -6652,26 +7895,31 @@ }, { "name": "Wano", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wano", + "depth": 4, "iso_1_code": null, "iso_3_code": "wno", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10347", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10346", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10331", "native_tokenizers": [], @@ -6679,14 +7927,17 @@ }, { "name": "Timor-Alor-Pantar", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wersing", + "depth": 3, "iso_1_code": null, "iso_3_code": "kvw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10349", "native_tokenizers": [], @@ -6694,9 +7945,11 @@ }, { "name": "Oirata", + "depth": 3, "iso_1_code": null, "iso_3_code": "oia", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10350", "native_tokenizers": [], @@ -6704,19 +7957,23 @@ }, { "name": "Alor-Pantar", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alor", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Abui", + "depth": 5, "iso_1_code": null, "iso_3_code": "abz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10353", "native_tokenizers": [], @@ -6726,9 +7983,11 @@ }, { "name": "Adang", + "depth": 5, "iso_1_code": null, "iso_3_code": "adn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10354", "native_tokenizers": [], @@ -6736,9 +7995,11 @@ }, { "name": "Hamap", + "depth": 5, "iso_1_code": null, "iso_3_code": "hmu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10355", "native_tokenizers": [], @@ -6746,9 +8007,11 @@ }, { "name": "Kabola", + "depth": 5, "iso_1_code": null, "iso_3_code": "klz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10356", "native_tokenizers": [], @@ -6756,9 +8019,11 @@ }, { "name": "Kafoa", + "depth": 5, "iso_1_code": null, "iso_3_code": "kpu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10357", "native_tokenizers": [], @@ -6766,9 +8031,11 @@ }, { "name": "Kui", + "depth": 5, "iso_1_code": null, "iso_3_code": "kvd", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10358", "native_tokenizers": [], @@ -6776,9 +8043,11 @@ }, { "name": "Klon", + "depth": 5, "iso_1_code": null, "iso_3_code": "kyo", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10359", "native_tokenizers": [], @@ -6786,15 +8055,18 @@ }, { "name": "Kamang", + "depth": 5, "iso_1_code": null, "iso_3_code": "woi", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10360", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10352", "native_tokenizers": [], @@ -6802,14 +8074,17 @@ }, { "name": "Pantar", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Blagar", + "depth": 5, "iso_1_code": null, "iso_3_code": "beu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10362", "native_tokenizers": [], @@ -6817,9 +8092,11 @@ }, { "name": "Kaera", + "depth": 5, "iso_1_code": null, "iso_3_code": "jka", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10363", "native_tokenizers": [], @@ -6827,9 +8104,11 @@ }, { "name": "Pantar, Western", + "depth": 5, "iso_1_code": null, "iso_3_code": "lev", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10364", "native_tokenizers": [], @@ -6837,9 +8116,11 @@ }, { "name": "Nedebang", + "depth": 5, "iso_1_code": null, "iso_3_code": "nec", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10365", "native_tokenizers": [], @@ -6847,9 +8128,11 @@ }, { "name": "Reta", + "depth": 5, "iso_1_code": null, "iso_3_code": "ret", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10366", "native_tokenizers": [], @@ -6857,9 +8140,11 @@ }, { "name": "Teiwa", + "depth": 5, "iso_1_code": null, "iso_3_code": "twe", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10367", "native_tokenizers": [], @@ -6867,21 +8152,25 @@ }, { "name": "Tereweng", + "depth": 5, "iso_1_code": null, "iso_3_code": "twg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10368", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10361", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10351", "native_tokenizers": [], @@ -6889,14 +8178,17 @@ }, { "name": "Tanglapui", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Sawila", + "depth": 4, "iso_1_code": null, "iso_3_code": "swt", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10370", "native_tokenizers": [], @@ -6904,15 +8196,18 @@ }, { "name": "Kula", + "depth": 4, "iso_1_code": null, "iso_3_code": "tpg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10371", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10369", "native_tokenizers": [], @@ -6920,14 +8215,17 @@ }, { "name": "Timor", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bunak", + "depth": 4, "iso_1_code": null, "iso_3_code": "bfn", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10373", "native_tokenizers": [], @@ -6935,9 +8233,11 @@ }, { "name": "Fataluku", + "depth": 4, "iso_1_code": null, "iso_3_code": "ddg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10374", "native_tokenizers": [], @@ -6947,9 +8247,11 @@ }, { "name": "Makalero", + "depth": 4, "iso_1_code": null, "iso_3_code": "mjb", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10375", "native_tokenizers": [], @@ -6957,9 +8259,11 @@ }, { "name": "Makasae", + "depth": 4, "iso_1_code": null, "iso_3_code": "mkz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10376", "native_tokenizers": [], @@ -6968,12 +8272,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10372", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10348", "native_tokenizers": [], @@ -6981,25 +8287,30 @@ }, { "name": "West Bomberai", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karas", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karas", + "depth": 4, "iso_1_code": null, "iso_3_code": "kgv", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10379", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10378", "native_tokenizers": [], @@ -7007,14 +8318,17 @@ }, { "name": "West Bomberai Proper", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Baham", + "depth": 4, "iso_1_code": null, "iso_3_code": "bdw", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10381", "native_tokenizers": [], @@ -7022,21 +8336,25 @@ }, { "name": "Iha", + "depth": 4, "iso_1_code": null, "iso_3_code": "ihp", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10382", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10380", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10377", "native_tokenizers": [], @@ -7044,14 +8362,17 @@ }, { "name": "Wissel Lakes", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Auye", + "depth": 3, "iso_1_code": null, "iso_3_code": "auu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10384", "native_tokenizers": [], @@ -7059,9 +8380,11 @@ }, { "name": "Moi", + "depth": 3, "iso_1_code": null, "iso_3_code": "daz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10385", "native_tokenizers": [], @@ -7069,9 +8392,11 @@ }, { "name": "Ekari", + "depth": 3, "iso_1_code": null, "iso_3_code": "ekg", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10386", "native_tokenizers": [], @@ -7079,9 +8404,11 @@ }, { "name": "Moni", + "depth": 3, "iso_1_code": null, "iso_3_code": "mnz", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10387", "native_tokenizers": [], @@ -7089,21 +8416,25 @@ }, { "name": "Wolani", + "depth": 3, "iso_1_code": null, "iso_3_code": "wod", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10388", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10383", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10330", "native_tokenizers": [], @@ -7111,14 +8442,17 @@ }, { "name": "West Kutubu", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Fasu", + "depth": 2, "iso_1_code": null, "iso_3_code": "faa", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10390", "native_tokenizers": [], @@ -7127,6 +8461,7 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10389", "native_tokenizers": [], @@ -7134,14 +8469,17 @@ }, { "name": "Wiru", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Witu", + "depth": 2, "iso_1_code": null, "iso_3_code": "wiu", "children": [], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10392", "native_tokenizers": [], @@ -7150,12 +8488,14 @@ ] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "10391", "native_tokenizers": [], "scripts": [] } ], + "family": "Trans-New Guinea", "tokenizers": {}, "node_i": "9723", "native_tokenizers": [], diff --git a/data/Tsimshian.json b/data/Tsimshian.json index 44a75bd0a85c9f946ad22f268fff27aaee4c9b59..f2392b9369cfa6b6393ade12bf6fb4334e7b5eaa 100644 --- a/data/Tsimshian.json +++ b/data/Tsimshian.json @@ -1,13 +1,16 @@ { "name": "Tsimshian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tsimshian", + "depth": 1, "iso_1_code": null, "iso_3_code": "tsi", "children": [], + "family": "Tsimshian", "tokenizers": {}, "node_i": "10394", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Nass-Gitksan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gitxsan", + "depth": 2, "iso_1_code": null, "iso_3_code": "git", "children": [], + "family": "Tsimshian", "tokenizers": {}, "node_i": "10396", "native_tokenizers": [], @@ -30,21 +36,25 @@ }, { "name": "Nisga\u2019a", + "depth": 2, "iso_1_code": null, "iso_3_code": "ncg", "children": [], + "family": "Tsimshian", "tokenizers": {}, "node_i": "10397", "native_tokenizers": [], "scripts": [] } ], + "family": "Tsimshian", "tokenizers": {}, "node_i": "10395", "native_tokenizers": [], "scripts": [] } ], + "family": "Tsimshian", "tokenizers": {}, "node_i": "10393", "native_tokenizers": [], diff --git a/data/Tucanoan.json b/data/Tucanoan.json index 5498716387250e76b8f22052084bc9889e7afd27..faa3f6d72a095fdbb0fd38c9ebb624095b9af4d6 100644 --- a/data/Tucanoan.json +++ b/data/Tucanoan.json @@ -1,13 +1,16 @@ { "name": "Tucanoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Miriti", + "depth": 1, "iso_1_code": null, "iso_3_code": "mmv", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10399", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Central Tucanoan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cubeo", + "depth": 2, "iso_1_code": null, "iso_3_code": "cub", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10401", "native_tokenizers": [], @@ -31,6 +37,7 @@ ] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10400", "native_tokenizers": [], @@ -38,14 +45,17 @@ }, { "name": "Eastern Tucanoan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arapaso", + "depth": 2, "iso_1_code": null, "iso_3_code": "arj", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10403", "native_tokenizers": [], @@ -53,9 +63,11 @@ }, { "name": "Wanano", + "depth": 2, "iso_1_code": null, "iso_3_code": "gvc", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10404", "native_tokenizers": [], @@ -65,9 +77,11 @@ }, { "name": "Macuna", + "depth": 2, "iso_1_code": null, "iso_3_code": "myy", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10405", "native_tokenizers": [], @@ -77,9 +91,11 @@ }, { "name": "Piratapuyo", + "depth": 2, "iso_1_code": null, "iso_3_code": "pir", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10406", "native_tokenizers": [], @@ -89,14 +105,17 @@ }, { "name": "Bar\u00e1-Tuyuka", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Waimaha", + "depth": 3, "iso_1_code": null, "iso_3_code": "bao", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10408", "native_tokenizers": [], @@ -106,9 +125,11 @@ }, { "name": "Barasana-Eduria", + "depth": 3, "iso_1_code": null, "iso_3_code": "bsn", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10409", "native_tokenizers": [], @@ -118,9 +139,11 @@ }, { "name": "Pokang\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "pok", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10410", "native_tokenizers": [], @@ -128,9 +151,11 @@ }, { "name": "Tuyuca", + "depth": 3, "iso_1_code": null, "iso_3_code": "tue", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10411", "native_tokenizers": [], @@ -139,6 +164,7 @@ ] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10407", "native_tokenizers": [], @@ -146,14 +172,17 @@ }, { "name": "Carapano", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Carapana", + "depth": 3, "iso_1_code": null, "iso_3_code": "cbc", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10413", "native_tokenizers": [], @@ -163,9 +192,11 @@ }, { "name": "Tatuyo", + "depth": 3, "iso_1_code": null, "iso_3_code": "tav", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10414", "native_tokenizers": [], @@ -174,6 +205,7 @@ ] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10412", "native_tokenizers": [], @@ -181,14 +213,17 @@ }, { "name": "Desano-Siriano", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Desano", + "depth": 3, "iso_1_code": null, "iso_3_code": "des", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10416", "native_tokenizers": [], @@ -198,9 +233,11 @@ }, { "name": "Siriano", + "depth": 3, "iso_1_code": null, "iso_3_code": "sri", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10417", "native_tokenizers": [], @@ -209,6 +246,7 @@ ] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10415", "native_tokenizers": [], @@ -216,14 +254,17 @@ }, { "name": "Tucano", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tucano", + "depth": 3, "iso_1_code": null, "iso_3_code": "tuo", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10419", "native_tokenizers": [], @@ -233,21 +274,25 @@ }, { "name": "Wajiara", + "depth": 3, "iso_1_code": null, "iso_3_code": "yui", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10420", "native_tokenizers": [], "scripts": [] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10418", "native_tokenizers": [], "scripts": [] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10402", "native_tokenizers": [], @@ -255,14 +300,17 @@ }, { "name": "Western Tucanoan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Koreguaje", + "depth": 2, "iso_1_code": null, "iso_3_code": "coe", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10422", "native_tokenizers": [], @@ -272,9 +320,11 @@ }, { "name": "Maijuna", + "depth": 2, "iso_1_code": null, "iso_3_code": "ore", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10423", "native_tokenizers": [], @@ -282,9 +332,11 @@ }, { "name": "Tetete", + "depth": 2, "iso_1_code": null, "iso_3_code": "teb", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10424", "native_tokenizers": [], @@ -292,9 +344,11 @@ }, { "name": "Tama", + "depth": 2, "iso_1_code": null, "iso_3_code": "ten", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10425", "native_tokenizers": [], @@ -302,9 +356,11 @@ }, { "name": "Tanimuca-Letuama", + "depth": 2, "iso_1_code": null, "iso_3_code": "tnc", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10426", "native_tokenizers": [], @@ -314,9 +370,11 @@ }, { "name": "Yahuna", + "depth": 2, "iso_1_code": null, "iso_3_code": "ynu", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10427", "native_tokenizers": [], @@ -324,14 +382,17 @@ }, { "name": "Macaguaje", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Macaguaje", + "depth": 3, "iso_1_code": null, "iso_3_code": "mcl", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10429", "native_tokenizers": [], @@ -339,9 +400,11 @@ }, { "name": "Paicoca", + "depth": 3, "iso_1_code": null, "iso_3_code": "sey", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10430", "native_tokenizers": [], @@ -351,9 +414,11 @@ }, { "name": "Siona", + "depth": 3, "iso_1_code": null, "iso_3_code": "snn", "children": [], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10431", "native_tokenizers": [], @@ -362,18 +427,21 @@ ] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10428", "native_tokenizers": [], "scripts": [] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10421", "native_tokenizers": [], "scripts": [] } ], + "family": "Tucanoan", "tokenizers": {}, "node_i": "10398", "native_tokenizers": [], diff --git a/data/Tungusic.json b/data/Tungusic.json index ab0246c3200239aaabbbcbce526a0b336d1eb27d..da38edfd012fc065b9741a489bd0ba4e8d00254d 100644 --- a/data/Tungusic.json +++ b/data/Tungusic.json @@ -1,23 +1,28 @@ { "name": "Tungusic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Even", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Even", + "depth": 3, "iso_1_code": null, "iso_3_code": "eve", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10435", "native_tokenizers": [], @@ -26,6 +31,7 @@ ] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10434", "native_tokenizers": [], @@ -33,14 +39,17 @@ }, { "name": "Evenki", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Evenki", + "depth": 3, "iso_1_code": null, "iso_3_code": "evn", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10437", "native_tokenizers": [], @@ -48,15 +57,18 @@ }, { "name": "Oroqen", + "depth": 3, "iso_1_code": null, "iso_3_code": "orh", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10438", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10436", "native_tokenizers": [], @@ -64,26 +76,31 @@ }, { "name": "Negidal", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Negidal", + "depth": 3, "iso_1_code": null, "iso_3_code": "neg", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10440", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10439", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10433", "native_tokenizers": [], @@ -91,24 +108,29 @@ }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Southeast", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nanaj", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nanai", + "depth": 4, "iso_1_code": null, "iso_3_code": "gld", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10444", "native_tokenizers": [], @@ -116,9 +138,11 @@ }, { "name": "Orok", + "depth": 4, "iso_1_code": null, "iso_3_code": "oaa", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10445", "native_tokenizers": [], @@ -126,15 +150,18 @@ }, { "name": "Ulch", + "depth": 4, "iso_1_code": null, "iso_3_code": "ulc", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10446", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10443", "native_tokenizers": [], @@ -142,14 +169,17 @@ }, { "name": "Udihe", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Oroch", + "depth": 4, "iso_1_code": null, "iso_3_code": "oac", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10448", "native_tokenizers": [], @@ -157,21 +187,25 @@ }, { "name": "Udihe", + "depth": 4, "iso_1_code": null, "iso_3_code": "ude", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10449", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10447", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10442", "native_tokenizers": [], @@ -179,14 +213,17 @@ }, { "name": "Southwest", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jurchen", + "depth": 3, "iso_1_code": null, "iso_3_code": "juc", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10451", "native_tokenizers": [], @@ -194,9 +231,11 @@ }, { "name": "Manchu", + "depth": 3, "iso_1_code": null, "iso_3_code": "mnc", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10452", "native_tokenizers": [], @@ -204,9 +243,11 @@ }, { "name": "Xibe", + "depth": 3, "iso_1_code": null, "iso_3_code": "sjo", "children": [], + "family": "Tungusic", "tokenizers": {}, "node_i": "10453", "native_tokenizers": [], @@ -215,18 +256,21 @@ ] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10450", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10441", "native_tokenizers": [], "scripts": [] } ], + "family": "Tungusic", "tokenizers": {}, "node_i": "10432", "native_tokenizers": [], diff --git a/data/Tupian.json b/data/Tupian.json index 312e15f6b78a86bcc32c973f6a4bd8cd9271d161..d87762b408c850823e3575526b656dd82863312e 100644 --- a/data/Tupian.json +++ b/data/Tupian.json @@ -1,13 +1,16 @@ { "name": "Tupian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Awet\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": "awe", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10455", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Kamayur\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "kay", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10456", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Sater\u00e9-Maw\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "mav", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10457", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Zo\u2019\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "pto", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10458", "native_tokenizers": [], @@ -47,9 +56,11 @@ }, { "name": "Purubor\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "pur", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10459", "native_tokenizers": [], @@ -57,14 +68,17 @@ }, { "name": "Arikem", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arikem", + "depth": 2, "iso_1_code": null, "iso_3_code": "ait", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10461", "native_tokenizers": [], @@ -72,15 +86,18 @@ }, { "name": "Kariti\u00e2na", + "depth": 2, "iso_1_code": null, "iso_3_code": "ktn", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10462", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10460", "native_tokenizers": [], @@ -88,14 +105,17 @@ }, { "name": "Juruna", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jur\u00fana", + "depth": 2, "iso_1_code": null, "iso_3_code": "jur", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10464", "native_tokenizers": [], @@ -103,9 +123,11 @@ }, { "name": "Maritsau\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "msp", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10465", "native_tokenizers": [], @@ -113,15 +135,18 @@ }, { "name": "Xipaya", + "depth": 2, "iso_1_code": null, "iso_3_code": "xiy", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10466", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10463", "native_tokenizers": [], @@ -129,14 +154,17 @@ }, { "name": "Mond\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mond\u00e9", + "depth": 2, "iso_1_code": null, "iso_3_code": "mnd", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10468", "native_tokenizers": [], @@ -144,9 +172,11 @@ }, { "name": "Suru\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": "sru", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10469", "native_tokenizers": [], @@ -154,14 +184,17 @@ }, { "name": "Aru\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aru\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "arx", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10471", "native_tokenizers": [], @@ -169,9 +202,11 @@ }, { "name": "Cinta Larga", + "depth": 3, "iso_1_code": null, "iso_3_code": "cin", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10472", "native_tokenizers": [], @@ -179,21 +214,25 @@ }, { "name": "Gavi\u00e3o do Jiparan\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "gvo", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10473", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10470", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10467", "native_tokenizers": [], @@ -201,14 +240,17 @@ }, { "name": "Munduruk\u00fa", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kuru\u00e1ya", + "depth": 2, "iso_1_code": null, "iso_3_code": "kyr", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10475", "native_tokenizers": [], @@ -216,9 +258,11 @@ }, { "name": "Munduruk\u00fa", + "depth": 2, "iso_1_code": null, "iso_3_code": "myu", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10476", "native_tokenizers": [], @@ -227,6 +271,7 @@ ] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10474", "native_tokenizers": [], @@ -234,14 +279,17 @@ }, { "name": "Ramarama", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karo", + "depth": 2, "iso_1_code": null, "iso_3_code": "arr", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10478", "native_tokenizers": [], @@ -251,15 +299,18 @@ }, { "name": "Urumi", + "depth": 2, "iso_1_code": null, "iso_3_code": "uru", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10479", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10477", "native_tokenizers": [], @@ -267,14 +318,17 @@ }, { "name": "Tupar\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Akuntsu", + "depth": 2, "iso_1_code": null, "iso_3_code": "aqz", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10481", "native_tokenizers": [], @@ -284,9 +338,11 @@ }, { "name": "Kepkiriw\u00e1t", + "depth": 2, "iso_1_code": null, "iso_3_code": "kpn", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10482", "native_tokenizers": [], @@ -294,9 +350,11 @@ }, { "name": "Makur\u00e1p", + "depth": 2, "iso_1_code": null, "iso_3_code": "mpu", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10483", "native_tokenizers": [], @@ -304,9 +362,11 @@ }, { "name": "Sakirabi\u00e1", + "depth": 2, "iso_1_code": null, "iso_3_code": "skf", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10484", "native_tokenizers": [], @@ -314,9 +374,11 @@ }, { "name": "Tupar\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": "tpr", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10485", "native_tokenizers": [], @@ -324,15 +386,18 @@ }, { "name": "Wayor\u00f3", + "depth": 2, "iso_1_code": null, "iso_3_code": "wyr", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10486", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10480", "native_tokenizers": [], @@ -340,14 +405,17 @@ }, { "name": "Tup\u00ed-Guaran\u00ed", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Arawet\u00e9", + "depth": 2, "iso_1_code": null, "iso_3_code": "awt", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10488", "native_tokenizers": [], @@ -355,14 +423,17 @@ }, { "name": "Guaran\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ach\u00e9", + "depth": 3, "iso_1_code": null, "iso_3_code": "guq", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10490", "native_tokenizers": [], @@ -372,9 +443,11 @@ }, { "name": "Xet\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "xet", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10491", "native_tokenizers": [], @@ -382,14 +455,17 @@ }, { "name": "Guaran\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guaran\u00ed, Paraguayan", + "depth": 4, "iso_1_code": "gn", "iso_3_code": "gug", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10493", "native_tokenizers": [], @@ -399,9 +475,11 @@ }, { "name": "Guaran\u00ed, Mby\u00e1", + "depth": 4, "iso_1_code": "gn", "iso_3_code": "gun", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10494", "native_tokenizers": [], @@ -411,9 +489,11 @@ }, { "name": "Kaiw\u00e1", + "depth": 4, "iso_1_code": null, "iso_3_code": "kgk", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10495", "native_tokenizers": [], @@ -423,9 +503,11 @@ }, { "name": "Guaran\u00ed, Ava", + "depth": 4, "iso_1_code": "gn", "iso_3_code": "nhd", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10496", "native_tokenizers": [], @@ -435,9 +517,11 @@ }, { "name": "Pai Tavytera", + "depth": 4, "iso_1_code": null, "iso_3_code": "pta", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10497", "native_tokenizers": [], @@ -445,9 +529,11 @@ }, { "name": "\u00d1andeva", + "depth": 4, "iso_1_code": null, "iso_3_code": "tpj", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10498", "native_tokenizers": [], @@ -455,14 +541,17 @@ }, { "name": "Bolivian Guaran\u00ed", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guaran\u00ed, Western Bolivian", + "depth": 5, "iso_1_code": "gn", "iso_3_code": "gnw", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10500", "native_tokenizers": [], @@ -472,9 +561,11 @@ }, { "name": "Guaran\u00ed, Eastern Bolivian", + "depth": 5, "iso_1_code": "gn", "iso_3_code": "gui", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10501", "native_tokenizers": [], @@ -483,18 +574,21 @@ ] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10499", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10492", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10489", "native_tokenizers": [], @@ -502,14 +596,17 @@ }, { "name": "Guaray\u00fa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guarayu", + "depth": 3, "iso_1_code": null, "iso_3_code": "gyr", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10503", "native_tokenizers": [], @@ -519,9 +616,11 @@ }, { "name": "Pauserna", + "depth": 3, "iso_1_code": null, "iso_3_code": "psm", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10504", "native_tokenizers": [], @@ -529,14 +628,17 @@ }, { "name": "Sirion\u00f3", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Jor\u00e1", + "depth": 4, "iso_1_code": null, "iso_3_code": "jor", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10506", "native_tokenizers": [], @@ -544,9 +646,11 @@ }, { "name": "Sirion\u00f3", + "depth": 4, "iso_1_code": null, "iso_3_code": "srq", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10507", "native_tokenizers": [], @@ -556,21 +660,25 @@ }, { "name": "Yuqui", + "depth": 4, "iso_1_code": null, "iso_3_code": "yuq", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10508", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10505", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10502", "native_tokenizers": [], @@ -578,14 +686,17 @@ }, { "name": "Kawahib", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Apiak\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "api", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10510", "native_tokenizers": [], @@ -593,9 +704,11 @@ }, { "name": "Uru-Pa-In", + "depth": 3, "iso_1_code": null, "iso_3_code": "urp", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10511", "native_tokenizers": [], @@ -603,9 +716,11 @@ }, { "name": "Uru-Eu-Wau-Wau", + "depth": 3, "iso_1_code": null, "iso_3_code": "urz", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10512", "native_tokenizers": [], @@ -613,14 +728,17 @@ }, { "name": "Parintintin", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Amundava", + "depth": 4, "iso_1_code": null, "iso_3_code": "adw", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10514", "native_tokenizers": [], @@ -628,9 +746,11 @@ }, { "name": "J\u00fama", + "depth": 4, "iso_1_code": null, "iso_3_code": "jua", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10515", "native_tokenizers": [], @@ -638,9 +758,11 @@ }, { "name": "Karipuna", + "depth": 4, "iso_1_code": null, "iso_3_code": "kuq", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10516", "native_tokenizers": [], @@ -648,9 +770,11 @@ }, { "name": "Paranaw\u00e1t", + "depth": 4, "iso_1_code": null, "iso_3_code": "paf", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10517", "native_tokenizers": [], @@ -658,9 +782,11 @@ }, { "name": "Tenharim", + "depth": 4, "iso_1_code": null, "iso_3_code": "pah", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10518", "native_tokenizers": [], @@ -670,9 +796,11 @@ }, { "name": "Tukumanf\u00e9d", + "depth": 4, "iso_1_code": null, "iso_3_code": "tkf", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10519", "native_tokenizers": [], @@ -680,9 +808,11 @@ }, { "name": "Wiraf\u00e9d", + "depth": 4, "iso_1_code": null, "iso_3_code": "wir", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10520", "native_tokenizers": [], @@ -690,21 +820,25 @@ }, { "name": "Morerebi", + "depth": 4, "iso_1_code": null, "iso_3_code": "xmo", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10521", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10513", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10509", "native_tokenizers": [], @@ -712,14 +846,17 @@ }, { "name": "Kayab\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asurini of Xing\u00fa", + "depth": 3, "iso_1_code": null, "iso_3_code": "asn", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10523", "native_tokenizers": [], @@ -727,9 +864,11 @@ }, { "name": "Kayab\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": "kyz", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10524", "native_tokenizers": [], @@ -738,6 +877,7 @@ ] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10522", "native_tokenizers": [], @@ -745,14 +885,17 @@ }, { "name": "Tenetehara", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Av\u00e1-Canoeiro", + "depth": 3, "iso_1_code": null, "iso_3_code": "avv", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10526", "native_tokenizers": [], @@ -760,9 +903,11 @@ }, { "name": "Tapirap\u00e9", + "depth": 3, "iso_1_code": null, "iso_3_code": "taf", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10527", "native_tokenizers": [], @@ -770,14 +915,17 @@ }, { "name": "Akwawa", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Asurini, Tocantins", + "depth": 4, "iso_1_code": null, "iso_3_code": "asu", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10529", "native_tokenizers": [], @@ -785,9 +933,11 @@ }, { "name": "Suru\u00ed do Par\u00e1", + "depth": 4, "iso_1_code": null, "iso_3_code": "mdz", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10530", "native_tokenizers": [], @@ -795,15 +945,18 @@ }, { "name": "Parakan\u00e3", + "depth": 4, "iso_1_code": null, "iso_3_code": "pak", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10531", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10528", "native_tokenizers": [], @@ -811,14 +964,17 @@ }, { "name": "Tenetehara", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Guajaj\u00e1ra", + "depth": 4, "iso_1_code": null, "iso_3_code": "gub", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10533", "native_tokenizers": [], @@ -828,21 +984,25 @@ }, { "name": "Temb\u00e9", + "depth": 4, "iso_1_code": null, "iso_3_code": "tqb", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10534", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10532", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10525", "native_tokenizers": [], @@ -850,19 +1010,23 @@ }, { "name": "Tup\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cocama", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Kukama-Kukamiria", + "depth": 4, "iso_1_code": null, "iso_3_code": "cod", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10537", "native_tokenizers": [], @@ -870,15 +1034,18 @@ }, { "name": "Omagua", + "depth": 4, "iso_1_code": null, "iso_3_code": "omg", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10538", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10536", "native_tokenizers": [], @@ -886,14 +1053,17 @@ }, { "name": "Tup\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Potigu\u00e1ra", + "depth": 4, "iso_1_code": null, "iso_3_code": "pog", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10540", "native_tokenizers": [], @@ -901,9 +1071,11 @@ }, { "name": "Tupinikin", + "depth": 4, "iso_1_code": null, "iso_3_code": "tpk", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10541", "native_tokenizers": [], @@ -911,9 +1083,11 @@ }, { "name": "Tupinamb\u00e1", + "depth": 4, "iso_1_code": null, "iso_3_code": "tpn", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10542", "native_tokenizers": [], @@ -923,9 +1097,11 @@ }, { "name": "Nhengatu", + "depth": 4, "iso_1_code": null, "iso_3_code": "yrl", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10543", "native_tokenizers": [], @@ -934,12 +1110,14 @@ ] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10539", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10535", "native_tokenizers": [], @@ -947,14 +1125,17 @@ }, { "name": "Wayamp\u00ed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aur\u00e1", + "depth": 3, "iso_1_code": null, "iso_3_code": "aux", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10545", "native_tokenizers": [], @@ -962,14 +1143,17 @@ }, { "name": "Amanay\u00e9", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anamb\u00e9", + "depth": 4, "iso_1_code": null, "iso_3_code": "aan", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10547", "native_tokenizers": [], @@ -977,9 +1161,11 @@ }, { "name": "Amanay\u00e9", + "depth": 4, "iso_1_code": null, "iso_3_code": "ama", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10548", "native_tokenizers": [], @@ -987,9 +1173,11 @@ }, { "name": "Guaj\u00e1", + "depth": 4, "iso_1_code": null, "iso_3_code": "gvj", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10549", "native_tokenizers": [], @@ -997,9 +1185,11 @@ }, { "name": "Turiw\u00e1ra", + "depth": 4, "iso_1_code": null, "iso_3_code": "twt", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10550", "native_tokenizers": [], @@ -1007,9 +1197,11 @@ }, { "name": "Kaapor", + "depth": 4, "iso_1_code": null, "iso_3_code": "urb", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10551", "native_tokenizers": [], @@ -1019,15 +1211,18 @@ }, { "name": "Ararandew\u00e1ra", + "depth": 4, "iso_1_code": null, "iso_3_code": "xaj", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10552", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10546", "native_tokenizers": [], @@ -1035,14 +1230,17 @@ }, { "name": "Wayamp\u00ed", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tek\u00f3", + "depth": 4, "iso_1_code": null, "iso_3_code": "eme", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10554", "native_tokenizers": [], @@ -1052,9 +1250,11 @@ }, { "name": "Wayampi", + "depth": 4, "iso_1_code": null, "iso_3_code": "oym", "children": [], + "family": "Tupian", "tokenizers": {}, "node_i": "10555", "native_tokenizers": [], @@ -1063,24 +1263,28 @@ ] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10553", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10544", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10487", "native_tokenizers": [], "scripts": [] } ], + "family": "Tupian", "tokenizers": {}, "node_i": "10454", "native_tokenizers": [], diff --git a/data/Turkic.json b/data/Turkic.json index 60427db9f55b15e824b25c0215eddc58a79618cc..a60a48b0dd7e069e543997920b9412ce72cc6dfc 100644 --- a/data/Turkic.json +++ b/data/Turkic.json @@ -1,13 +1,16 @@ { "name": "Turkic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Urum", + "depth": 1, "iso_1_code": null, "iso_3_code": "uum", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10557", "native_tokenizers": [], @@ -15,23 +18,18 @@ }, { "name": "Bolgar", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Chuvash", + "depth": 2, "iso_1_code": "cv", "iso_3_code": "chv", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10559", "native_tokenizers": [], "scripts": [ @@ -39,29 +37,25 @@ ] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10558", "native_tokenizers": [], "scripts": [] }, { "name": "Eastern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ainu", + "depth": 2, "iso_1_code": null, "iso_3_code": "aib", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10561", "native_tokenizers": [], @@ -69,9 +63,11 @@ }, { "name": "Chagatai", + "depth": 2, "iso_1_code": null, "iso_3_code": "chg", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10562", "native_tokenizers": [], @@ -79,9 +75,11 @@ }, { "name": "Ili Turki", + "depth": 2, "iso_1_code": null, "iso_3_code": "ili", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10563", "native_tokenizers": [], @@ -89,9 +87,11 @@ }, { "name": "Uyghur", + "depth": 2, "iso_1_code": "ug", "iso_3_code": "uig", "children": [], + "family": "Turkic", "tokenizers": { "Arab": { "full_object": "StanzaTokenizer(\"ug\")", @@ -99,20 +99,6 @@ "original_lang_code": "uig", "script": "Arab", "class_name": "StanzaTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10564", @@ -127,25 +113,12 @@ }, { "name": "Uzbek, Northern", + "depth": 2, "iso_1_code": "uz", "iso_3_code": "uzn", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10565", "native_tokenizers": [], "scripts": [ @@ -155,9 +128,11 @@ }, { "name": "Uzbek, Southern", + "depth": 2, "iso_1_code": "uz", "iso_3_code": "uzs", "children": [], + "family": "Turkic", "tokenizers": { "Arab": { "full_object": "StanzaTokenizer(\"ug\")", @@ -175,15 +150,18 @@ }, { "name": "Yugur, West", + "depth": 2, "iso_1_code": null, "iso_3_code": "ybe", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10567", "native_tokenizers": [], "scripts": [] } ], + "family": "Turkic", "tokenizers": { "Arab": { "full_object": "StanzaTokenizer(\"ug\")", @@ -191,20 +169,6 @@ "original_lang_code": "uig", "script": "Arab", "class_name": "StanzaTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10560", @@ -213,23 +177,18 @@ }, { "name": "Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Altai, Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": "alt", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10569", "native_tokenizers": [], "scripts": [ @@ -238,9 +197,11 @@ }, { "name": "Altai, Northern", + "depth": 2, "iso_1_code": null, "iso_3_code": "atv", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10570", "native_tokenizers": [], @@ -248,18 +209,12 @@ }, { "name": "Shor", + "depth": 2, "iso_1_code": null, "iso_3_code": "cjs", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10571", "native_tokenizers": [], "scripts": [ @@ -268,9 +223,11 @@ }, { "name": "Dolgan", + "depth": 2, "iso_1_code": null, "iso_3_code": "dlg", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10572", "native_tokenizers": [], @@ -278,9 +235,11 @@ }, { "name": "Karagas", + "depth": 2, "iso_1_code": null, "iso_3_code": "kim", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10573", "native_tokenizers": [], @@ -288,18 +247,12 @@ }, { "name": "Khakas", + "depth": 2, "iso_1_code": null, "iso_3_code": "kjh", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10574", "native_tokenizers": [], "scripts": [ @@ -308,18 +261,12 @@ }, { "name": "Yakut", + "depth": 2, "iso_1_code": null, "iso_3_code": "sah", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10575", "native_tokenizers": [], "scripts": [ @@ -328,18 +275,12 @@ }, { "name": "Tuvan", + "depth": 2, "iso_1_code": null, "iso_3_code": "tyv", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10576", "native_tokenizers": [], "scripts": [ @@ -347,29 +288,25 @@ ] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10568", "native_tokenizers": [], "scripts": [] }, { "name": "Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Crimean Tatar", + "depth": 2, "iso_1_code": null, "iso_3_code": "crh", "children": [], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tr\")", @@ -377,13 +314,6 @@ "original_lang_code": "tur", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10578", @@ -395,9 +325,11 @@ }, { "name": "Khalaj", + "depth": 2, "iso_1_code": null, "iso_3_code": "klj", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10579", "native_tokenizers": [], @@ -405,9 +337,11 @@ }, { "name": "Kashkay", + "depth": 2, "iso_1_code": null, "iso_3_code": "qxq", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10580", "native_tokenizers": [], @@ -415,9 +349,11 @@ }, { "name": "Salar", + "depth": 2, "iso_1_code": null, "iso_3_code": "slr", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10581", "native_tokenizers": [], @@ -425,23 +361,18 @@ }, { "name": "Azerbaijani", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Azerbaijani, South", + "depth": 3, "iso_1_code": "az", "iso_3_code": "azb", "children": [], - "tokenizers": { - "Arab": { - "full_object": "StanzaTokenizer(\"ug\")", - "original_lang_name": "uyghur", - "original_lang_code": "uig", - "script": "Arab", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10583", "native_tokenizers": [], "scripts": [ @@ -450,9 +381,11 @@ }, { "name": "Azerbaijani, North", + "depth": 3, "iso_1_code": "az", "iso_3_code": "azj", "children": [], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"az\")", @@ -460,13 +393,6 @@ "original_lang_code": "aze", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10584", @@ -479,6 +405,7 @@ ] } ], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"az\")", @@ -486,20 +413,6 @@ "original_lang_code": "aze", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Arab": { - "full_object": "StanzaTokenizer(\"ug\")", - "original_lang_name": "uyghur", - "original_lang_code": "uig", - "script": "Arab", - "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10582", @@ -508,14 +421,17 @@ }, { "name": "Turkish", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Balkan Gagauz Turkish", + "depth": 3, "iso_1_code": null, "iso_3_code": "bgx", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10586", "native_tokenizers": [], @@ -523,9 +439,11 @@ }, { "name": "Gagauz", + "depth": 3, "iso_1_code": null, "iso_3_code": "gag", "children": [], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tr\")", @@ -533,13 +451,6 @@ "original_lang_code": "tur", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10587", @@ -551,9 +462,11 @@ }, { "name": "Khorasani Turkish", + "depth": 3, "iso_1_code": null, "iso_3_code": "kmz", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10588", "native_tokenizers": [], @@ -561,9 +474,11 @@ }, { "name": "Turkish", + "depth": 3, "iso_1_code": "tr", "iso_3_code": "tur", "children": [], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tr\")", @@ -582,6 +497,7 @@ ] } ], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tr\")", @@ -589,13 +505,6 @@ "original_lang_code": "tur", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10585", @@ -604,14 +513,17 @@ }, { "name": "Turkmenian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Turkmen", + "depth": 3, "iso_1_code": "tk", "iso_3_code": "tuk", "children": [], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tr\")", @@ -619,20 +531,6 @@ "original_lang_code": "tur", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Arab": { - "full_object": "StanzaTokenizer(\"ug\")", - "original_lang_name": "uyghur", - "original_lang_code": "uig", - "script": "Arab", - "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10591", @@ -644,6 +542,7 @@ ] } ], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tr\")", @@ -651,20 +550,6 @@ "original_lang_code": "tur", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Arab": { - "full_object": "StanzaTokenizer(\"ug\")", - "original_lang_name": "uyghur", - "original_lang_code": "uig", - "script": "Arab", - "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10590", @@ -672,6 +557,7 @@ "scripts": [] } ], + "family": "Turkic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"tr\")", @@ -679,20 +565,6 @@ "original_lang_code": "tur", "script": "Latn", "class_name": "SpaCyTokenizer" - }, - "Arab": { - "full_object": "StanzaTokenizer(\"ug\")", - "original_lang_name": "uyghur", - "original_lang_code": "uig", - "script": "Arab", - "class_name": "StanzaTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" } }, "node_i": "10577", @@ -701,19 +573,23 @@ }, { "name": "Western", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Aralo-Caspian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Karakalpak", + "depth": 3, "iso_1_code": null, "iso_3_code": "kaa", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -721,13 +597,6 @@ "original_lang_code": "kaz", "script": "Cyrl", "class_name": "StanzaTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" } }, "node_i": "10594", @@ -739,9 +608,11 @@ }, { "name": "Kazakh", + "depth": 3, "iso_1_code": "kk", "iso_3_code": "kaz", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -761,9 +632,11 @@ }, { "name": "Kyrgyz", + "depth": 3, "iso_1_code": "ky", "iso_3_code": "kir", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"ky\")", @@ -783,9 +656,11 @@ }, { "name": "Nogai", + "depth": 3, "iso_1_code": null, "iso_3_code": "nog", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -803,15 +678,18 @@ }, { "name": "Kuman", + "depth": 3, "iso_1_code": null, "iso_3_code": "qwm", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10598", "native_tokenizers": [], "scripts": [] } ], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -819,13 +697,6 @@ "original_lang_code": "kaz", "script": "Cyrl", "class_name": "StanzaTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" } }, "node_i": "10593", @@ -834,14 +705,17 @@ }, { "name": "Ponto-Caspian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Krimchak", + "depth": 3, "iso_1_code": null, "iso_3_code": "jct", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10600", "native_tokenizers": [], @@ -849,18 +723,12 @@ }, { "name": "Karaim", + "depth": 3, "iso_1_code": null, "iso_3_code": "kdr", "children": [], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10601", "native_tokenizers": [], "scripts": [ @@ -869,9 +737,11 @@ }, { "name": "Karachay-Balkar", + "depth": 3, "iso_1_code": null, "iso_3_code": "krc", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -889,9 +759,11 @@ }, { "name": "Kumyk", + "depth": 3, "iso_1_code": null, "iso_3_code": "kum", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -908,6 +780,7 @@ ] } ], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -915,13 +788,6 @@ "original_lang_code": "kaz", "script": "Cyrl", "class_name": "StanzaTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" } }, "node_i": "10599", @@ -930,14 +796,17 @@ }, { "name": "Uralian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bashkort", + "depth": 3, "iso_1_code": "ba", "iso_3_code": "bak", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"tt\")", @@ -955,9 +824,11 @@ }, { "name": "Chulym", + "depth": 3, "iso_1_code": null, "iso_3_code": "clw", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10606", "native_tokenizers": [], @@ -965,9 +836,11 @@ }, { "name": "Siberian Tatar", + "depth": 3, "iso_1_code": null, "iso_3_code": "sty", "children": [], + "family": "Turkic", "tokenizers": {}, "node_i": "10607", "native_tokenizers": [], @@ -975,9 +848,11 @@ }, { "name": "Tatar", + "depth": 3, "iso_1_code": "tt", "iso_3_code": "tat", "children": [], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"tt\")", @@ -985,13 +860,6 @@ "original_lang_code": "tat", "script": "Cyrl", "class_name": "SpaCyTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" } }, "node_i": "10608", @@ -1004,6 +872,7 @@ ] } ], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "SpaCyTokenizer(\"tt\")", @@ -1011,13 +880,6 @@ "original_lang_code": "tat", "script": "Cyrl", "class_name": "SpaCyTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" } }, "node_i": "10604", @@ -1025,6 +887,7 @@ "scripts": [] } ], + "family": "Turkic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"kk\")", @@ -1032,13 +895,6 @@ "original_lang_code": "kaz", "script": "Cyrl", "class_name": "StanzaTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" } }, "node_i": "10592", @@ -1046,29 +902,8 @@ "scripts": [] } ], - "tokenizers": { - "Arab": { - "full_object": "StanzaTokenizer(\"ug\")", - "original_lang_name": "uyghur", - "original_lang_code": "uig", - "script": "Arab", - "class_name": "StanzaTokenizer" - }, - "Latn": { - "full_object": "SpaCyTokenizer(\"tr\")", - "original_lang_name": "turkish", - "original_lang_code": "tur", - "script": "Latn", - "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"kk\")", - "original_lang_name": "kazakh", - "original_lang_code": "kaz", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Turkic", + "tokenizers": {}, "node_i": "10556", "native_tokenizers": [], "scripts": [] diff --git a/data/Tuu.json b/data/Tuu.json index 90e587f119dbec61e7eb7b8dabb530ba47f57a45..8c12b15c6b766bf3c056816ce83fac547197df31 100644 --- a/data/Tuu.json +++ b/data/Tuu.json @@ -1,18 +1,22 @@ { "name": "Tuu", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "!Ui", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "\u2021Ungkue", + "depth": 2, "iso_1_code": null, "iso_3_code": "gku", "children": [], + "family": "Tuu", "tokenizers": {}, "node_i": "10611", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Seroa", + "depth": 2, "iso_1_code": null, "iso_3_code": "kqu", "children": [], + "family": "Tuu", "tokenizers": {}, "node_i": "10612", "native_tokenizers": [], @@ -30,9 +36,11 @@ }, { "name": "N\u01c1ng", + "depth": 2, "iso_1_code": null, "iso_3_code": "ngh", "children": [], + "family": "Tuu", "tokenizers": {}, "node_i": "10613", "native_tokenizers": [], @@ -40,9 +48,11 @@ }, { "name": "\u01c0Xam", + "depth": 2, "iso_1_code": null, "iso_3_code": "xam", "children": [], + "family": "Tuu", "tokenizers": {}, "node_i": "10614", "native_tokenizers": [], @@ -50,15 +60,18 @@ }, { "name": "\u01c1Xegwi", + "depth": 2, "iso_1_code": null, "iso_3_code": "xeg", "children": [], + "family": "Tuu", "tokenizers": {}, "node_i": "10615", "native_tokenizers": [], "scripts": [] } ], + "family": "Tuu", "tokenizers": {}, "node_i": "10610", "native_tokenizers": [], @@ -66,14 +79,17 @@ }, { "name": "Taa-Lower Nossob", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Taa", + "depth": 2, "iso_1_code": null, "iso_3_code": "nmn", "children": [], + "family": "Tuu", "tokenizers": {}, "node_i": "10617", "native_tokenizers": [], @@ -81,21 +97,25 @@ }, { "name": "Lower Nossob", + "depth": 2, "iso_1_code": null, "iso_3_code": "nsb", "children": [], + "family": "Tuu", "tokenizers": {}, "node_i": "10618", "native_tokenizers": [], "scripts": [] } ], + "family": "Tuu", "tokenizers": {}, "node_i": "10616", "native_tokenizers": [], "scripts": [] } ], + "family": "Tuu", "tokenizers": {}, "node_i": "10609", "native_tokenizers": [], diff --git a/data/Unclassified.json b/data/Unclassified.json index 0f646144a0ed18dfdff786398c0b0f9fd6497834..9662c15b274e85e6dc5b727ed6bf8f5628014cba 100644 --- a/data/Unclassified.json +++ b/data/Unclassified.json @@ -1,13 +1,16 @@ { "name": "Unclassified", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Alsea", + "depth": 1, "iso_1_code": null, "iso_3_code": "aes", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10620", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Aguano", + "depth": 1, "iso_1_code": null, "iso_3_code": "aga", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10621", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Awishira", + "depth": 1, "iso_1_code": null, "iso_3_code": "ash", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10622", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Agavotaguerra", + "depth": 1, "iso_1_code": null, "iso_3_code": "avo", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10623", "native_tokenizers": [], @@ -45,9 +54,11 @@ }, { "name": "Ar\u00e1ra, Mato Grosso", + "depth": 1, "iso_1_code": null, "iso_3_code": "axg", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10624", "native_tokenizers": [], @@ -55,9 +66,11 @@ }, { "name": "Bung", + "depth": 1, "iso_1_code": null, "iso_3_code": "bqd", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10625", "native_tokenizers": [], @@ -65,9 +78,11 @@ }, { "name": "Beothuk", + "depth": 1, "iso_1_code": null, "iso_3_code": "bue", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10626", "native_tokenizers": [], @@ -75,9 +90,11 @@ }, { "name": "Carabayo", + "depth": 1, "iso_1_code": null, "iso_3_code": "cby", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10627", "native_tokenizers": [], @@ -85,9 +102,11 @@ }, { "name": "Doso", + "depth": 1, "iso_1_code": null, "iso_3_code": "dol", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10628", "native_tokenizers": [], @@ -95,9 +114,11 @@ }, { "name": "Gail", + "depth": 1, "iso_1_code": null, "iso_3_code": "gic", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10629", "native_tokenizers": [], @@ -105,9 +126,11 @@ }, { "name": "Himarim\u00e3", + "depth": 1, "iso_1_code": null, "iso_3_code": "hir", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10630", "native_tokenizers": [], @@ -115,9 +138,11 @@ }, { "name": "Haitian Vodoun Culture Language", + "depth": 1, "iso_1_code": null, "iso_3_code": "hvc", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10631", "native_tokenizers": [], @@ -125,9 +150,11 @@ }, { "name": "Kara", + "depth": 1, "iso_1_code": null, "iso_3_code": "kah", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10632", "native_tokenizers": [], @@ -135,9 +162,11 @@ }, { "name": "Lufu", + "depth": 1, "iso_1_code": null, "iso_3_code": "ldq", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10633", "native_tokenizers": [], @@ -145,9 +174,11 @@ }, { "name": "Lepki", + "depth": 1, "iso_1_code": null, "iso_3_code": "lpe", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10634", "native_tokenizers": [], @@ -155,9 +186,11 @@ }, { "name": "Kasabe", + "depth": 1, "iso_1_code": null, "iso_3_code": "luw", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10635", "native_tokenizers": [], @@ -165,9 +198,11 @@ }, { "name": "Majhwar", + "depth": 1, "iso_1_code": null, "iso_3_code": "mmj", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10636", "native_tokenizers": [], @@ -175,9 +210,11 @@ }, { "name": "Mangue", + "depth": 1, "iso_1_code": null, "iso_3_code": "mom", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10637", "native_tokenizers": [], @@ -185,9 +222,11 @@ }, { "name": "Molof", + "depth": 1, "iso_1_code": null, "iso_3_code": "msl", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10638", "native_tokenizers": [], @@ -195,9 +234,11 @@ }, { "name": "Namla", + "depth": 1, "iso_1_code": null, "iso_3_code": "naa", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10639", "native_tokenizers": [], @@ -205,9 +246,11 @@ }, { "name": "Pankarar\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "pax", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10640", "native_tokenizers": [], @@ -215,9 +258,11 @@ }, { "name": "Pijao", + "depth": 1, "iso_1_code": null, "iso_3_code": "pij", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10641", "native_tokenizers": [], @@ -225,9 +270,11 @@ }, { "name": "Polari", + "depth": 1, "iso_1_code": null, "iso_3_code": "pld", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10642", "native_tokenizers": [], @@ -235,9 +282,11 @@ }, { "name": "Mercheros", + "depth": 1, "iso_1_code": null, "iso_3_code": "quq", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10643", "native_tokenizers": [], @@ -245,9 +294,11 @@ }, { "name": "Rer Bare", + "depth": 1, "iso_1_code": null, "iso_3_code": "rer", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10644", "native_tokenizers": [], @@ -255,9 +306,11 @@ }, { "name": "Murkim", + "depth": 1, "iso_1_code": null, "iso_3_code": "rmh", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10645", "native_tokenizers": [], @@ -265,9 +318,11 @@ }, { "name": "Shabo", + "depth": 1, "iso_1_code": null, "iso_3_code": "sbf", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10646", "native_tokenizers": [], @@ -275,9 +330,11 @@ }, { "name": "Kimki", + "depth": 1, "iso_1_code": null, "iso_3_code": "sbt", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10647", "native_tokenizers": [], @@ -285,9 +342,11 @@ }, { "name": "Shanenawa", + "depth": 1, "iso_1_code": null, "iso_3_code": "swo", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10648", "native_tokenizers": [], @@ -295,9 +354,11 @@ }, { "name": "Tingui-Boto", + "depth": 1, "iso_1_code": null, "iso_3_code": "tgv", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10649", "native_tokenizers": [], @@ -305,9 +366,11 @@ }, { "name": "Truk\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "tka", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10650", "native_tokenizers": [], @@ -315,9 +378,11 @@ }, { "name": "Takelma", + "depth": 1, "iso_1_code": null, "iso_3_code": "tkm", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10651", "native_tokenizers": [], @@ -325,9 +390,11 @@ }, { "name": "Tofanma", + "depth": 1, "iso_1_code": null, "iso_3_code": "tlg", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10652", "native_tokenizers": [], @@ -335,9 +402,11 @@ }, { "name": "Trememb\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "tme", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10653", "native_tokenizers": [], @@ -345,9 +414,11 @@ }, { "name": "Traveller Scottish", + "depth": 1, "iso_1_code": null, "iso_3_code": "trl", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10654", "native_tokenizers": [], @@ -355,9 +426,11 @@ }, { "name": "Lule", + "depth": 1, "iso_1_code": null, "iso_3_code": "ule", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10655", "native_tokenizers": [], @@ -365,9 +438,11 @@ }, { "name": "Usku", + "depth": 1, "iso_1_code": null, "iso_3_code": "ulf", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10656", "native_tokenizers": [], @@ -375,9 +450,11 @@ }, { "name": "Kujarge", + "depth": 1, "iso_1_code": null, "iso_3_code": "vkj", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10657", "native_tokenizers": [], @@ -385,9 +462,11 @@ }, { "name": "Wakon\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "waf", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10658", "native_tokenizers": [], @@ -395,9 +474,11 @@ }, { "name": "Weyto", + "depth": 1, "iso_1_code": null, "iso_3_code": "woy", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10659", "native_tokenizers": [], @@ -405,9 +486,11 @@ }, { "name": "Wasu", + "depth": 1, "iso_1_code": null, "iso_3_code": "wsu", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10660", "native_tokenizers": [], @@ -415,9 +498,11 @@ }, { "name": "Waxianghua", + "depth": 1, "iso_1_code": null, "iso_3_code": "wxa", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10661", "native_tokenizers": [], @@ -425,9 +510,11 @@ }, { "name": "Adai", + "depth": 1, "iso_1_code": null, "iso_3_code": "xad", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10662", "native_tokenizers": [], @@ -435,9 +522,11 @@ }, { "name": "Kaimb\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "xai", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10663", "native_tokenizers": [], @@ -445,9 +534,11 @@ }, { "name": "Kenaboi", + "depth": 1, "iso_1_code": null, "iso_3_code": "xbn", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10664", "native_tokenizers": [], @@ -455,9 +546,11 @@ }, { "name": "Kambiw\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "xbw", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10665", "native_tokenizers": [], @@ -465,9 +558,11 @@ }, { "name": "Kembra", + "depth": 1, "iso_1_code": null, "iso_3_code": "xkw", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10666", "native_tokenizers": [], @@ -475,9 +570,11 @@ }, { "name": "Kapinaw\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpn", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10667", "native_tokenizers": [], @@ -485,9 +582,11 @@ }, { "name": "Aranama-Tamique", + "depth": 1, "iso_1_code": null, "iso_3_code": "xrt", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10668", "native_tokenizers": [], @@ -495,9 +594,11 @@ }, { "name": "Solano", + "depth": 1, "iso_1_code": null, "iso_3_code": "xso", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10669", "native_tokenizers": [], @@ -505,9 +606,11 @@ }, { "name": "Yitha Yitha", + "depth": 1, "iso_1_code": null, "iso_3_code": "xth", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10670", "native_tokenizers": [], @@ -515,9 +618,11 @@ }, { "name": "Tambora", + "depth": 1, "iso_1_code": null, "iso_3_code": "xxt", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10671", "native_tokenizers": [], @@ -525,9 +630,11 @@ }, { "name": "Pum\u00e9", + "depth": 1, "iso_1_code": null, "iso_3_code": "yae", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10672", "native_tokenizers": [], @@ -535,9 +642,11 @@ }, { "name": "Yeni", + "depth": 1, "iso_1_code": null, "iso_3_code": "yei", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10673", "native_tokenizers": [], @@ -545,15 +654,18 @@ }, { "name": "Yetfa", + "depth": 1, "iso_1_code": null, "iso_3_code": "yet", "children": [], + "family": "Unclassified", "tokenizers": {}, "node_i": "10674", "native_tokenizers": [], "scripts": [] } ], + "family": "Unclassified", "tokenizers": {}, "node_i": "10619", "native_tokenizers": [], diff --git a/data/Uralic.json b/data/Uralic.json index 8cbe443fef5b748015446586ae7943cb8dc38d47..05773fca469d2f76304a05eab1e7e2f6195fe219 100644 --- a/data/Uralic.json +++ b/data/Uralic.json @@ -1,13 +1,16 @@ { "name": "Uralic", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hungarian", + "depth": 1, "iso_1_code": "hu", "iso_3_code": "hun", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"hu\")", @@ -27,18 +30,12 @@ }, { "name": "Khanty", + "depth": 1, "iso_1_code": null, "iso_3_code": "kca", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10677", "native_tokenizers": [], "scripts": [ @@ -47,18 +44,12 @@ }, { "name": "Mansi", + "depth": 1, "iso_1_code": null, "iso_3_code": "mns", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10678", "native_tokenizers": [], "scripts": [ @@ -67,14 +58,17 @@ }, { "name": "Finnic", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Estonian, Standard", + "depth": 2, "iso_1_code": "et", "iso_3_code": "ekk", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"et\")", @@ -94,9 +88,11 @@ }, { "name": "Finnish", + "depth": 2, "iso_1_code": "fi", "iso_3_code": "fin", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -116,9 +112,11 @@ }, { "name": "Me\u00e4nkieli", + "depth": 2, "iso_1_code": null, "iso_3_code": "fit", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -136,9 +134,11 @@ }, { "name": "Finnish, Kven", + "depth": 2, "iso_1_code": null, "iso_3_code": "fkv", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -156,9 +156,11 @@ }, { "name": "Ingrian", + "depth": 2, "iso_1_code": null, "iso_3_code": "izh", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10684", "native_tokenizers": [], @@ -166,9 +168,11 @@ }, { "name": "Karelian", + "depth": 2, "iso_1_code": null, "iso_3_code": "krl", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -186,9 +190,11 @@ }, { "name": "Liv", + "depth": 2, "iso_1_code": null, "iso_3_code": "liv", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -206,9 +212,11 @@ }, { "name": "Ludian", + "depth": 2, "iso_1_code": null, "iso_3_code": "lud", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -226,9 +234,11 @@ }, { "name": "Livvi-Karelian", + "depth": 2, "iso_1_code": null, "iso_3_code": "olo", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -246,9 +256,11 @@ }, { "name": "Veps", + "depth": 2, "iso_1_code": null, "iso_3_code": "vep", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -266,9 +278,11 @@ }, { "name": "Vod", + "depth": 2, "iso_1_code": null, "iso_3_code": "vot", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -286,9 +300,11 @@ }, { "name": "V\u00f5ro", + "depth": 2, "iso_1_code": "et", "iso_3_code": "vro", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"et\")", @@ -308,15 +324,18 @@ }, { "name": "Krevinian", + "depth": 2, "iso_1_code": null, "iso_3_code": "zkv", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10692", "native_tokenizers": [], "scripts": [] } ], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "SpaCyTokenizer(\"fi\")", @@ -332,23 +351,18 @@ }, { "name": "Mari", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mari, Meadow", + "depth": 2, "iso_1_code": null, "iso_3_code": "mhr", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10694", "native_tokenizers": [], "scripts": [ @@ -357,18 +371,12 @@ }, { "name": "Mari, Hill", + "depth": 2, "iso_1_code": null, "iso_3_code": "mrj", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10695", "native_tokenizers": [], "scripts": [ @@ -376,29 +384,25 @@ ] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10693", "native_tokenizers": [], "scripts": [] }, { "name": "Mordvin", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Moksha", + "depth": 2, "iso_1_code": null, "iso_3_code": "mdf", "children": [], + "family": "Uralic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"myv\")", @@ -416,9 +420,11 @@ }, { "name": "Erzya", + "depth": 2, "iso_1_code": null, "iso_3_code": "myv", "children": [], + "family": "Uralic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"myv\")", @@ -437,6 +443,7 @@ ] } ], + "family": "Uralic", "tokenizers": { "Cyrl": { "full_object": "StanzaTokenizer(\"myv\")", @@ -452,23 +459,18 @@ }, { "name": "Permian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Udmurt", + "depth": 2, "iso_1_code": null, "iso_3_code": "udm", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10700", "native_tokenizers": [], "scripts": [ @@ -477,23 +479,18 @@ }, { "name": "Komi", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Komi-Permyak", + "depth": 3, "iso_1_code": "kv", "iso_3_code": "koi", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10702", "native_tokenizers": [], "scripts": [ @@ -502,18 +499,12 @@ }, { "name": "Komi-Zyrian", + "depth": 3, "iso_1_code": "kv", "iso_3_code": "kpv", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10703", "native_tokenizers": [], "scripts": [ @@ -521,48 +512,38 @@ ] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10701", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10699", "native_tokenizers": [], "scripts": [] }, { "name": "Sami", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eastern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saami, Akkala", + "depth": 3, "iso_1_code": null, "iso_3_code": "sia", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10706", "native_tokenizers": [], @@ -570,9 +551,11 @@ }, { "name": "Saami, Kildin", + "depth": 3, "iso_1_code": null, "iso_3_code": "sjd", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10707", "native_tokenizers": [], @@ -580,9 +563,11 @@ }, { "name": "Saami, Kemi", + "depth": 3, "iso_1_code": null, "iso_3_code": "sjk", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10708", "native_tokenizers": [], @@ -590,9 +575,11 @@ }, { "name": "Saami, Ter", + "depth": 3, "iso_1_code": null, "iso_3_code": "sjt", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10709", "native_tokenizers": [], @@ -600,9 +587,11 @@ }, { "name": "Saami, Inari", + "depth": 3, "iso_1_code": null, "iso_3_code": "smn", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -620,9 +609,11 @@ }, { "name": "Saami, Skolt", + "depth": 3, "iso_1_code": null, "iso_3_code": "sms", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -639,6 +630,7 @@ ] } ], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -654,14 +646,17 @@ }, { "name": "Southern", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saami, Ume", + "depth": 3, "iso_1_code": null, "iso_3_code": "sju", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -678,6 +673,7 @@ ] } ], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -693,19 +689,23 @@ }, { "name": "Western", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saami, Pite", + "depth": 4, "iso_1_code": null, "iso_3_code": "sje", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10716", "native_tokenizers": [], @@ -713,9 +713,11 @@ }, { "name": "Saami, North", + "depth": 4, "iso_1_code": "se", "iso_3_code": "sme", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -735,9 +737,11 @@ }, { "name": "Saami, Lule", + "depth": 4, "iso_1_code": null, "iso_3_code": "smj", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -754,6 +758,7 @@ ] } ], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -769,14 +774,17 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saami, South", + "depth": 4, "iso_1_code": null, "iso_3_code": "sma", "children": [], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -793,6 +801,7 @@ ] } ], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -807,6 +816,7 @@ "scripts": [] } ], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -821,6 +831,7 @@ "scripts": [] } ], + "family": "Uralic", "tokenizers": { "Latn": { "full_object": "StanzaTokenizer(\"se\")", @@ -836,14 +847,17 @@ }, { "name": "Samoyed", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mator", + "depth": 2, "iso_1_code": null, "iso_3_code": "mtm", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10722", "native_tokenizers": [], @@ -851,23 +865,18 @@ }, { "name": "Northern Samoyed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nganasan", + "depth": 3, "iso_1_code": null, "iso_3_code": "nio", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10724", "native_tokenizers": [], "scripts": [ @@ -876,18 +885,12 @@ }, { "name": "Nenets", + "depth": 3, "iso_1_code": null, "iso_3_code": "yrk", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10725", "native_tokenizers": [], "scripts": [ @@ -896,14 +899,17 @@ }, { "name": "Enets", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Enets, Forest", + "depth": 4, "iso_1_code": null, "iso_3_code": "enf", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10727", "native_tokenizers": [], @@ -911,9 +917,11 @@ }, { "name": "Enets, Tundra", + "depth": 4, "iso_1_code": null, "iso_3_code": "enh", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10728", "native_tokenizers": [], @@ -921,53 +929,44 @@ }, { "name": "Yurats", + "depth": 4, "iso_1_code": null, "iso_3_code": "rts", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10729", "native_tokenizers": [], "scripts": [] } ], + "family": "Uralic", "tokenizers": {}, "node_i": "10726", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10723", "native_tokenizers": [], "scripts": [] }, { "name": "Southern Samoyed", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Selkup", + "depth": 3, "iso_1_code": null, "iso_3_code": "sel", "children": [], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10731", "native_tokenizers": [], "scripts": [ @@ -976,59 +975,33 @@ }, { "name": "Kamas", + "depth": 3, "iso_1_code": null, "iso_3_code": "xas", "children": [], + "family": "Uralic", "tokenizers": {}, "node_i": "10732", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10730", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10721", "native_tokenizers": [], "scripts": [] } ], - "tokenizers": { - "Latn": { - "full_object": "SpaCyTokenizer(\"hu\")", - "original_lang_name": "hungarian", - "original_lang_code": "hun", - "script": "Latn", - "class_name": "SpaCyTokenizer" - }, - "Cyrl": { - "full_object": "StanzaTokenizer(\"myv\")", - "original_lang_name": "erzya", - "original_lang_code": "myv", - "script": "Cyrl", - "class_name": "StanzaTokenizer" - } - }, + "family": "Uralic", + "tokenizers": {}, "node_i": "10675", "native_tokenizers": [], "scripts": [] diff --git a/data/Uto-Aztecan.json b/data/Uto-Aztecan.json index 4be899c9ee0c53ad713751ccc12b256f975a318b..ebe511b5fc40458d082dd991b7420edaca91858e 100644 --- a/data/Uto-Aztecan.json +++ b/data/Uto-Aztecan.json @@ -1,18 +1,22 @@ { "name": "Uto-Aztecan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern Uto-Aztecan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Hopi", + "depth": 2, "iso_1_code": null, "iso_3_code": "hop", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10735", "native_tokenizers": [], @@ -22,9 +26,11 @@ }, { "name": "T\u00fcbatulabal", + "depth": 2, "iso_1_code": null, "iso_3_code": "tub", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10736", "native_tokenizers": [], @@ -32,19 +38,23 @@ }, { "name": "Numic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Central", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Comanche", + "depth": 4, "iso_1_code": null, "iso_3_code": "com", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10739", "native_tokenizers": [], @@ -52,9 +62,11 @@ }, { "name": "Timbisha", + "depth": 4, "iso_1_code": null, "iso_3_code": "par", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10740", "native_tokenizers": [], @@ -62,15 +74,18 @@ }, { "name": "Shoshoni", + "depth": 4, "iso_1_code": null, "iso_3_code": "shh", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10741", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10738", "native_tokenizers": [], @@ -78,14 +93,17 @@ }, { "name": "Southern", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ute-Southern Paiute", + "depth": 4, "iso_1_code": null, "iso_3_code": "ute", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10743", "native_tokenizers": [], @@ -93,15 +111,18 @@ }, { "name": "Kawaiisu", + "depth": 4, "iso_1_code": null, "iso_3_code": "xaw", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10744", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10742", "native_tokenizers": [], @@ -109,14 +130,17 @@ }, { "name": "Western", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mono", + "depth": 4, "iso_1_code": null, "iso_3_code": "mnr", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10746", "native_tokenizers": [], @@ -124,9 +148,11 @@ }, { "name": "Paiute, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "pao", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10747", "native_tokenizers": [], @@ -135,12 +161,14 @@ ] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10745", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10737", "native_tokenizers": [], @@ -148,14 +176,17 @@ }, { "name": "Takic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Luise\u00f1o", + "depth": 3, "iso_1_code": null, "iso_3_code": "lui", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10749", "native_tokenizers": [], @@ -163,9 +194,11 @@ }, { "name": "Serrano", + "depth": 3, "iso_1_code": null, "iso_3_code": "ser", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10750", "native_tokenizers": [], @@ -173,9 +206,11 @@ }, { "name": "Gabrielino-Fernande\u00f1o", + "depth": 3, "iso_1_code": null, "iso_3_code": "xgf", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10751", "native_tokenizers": [], @@ -183,14 +218,17 @@ }, { "name": "Cahuilla", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cahuilla", + "depth": 4, "iso_1_code": null, "iso_3_code": "chl", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10753", "native_tokenizers": [], @@ -198,27 +236,32 @@ }, { "name": "Cupe\u00f1o", + "depth": 4, "iso_1_code": null, "iso_3_code": "cup", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10754", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10752", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10748", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10734", "native_tokenizers": [], @@ -226,19 +269,23 @@ }, { "name": "Southern Uto-Aztecan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Corachol-Aztecan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Pochutec", + "depth": 3, "iso_1_code": null, "iso_3_code": "xpo", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10757", "native_tokenizers": [], @@ -246,14 +293,17 @@ }, { "name": "Cora-Huichol", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Huichol", + "depth": 4, "iso_1_code": null, "iso_3_code": "hch", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10759", "native_tokenizers": [], @@ -263,14 +313,17 @@ }, { "name": "Cora", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cora, Santa Teresa", + "depth": 5, "iso_1_code": null, "iso_3_code": "cok", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10761", "native_tokenizers": [], @@ -280,9 +333,11 @@ }, { "name": "Cora, El Nayar", + "depth": 5, "iso_1_code": null, "iso_3_code": "crn", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10762", "native_tokenizers": [], @@ -291,12 +346,14 @@ ] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10760", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10758", "native_tokenizers": [], @@ -304,14 +361,17 @@ }, { "name": "Core Nahua", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nahuat", + "depth": 4, "iso_1_code": null, "iso_3_code": "ppl", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10764", "native_tokenizers": [], @@ -319,14 +379,17 @@ }, { "name": "Nahuatl", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nahuatl, Eastern Durango", + "depth": 5, "iso_1_code": null, "iso_3_code": "azd", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10766", "native_tokenizers": [], @@ -334,9 +397,11 @@ }, { "name": "Nahuatl, Western Durango", + "depth": 5, "iso_1_code": null, "iso_3_code": "azn", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10767", "native_tokenizers": [], @@ -344,9 +409,11 @@ }, { "name": "Nahuatl, Highland Puebla", + "depth": 5, "iso_1_code": null, "iso_3_code": "azz", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10768", "native_tokenizers": [], @@ -356,9 +423,11 @@ }, { "name": "Nahuatl, Coatepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "naz", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10769", "native_tokenizers": [], @@ -366,9 +435,11 @@ }, { "name": "Nahuatl, Central Huasteca", + "depth": 5, "iso_1_code": null, "iso_3_code": "nch", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10770", "native_tokenizers": [], @@ -378,9 +449,11 @@ }, { "name": "Nahuatl, Northern Puebla", + "depth": 5, "iso_1_code": null, "iso_3_code": "ncj", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10771", "native_tokenizers": [], @@ -390,9 +463,11 @@ }, { "name": "Nahuatl, Michoac\u00e1n", + "depth": 5, "iso_1_code": null, "iso_3_code": "ncl", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10772", "native_tokenizers": [], @@ -402,9 +477,11 @@ }, { "name": "Nahuatl, Central Puebla", + "depth": 5, "iso_1_code": null, "iso_3_code": "ncx", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10773", "native_tokenizers": [], @@ -414,9 +491,11 @@ }, { "name": "Nahuatl, Guerrero", + "depth": 5, "iso_1_code": null, "iso_3_code": "ngu", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10774", "native_tokenizers": [], @@ -426,9 +505,11 @@ }, { "name": "Nahuatl, Tabasco", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhc", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10775", "native_tokenizers": [], @@ -436,9 +517,11 @@ }, { "name": "Nahuatl, Eastern Huasteca", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhe", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10776", "native_tokenizers": [], @@ -448,9 +531,11 @@ }, { "name": "Nahuatl, Tetelcingo", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhg", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10777", "native_tokenizers": [], @@ -460,9 +545,11 @@ }, { "name": "Nahuatl, Zacatl\u00e1n-Ahuacatl\u00e1n-Tepetzintla", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhi", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10778", "native_tokenizers": [], @@ -472,9 +559,11 @@ }, { "name": "Nahuatl, Isthmus-Cosoleacaque", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhk", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10779", "native_tokenizers": [], @@ -484,9 +573,11 @@ }, { "name": "Nahuatl, Morelos", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhm", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10780", "native_tokenizers": [], @@ -494,9 +585,11 @@ }, { "name": "Nahuatl, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhn", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10781", "native_tokenizers": [], @@ -504,9 +597,11 @@ }, { "name": "Nahuatl, Isthmus-Pajapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhp", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10782", "native_tokenizers": [], @@ -514,9 +609,11 @@ }, { "name": "Nahuatl, Huaxcaleca", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhq", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10783", "native_tokenizers": [], @@ -524,9 +621,11 @@ }, { "name": "Nahuatl, Ometepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "nht", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10784", "native_tokenizers": [], @@ -534,9 +633,11 @@ }, { "name": "Nahuatl, Temascaltepec", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhv", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10785", "native_tokenizers": [], @@ -544,9 +645,11 @@ }, { "name": "Nahuatl, Western Huasteca", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhw", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10786", "native_tokenizers": [], @@ -556,9 +659,11 @@ }, { "name": "Nahuatl, Isthmus-Mecayapan", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhx", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10787", "native_tokenizers": [], @@ -568,9 +673,11 @@ }, { "name": "Nahuatl, Northern Oaxaca", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhy", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10788", "native_tokenizers": [], @@ -580,9 +687,11 @@ }, { "name": "Nahuatl, Santa Mar\u00eda la Alta", + "depth": 5, "iso_1_code": null, "iso_3_code": "nhz", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10789", "native_tokenizers": [], @@ -590,9 +699,11 @@ }, { "name": "Nahuatl, Orizaba", + "depth": 5, "iso_1_code": null, "iso_3_code": "nlv", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10790", "native_tokenizers": [], @@ -600,9 +711,11 @@ }, { "name": "Nahuatl, Southeastern Puebla", + "depth": 5, "iso_1_code": null, "iso_3_code": "npl", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10791", "native_tokenizers": [], @@ -612,9 +725,11 @@ }, { "name": "Nahuatl, Sierra Negra", + "depth": 5, "iso_1_code": null, "iso_3_code": "nsu", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10792", "native_tokenizers": [], @@ -624,9 +739,11 @@ }, { "name": "Nahuatl, Tlamacazapa", + "depth": 5, "iso_1_code": null, "iso_3_code": "nuz", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10793", "native_tokenizers": [], @@ -635,18 +752,21 @@ ] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10765", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10763", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10756", "native_tokenizers": [], @@ -654,14 +774,17 @@ }, { "name": "Pimic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tohono O\u2019odham", + "depth": 3, "iso_1_code": null, "iso_3_code": "ood", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10795", "native_tokenizers": [], @@ -671,9 +794,11 @@ }, { "name": "Pima Bajo", + "depth": 3, "iso_1_code": null, "iso_3_code": "pia", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10796", "native_tokenizers": [], @@ -681,9 +806,11 @@ }, { "name": "Tepecano", + "depth": 3, "iso_1_code": null, "iso_3_code": "tep", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10797", "native_tokenizers": [], @@ -691,14 +818,17 @@ }, { "name": "Tepehuan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tepehuan, Northern", + "depth": 4, "iso_1_code": null, "iso_3_code": "ntp", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10799", "native_tokenizers": [], @@ -708,9 +838,11 @@ }, { "name": "Tepehuan, Southeastern", + "depth": 4, "iso_1_code": null, "iso_3_code": "stp", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10800", "native_tokenizers": [], @@ -720,21 +852,25 @@ }, { "name": "Tepehuan, Southwestern", + "depth": 4, "iso_1_code": null, "iso_3_code": "tla", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10801", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10798", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10794", "native_tokenizers": [], @@ -742,14 +878,17 @@ }, { "name": "Taracahitic", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tubar", + "depth": 3, "iso_1_code": null, "iso_3_code": "tbu", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10803", "native_tokenizers": [], @@ -757,14 +896,17 @@ }, { "name": "Cahitan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Mayo", + "depth": 4, "iso_1_code": null, "iso_3_code": "mfy", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10805", "native_tokenizers": [], @@ -774,9 +916,11 @@ }, { "name": "Yaqui", + "depth": 4, "iso_1_code": null, "iso_3_code": "yaq", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10806", "native_tokenizers": [], @@ -785,6 +929,7 @@ ] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10804", "native_tokenizers": [], @@ -792,14 +937,17 @@ }, { "name": "Opatan", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Eudeve", + "depth": 4, "iso_1_code": null, "iso_3_code": "eud", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10808", "native_tokenizers": [], @@ -807,15 +955,18 @@ }, { "name": "Opata", + "depth": 4, "iso_1_code": null, "iso_3_code": "opt", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10809", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10807", "native_tokenizers": [], @@ -823,14 +974,17 @@ }, { "name": "Tarahumaran", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Huarij\u00edo", + "depth": 4, "iso_1_code": null, "iso_3_code": "var", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10811", "native_tokenizers": [], @@ -840,14 +994,17 @@ }, { "name": "Tarahumara", + "depth": 4, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tarahumara, Western", + "depth": 5, "iso_1_code": null, "iso_3_code": "tac", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10813", "native_tokenizers": [], @@ -857,9 +1014,11 @@ }, { "name": "Tarahumara, Central", + "depth": 5, "iso_1_code": null, "iso_3_code": "tar", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10814", "native_tokenizers": [], @@ -869,9 +1028,11 @@ }, { "name": "Tarahumara, Southeastern", + "depth": 5, "iso_1_code": null, "iso_3_code": "tcu", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10815", "native_tokenizers": [], @@ -879,9 +1040,11 @@ }, { "name": "Tarahumara, Northern", + "depth": 5, "iso_1_code": null, "iso_3_code": "thh", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10816", "native_tokenizers": [], @@ -889,39 +1052,46 @@ }, { "name": "Tarahumara, Southwestern", + "depth": 5, "iso_1_code": null, "iso_3_code": "twr", "children": [], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10817", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10812", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10810", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10802", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10755", "native_tokenizers": [], "scripts": [] } ], + "family": "Uto-Aztecan", "tokenizers": {}, "node_i": "10733", "native_tokenizers": [], diff --git a/data/Wakashan.json b/data/Wakashan.json index e1d3bda8d1c656430d9dad73db77d2d0765e0339..2404c193b69b6d5ce211caa4e9df57565ec2b1eb 100644 --- a/data/Wakashan.json +++ b/data/Wakashan.json @@ -1,18 +1,22 @@ { "name": "Wakashan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Northern Wakashan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Haisla", + "depth": 2, "iso_1_code": null, "iso_3_code": "has", "children": [], + "family": "Wakashan", "tokenizers": {}, "node_i": "10820", "native_tokenizers": [], @@ -20,14 +24,17 @@ }, { "name": "Kwakiutlan", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Heiltsuk", + "depth": 3, "iso_1_code": null, "iso_3_code": "hei", "children": [], + "family": "Wakashan", "tokenizers": {}, "node_i": "10822", "native_tokenizers": [], @@ -35,21 +42,25 @@ }, { "name": "Kwakwala", + "depth": 3, "iso_1_code": null, "iso_3_code": "kwk", "children": [], + "family": "Wakashan", "tokenizers": {}, "node_i": "10823", "native_tokenizers": [], "scripts": [] } ], + "family": "Wakashan", "tokenizers": {}, "node_i": "10821", "native_tokenizers": [], "scripts": [] } ], + "family": "Wakashan", "tokenizers": {}, "node_i": "10819", "native_tokenizers": [], @@ -57,14 +68,17 @@ }, { "name": "Southern Wakashan", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ditidaht", + "depth": 2, "iso_1_code": null, "iso_3_code": "dtd", "children": [], + "family": "Wakashan", "tokenizers": {}, "node_i": "10825", "native_tokenizers": [], @@ -72,9 +86,11 @@ }, { "name": "Makah", + "depth": 2, "iso_1_code": null, "iso_3_code": "myh", "children": [], + "family": "Wakashan", "tokenizers": {}, "node_i": "10826", "native_tokenizers": [], @@ -82,21 +98,25 @@ }, { "name": "Nuu-chah-nulth", + "depth": 2, "iso_1_code": null, "iso_3_code": "nuk", "children": [], + "family": "Wakashan", "tokenizers": {}, "node_i": "10827", "native_tokenizers": [], "scripts": [] } ], + "family": "Wakashan", "tokenizers": {}, "node_i": "10824", "native_tokenizers": [], "scripts": [] } ], + "family": "Wakashan", "tokenizers": {}, "node_i": "10818", "native_tokenizers": [], diff --git a/data/West Papuan.json b/data/West Papuan.json index 0907d8f75c42c3b1aceafdf463fe9f11e24716d6..58e3eca9b835de92c0915cdacdddca13cdf4fd77 100644 --- a/data/West Papuan.json +++ b/data/West Papuan.json @@ -1,23 +1,28 @@ { "name": "West Papuan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "North Halmahera", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Galela-Loloda", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Galela", + "depth": 3, "iso_1_code": null, "iso_3_code": "gbi", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10831", "native_tokenizers": [], @@ -27,9 +32,11 @@ }, { "name": "Laba", + "depth": 3, "iso_1_code": null, "iso_3_code": "lau", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10832", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Loloda", + "depth": 3, "iso_1_code": null, "iso_3_code": "loa", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10833", "native_tokenizers": [], @@ -47,9 +56,11 @@ }, { "name": "Modole", + "depth": 3, "iso_1_code": null, "iso_3_code": "mqo", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10834", "native_tokenizers": [], @@ -57,9 +68,11 @@ }, { "name": "Pagu", + "depth": 3, "iso_1_code": null, "iso_3_code": "pgu", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10835", "native_tokenizers": [], @@ -67,9 +80,11 @@ }, { "name": "Tabaru", + "depth": 3, "iso_1_code": null, "iso_3_code": "tby", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10836", "native_tokenizers": [], @@ -79,9 +94,11 @@ }, { "name": "Tobelo", + "depth": 3, "iso_1_code": null, "iso_3_code": "tlb", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10837", "native_tokenizers": [], @@ -91,15 +108,18 @@ }, { "name": "Tugutil", + "depth": 3, "iso_1_code": null, "iso_3_code": "tuj", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10838", "native_tokenizers": [], "scripts": [] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10830", "native_tokenizers": [], @@ -107,14 +127,17 @@ }, { "name": "Sahu", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Gamkonora", + "depth": 3, "iso_1_code": null, "iso_3_code": "gak", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10840", "native_tokenizers": [], @@ -122,9 +145,11 @@ }, { "name": "Ibu", + "depth": 3, "iso_1_code": null, "iso_3_code": "ibu", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10841", "native_tokenizers": [], @@ -132,9 +157,11 @@ }, { "name": "Kao", + "depth": 3, "iso_1_code": null, "iso_3_code": "kax", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10842", "native_tokenizers": [], @@ -142,9 +169,11 @@ }, { "name": "Sahu", + "depth": 3, "iso_1_code": null, "iso_3_code": "saj", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10843", "native_tokenizers": [], @@ -154,15 +183,18 @@ }, { "name": "Waioli", + "depth": 3, "iso_1_code": null, "iso_3_code": "wli", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10844", "native_tokenizers": [], "scripts": [] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10839", "native_tokenizers": [], @@ -170,14 +202,17 @@ }, { "name": "Ternate-Tidore", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ternate", + "depth": 3, "iso_1_code": null, "iso_3_code": "tft", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10846", "native_tokenizers": [], @@ -185,15 +220,18 @@ }, { "name": "Tidore", + "depth": 3, "iso_1_code": null, "iso_3_code": "tvo", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10847", "native_tokenizers": [], "scripts": [] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10845", "native_tokenizers": [], @@ -201,26 +239,31 @@ }, { "name": "West Makian", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Makian, West", + "depth": 3, "iso_1_code": null, "iso_3_code": "mqs", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10849", "native_tokenizers": [], "scripts": [] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10848", "native_tokenizers": [], "scripts": [] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10829", "native_tokenizers": [], @@ -228,14 +271,17 @@ }, { "name": "West Bird\u2019s Head", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Tehit", + "depth": 2, "iso_1_code": null, "iso_3_code": "kps", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10851", "native_tokenizers": [], @@ -243,9 +289,11 @@ }, { "name": "Kalabra", + "depth": 2, "iso_1_code": null, "iso_3_code": "kzz", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10852", "native_tokenizers": [], @@ -253,9 +301,11 @@ }, { "name": "Moraid", + "depth": 2, "iso_1_code": null, "iso_3_code": "msg", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10853", "native_tokenizers": [], @@ -263,9 +313,11 @@ }, { "name": "Moi Kelim", + "depth": 2, "iso_1_code": null, "iso_3_code": "mxn", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10854", "native_tokenizers": [], @@ -273,15 +325,18 @@ }, { "name": "Moi Lemas", + "depth": 2, "iso_1_code": null, "iso_3_code": "sbg", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10855", "native_tokenizers": [], "scripts": [] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10850", "native_tokenizers": [], @@ -289,14 +344,17 @@ }, { "name": "Yapen", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Saweru", + "depth": 2, "iso_1_code": null, "iso_3_code": "swr", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10857", "native_tokenizers": [], @@ -304,9 +362,11 @@ }, { "name": "Yawa", + "depth": 2, "iso_1_code": null, "iso_3_code": "yva", "children": [], + "family": "West Papuan", "tokenizers": {}, "node_i": "10858", "native_tokenizers": [], @@ -315,12 +375,14 @@ ] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10856", "native_tokenizers": [], "scripts": [] } ], + "family": "West Papuan", "tokenizers": {}, "node_i": "10828", "native_tokenizers": [], diff --git a/data/Wintuan.json b/data/Wintuan.json index 5bcfe5b8d2c5dda343325d821b8393c83750ecb2..38fe1e446516bf8b6279219fdc393b1404388bfb 100644 --- a/data/Wintuan.json +++ b/data/Wintuan.json @@ -1,13 +1,16 @@ { "name": "Wintuan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nomlaki", + "depth": 1, "iso_1_code": null, "iso_3_code": "nol", "children": [], + "family": "Wintuan", "tokenizers": {}, "node_i": "10860", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Patwin", + "depth": 1, "iso_1_code": null, "iso_3_code": "pwi", "children": [], + "family": "Wintuan", "tokenizers": {}, "node_i": "10861", "native_tokenizers": [], @@ -25,15 +30,18 @@ }, { "name": "Wintu", + "depth": 1, "iso_1_code": null, "iso_3_code": "wnw", "children": [], + "family": "Wintuan", "tokenizers": {}, "node_i": "10862", "native_tokenizers": [], "scripts": [] } ], + "family": "Wintuan", "tokenizers": {}, "node_i": "10859", "native_tokenizers": [], diff --git a/data/Witotoan.json b/data/Witotoan.json index 1cadf8b55db5457e2e6846ec5f8ed3562889117a..c9a171a103391b77cc6777a18ee6359cdbffb5d7 100644 --- a/data/Witotoan.json +++ b/data/Witotoan.json @@ -1,13 +1,16 @@ { "name": "Witotoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Nonuya", + "depth": 1, "iso_1_code": null, "iso_3_code": "noj", "children": [], + "family": "Witotoan", "tokenizers": {}, "node_i": "10864", "native_tokenizers": [], @@ -15,14 +18,17 @@ }, { "name": "Proto-Bora-Muinane", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Muinane", + "depth": 2, "iso_1_code": null, "iso_3_code": "bmr", "children": [], + "family": "Witotoan", "tokenizers": {}, "node_i": "10866", "native_tokenizers": [], @@ -32,9 +38,11 @@ }, { "name": "Bora", + "depth": 2, "iso_1_code": null, "iso_3_code": "boa", "children": [], + "family": "Witotoan", "tokenizers": {}, "node_i": "10867", "native_tokenizers": [], @@ -43,6 +51,7 @@ ] } ], + "family": "Witotoan", "tokenizers": {}, "node_i": "10865", "native_tokenizers": [], @@ -50,14 +59,17 @@ }, { "name": "Proto-Huitoto-Ocaina", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ocaina", + "depth": 2, "iso_1_code": null, "iso_3_code": "oca", "children": [], + "family": "Witotoan", "tokenizers": {}, "node_i": "10869", "native_tokenizers": [], @@ -65,14 +77,17 @@ }, { "name": "Early Huitoto", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Witoto, Nipode", + "depth": 3, "iso_1_code": null, "iso_3_code": "hux", "children": [], + "family": "Witotoan", "tokenizers": {}, "node_i": "10871", "native_tokenizers": [], @@ -80,14 +95,17 @@ }, { "name": "Proto-Minica-Murui", + "depth": 3, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Witoto, Minika", + "depth": 4, "iso_1_code": null, "iso_3_code": "hto", "children": [], + "family": "Witotoan", "tokenizers": {}, "node_i": "10873", "native_tokenizers": [], @@ -97,9 +115,11 @@ }, { "name": "Witoto, Murui", + "depth": 4, "iso_1_code": null, "iso_3_code": "huu", "children": [], + "family": "Witotoan", "tokenizers": {}, "node_i": "10874", "native_tokenizers": [], @@ -108,24 +128,28 @@ ] } ], + "family": "Witotoan", "tokenizers": {}, "node_i": "10872", "native_tokenizers": [], "scripts": [] } ], + "family": "Witotoan", "tokenizers": {}, "node_i": "10870", "native_tokenizers": [], "scripts": [] } ], + "family": "Witotoan", "tokenizers": {}, "node_i": "10868", "native_tokenizers": [], "scripts": [] } ], + "family": "Witotoan", "tokenizers": {}, "node_i": "10863", "native_tokenizers": [], diff --git a/data/Yaguan.json b/data/Yaguan.json index 7b7154803a9254f6c54099a863bb8082f161e980..4099bc5c747f32a4c25bdea23ff89fcc3bf9f049 100644 --- a/data/Yaguan.json +++ b/data/Yaguan.json @@ -1,13 +1,16 @@ { "name": "Yaguan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yagua", + "depth": 1, "iso_1_code": null, "iso_3_code": "yad", "children": [], + "family": "Yaguan", "tokenizers": {}, "node_i": "10876", "native_tokenizers": [], @@ -17,15 +20,18 @@ }, { "name": "Yameo", + "depth": 1, "iso_1_code": null, "iso_3_code": "yme", "children": [], + "family": "Yaguan", "tokenizers": {}, "node_i": "10877", "native_tokenizers": [], "scripts": [] } ], + "family": "Yaguan", "tokenizers": {}, "node_i": "10875", "native_tokenizers": [], diff --git a/data/Yanomaman.json b/data/Yanomaman.json index a7c9d68592f8073aea510e2cfe5c73c840f33263..7fa35e4005f2a88b5fe8ec86761d139196d5c518 100644 --- a/data/Yanomaman.json +++ b/data/Yanomaman.json @@ -1,13 +1,16 @@ { "name": "Yanomaman", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yanomam\u00f6", + "depth": 1, "iso_1_code": null, "iso_3_code": "guu", "children": [], + "family": "Yanomaman", "tokenizers": {}, "node_i": "10879", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Ninam", + "depth": 1, "iso_1_code": null, "iso_3_code": "shb", "children": [], + "family": "Yanomaman", "tokenizers": {}, "node_i": "10880", "native_tokenizers": [], @@ -27,9 +32,11 @@ }, { "name": "Yanom\u00e1mi", + "depth": 1, "iso_1_code": null, "iso_3_code": "wca", "children": [], + "family": "Yanomaman", "tokenizers": {}, "node_i": "10881", "native_tokenizers": [], @@ -37,9 +44,11 @@ }, { "name": "Sanum\u00e1", + "depth": 1, "iso_1_code": null, "iso_3_code": "xsu", "children": [], + "family": "Yanomaman", "tokenizers": {}, "node_i": "10882", "native_tokenizers": [], @@ -49,15 +58,18 @@ }, { "name": "Yaroam\u00eb", + "depth": 1, "iso_1_code": null, "iso_3_code": "yro", "children": [], + "family": "Yanomaman", "tokenizers": {}, "node_i": "10883", "native_tokenizers": [], "scripts": [] } ], + "family": "Yanomaman", "tokenizers": {}, "node_i": "10878", "native_tokenizers": [], diff --git a/data/Yele-West New Britain.json b/data/Yele-West New Britain.json index 21dc8cdc7faeb56ad11428f0e337f891481176fb..1b94a577dc5dbc5a2e71d2bad2b02af4054a37fe 100644 --- a/data/Yele-West New Britain.json +++ b/data/Yele-West New Britain.json @@ -1,18 +1,22 @@ { "name": "Yele-West New Britain", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "West New Britain", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Anem", + "depth": 2, "iso_1_code": null, "iso_3_code": "anz", "children": [], + "family": "Yele-West New Britain", "tokenizers": {}, "node_i": "10886", "native_tokenizers": [], @@ -20,9 +24,11 @@ }, { "name": "Pele-Ata", + "depth": 2, "iso_1_code": null, "iso_3_code": "ata", "children": [], + "family": "Yele-West New Britain", "tokenizers": {}, "node_i": "10887", "native_tokenizers": [], @@ -31,6 +37,7 @@ ] } ], + "family": "Yele-West New Britain", "tokenizers": {}, "node_i": "10885", "native_tokenizers": [], @@ -38,14 +45,17 @@ }, { "name": "Yele", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Y\u00e9l\u00ee Dnye", + "depth": 2, "iso_1_code": null, "iso_3_code": "yle", "children": [], + "family": "Yele-West New Britain", "tokenizers": {}, "node_i": "10889", "native_tokenizers": [], @@ -54,12 +64,14 @@ ] } ], + "family": "Yele-West New Britain", "tokenizers": {}, "node_i": "10888", "native_tokenizers": [], "scripts": [] } ], + "family": "Yele-West New Britain", "tokenizers": {}, "node_i": "10884", "native_tokenizers": [], diff --git a/data/Yeniseian.json b/data/Yeniseian.json index f3c5e191d1122e17a7a5c500b952c27acda58aa5..3e7e4b701a76782520d777137a8e393da6e5a12b 100644 --- a/data/Yeniseian.json +++ b/data/Yeniseian.json @@ -1,13 +1,16 @@ { "name": "Yeniseian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ket", + "depth": 1, "iso_1_code": null, "iso_3_code": "ket", "children": [], + "family": "Yeniseian", "tokenizers": {}, "node_i": "10891", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Pumpokol", + "depth": 1, "iso_1_code": null, "iso_3_code": "xpm", "children": [], + "family": "Yeniseian", "tokenizers": {}, "node_i": "10892", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Arin", + "depth": 1, "iso_1_code": null, "iso_3_code": "xrn", "children": [], + "family": "Yeniseian", "tokenizers": {}, "node_i": "10893", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Yug", + "depth": 1, "iso_1_code": null, "iso_3_code": "yug", "children": [], + "family": "Yeniseian", "tokenizers": {}, "node_i": "10894", "native_tokenizers": [], @@ -45,15 +54,18 @@ }, { "name": "Kott", + "depth": 1, "iso_1_code": null, "iso_3_code": "zko", "children": [], + "family": "Yeniseian", "tokenizers": {}, "node_i": "10895", "native_tokenizers": [], "scripts": [] } ], + "family": "Yeniseian", "tokenizers": {}, "node_i": "10890", "native_tokenizers": [], diff --git a/data/Yokutsan.json b/data/Yokutsan.json index 9f6da8f723efecd96a2dc11dd2111c5d44483d1d..53cb6273c1ca5bb58338ba80549f88ceab3112e2 100644 --- a/data/Yokutsan.json +++ b/data/Yokutsan.json @@ -1,19 +1,23 @@ { "name": "Yokutsan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yokuts", + "depth": 1, "iso_1_code": null, "iso_3_code": "yok", "children": [], + "family": "Yokutsan", "tokenizers": {}, "node_i": "10897", "native_tokenizers": [], "scripts": [] } ], + "family": "Yokutsan", "tokenizers": {}, "node_i": "10896", "native_tokenizers": [], diff --git a/data/Yuat.json b/data/Yuat.json index c95e6e4d2766319b9c00b2e80089dd38d5f0f19e..75316de26b42094020485604485245d59c7bb35a 100644 --- a/data/Yuat.json +++ b/data/Yuat.json @@ -1,13 +1,16 @@ { "name": "Yuat", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Bun", + "depth": 1, "iso_1_code": null, "iso_3_code": "buv", "children": [], + "family": "Yuat", "tokenizers": {}, "node_i": "10899", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Biwat", + "depth": 1, "iso_1_code": null, "iso_3_code": "bwm", "children": [], + "family": "Yuat", "tokenizers": {}, "node_i": "10900", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Changriwa", + "depth": 1, "iso_1_code": null, "iso_3_code": "cga", "children": [], + "family": "Yuat", "tokenizers": {}, "node_i": "10901", "native_tokenizers": [], @@ -35,9 +42,11 @@ }, { "name": "Kyenele", + "depth": 1, "iso_1_code": null, "iso_3_code": "kql", "children": [], + "family": "Yuat", "tokenizers": {}, "node_i": "10902", "native_tokenizers": [], @@ -47,15 +56,18 @@ }, { "name": "Mekmek", + "depth": 1, "iso_1_code": null, "iso_3_code": "mvk", "children": [], + "family": "Yuat", "tokenizers": {}, "node_i": "10903", "native_tokenizers": [], "scripts": [] } ], + "family": "Yuat", "tokenizers": {}, "node_i": "10898", "native_tokenizers": [], diff --git a/data/Yukaghir.json b/data/Yukaghir.json index a5667a4924fe8d083116b7b6da3162cc65b8d4d7..cea4872f46811f334bad09a5d1e88f473b55de5d 100644 --- a/data/Yukaghir.json +++ b/data/Yukaghir.json @@ -1,13 +1,16 @@ { "name": "Yukaghir", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Omok", + "depth": 1, "iso_1_code": null, "iso_3_code": "omk", "children": [], + "family": "Yukaghir", "tokenizers": {}, "node_i": "10905", "native_tokenizers": [], @@ -15,9 +18,11 @@ }, { "name": "Chuvantsy", + "depth": 1, "iso_1_code": null, "iso_3_code": "xcv", "children": [], + "family": "Yukaghir", "tokenizers": {}, "node_i": "10906", "native_tokenizers": [], @@ -25,9 +30,11 @@ }, { "name": "Yukaghir, Northern", + "depth": 1, "iso_1_code": null, "iso_3_code": "ykg", "children": [], + "family": "Yukaghir", "tokenizers": {}, "node_i": "10907", "native_tokenizers": [], @@ -35,15 +42,18 @@ }, { "name": "Yukaghir, Southern", + "depth": 1, "iso_1_code": null, "iso_3_code": "yux", "children": [], + "family": "Yukaghir", "tokenizers": {}, "node_i": "10908", "native_tokenizers": [], "scripts": [] } ], + "family": "Yukaghir", "tokenizers": {}, "node_i": "10904", "native_tokenizers": [], diff --git a/data/Yukian.json b/data/Yukian.json index 1a1eda57e90d3c096bec58dd47adb33ae9aaec59..3ecc35457ed7d506fbc3d89a9bb488134892804d 100644 --- a/data/Yukian.json +++ b/data/Yukian.json @@ -1,13 +1,16 @@ { "name": "Yukian", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Wappo", + "depth": 1, "iso_1_code": null, "iso_3_code": "wao", "children": [], + "family": "Yukian", "tokenizers": {}, "node_i": "10910", "native_tokenizers": [], @@ -15,26 +18,31 @@ }, { "name": "Core Yukian", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Yuki", + "depth": 2, "iso_1_code": null, "iso_3_code": "yuk", "children": [], + "family": "Yukian", "tokenizers": {}, "node_i": "10912", "native_tokenizers": [], "scripts": [] } ], + "family": "Yukian", "tokenizers": {}, "node_i": "10911", "native_tokenizers": [], "scripts": [] } ], + "family": "Yukian", "tokenizers": {}, "node_i": "10909", "native_tokenizers": [], diff --git a/data/Zamucoan.json b/data/Zamucoan.json index a0171f602a791ea3d51f9cb8d1920b505fb52594..67128a56d35de7846908f01756cd99d49e3c927a 100644 --- a/data/Zamucoan.json +++ b/data/Zamucoan.json @@ -1,13 +1,16 @@ { "name": "Zamucoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Ayoreo", + "depth": 1, "iso_1_code": null, "iso_3_code": "ayo", "children": [], + "family": "Zamucoan", "tokenizers": {}, "node_i": "10914", "native_tokenizers": [], @@ -17,9 +20,11 @@ }, { "name": "Chamacoco", + "depth": 1, "iso_1_code": null, "iso_3_code": "ceg", "children": [], + "family": "Zamucoan", "tokenizers": {}, "node_i": "10915", "native_tokenizers": [], @@ -28,6 +33,7 @@ ] } ], + "family": "Zamucoan", "tokenizers": {}, "node_i": "10913", "native_tokenizers": [], diff --git a/data/Zaparoan.json b/data/Zaparoan.json index 7d9cfa74bff69b207ad2697052100b5588de55bd..983c05967014b2a52d901df7d97377da6697525d 100644 --- a/data/Zaparoan.json +++ b/data/Zaparoan.json @@ -1,18 +1,22 @@ { "name": "Zaparoan", + "depth": 0, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Iquito-Cahuarano", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Cahuarano", + "depth": 2, "iso_1_code": null, "iso_3_code": "cah", "children": [], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10918", "native_tokenizers": [], @@ -20,15 +24,18 @@ }, { "name": "Iquitu", + "depth": 2, "iso_1_code": null, "iso_3_code": "iqu", "children": [], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10919", "native_tokenizers": [], "scripts": [] } ], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10917", "native_tokenizers": [], @@ -36,14 +43,17 @@ }, { "name": "Z\u00e1paro", + "depth": 1, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Z\u00e1paro", + "depth": 2, "iso_1_code": null, "iso_3_code": "zro", "children": [], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10921", "native_tokenizers": [], @@ -51,14 +61,17 @@ }, { "name": "Arabela-Andoa", + "depth": 2, "iso_1_code": null, "iso_3_code": null, "children": [ { "name": "Andoa", + "depth": 3, "iso_1_code": null, "iso_3_code": "anb", "children": [], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10923", "native_tokenizers": [], @@ -66,9 +79,11 @@ }, { "name": "Arabela", + "depth": 3, "iso_1_code": null, "iso_3_code": "arl", "children": [], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10924", "native_tokenizers": [], @@ -77,18 +92,21 @@ ] } ], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10922", "native_tokenizers": [], "scripts": [] } ], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10920", "native_tokenizers": [], "scripts": [] } ], + "family": "Zaparoan", "tokenizers": {}, "node_i": "10916", "native_tokenizers": [],