lang-word-tokenizers / data /Hmong-Mien.json
guipenedo's picture
guipenedo HF staff
do not propagate to the root
49dc1e7 unverified
{
"name": "Hmong-Mien",
"depth": 0,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Hmongic",
"depth": 1,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Bunu",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Bunu, Younuo",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "buh",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3866",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Bunu, Wunai",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "bwn",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3867",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Bunu, Bu-Nao",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "bwx",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3868",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Bunu, Jiongnai",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "pnu",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3869",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3865",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Chuanqiandian",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Miao, Chuanqiandian Cluster",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "cqd",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3871",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Southern Mashan",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hma",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3872",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Central Huishui",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmc",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3873",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Large Flowery",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmd",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3874",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Eastern Huishui",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hme",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3875",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Hmong Don",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmf",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3876",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Southwestern Guiyang",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmg",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3877",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Southwestern Huishui",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmh",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3878",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Northern Huishui",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmi",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3879",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Ge",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmj",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3880",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Luopohe",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hml",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3881",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Central Mashan",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmm",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3882",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Northern Mashan",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmp",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3883",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Hmong D\u00f4",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmv",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3884",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Western Mashan",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmw",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3885",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Southern Guiyang",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmy",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3886",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Sinicized Miao",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmz",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3887",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Hmong Njua",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hnj",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3888",
"native_tokenizers": [],
"scripts": [
"Latn"
]
},
{
"name": "Miao, Horned",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hrm",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3889",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Northern Guiyang",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "huj",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3890",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Hmong Daw",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "mww",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3891",
"native_tokenizers": [],
"scripts": [
"Latn"
]
},
{
"name": "Miao, Small Flowery",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "sfm",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3892",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3870",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Pa-hng",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Pa-Hng",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "pha",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3894",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3893",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Qiandong",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Miao, Northern Qiandong",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hea",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3896",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Eastern Qiandong",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hmq",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3897",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Southern Qiandong",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "hms",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3898",
"native_tokenizers": [],
"scripts": []
},
{
"name": "N\u00e1-Meo",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "neo",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3899",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3895",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Xiangxi",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Miao, Western Xiangxi",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "mmr",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3901",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Miao, Eastern Xiangxi",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "muq",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3902",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3900",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3864",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Ho Nte",
"depth": 1,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "She",
"depth": 2,
"iso_1_code": null,
"iso_3_code": "shx",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3904",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3903",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Mienic",
"depth": 1,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Biao-Jiao",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Biao-Jiao Mien",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "bje",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3907",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3906",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Mian-Jin",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Biao Mon",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "bmt",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3909",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Iu Mien",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "ium",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3910",
"native_tokenizers": [],
"scripts": [
"Latn"
]
},
{
"name": "Kim Mun",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "mji",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3911",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3908",
"native_tokenizers": [],
"scripts": []
},
{
"name": "Zaomin",
"depth": 2,
"iso_1_code": null,
"iso_3_code": null,
"children": [
{
"name": "Dzao Min",
"depth": 3,
"iso_1_code": null,
"iso_3_code": "bpn",
"children": [],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3913",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3912",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3905",
"native_tokenizers": [],
"scripts": []
}
],
"family": "Hmong-Mien",
"tokenizers": {},
"node_i": "3863",
"native_tokenizers": [],
"scripts": []
}