မဝ်ဂျူ:languages/data2

နူ ဝိက်ရှေန်နရဳ
အ​ညွှန်း​သို့ ခုန်ကူးရန် ရှာဖွေရန် ခုန်ကူးမည်

Documentation for this module may be created at မဝ်ဂျူ:languages/data2/doc

local u = mw.ustring.char

-- UTF-8 encoded strings for some commonly-used diacritics
local GRAVE     = u(0x0300)
local ACUTE     = u(0x0301)
local CIRC      = u(0x0302)
local TILDE     = u(0x0303)
local MACRON    = u(0x0304)
local BREVE     = u(0x0306)
local DOTABOVE  = u(0x0307)
local DIAER     = u(0x0308)
local CARON     = u(0x030C)
local DGRAVE    = u(0x030F)
local INVBREVE  = u(0x0311)
local DOTBELOW  = u(0x0323)
local RINGBELOW = u(0x0325)
local CEDILLA   = u(0x0327)
local OGONEK    = u(0x0328)

-- Puncuation to be used for standardChars field
local PUNCTUATION = ' \!\#\$\%\&\*\+\,\-\.\/\:\;\<\=\>\?\@\^\_\`\|\~\'\(\)'

local m = {}

m["aa"] = {
	canonicalName = "အဖှာင်",
	otherNames = {"Qafar"},
	scripts = {"Latn"},
	family = "cus",
}

m["ab"] = {
	canonicalName = "အဘ်ခါဇဳရာ",
	otherNames = {"Abkhaz", "Abkhazian", "Abxazo"},
	scripts = {"Cyrl", "Geor", "Latn"},
	family = "cau-abz",
	translit_module = "ab-translit",
	override_translit = true,
	entry_name = {
		from = {GRAVE, ACUTE},
		to   = {}} ,
}

m["ae"] = {
	"အဗါတ်သတေန်",
	29572,
	"ira-cen",
	{"Avst", "Gujr"},
	translit_module = "Avst-translit",
	wikipedia_article = "Avestan",
}

m["af"] = {
	canonicalName = "အေက်ဖရိကာန်",
	scripts = {"Latn", "Arab"},
	family = "gmw",
	ancestors = {"nl"},
	sort_key = {
		from = {"[äáâà]", "[ëéêè]", "[ïíîì]", "[öóôò]", "[üúûù]", "[ÿýŷỳ]", "^-", "'"},
		to   = {"a"	 , "e"	, "i"	, "o"	, "u"  , "y" }} ,
	wikipedia_article = "Afrikaans",
}

m["ak"] = {
	canonicalName = "အကာန်",
	otherNames = {"Akan", "Twi-Fante", "Twi", "Fante", "Fanti", "Asante", "Akuapem"},
	scripts = {"Latn"},
	family = "alv-kwa",
}

m["am"] = {
	canonicalName = "အာန်ဟာရိစ်",
	otherNames = {"Amharic"},
	scripts = {"Ethi"},
	family = "sem-eth",
	translit_module = "Ethi-translit",
	wikipedia_article = "Amharic",
}

m["an"] = {
	canonicalName = "အာဒါဂေန်",
	otherNames = {"Aragonese"},
	scripts = {"Latn"},
	family = "roa",
	ancestors = {"roa-oan"},
}

m["ar"] = {
	canonicalName = "အာရဗဳ",
	otherNames = {"Modern Standard Arabic", "Standard Arabic", "Literary Arabic", "Classical Arabic", "Arabic", "အာရက်လ်"},
	scripts = {"Arab", "Brai"},
	family = "sem-arb",
	translit_module = "ar-translit",
	wikipedia_article = "Arabic",
}

m["as"] = {
	canonicalName = "အိသ်ဇြာံမဳ",
	otherNames ={"Assamese"},
	scripts = {"Beng"},
	family = "inc",
	ancestors = {"inc-mgd"},
	translit_module = "as-translit",
}

m["av"] = {
	canonicalName = "အာဗာ",
	otherNames = {"Avar", "Avaric", "အာဗာရစ်ဇ်"},
	scripts = {"Cyrl"},
	family = "cau-nec",
	ancestors = {"oav"},
	translit_module = "av-translit",
	override_translit = true,
	entry_name = {
		from = {GRAVE, ACUTE},
		to   = {}} ,
	wikipedia_article = "Avestan",
}

m["ay"] = {
	canonicalName = "အိုင်မာရ",
	otherNames = {"Aymara", "Southern Aymara", "Central Aymara"},
	scripts = {"Latn"},
	family = "sai-aym",
}

m["az"] = {
	"အာက်သေတ်ဗါဲဇြေနဳ",
	9292,
	"trk-ogz",
	{"Latn", "Cyrl", "fa-Arab"},
	ancestors = {"trk-oat"},
	dotted_dotless_i = true,
}

m["ba"] = {
	canonicalName = "ဘက်ရှ်ကာ",
	otherNames = {"Bashkir"},
	scripts = {"Cyrl"},
	family = "trk-kip",
	translit_module = "ba-translit",
	override_translit = true,
}

m["be"] = {
	canonicalName = "ဗါလာရုဇ်",
	otherNames = {"Belarusian", "Belorussian", "Belarusan", "Bielorussian", "Byelorussian", "Belarussian", "White Russian"},
	scripts = {"Cyrl"},
	family = "zle",
	ancestors = {"orv"},
	translit_module = "be-translit",
	sort_key = {
		from = {"Ё", "ё"},
		to   = {"Е" , "е"}},
	entry_name = {
		from = {"Ѐ", "ѐ", GRAVE, ACUTE},
		to   = {"Е", "е"}},
}

m["bg"] = {
	canonicalName = "ဗူလ်ဂရဳယာန်",
	otherNames = {"Bulgarian"},
	scripts = {"Cyrl"},
	family = "zls",
	translit_module = "bg-translit",
	entry_name = {
		from = {"Ѐ", "ѐ", "Ѝ", "ѝ", GRAVE, ACUTE},
		to   = {"Е", "е", "И", "и"}},
}

m["bh"] = {
	canonicalName = "ဘဳဟာရဳ",
	otherNames = {"Bihari"},
	scripts = {"Deva"},
	family = "inc",
	ancestors = {"inc-mgd"},
	wikipedia_article = "ဘာသာဘဳဟာရဳ",
}

m["bi"] = {
	canonicalName = "ဘစ်စ်လာမာ",
	otherNames = {"Bislama"},
	scripts = {"Latn"},
	family = "crp",
	ancestors = {"en"},
	wikipedia_article = "Bislama",
}

m["bm"] = {
	canonicalName = "Bambara",
	otherNames = {"Bamanankan"},
	scripts = {"Latn"},
	family = "dmn",
}

m["bn"] = {
	canonicalName = "ဘင်္ဂါလဳ",
	otherNames = {"Bangla", "Bengali"},
	scripts = {"Beng"},
	family = "inc",
	ancestors = {"inc-mgd"},
	translit_module = "bn-translit",
}

m["bo"] = {
	canonicalName = "တဳဗဝ်",
	otherNames = {"Tibetan", "Ü", "Dbus", "Lhasa", "Lhasa Tibetan", "Amdo Tibetan", "Amdo", "Panang", "Khams", "Khams Tibetan", "Khamba", "Tseku", "Dolpo", "Humla", "Limi", "Lhomi", "Shing Saapa", "Mugom", "Mugu", "Nubri", "Walungge", "Gola", "Thudam", "Lowa", "Loke", "Mustang", "Tichurong", "တိဗက်"},
	scripts = {"Tibt"},
	family = "tbq",
	ancestors = {"xct"},
	translit_module = "bo-translit",
	override_translit = true,
	wikipedia_article = "Standard Tibetan",		-- may need verification
}

m["br"] = {
	canonicalName = "ဗရဳတေန်",
	otherNames = {"Breton"},
	scripts = {"Latn"},
	family = "cel-bry",
	ancestors = {"xbm"},
}

m["ca"] = {
	canonicalName = "ကတလာန်",
	otherNames = {"Valencian", "Catalan"},
	scripts = {"Latn"},
	family = "roa",
	ancestors = {"roa-oca"},
	sort_key = {
		from = {"à", "[èé]", "[íï]", "[òó]", "[úü]", "ç", "l·l"},
		to   = {"a", "e"   , "i"   , "o"   , "u"   , "c", "ll" }} ,
}

m["ce"] = {
	canonicalName = "ချက်ခ်ချေင်",
	otherNames = {"Chechen"},
	scripts = {"Cyrl"},
	family = "cau-nkh",
	translit_module = "ce-translit",
	override_translit = true,
	entry_name = {
		from = {MACRON},
		to   = {}},
}

m["ch"] = {
	canonicalName = "ချာမဝ်ရဝ်",
	otherNames = {"Chamorro", "Chamoru"},
	scripts = {"Latn"},
	family = "poz-sus",
}

m["co"] = {
	canonicalName = "ခဝ်သဳကာန်",
	otherNames = {"Corsican", "Corsu"},
	scripts = {"Latn"},
	family = "roa",
}

m["cr"] = {
	canonicalName = "ခရေဝ်",
	scripts = {"Cree", "Cans", "Latn"},
	family = "alg",
	translit_module = "cr-translit",
}

m["cs"] = {
	canonicalName = "ချက်ခ်",
	otherNames = {"Czech"},
	scripts = {"Latn"},
	family = "zlw",
	ancestors = {"zlw-ocs"},
	sort_key = {
		from = {"á", "é", "í", "ó", "[úů]", "ý"},
		to   = {"a", "e", "i", "o", "u"   , "y"}} ,
}

m["cu"] = {
	canonicalName = "ခရေတ်သလာဗဝ်နေတ်တြေံ",
	otherNames = {"Old Church Slavic"},
	scripts = {"Cyrs", "Glag"},
	family = "zls",
	translit_module = "Cyrs-Glag-translit",
	entry_name = {
		from = {u(0x0484)}, -- kamora
		to   = {}},
	sort_key = {
		from = {"оу", "є"},
		to   = {"у" , "е"}} ,
	wikipedia_article = "Old Church Slavonic",
}

m["cv"] = {
	canonicalName = "ချူဗက်ရှ်",
	otherNames ={"Chuvash"},
	scripts = {"Cyrl"},
	family = "trk-ogr",
	translit_module = "cv-translit",
	override_translit = true,
}

m["cy"] = {
	canonicalName = "ဝေလ",
	otherNames ={"Welsh"},
	scripts = {"Latn"},
	family = "cel-bry",
	ancestors = {"wlm"},
	sort_key = {
		from = {"[âáàä]", "[êéèë]", "[îíìï]", "[ôóòö]", "[ûúùü]", "[ŵẃẁẅ]", "[ŷýỳÿ]", "'"},
		to   = {"a"	 , "e"	 , "i"	 , "o"	 , "u"	 , "w"	 , "y"	 }} ,
}

m["da"] = {
	canonicalName = "ဒိန်နေတ်",
	otherNames ={"Danish"},
	scripts = {"Latn"},
	family = "gmq",
	ancestors = {"gmq-oda"},
}

m["de"] = {
	canonicalName = "ဂျာမာန်",
	otherNames = {"High German", "New High German", "Deutsch", "German", "ဂျာမနဳ"},
	scripts = {"Latn", "Latf"},
	family = "gmw",
	ancestors = {"gmh"},
	sort_key = {
		from = {"[äàáâå]", "[ëèéê]", "[ïìíî]", "[öòóô]", "[üùúû]", "ß" },
		to   = {"a"	  , "e"	 , "i"	 , "o"	 , "u"	 , "ss"}} ,
}

m["dv"] = {
	canonicalName = "ဒိဝေဟဳ",
	otherNames = {"Dhivehi", "Divehi", "Mahal", "Mahl", "Maldivian"},
	scripts = {"Thaa"},
	family = "inc",
	ancestors = {"pmh"},	-- or Helu?
	translit_module = "dv-translit",
	override_translit = true,
	wikipedia_article = "ဘာသာမောဝ်ဒိုက်",
}

m["dz"] = {
	canonicalName = "သောင်ခါ",
	otherNames = {"Dzongkha"},
	scripts = {"Tibt"},
	family = "tbq",
	ancestors = {"xct"},
	translit_module = "bo-translit",
	override_translit = true,
	wikipedia_article = "Dzongkha",
}

m["ee"] = {
	canonicalName = "အဳဝါ",
	otherNames = {"Ewe"},
	scripts = {"Latn"},
	family = "alv-von",
}

m["el"] = {
	canonicalName = "ဂရေတ်",
	otherNames = {"Greek", "Modern Greek", "Neo-Hellenic"},
	scripts = {"Grek", "Brai"},
	family = "grk",
	ancestors = {"grc"},
	translit_module = "el-translit",
	override_translit = true,
	sort_key = {  -- Keep this synchronized with grc, cpg, pnt
		from = {"[ᾳάᾴὰᾲᾶᾷἀᾀἄᾄἂᾂἆᾆἁᾁἅᾅἃᾃἇᾇ]", "[έὲἐἔἒἑἕἓ]", "[ῃήῄὴῂῆῇἠᾐἤᾔἢᾒἦᾖἡᾑἥᾕἣᾓἧᾗ]", "[ίὶῖἰἴἲἶἱἵἳἷϊΐῒῗ]", "[όὸὀὄὂὁὅὃ]", "[ύὺῦὐὔὒὖὑὕὓὗϋΰῢῧ]", "[ῳώῴὼῲῶῷὠᾠὤᾤὢᾢὦᾦὡᾡὥᾥὣᾣὧᾧ]", "ῥ", "ς"},
		to   = {"α"						, "ε"		 , "η"						, "ι"				, "ο"		 , "υ"				, "ω"						, "ρ", "σ"}} ,
	standardChars = "ͺ;΄-ώϜϝ" .. PUNCTUATION .. "ἀ-῾"
}

m["en"] = {
	canonicalName = "အင်္ဂလိက်",
	otherNames = {"English", "Modern English", "New English", "Hawaiian Creole English", "Hawai'ian Creole English", "Hawaiian Creole", "Hawai'ian Creole", "Polari", "Yinglish"}, -- all but the first three are names of subsumed dialects which once had codes
	scripts = {"Latn", "Brai", "Shaw", "Dsrt"}, -- entries in Shaw or Dsrt might require prior discussion
	family = "gmw",
	ancestors = {"enm"},
	wikipedia_article = "ဘာသာအင်္ဂလိက်",
	sort_key = {
		from = {"[äàáâåā]", "[ëèéêē]", "[ïìíîī]", "[öòóôō]", "[üùúûū]", "æ" , "œ" , "[çč]", "ñ", "'"},
		to   = {"a"       , "e"      , "i"      , "o"      , "u"      , "ae", "oe", "c"   , "n"}},
	wikimedia_codes = {"en", "simple"},
	standardChars = "A-Za-z0-9" .. PUNCTUATION .. u(0x2800) .. "-" .. u(0x28FF)
}

m["eo"] = {
	canonicalName = "အေက်သပရေန်တဝ်",
	otherNames = {"Esperanto"},
	scripts = {"Latn"},
	family = "art",
	sort_key = {
		from = {"[áà]", "[éè]", "[íì]", "[óò]", "[úù]", "[ĉ]", "[ĝ]", "[ĥ]", "[ĵ]", "[ŝ]", "[ŭ]"},
		to   = {"a"	   , "e"  , "i"  , "o"  , "u", "cĉ", "gĉ", "hĉ", "jĉ", "sĉ", "uĉ"}} ,
	wikipedia_article = "Esperanto",
}

m["es"] = {
	canonicalName = "သပုင်",
	otherNames = {"Spanish", "Castilian", "Amazonian Spanish", "Amazonic Spanish", "Loreto-Ucayali Spanish"},
	scripts = {"Latn", "Brai"},
	family = "roa",
	ancestors = {"osp"},
	sort_key = {
		from = {"á", "é", "í", "ó", "[úü]", "ç", "ñ"},
		to   = {"a", "e", "i", "o", "u"   , "c", "n"}},
	standardChars = "A-VXYZa-vxyz0-9ÁáÉéÍíÓóÚúÑñ¿¡" .. PUNCTUATION
}

m["et"] = {
	canonicalName = "အေက်သတဝ်နဳယာန်",
	otherNames = {"Estonian"},
	scripts = {"Latn"},
	family = "fiu-fin",
}

m["eu"] = {
	canonicalName = "ဗက်ခ်",
	otherNames = {"Basque", "Euskara"},
	scripts = {"Latn"},
	family = "euq",
}

m["fa"] = {
	canonicalName = "ပါရှေန်",
	otherNames = {"ပါရှာ", "ဖာသဳ", "ဖာစဳ", "Persian", "Farsi", "New Persian", "Modern Persian", "Western Persian", "Iranian Persian", "Eastern Persian", "Dari", "Aimaq", "Aimak", "Aymaq", "Eimak"},
	scripts = {"fa-Arab"},
	family = "ira-wes",
	ancestors = {"pal"}, -- "ira-mid"
	entry_name = {
		from = {u(0x064E), u(0x064F), u(0x0650), u(0x0651), u(0x0652)},
		to   = {}} ,
}

m["ff"] = {
	canonicalName = "ဖှောတ်လာ",
	otherNames = {"Fula", "Adamawa Fulfulde", "Bagirmi Fulfulde", "Borgu Fulfulde", "Central-Eastern Niger Fulfulde", "Fulani", "Fulfulde", "Maasina Fulfulde", "Nigerian Fulfulde", "Pular", "Pulaar", "Western Niger Fulfulde"}, -- Maasina, etc are dialects, subsumed into this code
	scripts = {"Latn"},
	family = "alv-sng",
}

m["fi"] = {
	canonicalName = "ဖေန်လာန်",
	otherNames = {"Finnish", "Suomi", "Botnian"},
	scripts = {"Latn"},
	family = "fiu-fin",
	entry_name = {
		from = {"ˣ"},  -- Used to indicate gemination of the next consonant
		to   = {}},
	sort_key = {
		from = {"[áàâã]", "[éèêẽ]", "[íìîĩ]", "[óòôõ]", "[úùûũ]", "[ýỳŷüű]", "[øõő]", "æ" , "œ" , "[čç]", "š", "ž", "ß" , "[':]"},
		to   = {"a"	 , "e"	 , "i"	 , "o"	 , "u"	 ,  "y"	 , "ö"	, "ae", "oe", "c"   , "s", "z", "ss"}} ,
}

m["fj"] = {
	canonicalName = "ဖရဳဂျိ",
	otherNames = {"Fijian"},
	scripts = {"Latn"},
	family = "poz-occ",
}

m["fo"] = {
	canonicalName = "ဖာရဝ်သဳ",
	otherNames = {"Faroese"},
	scripts = {"Latn"},
	family = "gmq",
	ancestors = {"non"},
}

m["fr"] = {
	canonicalName = "ပြင်သေတ်",
	otherNames = {"French", "Modern French"},
	scripts = {"Latn", "Brai"},
	family = "roa-oil",
	ancestors = {"frm"},
	sort_key = {
		from = {"[áàâä]", "[éèêë]", "[íìîï]", "[óòôö]", "[úùûü]", "[ýỳŷÿ]", "ç", "æ" , "œ" , "'"},
		to   = {"a"	 , "e"	 , "i"	 , "o"	 , "u"	 , "y"	 , "c", "ae", "oe"}},
	standardChars = "A-Za-z0-9ÀÂÇÉÈÊËÎÏÔŒÛÙÜàâçéèêëîïôœûùü«»" .. PUNCTUATION
}

m["fy"] = {
	canonicalName = "ဖရေဝ်သဳယာန်လက္ကရဴ",
	otherNames = {"West Frisian", "Western Frisian", "Frisian"},
	scripts = {"Latn"},
	family = "gmw-fri",
	ancestors = {"ofs"},
}

m["ga"] = {
	canonicalName = "အာဲယျာလာန်",
	otherNames = {"Irish", "Irish Gaelic", "အိုင်ရစ်ရှ်"},
	scripts = {"Latn"},
	family = "cel-gae",
	ancestors = {"mga"},
	sort_key = {
		from = {"á", "é", "í", "ó", "ú", "ý", "ḃ" , "ċ" , "ḋ" , "ḟ" , "ġ" , "ṁ" , "ṗ" , "ṡ" , "ṫ" },
		to   = {"a", "e", "i", "o", "u", "y", "bh", "ch", "dh", "fh", "gh", "mh", "ph", "sh", "th"}} ,
}

m["gd"] = {
	canonicalName = "သကတ်ဂဴလိစ်",
	otherNames = {"Scottish Gaelic", "Gàidhlig", "Highland Gaelic", "Scots Gaelic", "Scottish"},
	scripts = {"Latn"},
	family = "cel-gae",
	ancestors = {"mga"},
	sort_key = {
		from = {"[áà]", "[éè]", "[íì]", "[óò]", "[úù]", "[ýỳ]"},
		to   = {"a"   , "e"   , "i"   , "o"   , "u"   , "y"   }} ,
	wikipedia_article = "Scottish Gaelic",
}

m["gl"] = {
	canonicalName = "ဂလဳသဳယာန်",
	otherNames = {"Galician"},
	scripts = {"Latn"},
	family = "roa",
	ancestors = {"roa-opt"},
	sort_key = {
		from = {"á", "é", "í", "ó", "ú"},
		to   = {"a", "e", "i", "o", "u"}} ,
}

m["gn"] = {
	canonicalName = "ဂူအာရာနဳ",
	otherNames = {"Guaraní"},
	scripts = {"Latn"},
	family = "tup-gua",
	wikipedia_article = "ဘာသာဂူအာရာနဳ",
}

m["gu"] = {
	canonicalName = "ဂုဂျာရတဳ",
	otherNames = {"Gujarati"},
	scripts = {"Gujr"},
	family = "inc",
	ancestors = {"inc-ogu"},
	translit_module = "gu-translit",
}

m["gv"] = {
	canonicalName = "မာက်",
	otherNames = {"Manx", "Manx Gaelic"},
	scripts = {"Latn"},
	family = "cel-gae",
	ancestors = {"mga"},
	sort_key = {
		from = {"ç", "-"},
		to   = {"c"}} ,
}

m["ha"] = {
	canonicalName = "ဟဴသာ",
	otherNames = {"Hausa"},
	scripts = {"Latn", "Arab"},
	family = "cdc-wst",
    sort_key = {
		from = {"ɓ",   "ɗ",   "ƙ",  "'y", "ƴ",  "'" },
		to   = {"b~" , "d~"	, "k~", "y~", "y~", ""  }},
    entry_name = {
		from = {"R̃", "r̃", "À", "à", "È", "è", "Ì", "ì", "Ò", "ò", "Ù", "ù", "Â", "â", "Ê", "ê", "Î", "î", "Ô", "ô", "Û", "û", "Ā", "ā", "Ē", "ē", "Ī", "ī", "Ō", "ō", "Ū", "ū", "Á", "á", "É", "é", "Í", "í", "Ó", "ó", "Ú", "ú", "Ā̀", "ā̀", "Ḕ", "ḕ", "Ī̀", "ī̀", "Ṑ", "ṑ", "Ū̀", "ū̀", GRAVE, ACUTE},
		to   = {"R", "r", "A", "a", "E", "e", "I", "i", "O", "o", "U", "u", "A", "a", "E", "e", "I", "i", "O", "o", "U", "u", "A", "a", "E", "e", "I", "i", "O", "o", "U", "u", "A", "a", "E", "e", "I", "i", "O", "o", "U", "u", "A", "a", "E", "e", "I", "i", "O", "o", "U", "u"}},
}

m["he"] = {
	canonicalName = "ဟဳဘရဝ်",
	otherNames = {"Hebrew", "Ivrit"},
	scripts = {"Hebr", "Phnx", "Brai"},
	family = "sem-can",
	translit_module = "he-translit",
	entry_name = {
		from = {"[" .. u(0x0591) .. "-" .. u(0x05BD) .. u(0x05BF) .. "-" .. u(0x05C5) .. u(0x05C7) .. "]"},
		to   = {}} ,
}

m["hi"] = {
	canonicalName = "ဟိန္ဒဳ",
	otherNames = {"ဟိန္ဒဳ", "Hindi", "Braj", "Brij Bhasha", "Braj Bhasha", "Braj Bhāshā", "Braj Bhakha", "Dehaati Zabaan"},
	scripts = {"Deva", "Guru"}, -- Guru for the subsumed variety Braj
	family = "inc",
	ancestors = {"inc-ohi"},
	translit_module = "hi-translit",
	wikipedia_article = "Hindi",
}

m["ho"] = {
	canonicalName = "ဟဳရဳမိုတု",
	otherNames = {"Hiri Motu", "Pidgin Motu", "Police Motu"},
	scripts = {"Latn"},
	family = "crp",
	ancestors = {"meu"},
	wikipedia_article = "Hiri Motu",
}

m["ht"] = {
	"ဟေဲယှေန် ခရေဝ်အဝ်လ်",
	33491,
	"crp",
	Latn,
	ancestors = {"fr"},
}

m["hu"] = {
	canonicalName = "ဟာန်ဂါရေဝ်",
	otherNames = {"Hungarian", "Magyar"},
	scripts = {"Latn", "Hung"},
	family = "urj-ugr",
	ancestors = {"ohu"},
	sort_key = {
		from = {"á", "é", "í", "ó", "ú", "ő", "ű"},
		to   = {"a", "e", "i", "o", "u", "ö", "ü"}} ,
}

m["hy"] = {
	canonicalName = "အာမေနဳယျာ",
	otherNames = {"Armenian", "Modern Armenian", "Eastern Armenian", "Western Armenian", "အမေရိကာန်ဗၟံက်", "အမေရိကာန်ပလိုတ်", "အမေရိကာန်အခေတ်တၟိ"},
	scripts = {"Armn", "Brai"},
	family = "hyx",
	ancestors = {"axm"},
	translit_module = "Armn-translit",
	override_translit = true,
	sort_key = {
		from = {"ու", "և", "եւ"},
		to   = {"ւ", "եվ", "եվ"}},
	entry_name = {
		from = {"՞", "՜", "՛", "՟", "և", "<sup>յ</sup>", "<sup>ի</sup>"},
		to   = {"", "", "", "", "եւ", "յ", "ի"}} ,
}

m["hz"] = {
	canonicalName = "ဟဳရဲရို",
	otherNames = {"Herero"},
	scripts = {"Latn"},
	family = "bnt",
}

m["ia"] = {
	canonicalName = "အေန်တာလိင်ဂဝ်",
	otherNames = {"Interlingua"},
	scripts = {"Latn"},
	family = "art",
	wikipedia_article = "Interlingua",
}

m["id"] = {
	canonicalName = "အိန်ဒဝ်နဳသဳယျာ",
	otherNames = {"Indonesian"},
	scripts = {"Latn"},
	family = "poz-mly",
	ancestors = {"ms"},
}

m["ie"] = {
	canonicalName = "အေန်တာလိင်ဂဝေ",
	otherNames = {"Interlingue", "Occidental"},
	scripts = {"Latn"},
	family = "art",
	wikipedia_article = "Occidental language",
}

m["ig"] = {
	canonicalName = "အစ်ဂဘို",
	otherNames = {"Igbo", "အစ္ဂဘို"},
	scripts = {"Latn"},
	family = "nic-bco",
}

m["ii"] = {
	canonicalName = "သေဲဆိုန်ယဳ",
	otherNames = {"Sichuan Yi", "Nuosu", "Nosu", "Northern Yi", "Liangshan Yi"},
	scripts = {"Yiii"},
	family = "tbq-lol",
	wikipedia_article = "Nuosu language",
	translit_module = "ii-translit",
	override_translit = true,
}

m["ik"] = {
	canonicalName = "အဳနုဗဳယာတ်",
	otherNames = {"Inupiak", "Inupiaq", "Iñupiaq", "Inupiatun"},
	scripts = {"Latn"},
	family = "esx-inu",
	wikipedia_article = "Inupiaq",
}

m["io"] = {
	canonicalName = "ဣဒဝ်",
	otherNames = {"Ido"},
	scripts = {"Latn"},
	family = "art",
}

m["is"] = {
	canonicalName = "အာက်သလာန်",
	otherNames = {"Icelandic", "အာက်သလာန်"},
	scripts = {"Latn"},
	family = "gmq",
	ancestors = {"non"},
}

m["it"] = {
	canonicalName = "အဳတခ်လဳ",
	otherNames = {"Italian"},
	scripts = {"Latn"},
	family = "roa",
	sort_key = {
		from = {"[àáâäå]", "[èéêë]", "[ìíîï]", "[òóôö]", "[ùúûü]"},
		to   = {"a"	  , "e"	 , "i"	 , "o"	 , "u"	 }} ,
}

m["iu"] = {
	canonicalName = "ဣနုက်တိတုတ်",
	otherNames = {"Inuktitut", "Eastern Canadian Inuktitut", "Eastern Canadian Inuit", "Western Canadian Inuktitut", "Western Canadian Inuit", "Western Canadian Inuktun", "Inuinnaq", "Inuinnaqtun", "Inuvialuk", "Inuvialuktun", "Nunavimmiutit", "Nunatsiavummiut", "Aivilimmiut", "Natsilingmiut", "Kivallirmiut", "Siglit", "Siglitun"},
	scripts = {"Cans", "Latn"},
	family = "esx-inu",
	translit_module = "iu-translit",
	override_translit = true,
	wikipedia_article = "Inuktitut",
}

m["ja"] = {
	canonicalName = "ဂျပါန်",
	otherNames = {"Japanese", "Modern Japanese", "Nipponese", "Nihongo"},
	scripts = {"Jpan", "Latn", "Hira", "Brai"},
	family = "jpx",
	ancestors = {"ojp"},
	--[[
	sort_key = {
		from = {"[ぁァア]", "[ぃィイ]", "[ぅゔゥウヴ]", "[ぇェエ]", "[ぉォオ]", "[がゕカガヵ]", "[ぎキギ]", "[ぐクグㇰ]", "[げゖケゲヶ]", "[ごコゴ]", "[ざサザ]", "[じシジㇱ]", "[ずスズㇲ]", "[ぜセゼ]", "[ぞソゾ]", "[だタダ]", "[ぢチヂ]", "[っづッツヅ]", "[でテデ]", "[どトドㇳ]", "ナ", "ニ", "[ヌㇴ]", "ネ", "ノ", "[ばぱハバパㇵ]", "[びぴヒビピㇶ]", "[ぶぷフブプㇷ]", "[べぺヘベペㇸ]", "[ぼぽホボポㇹ]", "マ", "ミ", "[ムㇺ]", "メ", "モ", "[ゃャヤ]", "[ゅュユ]", "[ょョヨ]", "[ラㇻ]", "[リㇼ]", "[ルㇽ]", "[レㇾ]", "[ロㇿ]", "[ゎヮワヷ]", "[ヰヸ]", "[ヱヹ]", "[ヲヺ]", "ン", "[゙゚゛゜ゝゞ・ヽヾ]", "𛀀"},
		to   = {"あ", "い", "う", "え", "お", "か", "き", "く", "け", "こ", "さ", "し", "す", "せ", "そ", "た", "ち", "つ", "て", "と", "な", "に", "ぬ", "ね", "の", "は", "ひ", "ふ", "へ", "ほ", "ま", "み", "む", "め", "も", "や", "ゆ", "よ", "ら", "り", "る", "れ", "ろ", "わ", "ゐ", "ゑ", "を", "ん", "", "え"}},
	]]
}

m["jv"] = {
	canonicalName = "ဂျာဗာ",
	otherNames = {"Javanese"},
	scripts = {"Latn", "Java"},
	family = "poz-sus",
	translit_module = "jv-translit",
	ancestors = {"kaw"},
	link_tr = true,
}

m["ka"] = {
	canonicalName = "ဂျဝ်ဂျဳယျာ",
	otherNames = {"Georgian", "Kartvelian", "Judeo-Georgian", "Kivruli", "Gruzinic"},
	scripts = {"Geor", "Geok", "Hebr"}, -- Hebr is used to write Judeo-Georgian
	family = "ccs-gzn",
	ancestors = {"oge"},
	translit_module = "Geor-translit",
	override_translit = true,
	entry_name = {
		from = {"̂"},
		to   = {""}},
}

m["kg"] = {
	canonicalName = "ကောန်ဂေါ",
	otherNames = {"Kongo", "Kikongo", "Koongo", "Laari", "San Salvador Kongo", "Yombe"},
	scripts = {"Latn"},
	family = "bnt",
}

m["ki"] = {
	canonicalName = "ခဳခူယူ",
	otherNames = {"Kikuyu", "Gikuyu", "Gĩkũyũ"},
	scripts = {"Latn"},
	family = "bnt",
}

m["kj"] = {
	canonicalName = "ကောန်ယာမာ",
	otherNames = {"Kwanyama", "Kuanyama", "Oshikwanyama"},
	scripts = {"Latn"},
	family = "bnt",
	wikipedia_article = "Kwanyama dialect",
}

m["kk"] = {
	canonicalName = "ကဇက်",
	scripts = {"Kazakh", "Cyrl", "Latn", "Arab", "kk-Arab"},
	family = "trk-kip",
	translit_module = "kk-translit",
	override_translit = true,
}

m["kl"] = {
	canonicalName = "ဂရိန်လာန်",
	otherNames = {"Greenlandic", "Kalaallisut"},
	scripts = {"Latn"},
	family = "esx-inu",
}

m["km"] = {
	canonicalName = "ခမေန်",
	otherNames = {"Khmer", "Cambodian"},
	scripts = {"Khmr"},
	family = "mkh",
	ancestors = {"mkh-mkm"},
	translit_module = "km-translit",
}

m["kn"] = {
	canonicalName = "ကာန်နဒါ",
	otherNames = {"Kannada", "ကန္နာဒါ"},
	scripts = {"Knda"},
	family = "dra",
	translit_module = "kn-translit",
	wikipedia_article = "Kannada",
}

m["ko"] = {
	canonicalName = "ကိုဝ်ရဳယျာ",
	otherNames = {"Korean", "Modern Korean"},
	scripts = {"Kore", "Brai"},
	family = "qfa-kor",
	ancestors = {"okm"},
	translit_module = "ko-translit",
}

m["kr"] = {
	canonicalName = "ကနူရဳ",
	otherNames = {"Kanuri", "Kanembu", "Bilma Kanuri", "Central Kanuri", "Manga Kanuri", "Tumari Kanuri"},
	scripts = {"Latn", "Arab"},
	family = "ssa-sah",
	sort_key = {
		from = {"ny", "ǝ", "sh"},
		to   = {"n~", "e~", "s~"}} , -- the sortkey and entry_name are only for standard Kanuri; when dialectal entries get added, someone will have to work out how the dialects should be represented orthographically
	entry_name = {
		from = {"À", "à", "È", "è", "Ǝ̀", "ǝ̀", "Ì", "ì", "Ò", "ò", "Ù", "ù", "Â", "â", "Ê", "ê", "Ǝ̂", "ǝ̂", "Î", "î", "Ô", "ô", "Û", "û", "Ă", "ă", "Ĕ", "ĕ", "Ǝ̆", "ǝ̆", "Ĭ", "ĭ", "Ŏ", "ŏ", "Ŭ", "ŭ", "Á", "á", "É", "é", "Ǝ́", "ǝ́", "Í", "í", "Ó", "ó", "Ú", "ú", GRAVE, ACUTE},
		to   = {"A", "a", "E", "e", "Ǝ", "ǝ", "I", "i", "O", "o", "U", "u", "A", "a", "E", "e", "Ǝ", "ǝ", "I", "i", "O", "o", "U", "u", "A", "a", "E", "e", "Ǝ", "ǝ", "I", "i", "O", "o", "U", "u", "A", "a", "E", "e", "Ǝ", "ǝ", "I", "i", "O", "o", "U", "u"}},
}

m["ks"] = {
	"ကာဒ်ရ်ှမဳယျာ",
	33552,
	"inc-dar",
	{"ks-Arab", "Deva", "Shrd", "Latn"},
	translit_module = "translit-redirect",
	ancestors = {"sa"},
}

m["ku"] = {
	canonicalName = "ကာဒဳ",
	otherNames = {"Kurdish"},
	scripts = {"Latn", "ku-Arab", "Armn", "Cyrl"},
	family = "ira-wes",
	wikipedia_article = "Kurdish languages",
}

-- "kv" IS TREATED AS "koi", "kpv", SEE WT:LT

m["kw"] = {
	canonicalName = "ခမ်နေတ်",
	otherNames = {"Cornish"},
	scripts = {"Latn"},
	family = "cel-bry",
	ancestors = {"cnx"},
}

m["ky"] = {
	canonicalName = "ကာဇေတ်",
	otherNames = {"Kyrgyz", "Kirghiz", "Kirgiz"},
	scripts = {"Cyrl", "Latn", "Arab"},
	family = "trk-kip",
	translit_module = "ky-translit",
	override_translit = true,
}

m["la"] = {
	canonicalName = "လပ်တေန်",
	otherNames = {"Latin"},
	scripts = {"Latn"},
	family = "itc",
	ancestors = {"itc-ola"},
	entry_name = {
		from = {"[ĀĂ]", "[āă]", "[ĒĔ]", "[ēĕë]", "[ĪĬÏ]", "[īĭï]", "[ŌŎ]", "[ōŏ]", "[ŪŬÜ]", "[ūŭü]", "Ȳ", "ȳ", MACRON, BREVE, DIAER},
		to   = {"A", "a", "E", "e", "I", "i", "O", "o", "U", "u", "Y", "y"}},
	wikipedia_article = "Latin",
	standardChars = "A-Za-zÆ挜Ā-ăĒ-ĕĪ-ĭŌ-ŏŪ-ŭȲȳ" .. MACRON .. BREVE .. PUNCTUATION
}

m["lb"] = {
	canonicalName = "လူဇေန်ဘာဂျ်",
	otherNames = {"Luxembourgish"},
	scripts = {"Latn"},
	family = "gmw",
	ancestors = {"gmh"},
	wikipedia_article = "Luxembourgish",
}

m["lg"] = {
	canonicalName = "လုဂန်ဒါ",
	otherNames = {"ဂန်ဒါ", "Luganda", "Ganda", "Oluganda"},
	scripts = {"Latn"},
	family = "bnt",
	entry_name = {
		from = {"á", "Á", "é", "É", "í", "Í", "ó", "Ó", "ú", "Ú", "ń", "Ń", "ḿ", "Ḿ", "â", "Â", "ê", "Ê", "î", "Î", "ô", "Ô", "û", "Û" },
		to   = {"a", "A", "e", "E", "i", "I", "o", "O", "u", "U", "n", "N", "m", "M", "a", "A", "e", "E", "i", "I", "o", "O", "u", "U",}},
	sort_key = {
		from = {"ŋ"},
		to   = {"n"}} ,
	wikipedia_article = "Luganda",
}

m["li"] = {
	canonicalName = "လိမ်ဗူရ်ဂိသ်",
	otherNames = {"Limburgish", "Limburgan", "Limburgian", "Limburgic"},
	scripts = {"Latn"},
	family = "gmw",
	ancestors = {"dum"},
}

m["ln"] = {
	canonicalName = "လေန်ဂါလာ",
	otherNames = {"Lingala", "Ngala"},
	scripts = {"Latn"},
	family = "bnt",
	wikipedia_article = "Lingala",
}

m["lo"] = {
	canonicalName = "သေံလဴ",
	otherNames = {"သေံလဴ", "Lao", "Laotian"},
	scripts = {"Laoo"},
	family = "tai-swe",
	translit_module = "lo-translit",
	sort_key = {
		from = {"ຼ", "ຽ", "ໜ", "ໝ", "([ເແໂໃໄ])([ກ-ຮ])"},
		to   = {"ລ", "ຍ", "ຫນ", "ຫມ", "%2%1"}},
}

m["lt"] = {
	canonicalName = "လေတ်တူယဵုနဳယျာ",
	otherNames = {"Lithuanian", "လေတ်တူယဵုနဳယျာ"},
	scripts = {"Latn"},
	family = "bat",
	ancestors = {"olt"},
	entry_name = {
		from = {"[áãà]", "[ÁÃÀ]", "[éẽè]", "[ÉẼÈ]", "[íĩì]", "[ÍĨÌ]", "[ýỹ]", "[ÝỸ]", "ñ", "[óõò]", "[ÓÕÒ]", "[úũù]", "[ÚŨÙ]", ACUTE, GRAVE, TILDE},
		to   = {"a",       "A",     "e",     "E",     "i",     "I",     "y",   "Y",   "n",   "o",    "O",     "u",      "U"}} ,
}

m["lu"] = {
	canonicalName = "ဠူဘ-ကာတေန်ဂါ",
	scripts = {"Latn"},
	family = "bnt",
}

m["lv"] = {
	canonicalName = "လပ်ဗဳယာ",
	otherNames = {"Latvian", "Lettish", "Lett"},
	scripts = {"Latn"},
	family = "bat",
	entry_name = {
		-- This attempts to convert vowels with tone marks to vowels either with
		-- or without macrons. Specifically, there should be no macrons if the
		-- vowel is part of a diphthong (including resonant diphthongs such
		-- pìrksts -> pirksts not #pīrksts). What we do is first convert the
		-- vowel + tone mark to a vowel + tilde in a decomposed fashion,
		-- then remove the tilde in diphthongs, then convert the remaining
		-- vowel + tilde sequences to macroned vowels, then delete any other
		-- tilde. We leave already-macroned vowels alone: Both e.g. ar and ār
		-- occur before consonants. FIXME: This still might not be sufficient.
		from = {"Ȩ", "ȩ", "[ÂÃÀ]", "[âãà]", "[ÊẼÈ]", "[êẽè]", "[ÎĨÌ]", "[îĩì]", "[ÔÕÒ]", "[ôõò]", "[ÛŨÙ]", "[ûũù]", "[ÑǸ]", "[ñǹ]", "[" .. CIRC .. TILDE ..GRAVE .."]", "([aAeEiIoOuU])" .. TILDE .."?([lrnmuiLRNMUI])" .. TILDE .. "?([^aAeEiIoOuUāĀēĒīĪūŪ])", "([aAeEiIoOuU])" .. TILDE .."?([lrnmuiLRNMUI])" .. TILDE .."?$", "([iI])" .. TILDE .. "?([eE])" .. TILDE .. "?", "A" .. TILDE, "a" .. TILDE, "E" .. TILDE, "e" .. TILDE, "I" .. TILDE, "i" .. TILDE, "U" .. TILDE, "u" .. TILDE, TILDE},
		to   = {"E", "e", "A" .. TILDE, "a" .. TILDE, "E" .. TILDE, "e" .. TILDE, "I" .. TILDE, "i" .. TILDE, "O", "o", "U" .. TILDE, "u" .. TILDE, "N", "n", TILDE, "%1%2%3", "%1%2", "%1%2", "Ā", "ā", "Ē", "ē", "Ī", "ī", "Ū", "ū", ""}},
}

m["mg"] = {
	canonicalName = "မာလဂတ်စဳ",
	otherNames = {"Malagasy", "Betsimisaraka Malagasy", "Betsimisaraka", "Northern Betsimisaraka Malagasy", "Northern Betsimisaraka", "Southern Betsimisaraka Malagasy", "Southern Betsimisaraka", "Bara Malagasy", "Bara", "Masikoro Malagasy", "Masikoro", "Antankarana", "Antankarana Malagasy", "Plateau Malagasy", "Sakalava", "Tandroy Malagasy", "Tandroy", "Tanosy", "Tanosy Malagasy", "Tesaka", "Tsimihety", "Tsimihety Malagasy", "Bushi", "Shibushi", "Kibushi", "Sakalava"},
	scripts = {"Latn"},
	family = "poz-bre",
}

m["mh"] = {
	canonicalName = "မာချဲလဳ",
	otherNames = {"Marshallese"},
	scripts = {"Latn"},
	family = "poz-mic",
	sort_key = {
		from = {"ā" , "ļ" , "m̧" , "ņ" , "n̄"  , "o̧" , "ō"  , "ū" },
		to   = {"a~", "l~", "m~", "n~", "n~~", "o~", "o~~", "u~"}} ,
}

m["mi"] = {
	canonicalName = "မဝ်ရဳ",
	otherNames = {"Maori", "Māori"},
	scripts = {"Latn"},
	family = "poz-pol",
	wikipedia_article = "Māori language",
}

m["mk"] = {
	canonicalName = "မက်သဳဒဝ်နဳယျာ",
	otherNames = {"Macedonian"},
	scripts = {"Cyrl"},
	family = "zls",
	translit_module = "mk-translit",
	entry_name = {
		from = {ACUTE},
		to   = {}},
}

m["ml"] = {
	canonicalName = "မလေဝ်ယျလာမ်",
	otherNames = {"Malayalam"},
	scripts = {"Mlym"},
	family = "dra",
	translit_module = "ml-translit",
	override_translit = true,
	wikipedia_article = "Malayalam",
}

m["mn"] = {
	canonicalName = "မန်ဂဝ်လဳယျာ",
	otherNames = {"မန်ဂဝ်လဳယျာ", "ခန်ခါ မန်ဂဝ်လဳယျာ"},
	scripts = {"Cyrl", "Mong", "Soyo", "Zanb"}, -- entries in Soyo or Zanb might require prior discussion
	family = "xgn",
	ancestors = {"cmg"},
	translit_module = "mn-translit",
	override_translit = true,
}

-- "mo" IS TREATED AS "ro", SEE WT:LT

m["mr"] = {
	canonicalName = "မာရဒဳ",
	otherNames = {"Marathi"},
	scripts = {"Deva", "Modi"},
	family = "inc",
	ancestors = {"omr"},
	translit_module = "hi-translit",
}

m["ms"] = {
	canonicalName = "မလေဝ်",
	otherNames = {"Malay", "Malaysian", "Standard Malay", "Orang Seletar", "Orang Kanaq", "Jakun", "Temuan"},
	scripts = {"Latn", "ms-Arab"},
	family = "poz-mly",
}

m["mt"] = {
	canonicalName = "မာလ်တဳ",
	otherNames = {"Maltese"},
	scripts = {"Latn"},
	family = "sem-arb",
	ancestors = {"sqr"},
}

m["my"] = {
	canonicalName = "ဗၟာ",
	otherNames = {"Burmese", "Myanmar", "ဗၟာ"},
	scripts = {"Mymr"},
	family = "tbq-brm",
	ancestors = {"obr"},
	wikipedia_article = "ဘာသာဗၟာ",
	translit_module = "my-translit",
	override_translit = true,
}

m["na"] = {
	canonicalName = "နောရူ",
	otherNames = {"Nauruan","Nauru"},
	scripts = {"Latn"},
	family = "poz-mic",
}

m["nb"] = {
	canonicalName = "နဝ်ဝေ ဗော်ခ်မဝ်",
	otherNames = {"Norwegian Bokmål", "Bokmål"},
	scripts = {"Latn"},
	family = "gmq",
	ancestors = {"gmq-mno"},
	wikimedia_codes = {"no"},
	wikipedia_article = "Bokmål",
}

m["nd"] = {
	canonicalName = "Northern Ndebele",
	otherNames = {"North Ndebele"},
	scripts = {"Latn"},
	family = "bnt-ngu",
	entry_name = {
		from = {"[āàáâǎ]", "[ēèéêě]", "[īìíîǐ]", "[ōòóôǒ]", "[ūùúûǔ]", "ḿ", "[ǹńň]", MACRON, ACUTE, GRAVE, CIRC, CARON},
		to   = {"a"      , "e"      , "i"      , "o"      , "u"      , "m", "n"    }},
}

m["ne"] = {
	"နဳပဝ်",
	33823,
	"inc-pah",
	{"Deva", "Newa"},
	translit_module = "ne-translit",
}

m["ng"] = {
	canonicalName = "အွန်ဒွန်ဂါ",
	otherNames = {"Ndonga"},
	scripts = {"Latn"},
	family = "bnt",
	wikipedia_article = "Ndonga dialect",
}

m["nl"] = {
	canonicalName = "ဒါတ်",
	otherNames = {"Dutch", "Netherlandic", "Flemish"},
	scripts = {"Latn"},
	family = "gmw",
	ancestors = {"dum"},
	sort_key = {
		from = {"[äáâå]", "[ëéê]", "[ïíî]", "[öóô]", "[üúû]", "ç", "ñ", "^-"},
		to   = {"a"	 , "e"	, "i"	, "o"	, "u"	, "c", "n"}} ,
	standardChars = "A-Za-z0-9" .. PUNCTUATION .. u(0x2800) .. "-" .. u(0x28FF),
}

m["nn"] = {
	canonicalName = "နဝ်ဝေ နဳနိုတ်",
	otherNames = {"Norwegian Nynorsk", "New Norwegian", "Nynorsk"},
	scripts = {"Latn"},
	family = "gmq",
	ancestors = {"gmq-mno"},
	wikipedia_article = "Nynorsk",
}

m["no"] = {
	canonicalName = "နဝ်ဝေ",
	otherNames = {"Norwegian"},
	scripts = {"Latn"},
	family = "gmq",
	ancestors = {"gmq-mno"},
}

m["nr"] = {
	canonicalName = "Southern Ndebele",
	otherNames = {"South Ndebele"},
	scripts = {"Latn"},
	family = "bnt-ngu",
	entry_name = {
		from = {"[āàáâǎ]", "[ēèéêě]", "[īìíîǐ]", "[ōòóôǒ]", "[ūùúûǔ]", "ḿ", "[ǹńň]", MACRON, ACUTE, GRAVE, CIRC, CARON},
		to   = {"a"      , "e"      , "i"      , "o"      , "u"      , "m", "n"    }},
}

m["nv"] = {
	"နာဝါဟဝ်",
	13310,
	"apa",
	Latn,
	sort_key = {
		from = {"[áą]", "[éę]", "[íį]", "[óǫ]", "ń", "^n([djlt])", "ł" , "[ʼ’']", ACUTE},
		to   = {"a"   , "e"   , "i"   , "o"   , "n", "ni%1"	  , "l~"}}, -- the tilde is used to guarantee that ł will always be sorted after all other words with l
}

m["ny"] = {
	canonicalName = "ချဳဝါ",
	otherNames = {"နရန်ဂျာ", "Chichewa", "Chicheŵa", "Chinyanja", "Nyanja", "Chewa", "Cicewa", "Cewa", "Cinyanja"},
	scripts = {"Latn"},
	family = "bnt",
	entry_name = {
		from = {"ŵ", "Ŵ", "á", "Á", "é", "É", "í", "Í", "ó", "Ó", "ú", "Ú", "ń", "Ń", "ḿ", "Ḿ" },
		to   = {"w", "W", "a", "A", "e", "E", "i", "I", "o", "O", "u", "U", "n", "N", "m", "M"}},
	sort_key = {
		from = {"ng'"},
		to   = {"ng"}} ,
	wikipedia_article = "Chewa language",
}

m["oc"] = {
	canonicalName = "အောက်စဳတာန်",
	otherNames = {"Occitan", "Provençal", "Auvergnat", "Auvernhat", "Gascon", "Languedocien", "Lengadocian", "Shuadit", "Chouhadite", "Chouhadit", "Chouadite", "Chouadit", "Shuhadit", "Judeo-Provençal", "Judeo-Provencal", "Judeo-Comtadin"},
	scripts = {"Latn", "Hebr"},
	family = "roa",
	ancestors = {"pro"},
	sort_key = {
		from = {"[àá]", "[èé]", "[íï]", "[òó]", "[úü]", "ç", "([lns])·h"},
		to   = {"a"   , "e"   , "i"   , "o"   , "u"   , "c", "%1h"	  }} ,
}

m["oj"] = {
	canonicalName = "အဵုဂျဳဘွဲ",
	otherNames = {"Ojibwe", "Chippewa", "Ojibway", "Ojibwemowin", "Southwestern Ojibwa"},
	scripts = {"Cans", "Latn"},
	family = "alg",
}

m["om"] = {
	canonicalName = "သြရောမော",
	otherNames = {"Oromo", "Orma", "Borana-Arsi-Guji Oromo", "West Central Oromo"},
	scripts = {"Latn", "Ethi"},
	family = "cus",
}

m["or"] = {
	canonicalName = "အဝ်ရေဝ်ယာ",
	otherNames = {"Oriya", "Odia", "Oorya"},
	scripts = {"Orya"},
	family = "inc",
	ancestors = {"inc-mgd"},
	translit_module = "or-translit",
	wikipedia_article = "Odia language",
}

m["os"] = {
	canonicalName = "အဝ်ဇြဳယာန်",
	otherNames = {"Ossetian", "Ossete", "Ossetic", "Digor", "Iron"},
	scripts = {"Cyrl", "Geor", "Latn"},
	family = "ira",
	ancestors = {"oos"},
	translit_module = "os-translit",
	override_translit = true,
	entry_name = {
		from = {GRAVE, ACUTE},
		to   = {}} ,
}

m["pa"] = {
	canonicalName = "ပါန်ချာပဳ",
	otherNames = {"Punjabi", "Panjabi"},
	scripts = {"Guru", "pa-Arab"},
	family = "inc-opa",
	ancestors = {"psu"},
	translit_module = "translit-redirect",
	entry_name = {
		from = {u(0x064B), u(0x064C), u(0x064D), u(0x064E), u(0x064F), u(0x0650), u(0x0651), u(0x0652), u(0x0658), u(0x08C7), u(0x0768)},
		to   = {"", "", "", "", "", "", "", "", "", "ل", "ن"}} ,
}

m["pi"] = {
	"ပါဠိ",
	"Q36727",
	"pra",
	scripts = {"Latn", "Brah", "Deva", "Beng", "Sinh", "Mymr", "Thai", "Lana", "Laoo", "Khmr"},
	ancestors = {"sa"},
	translit_module = "pi-translit",
	sort_key = {
		from = {"ā", "ī", "ū", "ḍ", "ḷ", "[ṁṃ]", "ṅ", "ñ", "ṇ", "ṭ", "([เโ])([ก-ฮ])", "([ເໂ])([ກ-ຮ])", "ᩔ", "ᩕ", "ᩖ", "ᩘ", "([ᨭ-ᨱ])ᩛ", "([ᨷ-ᨾ])ᩛ", "ᩤ", u(0xFE00), u(0x200D)},
		to   = {"a~", "i~", "u~", "d~", "l~", "m~", "n~", "n~~", "n~~~", "t~", "%2%1", "%2%1", "ᩈ᩠ᩈ", "᩠ᩁ", "᩠ᩃ", "ᨦ᩠", "%1᩠ᨮ", "%1᩠ᨻ", "ᩣ"}} ,
	entry_name = {
		from = {u(0xFE00)},
		to   = {}},
}


m["pl"] = {
	canonicalName = "ပဝ်လာန်",
	otherNames = {"Polish"},
	scripts = {"Latn"},
	family = "zlw",
	ancestors = {"zlw-opl"},
	sort_key = {
		from = {"[Ąą]", "[Ćć]", "[Ęę]", "[Łł]", "[Ńń]", "[Óó]", "[Śś]", "[Żż]", "[Źź]"},
		to   = {
			"a" .. u(0x10FFFF),
			"c" .. u(0x10FFFF),
			"e" .. u(0x10FFFF),
			"l" .. u(0x10FFFF),
			"n" .. u(0x10FFFF),
			"o" .. u(0x10FFFF),
			"s" .. u(0x10FFFF),
			"z" .. u(0x10FFFF),
			"z" .. u(0x10FFFE)}} ,
}

m["ps"] = {
	"ပါသတုန်",
	58680,
	"ira-pat",
	{"ps-Arab"},
	ancestors = {"ira-pat-pro"},
}

m["pt"] = {
	canonicalName = "ပဝ်တူဂြဳ",
	otherNames = {"Portuguese", "Modern Portuguese"},
	scripts = {"Latn", "Brai"},
	family = "roa",
	ancestors = {"roa-opt"},
	sort_key = {
		from = {"[àãáâä]", "[èẽéêë]", "[ìĩíï]", "[òóôõö]", "[üúùũ]", "ç", "ñ"},
		to   = {"a"	  , "e"	  , "i"	 , "o"	  , "u"	 , "c", "n"}} ,
}

m["qu"] = {
	canonicalName = "ခေန်ချူဝါ",
	scripts = {"Latn"},
	family = "qwe",
	wikipedia_article = "ဘာသာခေန်ချူဝါ",
}

m["rm"] = {
	canonicalName = "ရဝ်မာန်",
	otherNames = {"Romansch","Romansh", "Rumantsch", "Romanche"},
	scripts = {"Latn"},
	family = "roa",
	wikipedia_article = "Romansh language",
}

m["ro"] = {
	canonicalName = "ရဝ်မေနဳယျာ",
	otherNames = {"Romanian", "Daco-Romanian", "Roumanian", "Rumanian"},
	scripts = {"Latn", "Cyrl"},
	family = "roa",
	sort_key = {
        from = {"ă" , "â"  , "î" , "ș" , "ț" },
        to   = {"a~", "a~~", "i~", "s~", "t~"}},
}

m["ru"] = {
	canonicalName = "ရုရှာ",
	otherNames = {"Russian"},
	scripts = {"Cyrl", "Brai"},
	family = "zle",
	translit_module = "ru-translit",
	sort_key = {
		from = {"ё"},
		to   = {"е" .. mw.ustring.char(0x10FFFF)}},
	entry_name = {
		from = {"Ѐ", "ѐ", "Ѝ", "ѝ", GRAVE, ACUTE},
		to   = {"Е", "е", "И", "и"}},
	standardChars = "ЁІА-яёі0-9—" .. PUNCTUATION,
}

m["rw"] = {
	canonicalName = "ရဝမ်ဒါ ရမ်ဒဳ",
	otherNames = {"Rwanda-Rundi", "Rwanda", "Kinyarwanda", "Rundi", "Kirundi", "Ha", "Giha", "Hangaza", "Vinza", "Shubi", "Subi"},
	scripts = {"Latn"},
	family = "bnt",
	wikipedia_article = "Rwanda-Rundi",
}

m["sa"] = {
	canonicalName = "သံသကြိုတ်",
	otherNames = {"Sanskrit"},
	scripts = {"Deva", "Beng", "Brah", "Gran", "Gujr", "Guru", "Khar", "Knda", "Mlym", "Mymr", "Orya", "Shrd", "Sinh", "Taml", "Telu", "Thai", "Tibt"},
	family = "inc",
	translit_module = "sa-translit",
	wikipedia_article = "ဘာသာသံသကြိုက်",
}

m["sc"] = {
	canonicalName = "သာဒဳနဳယာန်",
	otherNames = {"Sardinian", "Campidanese", "Campidanese Sardinian", "Logudorese", "Logudorese Sardinian", "Nuorese", "Nuorese Sardinian"},
	scripts = {"Latn"},
	family = "roa",
}

m["sd"] = {
	"သိန္ဓိ",
	33997,
	"inc-snd",
	{"sd-Arab", "Deva", "Sind", "Khoj"},
	entry_name = {
		from = {u(0x0671), u(0x064B), u(0x064C), u(0x064D), u(0x064E), u(0x064F), u(0x0650), u(0x0651), u(0x0652), u(0x0670), u(0x0640)},
		to   = {u(0x0627)}},
	ancestors = {"inc-vra"},
	translit_module = "translit-redirect",
}

m["se"] = {
	canonicalName = "သာမိ သၟဝ်ကျာ",
	otherNames = {"Northern Sami", "North Sami", "Northern Saami", "North Saami"},
	scripts = {"Latn"},
	family = "smi",
	entry_name = {
		from = {"([đflmnŋrsšŧv])'%1"},
		to   = {"%1%1"} },
	wikipedia_article = "Northern Sami",
}

m["sg"] = {
	canonicalName = "သင်ဂဝ်",
	otherNames = {"Sango"},
	scripts = {"Latn"},
	family = "crp",
}

m["sh"] = {
	canonicalName = "သာဗ်ခြဝ်ဨရှဳယာန်",
	otherNames = {"Serbo-Croatian", "BCS", "Croato-Serbian", "Serbocroatian", "Bosnian", "Croatian", "Montenegrin", "Serbian"},
	scripts = {"Latn", "Cyrl"},
	family = "zls",
	entry_name = {
		from = {"[ȀÀȂÁĀÃ]", "[ȁàȃáāã]", "[ȄÈȆÉĒẼ]", "[ȅèȇéēẽ]", "[ȈÌȊÍĪĨ]", "[ȉìȋíīĩ]", "[ȌÒȎÓŌÕ]", "[ȍòȏóōõ]", "[ȐȒŔ]", "[ȑȓŕ]", "[ȔÙȖÚŪŨ]", "[ȕùȗúūũ]", "Ѐ", "ѐ", "[ӢЍ]", "[ӣѝ]", "[Ӯ]", "[ӯ]", GRAVE, ACUTE, DGRAVE, INVBREVE, MACRON, TILDE},
		to   = {"A"	  , "a"	  , "E"	  , "e"	  , "I"	  , "i"	  , "O"	  , "o"	  , "R"	, "r"	, "U"	  , "u"	  , "Е", "е", "И"   , "и", "У", "у"   }},
	wikimedia_codes = {"sh", "bs", "hr", "sr"},
	wikipedia_article = "Serbo-Croatian",
}

m["si"] = {
	canonicalName = "သိၚ်္ဃဵုရ်",
	otherNames = {"Sinhalese", "Singhalese", "Sinhala"},
	scripts = {"Sinh"},
	family = "inc",
	ancestors = {"elu-prk"},
	translit_module = "si-translit",
	override_translit = true,
}

m["sk"] = {
	canonicalName = "သလဝ်ဝေန်နဳယျာ",
	otherNames = {"Slovak"},
	scripts = {"Latn"},
	family = "zlw",
	sort_key = {
		from = {"[áä]", "é", "í", "[óô]", "ú", "ý", "ŕ", "ĺ", "[" .. DIAER .. ACUTE .. CIRC .. "]"},
		to   = {"a"   , "e", "i", "o"   , "u", "y", "r", "l", ""}} ,
}

m["sl"] = {
	canonicalName = "သၠဝ်ဝေနဳ",
	otherNames = {"Slovene", "Slovenian"},
	scripts = {"Latn"},
	family = "zls",
	entry_name = {
		from = {"[ÁÀÂȂȀ]", "[áàâȃȁ]", "[ÉÈÊȆȄỆẸ]", "[éèêȇȅệẹə]", "[ÍÌÎȊȈ]", "[íìîȋȉ]", "[ÓÒÔȎȌỘỌ]", "[óòôȏȍộọ]", "[ŔȒȐ]", "[ŕȓȑ]", "[ÚÙÛȖȔ]", "[úùûȗȕ]", "ł", GRAVE, ACUTE, DGRAVE, INVBREVE, CIRC, DOTBELOW},
		to   = {"A"	  , "a"	  , "E"		, "e"		 , "I"	  , "i"	  , "O"		, "o"		, "R"	, "r"	, "U"	  , "u"	  , "l"}} ,
}

m["sm"] = {
	canonicalName = "သမဝ်အာ",
	otherNames = {"Samoan"},
	scripts = {"Latn"},
	family = "poz-pol",
}

m["sn"] = {
	canonicalName = "ရှိုနာ",
	otherNames = {"Shona"},
	scripts = {"Latn"},
	family = "bnt",
}

m["so"] = {
	canonicalName = "ဆဝ်မာလဳ",
	otherNames = {"Somali"},
	scripts = {"Latn", "Arab", "Osma"},
	family = "cus",
	entry_name = {
		from = {"[ÁÀÂ]", "[áàâ]", "[ÉÈÊ]", "[éèê]", "[ÍÌÎ]", "[íìî]", "[ÓÒÔ]", "[óòô]", "[ÚÙÛ]", "[úùû]", "[ÝỲ]", "[ýỳ]"},
		to   = {"A"	  , "a"	  , "E"	, "e" , "I"	  , "i"	  , "O"	, "o"	, "U"  , "u", "Y", "y"}} ,
}

m["sq"] = {
	canonicalName = "အလ်ဗနဳယာန်",
	otherNames = {"Albanian"},
	scripts = {"Latn", "Elba"},
	family = "sqj",
	sort_key = {
		from = { '[âãä]', '[ÂÃÄ]', '[êẽë]', '[ÊẼË]', 'ĩ', 'Ĩ', 'õ', 'Õ', 'ũ', 'Ũ', 'ỹ', 'Ỹ', 'ç', 'Ç' },
		to   = {     'a',     'A',     'e',     'E', 'i', 'I', 'o', 'O', 'u', 'U', 'y', 'Y', 'c', 'C' } } ,
}

m["ss"] = {
	canonicalName = "ဆွာဇဳ",
	otherNames = {"Swazi", "Swati"},
	scripts = {"Latn"},
	family = "bnt-ngu",
	entry_name = {
		from = {"[āàáâǎ]", "[ēèéêě]", "[īìíîǐ]", "[ōòóôǒ]", "[ūùúûǔ]", "ḿ", "[ǹńň]", MACRON, ACUTE, GRAVE, CIRC, CARON},
		to   = {"a"      , "e"      , "i"      , "o"      , "u"      , "m", "n"    }},
}

m["st"] = {
	canonicalName = "သူထူ",
	otherNames = {"Sotho", "Sesotho", "Southern Sesotho", "Southern Sotho"},
	scripts = {"Latn"},
	family = "bnt",
}

m["su"] = {
	canonicalName = "သာန်ဓနဳ",
	otherNames = {"Sundanese"},
	scripts = {"Latn", "Sund"},
	family = "poz-msa",
	translit_module = "su-translit",
}

m["sv"] = {
	canonicalName = "သွဳဒေန်",
	otherNames = {"Swedish"},
	scripts = {"Latn"},
	family = "gmq",
	ancestors = {"gmq-osw"},
}

m["sw"] = {
	canonicalName = "သဝါတ်ဟဳလဳ",
	otherNames = {"Swahili", "Settler Swahili", "KiSetla", "KiSettla", "Setla", "Settla", "Kitchen Swahili", "Kihindi", "Indian Swahili", "KiShamba", "Kishamba", "Field Swahili", "Kibabu", "Asian Swahili", "Kimanga", "Arab Swahili", "Kitvita", "Army Swahili"},
	scripts = {"Latn", "Arab"},
	family = "bnt",
	sort_key = {
		from = {"ng'", "^-"},
		to   = {"ngz"}} ,
}

m["ta"] = {
	canonicalName = "တမဳလ်",
	otherNames = {"Tamil"},
	scripts = {"Taml"},
	family = "dra",
	ancestors = {"oty"},
	translit_module = "ta-translit",
	override_translit = true,
}

m["te"] = {
	canonicalName = "တေလုဂု",
	otherNames = {"Telugu"},
	scripts = {"Telu"},
	family = "dra",
	translit_module = "te-translit",
	override_translit = true,
}

m["tg"] = {
	canonicalName = "တာဇိက်",
	otherNames = {"Tajik", "Tadjik", "Tadzhik", "Tajiki", "Tajik Persian"},
	scripts = {"Cyrl", "fa-Arab", "Latn"},
	family = "ira-wes",
	ancestors = {"fa"},
	translit_module = "tg-translit",
	override_translit = true,
	sort_key = {
		from = {"Ё", "ё"},
		to   = {"Е" , "е"}} ,
	entry_name = {
		from = {ACUTE},
		to   = {}} ,
}

m["th"] = {
	canonicalName = "သေံ",
	otherNames = {"Thai", "Siamese", "Central Thai", "သေံထိုၚ်"},
	scripts = {"Thai", "Brai"},
	family = "tai-swe",
	translit_module = "th-translit",
	sort_key = {
		from = {"%p", "([เแโใไ])([ก-ฮ])"},
		to   = {"", "%2%1"}},
}

m["ti"] = {
	canonicalName = "တဳဂျရေဝ်ယျာ",
	otherNames = {"Tigrinya"},
	scripts = {"Ethi"},
	family = "sem-eth",
	translit_module = "Ethi-translit",
}

m["tk"] = {
	canonicalName = "တာ့ခ်မေန်",
	otherNames = {"Turkmen"},
	scripts = {"Latn", "Cyrl"},
	family = "trk-ogz",
	entry_name = {
		from = {"ā", "ē", "ī", "ō", "ū", "ȳ", "ȫ", "ǖ", MACRON},
		to   = {"a", "e", "i", "o", "u", "y", "ö", "ü", ""}},
}

m["tl"] = {
	canonicalName = "တာဂါလံက်",
	otherNames = {"Tagalog"},
	scripts = {"Latn", "Tglg"},
	family = "phi",
	entry_name = {
		from = {"[áàâ]", "[éèê]", "[íìî]", "[óòô]", "[úùû]", ACUTE, GRAVE, CIRC},
		to   = {"a"    , "e"    , "i"    , "o"    , "u"    }},
	translit_module = "tl-translit",
	override_translit = true
}

m["tn"] = {
	canonicalName = "တဳဆဝါနာ",
	otherNames = {"Tswana", "Setswana"},
	scripts = {"Latn"},
	family = "bnt",
}

m["to"] = {
	canonicalName = "တွန်ဂါ",
	otherNames = {"Tongan"},
	scripts = {"Latn"},
	family = "poz-pol",
}

m["tr"] = {
	canonicalName = "တူရကဳ",
	otherNames = {"Turkish"},
	scripts = {"Latn"},
	family = "trk-ogz",
	ancestors = {"ota"},
}

m["ts"] = {
	canonicalName = "ဆွန်ဂါ",
	otherNames = {"Tsonga"},
	scripts = {"Latn"},
	family = "bnt",
}

m["tt"] = {
	canonicalName = "တာတာ",
	otherNames = {"Tatar"},
	scripts = {"Cyrl", "Latn", "Arab", "tt-Arab"},
	family = "trk-kip",
	translit_module = "tt-translit",
	override_translit = true,
}

-- "tw" IS TREATED AS "ak", SEE WT:LT

m["ty"] = {
	canonicalName = "တဟဳတဳ",
	otherNames = {"Tahitian"},
	scripts = {"Latn"},
	family = "poz-pol",
}

m["ug"] = {
	canonicalName = "ဥူဃူရ်",
	otherNames = {"Uigur", "Uighur", "Uygur"},
	scripts = {"ug-Arab", "Latn", "Cyrl"},
	family = "trk",
	ancestors = {"chg"},
	translit_module = "ug-translit",
	override_translit = true,
}

m["uk"] = {
	canonicalName = "ယူကရိန်",
	otherNames = {"Ukrainian"},
	scripts = {"Cyrl"},
	family = "zle",
	ancestors = {"orv"},
	translit_module = "uk-translit",
	entry_name = {
		from = {"Ѐ", "ѐ", "Ѝ", "ѝ", GRAVE, ACUTE},
		to   = {"Е", "е", "И", "и"}},
	standardChars = "ЄІЇА-ЩЫЬЮ-щыьюяєії" .. PUNCTUATION
} 
m["ur"] = {
	"အူရဒူ",
	1617,
	"inc-hnd",
	{"ur-Arab"},
	ancestors = {"inc-ohi"},
	entry_name = {
		from = {u(0x0640), u(0x064B), u(0x064C), u(0x064D), u(0x064E), u(0x064F), u(0x0650), u(0x0651), u(0x0652), u(0x0658)},
		to   = {}} ,
}

m["uz"] = {
	canonicalName = "ဥုသဗဝ်",
	otherNames = {"Uzbek", "Northern Uzbek", "Southern Uzbek"},
	scripts = {"Latn", "Cyrl", "fa-Arab"},
	family = "trk",
	ancestors = {"chg"},
	translit_module = "uz-translit"
}

m["ve"] = {
	canonicalName = "ဗန်ဒါ",
	otherNames = {"Venda"},
	scripts = {"Latn"},
	family = "bnt",
}

m["vi"] = {
	canonicalName = "ဗဳယေတ်နာမ်",
	otherNames = {"Vietnamese", "Annamese", "Annamite"},
	scripts = {"Latn", "Hani"},
	family = "mkh-vie",
	ancestors = {"mkh-mvi"},
	sort_key = "vi-sortkey",
}

m["vo"] = {
	canonicalName = "ဝဝ်လပုက်",
	otherNames = {"Volapük"},
	scripts = {"Latn"},
	family = "art",
	wikipedia_article = "Volapük",
}

m["wa"] = {
	canonicalName = "ဝါဠူ",
	otherNames = {"Walloon", "Liégeois", "Namurois", "Wallo-Picard", "Wallo-Lorrain"},
	scripts = {"Latn"},
	family = "roa-oil",
	ancestors = {"fro"},
	sort_key = {
		from = {"[áàâäå]", "[éèêë]", "[íìîï]", "[óòôö]", "[úùûü]", "[ýỳŷÿ]", "ç", "'"},
		to   = {"a"	  , "e"	 , "i"	 , "o"	 , "u"	 , "y"	 , "c"}} ,
}

m["wo"] = {
	canonicalName = "ဝဝ်လံက်",
	otherNames = {"Wolof", "Gambian Wolof"}, -- the subsumed dialect 'wof'
	scripts = {"Latn", "Arab"},
	family = "alv-sng",
}

m["xh"] = {
	canonicalName = "ဇိုစာ",
	otherNames = {"Xhosa"},
	scripts = {"Latn"},
	family = "bnt-ngu",
	entry_name = {
		from = {"[āàáâǎ]", "[ēèéêě]", "[īìíîǐ]", "[ōòóôǒ]", "[ūùúûǔ]", "ḿ", "[ǹńň]", MACRON, ACUTE, GRAVE, CIRC, CARON},
		to   = {"a"      , "e"      , "i"      , "o"      , "u"      , "m", "n"    }},
}

m["yi"] = {
	canonicalName = "ယိဒ်ဒိသ်",
	otherNames = {"Yiddish"},
	scripts = {"Hebr"},
	family = "gmw",
	ancestors = {"gmh"},
	translit_module = "yi-translit",
	wikipedia_article = "Yiddish",
}

m["yo"] = {
	canonicalName = "ရိုရုဗာ",
	otherNames = {"Yoruba"},
	scripts = {"Latn"},
	family = "alv-von",
}

m["za"] = {
	canonicalName = "ဇြုန်",
	otherNames = {"Standard Zhuang"},
	scripts = {"Latn", "Hani"},
	family = "tai",
	wikipedia_article = "Zhuang languages",
}

m["zh"] = {
	canonicalName = "ကြုက်",
	otherNames = {"Chinese"},
	scripts = {"Hani", "Brai"},
	family = "sit",
	ancestors = {"ltc"},
	sort_key = "zh-sortkey",
}

m["zu"] = {
	canonicalName = "ဇြူလူ",
	otherNames = {"Zulu", "isiZulu"},
	scripts = {"Latn"},
	family = "bnt-ngu",
	entry_name = {
                from = {"[āàáâǎ]", "[ēèéêě]", "[īìíîǐ]", "[ōòóôǒ]", "[ūùúûǔ]", "ḿ", "[ǹńň]", MACRON, ACUTE, GRAVE, CIRC, CARON},
                to   = {"a"      , "e"      , "i"      , "o"      , "u"      , "m", "n"    }},
}

return m