ഘടകം:languages/datax
ഈ ഘടകത്തിന്റെ വിവരണം ഘടകം:languages/datax/വിവരണം എന്ന താളിൽ നിർമ്മിക്കാവുന്നതാണ്
-- UTF-8 encoded strings for some commonly-used diacritics
local GRAVE = "\204\128" -- U+0300
local ACUTE = "\204\129" -- U+0301
local CIRC = "\204\130" -- U+0302
local TILDE = "\204\131" -- U+0303
local MACRON = "\204\132" -- U+0304
local BREVE = "\204\134" -- U+0306
local DOTABOVE = "\204\135" -- U+0307
local DIAER = "\204\136" -- U+0308
local CARON = "\204\140" -- U+030C
local DGRAVE = "\204\143" -- U+030F
local INVBREVE = "\204\145" -- U+0311
local DOTBELOW = "\204\163" -- U+0323
local RINGBELOW = "\204\165" -- U+0325
local CEDILLA = "\204\167" -- U+0327
local m = {}
m["aav-pro"] = {
names = {"Proto-Austro-Asiatic"},
type = "reconstructed",
scripts = {"unicode"},
family = "aav"}
m["afa-pro"] = {
names = {"Proto-Afro-Asiatic"},
type = "reconstructed",
scripts = {"unicode"},
family = "afa"}
m["alg-pro"] = {
names = {"Proto-Algonquian"},
type = "reconstructed",
scripts = {"unicode"},
family = "alg"}
m["aql-pro"] = {
names = {"Proto-Algic"},
type = "reconstructed",
scripts = {"unicode"},
family = "aql"}
m["art-blk"] = {
names = {"Bolak"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-com"] = {
names = {"Communicationssprache"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-elo"] = {
names = {"Eloi"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-gld"] = {
names = {"Goa'uld"},
type = "appendix-constructed",
scripts = {"Latn", "Egyp", "Mero"},
family = "art"}
m["art-lap"] = {
names = {"Lapine"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-man"] = {
names = {"Mandalorian"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-mun"] = {
names = {"Mundolinco"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-nav"] = {
names = {"Na'vi"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-nox"] = {
names = {"Noxilo"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-top"] = {
names = {"Toki Pona"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["art-una"] = {
names = {"Unas"},
type = "appendix-constructed",
scripts = {"Latn"},
family = "art"}
m["ath-pro"] = {
names = {"Proto-Athabaskan"},
type = "reconstructed",
scripts = {"unicode"},
family = "ath"}
m["aus-bun"] = {
names = {"Bunurong"},
type = "regular",
scripts = {"None"},
family = "aus-pam"}
m["aus-cww-pro"] = {
names = {"Proto-Central New South Wales"},
type = "reconstructed",
scripts = {"unicode"},
family = "aus-cww"}
m["aus-dar"] = {
names = {"Darkinjung"},
type = "regular",
scripts = {"Latn"},
family = "aus-yuk"}
m["aus-gab"] = {
names = {"Gabi"},
type = "regular",
scripts = {"Latn"},
family = "aus-pam"}
m["aus-pam-pro"] = {
names = {"Proto-Pama-Nyungan"},
type = "reconstructed",
scripts = {"unicode"},
family = "aus-pam"}
m["azc-nah-pro"] = {
names = {"Proto-Nahuan"},
type = "reconstructed",
scripts = {"unicode"},
family = "azc-nah"}
m["azc-pro"] = {
names = {"Proto-Uto-Aztecan"},
type = "reconstructed",
scripts = {"unicode"},
family = "azc"}
m["bat-olt"] = {
names = {"Old Lithuanian"},
type = "regular",
scripts = {"None"},
family = "bat",
entry_name = {
from = {"[áãà]", "[éẽè]", "[íĩì]", "[ýỹ]", "ñ", "[óõò]", "[úù]", ACUTE, GRAVE, TILDE},
to = {"a" , "e" , "i", "y" , "n", "o" , "u" }} }
m["bat-pro"] = {
names = {"Proto-Baltic"},
type = "reconstructed",
scripts = {"unicode"},
family = "bat"}
m["ber-pro"] = {
names = {"Proto-Berber"},
type = "reconstructed",
scripts = {"None"},
family = "ber"}
m["bnt-phu"] = {
names = {"Phuthi"},
type = "regular",
scripts = {"None"},
family = "bnt"}
m["bnt-pro"] = {
names = {"Proto-Bantu"},
type = "reconstructed",
scripts = {"unicode"},
family = "bnt"}
m["cau-nec-pro"] = {
names = {"Proto-Northeast Caucasian"},
type = "reconstructed",
scripts = {"unicode"},
family = "cau-nec"}
m["cbk-zam"] = {
names = {"Zamboanga Chavacano"},
type = "regular",
scripts = {"None"},
family = "crp"}
m["ccn-pro"] = {
names = {"Proto-North Caucasian"},
type = "reconstructed",
scripts = {"unicode"},
family = "ccn"}
m["ccs-pro"] = {
names = {"Proto-Kartvelian"},
type = "reconstructed",
scripts = {"unicode"},
family = "ccs"}
m["cel-bry-pro"] = {
names = {"Proto-Brythonic", "Proto-Brittonic"},
type = "reconstructed",
scripts = {"unicode"},
family = "cel-bry"}
m["cel-gau"] = {
names = {"Gaulish"},
type = "regular",
scripts = {"Latn", "Grek"},
family = "cel"}
m["cel-pro"] = {
names = {"Proto-Celtic"},
type = "reconstructed",
scripts = {"unicode"},
family = "cel"}
m["cmc-pro"] = {
names = {"Proto-Chamic"},
type = "reconstructed",
scripts = {"unicode"},
family = "cmc"}
m["cpe-mar"] = {
names = {"Maroon Spirit Language", "Jamaican Maroon Spirit Possession Language"},
type = "regular",
scripts = {"Latn"},
family = "crp"}
m["cpe-spp"] = {
names = {"Samoan Plantation Pidgin"},
type = "regular",
scripts = {"Latn"},
family = "crp"}
m["crp-gep"] = {
names = {"Greenlandic Eskimo Pidgin"},
type = "regular",
scripts = {"Latn"},
family = "crp"}
m["crp-rsn"] = {
names = {"Russenorsk"},
type = "regular",
scripts = {"Cyrl", "Latn"},
family = "crp"}
m["crp-tpr"] = {
names = {"Taimyr Pidgin Russian"},
type = "regular",
scripts = {"Cyrl"},
family = "crp"}
m["dra-pro"] = {
names = {"Proto-Dravidian"},
type = "reconstructed",
scripts = {"unicode"},
family = "dra"}
m["dru-pro"] = {
names = {"Proto-Rukai"},
type = "reconstructed",
scripts = {"unicode"},
family = "map"}
m["esx-esk-pro"] = {
names = {"Proto-Eskimo"},
type = "reconstructed",
scripts = {"unicode"},
family = "esx-esk"}
m["esx-inu-pro"] = {
names = {"Proto-Inupik"},
type = "reconstructed",
scripts = {"unicode"},
family = "esx-inu"}
m["esx-pro"] = {
names = {"Proto-Eskimo-Aleut"},
type = "reconstructed",
scripts = {"unicode"},
family = "esx"}
m["euq-pro"] = {
names = {"Proto-Basque"},
type = "reconstructed",
scripts = {"unicode"},
family = "euq"}
m["fiu-fin-pro"] = {
names = {"Proto-Finnic"},
type = "reconstructed",
scripts = {"Latn"},
family = "fiu-fin",
sort_key = {
from = {"ä", "ö", "ü"},
to = {"a", "o", "u"}} }
m["fiu-fpr-pro"] = {
names = {"Proto-Finno-Permic"},
type = "reconstructed",
scripts = {"unicode"},
family = "fiu-fpr"}
m["fiu-pro"] = {
names = {"Proto-Finno-Ugric"},
type = "reconstructed",
scripts = {"unicode"},
family = "fiu"}
m["fiu-ugr-pro"] = {
names = {"Proto-Ugric"},
type = "reconstructed",
scripts = {"unicode"},
family = "fiu-ugr"}
m["fra-aca"] = {
names = {"Acadian French"},
type = "regular",
scripts = {"Latn"},
family = "roa"}
m["gem-pro"] = {
names = {"Proto-Germanic", "Common Germanic"},
type = "reconstructed",
scripts = {"unicode"},
family = "gem",
sort_key = {
from = {"ā", "[ēê]", "ī", "[ōô]", "ū", "ą" , "į" , "ǫ" , "ų" , CIRC, MACRON},
to = {"a" , "e" , "i", "o" , "u", "an", "in", "on", "un"}} }
m["gme-cgo"] = {
names = {"Crimean Gothic"},
type = "regular",
scripts = {"Latn"},
family = "gme"}
m["gmq-gut"] = {
names = {"Gutnish"},
type = "regular",
scripts = {"Latn"},
family = "gmq"}
m["gmq-mno"] = {
names = {"Middle Norwegian"},
type = "regular",
scripts = {"Latn"},
family = "gmq"}
m["gmq-oda"] = {
names = {"Old Danish"},
type = "regular",
scripts = {"Latn"},
family = "gmq"}
m["gmq-osw"] = {
names = {"Old Swedish"},
type = "regular",
scripts = {"Latn"},
family = "gmq"}
m["gmq-pro"] = {
names = {"Proto-Norse"},
type = "regular",
scripts = {"Runr"},
family = "gmq",
translit_module = "Runr-translit"}
m["gmw-jdt"] = {
names = {"Jersey Dutch"},
type = "regular",
scripts = {"Latn"},
family = "gmw"}
m["grk-cal"] = {
names = {"Calabrian Greek", "Italian Greek", "Bova"},
type = "regular",
scripts = {"Latn"},
family = "grk"}
m["grk-pro"] = {
names = {"Proto-Hellenic"},
type = "reconstructed",
scripts = {"unicode"},
family = "grk"}
m["hmn-pro"] = {
names = {"Proto-Hmong"},
type = "reconstructed",
scripts = {"unicode"},
family = "hmn"}
m["hmx-mie-pro"] = {
names = {"Proto-Mien"},
type = "reconstructed",
scripts = {"unicode"},
family = "hmx-mie"}
m["hmx-pro"] = {
names = {"Proto-Hmong-Mien"},
type = "reconstructed",
scripts = {"unicode"},
family = "hmx"}
m["hyx-pro"] = {
names = {"Proto-Armenian"},
type = "reconstructed",
scripts = {"Latn"},
family = "hyx"}
m["iir-pro"] = {
names = {"Proto-Indo-Iranian"},
type = "reconstructed",
scripts = {"unicode"},
family = "iir"}
m["inc-pro"] = {
names = {"Proto-Indo-Aryan"},
type = "reconstructed",
scripts = {"unicode"},
family = "inc"}
m["ine-ana-pro"] = {
names = {"Proto-Anatolian"},
type = "reconstructed",
scripts = {"unicode"},
family = "ine-ana"}
m["ine-bsl-pro"] = {
names = {"Proto-Balto-Slavic"},
type = "reconstructed",
scripts = {"unicode"},
family = "ine-bsl"}
m["ine-pro"] = {
names = {"Proto-Indo-European"},
type = "reconstructed",
scripts = {"unicode"},
family = "ine",
sort_key = {
from = {"[áā]", "[éēḗ]", "[íī]", "[óōṓ]", "[úū]", "ĺ", "ḿ", "ń", "ŕ", "ǵ" , "ḱ" , "ʰ", "ʷ", "₁", "₂", "₃", RINGBELOW, ACUTE, MACRON},
to = {"a" , "e" , "i" , "o" , "u" , "l", "m", "n", "r", "g'", "k'", "h", "w", "1", "2", "3"}} }
m["ine-toc-pro"] = {
names = {"Proto-Tocharian"},
type = "reconstructed",
scripts = {"unicode"},
family = "ine-toc"}
m["ira-pro"] = {
names = {"Proto-Iranian"},
type = "reconstructed",
scripts = {"unicode"},
family = "ira"}
m["iro-min"] = {
names = {"Mingo"},
type = "regular",
scripts = {"Latn"},
family = "iro"}
m["itc-pro"] = {
names = {"Proto-Italic"},
type = "reconstructed",
scripts = {"unicode"},
family = "itc"}
m["jpx-pro"] = {
names = {"Proto-Japonic"},
type = "reconstructed",
scripts = {"unicode"},
family = "jpx"}
m["khi-kun"] = {
names = {"ǃKung", "ǃOǃKung", "ǃ'OǃKung", "Kung", "Ekoka ǃKung", "Ekoka Kung", "Sekele"},
type = "regular",
scripts = {"Latn"},
family = "khi"}
m["map-ata-pro"] = {
names = {"Proto-Atayalic"},
type = "reconstructed",
scripts = {"unicode"},
family = "map-ata"}
m["map-bms"] = {
names = {"Banyumasan"},
type = "regular",
scripts = {"None"},
family = "qfa-und"}
m["map-pro"] = {
names = {"Proto-Austronesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "map"}
m["mkh-pro"] = {
names = {"Proto-Mon-Khmer"},
type = "reconstructed",
scripts = {"unicode"},
family = "mkh"}
m["mkh-vie-pro"] = {
names = {"Proto-Vietic"},
type = "reconstructed",
scripts = {"unicode"},
family = "mkh-vie"}
m["nai-pic"] = {
names = {"Picuris"},
type = "regular",
scripts = {"Latn"},
family = "qfa-kta"}
m["nds-de"] = {
names = {"German Low German"},
type = "regular",
scripts = {"Latn"},
family = "gmw"}
m["nds-nl"] = {
names = {"Dutch Low Saxon"},
type = "regular",
scripts = {"Latn"},
family = "gmw"}
m["phi-pro"] = {
names = {"Proto-Philippine"},
type = "reconstructed",
scripts = {"unicode"},
family = "phi"}
m["plf-pro"] = {
names = {"Proto-Central Malayo-Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "plf"}
m["poz-btk-pro"] = {
names = {"Proto-Bungku-Tolaki"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-btk"}
m["poz-cet-pro"] = {
names = {"Proto-Central-Eastern Malayo-Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz"}
m["poz-hce-pro"] = {
names = {"Proto-Halmahera-Cenderawasih", "Proto-South Halmahera - West New Guinea"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-hce"}
m["poz-lgx-pro"] = {
names = {"Proto-Lampungic"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-lgx"}
m["poz-mcm-pro"] = {
names = {"Proto-Malayo-Chamic"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-msa"}
m["poz-mly-pro"] = {
names = {"Proto-Malayic"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-mly"}
m["poz-msa-pro"] = {
names = {"Proto-Malayo-Sumbawan"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-msa"}
m["poz-oce-pro"] = {
names = {"Proto-Oceanic"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-oce"}
m["poz-pep-pro"] = {
names = {"Proto-Eastern Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-pol"}
m["poz-pnp-pro"] = {
names = {"Proto-Nuclear Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-pol"}
m["poz-pol-pro"] = {
names = {"Proto-Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-pol"}
m["poz-pro"] = {
names = {"Proto-Malayo-Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz"}
m["poz-ssw-pro"] = {
names = {"Proto-South Sulawesi"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-ssw"}
m["poz-sus-pro"] = {
names = {"Proto-Sunda-Sulawesi"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-sus"}
m["poz-swa-pro"] = {
names = {"Proto-North Sarawak"},
type = "reconstructed",
scripts = {"unicode"},
family = "poz-swa"}
m["pqe-pol-pro"] = {
names = {"Proto-East-Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "pqe-pol"}
m["pqe-pro"] = {
names = {"Proto-Eastern Malayo-Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "pqe"}
m["pqw-pro"] = {
names = {"Proto-Western Malayo-Polynesian"},
type = "reconstructed",
scripts = {"unicode"},
family = "pqw"}
m["qfa-cka-pro"] = {
names = {"Proto-Chukotko-Kamchatkan"},
type = "reconstructed",
scripts = {"unicode"},
family = "qfa-cka"}
m["qfa-kor-pro"] = {
names = {"Proto-Korean"},
type = "reconstructed",
scripts = {"None"},
family = "qfa-kor"}
m["qfa-yen-pro"] = {
names = {"Proto-Yeniseian"},
type = "reconstructed",
scripts = {"unicode"},
family = "qfa-yen"}
m["roa-gal"] = {
names = {"Gallo"},
type = "regular",
scripts = {"Latn"},
family = "roa",
sort_key = {
from = {"[áàâä]", "[éèêë]", "[íìîï]", "[óòôö]", "[úùûü]", "[ýỳŷÿ]", "ç", "'"},
to = {"a" , "e" , "i" , "o" , "u" , "y" , "c"}} }
m["roa-grn"] = {
names = {"Guernésiais", "Dgèrnésiais", "Guernsey French", "Guernsey Norman French"},
type = "regular",
scripts = {"Latn"},
family = "roa",
sort_key = {
from = {"[áàâä]", "[éèêë]", "[íìîï]", "[óòôö]", "[úùûü]", "[ýỳŷÿ]", "ç", "'"},
to = {"a" , "e" , "i" , "o" , "u" , "y" , "c"}} }
m["roa-jer"] = {
names = {"Jèrriais", "Jersey French", "Jersey Norman", "Jersey Norman French"},
type = "regular",
scripts = {"Latn"},
family = "roa",
sort_key = {
from = {"[áàâä]", "[éèêë]", "[íìîï]", "[óòôö]", "[úùûü]", "[ýỳŷÿ]", "ç", "'"},
to = {"a" , "e" , "i" , "o" , "u" , "y" , "c"}} }
m["roa-leo"] = {
names = {"Leonese"},
type = "regular",
scripts = {"Latn"},
family = "roa"}
m["roa-nor"] = {
names = {"Norman"},
type = "regular",
scripts = {"Latn"},
family = "roa",
sort_key = {
from = {"[áàâä]", "[éèêë]", "[íìîï]", "[óòôö]", "[úùûü]", "[ýỳŷÿ]", "ç", "'"},
to = {"a" , "e" , "i" , "o" , "u" , "y" , "c"}} }
m["roa-oit"] = {
names = {"Old Italian"},
type = "regular",
scripts = {"Latn"},
family = "roa"}
m["roa-ptg"] = {
names = {"Old Portuguese", "Galician-Portuguese", "Galician Portuguese"},
type = "regular",
scripts = {"Latn"},
family = "roa"}
m["roa-tar"] = {
names = {"Tarantino"},
type = "regular",
scripts = {"Latn"},
family = "roa"}
m["sca-pro"] = { -- the family is called Siouan, but sio-pro Proto-Siouan is the proto-lang of Western Sioun only
names = {"Proto-Siouan-Catawban"},
type = "reconstructed",
scripts = {"unicode"},
family = "qfa-sca"}
m["sem-amm"] = {
names = {"Ammonite"},
type = "regular",
scripts = {"Phnx"},
family = "sem-can"}
m["sem-pro"] = {
names = {"Proto-Semitic"},
type = "reconstructed",
scripts = {"unicode"},
family = "sem"}
m["sem-srb"] = {
names = {"Old South Arabian"},
type = "regular",
scripts = {"Sarb"},
family = "sem-osa"}
m["sem-syr"] = {
names = {"Syrian Arabic"},
type = "regular",
scripts = {"Arab"},
family = "sem-arb"}
m["sio-pro"] = { -- though the whole family is called Siouan, this is the proto-lang of Western Sioun only; compare sca-pro
names = {"Proto-Siouan"},
type = "reconstructed",
scripts = {"unicode"},
family = "sio"}
m["sit-pro"] = {
names = {"Proto-Sino-Tibetan"},
type = "reconstructed",
scripts = {"Latn"},
family = "sit"}
m["sla-pro"] = {
names = {"Proto-Slavic", "Common Slavic"},
type = "reconstructed",
scripts = {"unicode"},
family = "sla"}
m["smi-pro"] = {
names = {"Proto-Samic", "Proto-Sami"},
type = "reconstructed",
scripts = {"Latn"},
family = "smi"}
m["sqj-pro"] = {
names = {"Proto-Albanian"},
type = "reconstructed",
scripts = {"unicode"},
family = "sqj"}
m["syd-pro"] = {
names = {"Proto-Samoyedic"},
type = "reconstructed",
scripts = {"None"},
family = "syd"}
m["tai-pro"] = {
names = {"Proto-Tai"},
type = "reconstructed",
scripts = {"unicode"},
family = "tai"}
m["tai-swe-pro"] = {
names = {"Proto-Southwestern Tai"},
type = "reconstructed",
scripts = {"unicode"},
family = "tai-swe"}
m["trk-pro"] = {
names = {"Proto-Turkic"},
type = "reconstructed",
scripts = {"unicode"},
family = "trk"}
m["tut-pro"] = {
names = {"Proto-Altaic"},
type = "reconstructed",
scripts = {"unicode"},
family = "tut"}
m["und-ibe"] = {
names = {"pre-Roman (Iberia)"},
type = "reconstructed",
scripts = {"unicode"},
family = "qfa-sub"}
m["und-bal"] = {
names = {"pre-Roman (Balkans)"},
type = "reconstructed",
scripts = {"unicode"},
family = "qfa-sub"}
m["urj-pro"] = {
names = {"Proto-Uralic"},
type = "reconstructed",
scripts = {"unicode"},
family = "urj"}
m["xgn-pro"] = {
names = {"Proto-Mongolic"},
type = "reconstructed",
scripts = {"unicode"},
family = "xgn"}
m["zhx-mid"] = {
names = {"Middle Chinese"},
type = "regular",
scripts = {"Hani"},
family = "qfa-und"}
m["zlw-opl"] = {
names = {"Old Polish"},
type = "regular",
scripts = {"Latn"},
family = "zlw"}
m["zlw-pom"] = {
names = {"Pomeranian"},
type = "regular",
scripts = {"None"},
family = "qfa-und"}
m["zlw-slv"] = {
names = {"Slovincian"},
type = "regular",
scripts = {"Latn"},
family = "zlw"}
return m