မော်ဂျူး:scripts/data: ခြပ်ချော်ꩻမုꩻခါႏ ဗိုန်ပီတဝ်းဒါႏဖိုင်ႏ

Content deleted Content added
အရေꩻတန်တဝ်း ၂ revisions imported: [TEST] importing blkwiktionary via a tool
No edit summary
လိတ်တွယ်ꩻ: နောက်ပြန်ပြင်ခဲ့ပြီး
လိတ်ရဲဉ်ႏ ၁:
--[=[
When adding new scripts to this file, please don't forget to add
style definitons for the script in [[မီဒီယာဝီခီMediaWiki:Common.css]].
]=]
local u = mw.ustring.char
 
local u = mw.ustring.char
local m = {}
local u = mw.ustring.char
 
m["Adlm"] = {
canonicalName = "Adlam",
"alphabet",
characters = "؟ـ𞤀-𞥟",
capitalized = true,
လိတ်ရဲဉ်ႏ ၁၆:
 
m["Afak"] = {
canonicalName = "Afaka",
"syllabary",
}
 
m["Aghb"] = {
canonicalName = "Caucasian Albanian",
"alphabet",
characters = "𐔰-𐕯",
}
 
m["Ahom"] = {
canonicalName = "Ahom",
"abugida",
characters = "𑜀-𑝏",
systems = {"abugida"},
}
 
m["Arab"] = {
canonicalName = "Arabic",
"abjad", -- more precisely, impure abjad
varieties = {"Jawi", {"Nastaliq", "Nastaleeq"}},
characters = "؀-ۿݐ-ݿࡰ-ࣿﭐ-﷏ﷰ-﷿ﹰ-﻾𐋠-𐋻𐹠-𐹿𐻀-𐻿𞸀-𞻿",
direction = "rtl",
systems = {"abjad"}, -- more precisely, impure abjad
normalizationFixes = {
from = {"ٳ"},
Line ၄၃ ⟶ ၄၅:
 
m["fa-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
otherNames = {"Perso-Arabic"},
characters = m["Arab"].characters,
otherNames = {"Perso-Arabic"},
direction = "rtl",
parent = "Arab",
Line ၅၂ ⟶ ၅၅:
 
m["kk-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၆၀ ⟶ ၆၄:
 
m["ks-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၆၈ ⟶ ၇၃:
 
m["ku-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၇၆ ⟶ ၈၂:
 
m["ms-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၈၄ ⟶ ၉၁:
 
m["mzn-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၉၂ ⟶ ၁၀၀:
 
m["ota-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၁၀၀ ⟶ ၁၀၉:
 
m["pa-Arab"] = {
canonicalName = "Shahmukhi",
m["Arab"][2],
otherNames = {"Arabic"},
characters = m["Arab"].characters,
otherNames = {"Arabic"},
direction = "rtl",
parent = "Arab",
Line ၁၀၉ ⟶ ၁၁၉:
 
m["ps-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၁၁၇ ⟶ ၁၂၈:
 
m["sd-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၁၂၅ ⟶ ၁၃၇:
 
m["tt-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၁၃၃ ⟶ ၁၄၆:
 
m["ug-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၁၄၁ ⟶ ၁၅၅:
 
m["ur-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၁၄၉ ⟶ ၁၆၄:
 
m["xka-Arab"] = {
canonicalName = "Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
Line ၁၅၉ ⟶ ၁၇၅:
 
m["Armi"] = {
canonicalName = "Imperial Aramaic",
"abjad",
characters = "𐡀-𐡟",
direction = "rtl",
systems = {"abjad"},
}
 
m["Armn"] = {
canonicalName = "Armenian",
"alphabet",
characters = "԰-֏ﬓ-ﬗ",
capitalized = true,
systems = {"alphabet"},
}
 
m["Avst"] = {
canonicalName = "Avestan",
"alphabet",
characters = "𐬀-𐬿",
direction = "rtl",
Line ၁၇၉ ⟶ ၁၉၆:
 
m["pal-Avst"] = {
canonicalName = "Pazend",
m["Avst"][2],
characters = m["Avst"].characters,
direction = "rtl",
Line ၁၈၆ ⟶ ၂၀၄:
 
m["Bali"] = {
canonicalName = "Balinese",
"abugida",
characters = "ᬀ-᭿",
systems = {"abugida"},
}
 
m["Bamu"] = {
canonicalName = "Bamum",
"syllabary",
characters = "ꚠ-꛿𖠀-𖨿",
}
 
m["Bass"] = {
canonicalName = "Bassa",
"alphabet",
aliases = {"Bassa Vah", "Vah"},
characters = "𖫐-𖫿",
Line ၂၀၃ ⟶ ၂၂၃:
 
m["Batk"] = {
canonicalName = "Batak",
"abugida",
characters = "ᯀ-᯿",
systems = {"abugida"},
}
 
m["Beng"] = {
canonicalName = "Bengali",
"abugida",
characters = "॒॑।॥ঀ-৯৲-৿᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱",
systems = {"abugida"},
normalizationFixes = {
from = {"অা", "ঋৃ", "ঌৢ"},
Line ၂၁၉ ⟶ ၂၃၉:
 
m["as-Beng"] = {
canonicalName = "Assamese",
m["Beng"][2],
otherNames = {"Bengali-Assamese", "Eastern Nagari"},
characters = "॒॑।॥ঀ-য঱-৿᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱",
systems = {"abugida"},
normalizationFixes = m["Beng"].normalizationFixes,
}
 
m["Bhks"] = {
canonicalName = "Bhaiksuki",
"abugida",
characters = "𑰀-𑱯",
systems = {"abugida"},
}
 
m["Blis"] = {
canonicalName = "Blissymbols",
"logography",
aliases = {"Blissymbolics"},
systems = {"logography"},
-- Not in Unicode
}
 
m["Bopo"] = {
canonicalName = "Zhuyin",
"semisyllabary",
aliases = {"Zhuyin Fuhao", "Bopomofo"},
characters = "ˇˉˊˋ˙˪˫、-〃〈-】〓-〟〪-〭〰〷・㄀-ㄯ﹅﹆。-・",
Line ၂၄၆ ⟶ ၂၆၇:
 
m["Brah"] = {
canonicalName = "Brahmi",
"abugida",
characters = "𑀀-𑁿",
systems = {"abugida"},
normalizationFixes = {
from = {"𑀅𑀸", "𑀋𑀾", "𑀏𑁂"},
Line ၂၅၆ ⟶ ၂၇၇:
 
m["Brai"] = {
canonicalName = "Braille",
"alphabet",
characters = "⠀-⣿",
}
 
m["Bugi"] = {
canonicalName = "Buginese",
"abugida",
aliases = {"Lontara"},
characters = "ᨀ-᨟ꧏ",
systems = {"abugida"},
}
 
m["Buhd"] = {
canonicalName = "Buhid",
"abugida",
characters = "᜵᜶ᝀ-᝟ꧏ",
systems = {"abugida"},
}
 
m["Cakm"] = {
canonicalName = "Chakma",
"abugida",
characters = "০-৯၀-၉𑄀-𑅏",
systems = {"abugida"},
}
 
m["Cans"] = {
canonicalName = "Canadian syllabics",
"abugida",
characters = "᐀-ᙿᢰ-᣿𑪰-𑪿",
systems = {"abugida"},
}
 
m["Cari"] = {
canonicalName = "Carian",
"alphabet",
characters = "𐊠-𐋟",
systems = {"alphabet"},
}
 
m["Cham"] = {
canonicalName = "Cham",
"abugida",
characters = "ꨀ-꩟",
systems = {"abugida"},
}
 
m["Cher"] = {
canonicalName = "Cherokee",
"syllabary",
characters = "Ꭰ-᏿ꭰ-ꮿ",
systems = {"syllabary"},
}
 
m["Chrs"] = {
canonicalName = "Chorasmian",
"abjad",
characters = "𐾰-𐿟",
direction = "rtl",
systems = {"abjad"},
}
 
m["Copt"] = {
canonicalName = "Coptic",
"alphabet",
characters = "Ϣ-ϯⲀ-⳿𐋠-𐋻", -- this is mostly "Coptic", not unified "Greek and Coptic"
capitalized = true,
systems = {"alphabet"},
}
 
m["Cpmn"] = {
canonicalName = "Cypro-Minoan",
"syllabary",
aliases = {"Cypro Minoan"},
characters = "𐄀𐄁𒾐-𒿿",
systems = {"syllabary"},
}
 
m["Cprt"] = {
canonicalName = "Cypriot",
"syllabary",
characters = "𐄀-𐄂𐄇-𐄳𐄷-𐄿𐠀-𐠿",
direction = "rtl",
systems = {"syllabary"},
}
 
m["Cyrl"] = {
canonicalName = "Cyrillic",
"alphabet",
characters = "Ѐ-ԯᲀ-᲏ᴫᵸ᷸ⷠ-ⷿ⹃Ꙁ-ꚟ︮︯𞀰-𞂏",
capitalized = true,
systems = {"alphabet"},
}
 
m["Cyrs"] = {
canonicalName = "Old Cyrillic",
m["Cyrl"][2],
aliases = {"Early Cyrillic"},
characters = m["Cyrl"].characters,
capitalized = m["Cyrl"].capitalized,
wikipedia_article = "Early Cyrillic alphabet",
systems = {"alphabet"},
}
 
m["Deva"] = {
canonicalName = "Devanagari",
"abugida",
characters = "ऀ-ॿ꣠-ꣿ𑬀-𑬉",
systems = {"abugida"},
normalizationFixes = {
from = {"ॆॆ", "ेे", "ाॅ", "ाॆ", "ाꣿ", "ॊॆ", "ाे", "ाै", "ोे", "ाऺ", "ॖॖ", "अॅ", "अॆ", "अा", "एॅ", "एॆ", "एे", "एꣿ", "ऎॆ", "अॉ", "आॅ", "अॊ", "आॆ", "अो", "आे", "अौ", "आै", "ओे", "अऺ", "अऻ", "आऺ", "अाꣿ", "आꣿ", "ऒॆ", "अॖ", "अॗ", "ॶॖ", "्‍?ा"},
Line ၃၅၈ ⟶ ၃၈၀:
 
m["Diak"] = {
canonicalName = "Dhives Akuru",
"abugida",
aliases = {"Dives Akuru"},
characters = "𑤀-𑤆𑤉𑤌-𑤓𑤕𑤖𑤘-𑤵𑤷𑤸𑤻-𑥆𑥐-𑥙",
systems = {"abugida"},
}
 
m["Dogr"] = {
canonicalName = "Dogra",
"abugida",
characters = "𑠀-𑠻",
systems = {"abugida"},
}
 
m["Dsrt"] = {
canonicalName = "Deseret",
"alphabet",
characters = "𐐀-𐑏",
capitalized = true,
systems = {"alphabet"},
}
 
m["Dupl"] = {
canonicalName = "Duployan",
"alphabet",
characters = "𛰀-𛱪𛱰-𛱼𛲀-𛲈𛲐-𛲙𛲜-𛲟",
}
 
m["Egyd"] = {
canonicalName = "Demotic",
systems = {"abjad", "logography"},
}
 
m["Egyh"] = {
canonicalName = "Hieratic",
systems = { "abjad", "logography"},
}
 
m["Egyp"] = {
canonicalName = "Egyptian hieroglyphic",
"abjad, logography",
varieties = {"Hieratic"},
characters = "𓀀-𓑕",
varieties = {"Hieratic"},
wikipedia_article = "Egyptian hieroglyphs",
systems = {"abjad", "logography"},
normalizationFixes = {
from = {"𓈗", "𓃁", "𓆖"},
to = {"𓈖𓐰𓈖𓐰𓈖", "𓃀𓐶𓂝", "𓆓𓐳𓐷𓏏𓐰𓇿𓐸"}
},
}
 
m["Elba"] = {
canonicalName = "Elbasan",
"alphabet",
characters = "𐔀-𐔧",
}
systems = {"alphabet"},
 
m["Elym"] = {
"Elymaic",
"abjad",
characters = "𐿠-𐿶",
direction = "rtl",
}
 
m["Ethi"] = {
canonicalName = "Ethiopic",
"abugida",
aliases = {"Ge'ez"},
characters = "ሀ-ቈቊ-ቍቐ-ቖቘቚ-ቝበ-ኈኊ-ኍነ-ኰኲ-ኵኸ-ኾዀዂ-ዅወ-ዖዘ-ጐጒ-ጕጘ-ፚ፝-፼ᎀ-᎙ⶀ-ⶖⶠ-ⶦⶨ-ⶮⶰ-ⶶⶸ-ⶾⷀ-ⷆⷈ-ⷎⷐ-ⷖⷘ-ⷞꬁ-ꬆꬉ-ꬎꬑ-ꬖꬠ-ꬦꬨ-ꬮ𞟠-𞟦𞟨-𞟫𞟭𞟮𞟰-𞟾",
systems = {"abugida"},
}
 
m["Geok"] = {
canonicalName = "Khutsuri",
"alphabet",
varieties = {"Nuskhuri", "Asomtavruli"},
characters = "Ⴀ-ჅჇჍ჻ⴀ-ⴥⴧⴭ", -- Ⴀ-Ⴭ is Asomtavruli, ⴀ-ⴭ is Nuskhuri
varieties = {"Nuskhuri", "Asomtavruli"},
capitalized = true,
systems = {"alphabet"},
}
 
m["Geor"] = {
canonicalName = "Georgian",
"alphabet",
varieties = {"Mkhedruli", "Mtavruli"},
characters = "ა-ჿᲐ-ᲺᲽ-Ჿ", -- ა-ჿ is lowercase Mkhedruli; Ა-Ჿ is uppercase Mkhedruli (Mtavruli)
varieties = {"Mkhedruli", "Mtavruli"},
capitalized = true,
systems = {"alphabet"},
}
 
m["Glag"] = {
canonicalName = "Glagolitic",
"alphabet",
characters = "Ⰰ-ⱟ𞀀-𞀆𞀈-𞀘𞀛-𞀡𞀣𞀤𞀦-𞀪",
capitalized = true,
systems = {"alphabet"},
}
 
m["Gong"] = {
canonicalName = "Gunjala Gondi",
"abugida",
characters = "𑵠-𑵥𑵧𑵨𑵪-𑶎𑶐𑶑𑶓-𑶘𑶠-𑶩",
systems = {"abugida"},
}
 
m["Gonm"] = {
canonicalName = "Masaram Gondi",
"abugida",
characters = "𑴀-𑴆𑴈𑴉𑴋-𑴶𑴺𑴼𑴽𑴿-𑵇𑵐-𑵙",
systems = {"abugida"},
}
 
m["Goth"] = {
canonicalName = "Gothic",
"alphabet",
characters = "𐌰-𐍊",
systems = {"alphabet"},
}
 
m["Gran"] = {
canonicalName = "Grantha",
"abugida",
characters = "𑌀-𑌃𑌅-𑌌𑌏-𑌐𑌓-𑌨𑌪-𑌰𑌲𑌳𑌵-𑌹𑌼-𑍄𑍇𑍈𑍋-𑍍𑍐𑍗𑍝-𑍣𑍦-𑍬𑍰-𑍴",
systems = {"abugida"},
}
 
m["Grek"] = {
canonicalName = "Greek",
"alphabet",
characters = "Ͱ-ͷͺ-Ϳ΄-ΊΌΎ-ΡΣ-ϡϰ-Ͽᴦ-ᴪᵝ-ᵡᵦ-ᵪᶿΩ℩ꭥ𐅀-𐆎𐆠𝈀-𝉅",
capitalized = true,
systems = {"alphabet"},
}
 
m["polytonicPolyt"] = {
canonicalName = "Greek",
m["Grek"][2],
characters = "ἀ-῾" .. m["Grek"].characters,
capitalized = m["Grek"].capitalized,
parent = "Grek",
systems = {"alphabet"},
}
 
m["Gujr"] = {
canonicalName = "Gujarati",
"abugida",
characters = "ઁ-ઃઅ-ઍએ-ઑઓ-નપ-રલળવ-હ઼-ૅે-ૉો-્ૐૠ-ૣ૦-૱ૺ-૿",
systems = {"abugida"},
normalizationFixes = {
from = {"ઓ", "અાૈ", "અા", "અૅ", "અે", "અૈ", "અૉ", "અો", "અૌ", "આૅ", "આૈ", "ૅા"},
Line ၄၉၀ ⟶ ၅၂၀:
 
m["Guru"] = {
canonicalName = "Gurmukhi",
"abugida",
characters = "ਁ-ਃਅ-ਊਏਐਓ-ਨਪ-ਰਲਲ਼ਵਸ਼ਸਹ਼ਾ-ੂੇੈੋ-੍ੑਖ਼-ੜਫ਼੦-੶",
systems = {"abugida"},
normalizationFixes = {
from = {"ਅਾ", "ਅੈ", "ਅੌ", "ੲਿ", "ੲੀ", "ੲੇ", "ੳੁ", "ੳੂ", "ੳੋ"},
Line ၅၀၀ ⟶ ၅၃၀:
 
m["Hang"] = {
canonicalName = "Hangul",
"syllabary",
aliases = {"Hangeul"},
characters = (
Line ၅၁၀ ⟶ ၅၄၁:
"ᅠ-ᅵ" -- Halfwidth
),
systems = {"syllabary"},
}
 
m["Hani"] = {
canonicalName = "Han",
"logography",
varieties = {"Hanzi", "Kanji", "Hanja", "Chu Nom"},
characters = (
"一-鿿" ..
"㐀-䶿" .. -- ExtA
"𠀀-𮯯𪛟" .. -- SIP ExtB
"𰀀𪜀-𲎯𮹟" .. -- ExtGExtC-HF & I
"𰀀-𲎯" .. -- ExtG-H
"﨎﨏﨑﨓﨔﨟﨡﨣﨤﨧﨨﨩" ..
"-⻿" .. -- RadicalsKangxi SupplementRadicals
" -⻿" .. -- CJK Symbols andRadicals PunctuationSupplement
"𖿢𖿣𖿰𖿱 -〿" .. -- IdeographicCJK Symbols and Punctuation
"𖿢𖿣𖿰𖿱" .. -- Ideographic Symbols and Punctuation
"㇀-㇯".. -- Strokes
"-㍿㋿" .. -- 組文字Strokes
"㋿㍻-㍿" .. -- 組文字
"㈠-㉇㊀-㊰㋀-㋋㍘-㍰㏠-㏾🈐-🈒🈔-🈻🉀-🉈🉐🉑🉠-🉥" ..
-- Saved as bytes to stop normalization on save.
"\239\164\128-\239\171\191" .. -- Compatibility Ideographs
"\240\175\160\128-\240\175\168\159" -- Compatibility Ideographs Supplement
),
varieties = {"Hanzi", "Kanji", "Hanja", "Chu Nom"},
systems = {"logography"},
spaces = false,
}
 
m["Hans"] = {
canonicalName = "Simplified Han",
m["Hani"][2],
characters = m["Hani"].characters,
systemsspaces = {m["logographyHani"}].spaces,
parent = "Hani",
}
 
m["Hant"] = {
canonicalName = "Traditional Han",
m["Hani"][2],
characters = m["Hani"].characters,
systemsspaces = {m["logographyHani"}].spaces,
parent = "Hani",
}
 
m["Hano"] = {
canonicalName = "Hanunoo",
"abugida",
characters = "ᜠ-᜴",
systems = {"abugida"},
}
 
m["Hatr"] = {
canonicalName = "Hatran",
"abjad",
characters = "𐣠-𐣿",
direction = "rtl",
systems = {"abjad"},
}
 
m["Hebr"] = {
canonicalName = "Hebrew",
"abjad", -- more precisely, impure abjad
characters = u(0x0590) .. "-" .. u(0x05FF) .. u(0xFB1D) .. "-" .. u(0xFB4F),
direction = "rtl",
systems = {"abjad"}, -- more precisely, impure abjad
}
 
m["Hira"] = {
canonicalName = "Hiragana",
"syllabary",
varieties = {"Hentaigana"},
characters = "ぁ-ゟ𛀁-𛄞𛅐𛅑𛅒🈀",
systemsvarieties = {"syllabaryHentaigana"},
spaces = false,
}
 
m["Hluw"] = {
canonicalName = "Anatolian Hieroglyphs",
"logography, syllabary",
characters = "𔐀-𔙆",
wikipedia_article = "Anatolian hieroglyphs",
Line ၅၇၉ ⟶ ၆၂၀:
 
m["Hmng"] = {
canonicalName"Pahawh = "Hmong",
"semisyllabary",
aliases = {"Pahawh Hmong"},
aliases = {"Hmong"},
characters = "𖬀-𖮏",
}
 
m["Hmnp"] = {
"Nyiakeng Puachue Hmong",
"alphabet",
characters = "𞄀‎-𞅏",
}
 
m["Hung"] = {
canonicalName = "Old Hungarian",
"alphabet",
aliases = {"Hungarian runic"},
characters = "𐲀-𐲲",
Line ၅၉၃ ⟶ ၆၄၂:
 
m["Ibrn"] = {
canonicalName = "Iberian",
"semisyllabary",
}
 
m["Imag"] = {
-- To be used to avoid any formatting or link processing
canonicalName = "Image-rendered",
-- This should not have any characters listed
translit = false,
character_category = false,
}
 
m["Inds"] = {
canonicalName = "Indus",
aliases = {"Harappan", "Indus Valley"},
}
 
m["IPAcharIpach"] = {
canonicalName = "International Phonetic Alphabet",
aliases = {"IPA"},
}
 
m["Ital"] = {
canonicalName = "Old Italic",
"alphabet",
characters = "𐌀-𐌯",
systems = {"alphabet"},
}
 
m["Java"] = {
canonicalName = "Javanese",
"abugida",
characters = "ꦀ-꧟",
systems = {"abugida"},
}
 
m["Jurc"] = {
canonicalName = "Jurchen",
spaces = false,
}
 
m["Kali"] = {
canonicalName = "Kayah Li",
"abugida",
characters = "꤀-꤯",
systems = {"abugida"},
}
 
m["Kana"] = {
canonicalName = "Katakana",
"syllabary",
characters = "゠-ヿㇰ-ㇿ㌀-㍗ヲ-゚𛀀𛅤𛅥𛅦𛅧",
spaces = false,
systems = {"syllabary"},
}
 
m["Kawi"] = {
canonicalName = "Kawi",
"abugida",
characters = "𑼀-𑽙",
systems = {"abugida"},
}
 
m["Khar"] = {
canonicalName = "Kharoshthi",
"abugida",
characters = "𐨀-𐩘",
systems = {"abugida"},
direction = "rtl",
}
 
m["Khmr"] = {
canonicalName = "Khmer",
"abugida",
characters = "ក-៹᧠-᧿",
characters = "ក-៝០-៩៰-៹᧠-᧿",
systems = {"abugida"},
spaces = false,
normalizationFixes = {
from = {"ឣ", "ឤ"},
Line ၆၆၅ ⟶ ၇၁၉:
 
m["Khoj"] = {
canonicalName = "Khojki",
"abugida",
characters = "𑈀-𑈾",
systems = {"abugida"},
normalizationFixes = {
from = {"𑈀𑈬𑈱", "𑈀𑈬", "𑈀𑈱", "𑈀𑈳", "𑈁𑈱", "𑈆𑈬", "𑈬𑈰", "𑈬𑈱", "𑉀𑈮"},
Line ၆၇၅ ⟶ ၇၂၉:
 
m["Kitl"] = {
canonicalName = "Khitan Large",
systems = {"logography", "syllabary"},
spaces = false,
}
 
m["Kits"] = {
canonicalName = "Khitan Small",
"logography, syllabary",
characters = "𘬀-𘳕"..u(0x16FE4),
spaces = false,
systems = {"logography", "syllabary"},
}
 
m["Knda"] = {
canonicalName = "Kannada",
"abugida",
characters = "ಀ-ೲ",
systems = {"abugida"},
normalizationFixes = {
from = {"ಉಾ", "ಋಾ", "ಒೌ"},
Line ၆၉၆ ⟶ ၇၅၂:
 
m["Kpel"] = {
canonicalName = "Kpelle",
systems = {"syllabary"},
-- Not in Unicode
}
 
m["Kthi"] = {
canonicalName = "Kaithi",
"abugida",
characters = "𑂀-𑃍",
systems = {"abugida"},
}
 
m["Lana"] = {
canonicalName = "Tai Tham",
"abugida",
aliases = {"Tham", "Tua Mueang", "Lanna"},
characters = "ᨠ-ᩞ᩠-᩿᩼᪀-᪉᪐-᪙᪠-᪭",
systemsspaces = {"abugida"}false,
}
 
m["Laoo"] = {
canonicalName = "Lao",
"abugida",
characters = "ກ-ໟ",
characters = "ກຂຄຆ-ຊຌ-ຣລວ-ຽເ-ໄໆ່-໎໐-໙ໜ-ໟ",
systems = {"abugida"},
spaces = false,
}
 
m["Latn"] = {
canonicalName = "Latin",
"alphabet",
aliases = {"Roman"},
varieties = {"Rumi", "Romaji", "Rōmaji", "Romaja"},
characters = "A-Za-zªºÀ-ÖØ-öø-ɏḀ-ỿ",
varieties = {"Rumi", "Romaji", "Rōmaji", "Romaja"},
capitalized = true,
translit = false,
systems = {"alphabet"},
}
 
m["Latf"] = {
canonicalName = "Fraktur",
m["Latn"][2],
otherNames = {"Blackletter"}, -- Blackletter is actually the parent "script"
characters = m["Latn"].characters,
otherNames = {"Blackletter"}, -- Blackletter is actually the parent "script"
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
m["Latg"] = {
canonicalName = "Gaelic",
m["Latn"][2],
otherNames = {"Irish"},
characters = m["Latn"].characters,
otherNames = {"Irish"},
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
 
m["LatinxLatnx"] = {
canonicalName = "Latin",
m["Latn"][2],
characters = m["Latn"].characters .. "ɐ-ʸˠ-ˤᴀ-ᴥᴬ-ᵜᵢ-ᵥᵫ-ᵷᵹ-ᶾⁱⁿₐ-ₜKÅℲⅎⅠ-ↈⱠ-ⱿꜢ-ꞇꞋ-ꟊꟐꟑꟓꟕ-ꟙꟲ-ꟿꬰ-ꭚꭜ-ꭤꭦ-ꭩff-stA-Za-z𐞀-𐞅𐞇-𐞰𐞲-𐞺𝼀-𝼞𝼥-𝼪",
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
 
m["pjt-Latn"] = {
canonicalName = "Latin",
m["Latn"][2],
characters = m["Latn"].characters,
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
 
m["Leke"] = {
canonicalName = "Leke",
systems = {"abugida"},
}
 
m["Lepc"] = {
canonicalName = "Lepcha",
"abugida",
characters = "ᰀ-ᱏ",
systems = {"abugida"},
}
 
m["Limb"] = {
canonicalName = "Limbu",
"abugida",
characters = "ᤀ-᥏",
systems = {"abugida"},
}
 
m["Lina"] = {
canonicalName = "Linear A",
characters = "𐘀-𐝧",
}
 
m["Linb"] = {
canonicalName = "Linear B",
characters = "𐀀-𐃺",
}
 
m["Lisu"] = {
canonicalName = "Lisu",
"alphabet",
aliases = {"Fraser"},
characters = "ꓐ-꓿𑾰",
normalizationFixes = {
systems = {"alphabet"},
from = {"['’]", "[.ꓸ][.ꓸ]", "[.ꓸ][,ꓹ]"},
to = {"ʼ", "ꓺ", "ꓻ"}
},
}
 
m["Loma"] = {
canonicalName = "Loma",
systems = {"syllabary"},
-- Not in Unicode
}
 
m["Lyci"] = {
canonicalName = "Lycian",
"alphabet",
characters = "𐊀-𐊜",
systems = {"alphabet"},
}
 
m["Lydi"] = {
canonicalName = "Lydian",
"alphabet",
characters = "𐤠-𐤿",
direction = "rtl",
systems = {"alphabet"},
}
 
m["Mahj"] = {
canonicalName = "Mahajani",
"abugida",
characters = "𑅐-𑅶",
systems = {"abugida"},
}
 
m["Maka"] = {
canonicalName = "Lontara",
"abugida",
aliases = {"Makasar"},
characters = "𑻠-𑻸",
systems = {"abugida"},
}
 
m["Mand"] = {
canonicalName = "Mandaic",
aliases = {"Mandaean"},
characters = "ࡀ-࡞",
Line ၈၃၂ ⟶ ၉၀၄:
 
m["Mani"] = {
canonicalName = "Manichaean",
"abjad",
characters = "𐫀-𐫶",
direction = "rtl",
systems = {"abjad"},
}
 
m["Marc"] = {
canonicalName = "Marchen",
"abugida",
characters = "𑱰-𑲶",
systems = {"abugida"},
}
 
m["Maya"] = {
canonicalName = "Maya",
aliases = {"Maya hieroglyphic", "Mayan", "Mayan hieroglyphic"},
characters = "𝋠-𝋳",
Line ၈၅၁ ⟶ ၉၂၃:
 
m["Medf"] = {
canonicalName = "Medefaidrin",
aliases = {"Oberi Okaime", "Oberi Ɔkaimɛ"},
characters = "𖹀-𖺚",
Line ၈၅၈ ⟶ ၉၃၀:
 
m["Mend"] = {
canonicalName = "Mende",
aliases = {"Mende Kikakui"},
characters = "𞠀-𞣖",
Line ၈၆၅ ⟶ ၉၃၇:
 
m["Merc"] = {
canonicalName = "Meroitic cursive",
"abugida",
characters = "𐦠-𐦿",
direction = "rtl",
systems = {"abugida"},
}
 
m["Mero"] = {
canonicalName = "Meroitic hieroglyphic",
"abugida",
characters = "𐦀-𐦟",
direction = "rtl",
systems = {"abugida"},
}
 
m["Mlym"] = {
canonicalName = "Malayalam",
"abugida",
characters = "ഀ-ൿ",
systems = {"abugida"},
normalizationFixes = {
from = {"ഇൗ", "ഉൗ", "എെ", "ഒാ", "ഒൗ", "ക്‍", "ണ്‍", "ന്‍റ", "ന്‍", "മ്‍", "യ്‍", "ര്‍", "ല്‍", "ള്‍", "ഴ്‍", "െെ", "ൻ്റ"},
Line ၈၈၉ ⟶ ၉၆၁:
 
m["Modi"] = {
canonicalName = "Modi",
"abugida",
characters = "𑘀-𑙙",
systems = {"abugida"},
normalizationFixes = {
from = {"𑘀𑘹", "𑘀𑘺", "𑘁𑘹", "𑘁𑘺"},
Line ၈၉၉ ⟶ ၉၇၁:
 
m["Mong"] = {
canonicalName = "Mongolian",
"alphabet",
aliases = {"Mongol bichig", "Hudum Mongol bichig"},
characters = "᠀-᠅᠊-᠙ᠠ-ᡂᡸᢀ-ᢗᢦᢩ‌‍ 𑙠-𑙨",
direction = "down",
systems = {"alphabet"},
}
 
m["mnc-Mong"] = {
canonicalName = "Manchu",
m["Mong"][2],
characters = "᠁᠄᠈-᠏ᠠᠣᠨ-ᠪᠮ-ᠰᠴ-ᠸᠺᡝᡟ-ᡡᡤ-ᡩᡬ-ᡱᡳ-ᡷᢀ-ᢈᢏᢚ-ᢥᢨᢪ‌‍ ",
direction = "down",
systems = {"alphabet"},
parent = "Mong",
}
m["sjo-Mong"] = {
canonicalName = "Xibe",
m["Mong"][2],
aliases = {"Sibe"},
characters = "᠄᠇᠊-᠏ᠠᠣᠨᠪᠮ-ᠰᠴ-ᠸᠺᡝ-ᡲ‌‍ ",
direction = "down",
systems = {"alphabet"},
parent = "mnc-Mong",
}
m["xwo-Mong"] = {
canonicalName = "Clear Script",
m["Mong"][2],
aliases = {"Todo", "Todo bichig"},
characters = "᠀᠁᠄-᠆᠊-ᠠᠨᠯ-ᠱᠴᠷᠸᠺᠻᡀᡃ-ᡜᢀ-ᢇᢉ-ᢏᢔᢖ-ᢙᢧ‌‍ 𑙩-𑙬",
direction = "down",
systems = {"alphabet"},
parent = "Mong",
}
 
m["Moon"] = {
canonicalName = "Moon",
"alphabet",
aliases = {"Moon System of Embossed Reading", "Moon type", "Moon writing", "Moon alphabet", "Moon code"},
systems = {"alphabet"},
-- Not in Unicode
}
 
m["Morse"] = {
canonicalName = "Morse code",
}
 
m["Mroo"] = {
canonicalName = "Mro",
characters = "𖩀-𖩯",
}
 
m["Mtei"] = {
canonicalName = "Meitei Mayek",
"abugida",
aliases = {"Meetei Mayek", "Manipuri"},
characters = "ꯀ-꯹ꫠ-꫶",
systems = {"abugida"},
}
 
m["Mult"] = {
canonicalName = "Multani",
"abugida",
characters = "𑊀-𑊩",
systems = {"abugida"},
}
 
m["musicalMusic"] = {
canonicalName = "Musical notation",
"pictography",
characters = "𝄀-𝇨",
translit = false,
systems = {"pictography"},
}
 
m["Mymr"] = {
"Burmese",
canonicalName = "မန်း",
"abugida",
aliases = {"Myanmar"},
characters = "က-႟ꩠ-ꩿꧠ-ꧾ",
systemsspaces = {"abugida"}false,
}
 
m["Nagm"] = {
canonicalName = "Nag Mundari",
"alphabet",
characters = "𞓐-𞓹",
systems = {"alphabet"},
}
 
m["Nand"] = {
canonicalName = "Nandinagari",
"abugida",
characters = "𑦠-𑧤",
systems = {"abugida"},
}
 
m["Narb"] = {
canonicalName = "Old North Arabian",
"abjad",
characters = "𐪀-𐪟",
direction = "rtl",
systems = {"abjad"},
}
 
m["Nbat"] = {
canonicalName = "Nabataean",
"abjad",
aliases = {"Nabatean"},
characters = "𐢀-𐢯",
direction = "rtl",
systems = {"abjad"},
}
 
m["Newa"] = {
canonicalName = "Newa",
"abugida",
aliases = {"Newar", "Newari", "Prachalit Nepal"},
characters = "𑐀-𑑡",
systems = {"abugida"},
}
 
m["Nkdb"] = {
canonicalName = "Naxi Dongba",
systems = {"pictography"},
aliases = {"Naxi Dongba", "Nakhi Dongba", "Tomba", "Tompa", "Mo-so"},
spaces = false,
-- Not in Unicode
}
 
m["Nkgb"] = {
canonicalName = "Nakhi Geba",
systems = {"syllabary"},
aliases = {"Nakhi Geba", "Naxi Geba"},
spaces = false,
-- Not in Unicode
}
 
m["Nkoo"] = {
canonicalName = "N'Ko",
"alphabet",
characters = "߀-߿",
direction = "rtl",
systems = {"alphabet"},
}
 
m["None"] = {
canonicalName = "Unspecified", -- renders as 'unspecified script'
-- This should not have any characters listed
character_categorytranslit = false, -- none
character_category = false,
}
 
m["Nshu"] = {
canonicalName = "Nüshu",
"syllabary",
aliases = {"Nushu"},
characters = "𖿡𛅰-𛋻",
spaces = false,
systems = {"syllabary"},
}
 
m["Ogam"] = {
canonicalName = "Ogham",
characters = " -᚜",
}
 
m["Olck"] = {
canonicalName = "Ol Chiki",
characters = "᱐-᱿",
}
 
m["Orkh"] = {
canonicalName = "Orkhon runes",
aliases = {"Old Turkic"},
characters = "𐰀-𐱈",
direction = "rtl",
Line ၁၀၅၇ ⟶ ၁၁၃၈:
 
m["Orya"] = {
canonicalName = "Oriya",
"abugida",
aliases = {"Odia"},
characters = "ଁ-୷",
systems = {"abugida"},
normalizationFixes = {
from = {"ଅା", "ଏୗ", "ଓୗ"},
Line ၁၀၆၈ ⟶ ၁၁၄၉:
 
m["Osge"] = {
canonicalName = "Osage",
characters = "𐒰-𐓻",
capitalized = true,
Line ၁၀၇၄ ⟶ ၁၁၅၅:
 
m["Osma"] = {
canonicalName = "Osmanya",
characters = "𐒀-𐒩",
}
 
m["Ougr"] = {
canonicalName = "Old Uyghur",
"abjad, alphabet",
characters = "𐽰-𐾉",
direction = "down",
systems = {"abjad", "alphabet"},
}
 
m["Palm"] = {
canonicalName = "Palmyrene",
characters = "𐡠-𐡿",
direction = "rtl",
Line ၁၀၉၂ ⟶ ၁၁၇၃:
 
m["Pauc"] = {
canonicalName = "Pau Cin Hau",
characters = "𑫀-𑫸",
}
 
m["Perm"] = {
canonicalName = "Old Permic",
characters = "𐍐-𐍺",
}
 
m["Phag"] = {
canonicalName = "Phags-pa",
"abugida",
characters = "᠂᠃᠅‌‍ 。ꡀ-꡷",
direction = "down",
systems = {"abugida"},
}
 
m["Phli"] = {
canonicalName = "Inscriptional Pahlavi",
"abjad",
characters = "𐭠-𐭿",
direction = "rtl",
systems = {"abjad"},
}
 
m["Phlp"] = {
canonicalName = "Psalter Pahlavi",
"abjad",
characters = "𐮀-𐮯",
direction = "rtl",
systems = {"abjad"},
}
 
m["Phlv"] = {
canonicalName = "Book Pahlavi",
"abjad",
direction = "rtl",
systems = {"abjad"},
-- Not in Unicode
}
 
m["Phnx"] = {
canonicalName = "Phoenician",
"abjad",
characters = "𐤀-𐤟",
direction = "rtl",
systems = {"abjad"},
}
 
m["Plrd"] = {
canonicalName = "Pollard",
"abugida",
aliases = {"Miao"},
characters = "𖼀-𖾟",
systems = {"abugida"},
}
 
m["Prti"] = {
canonicalName = "Inscriptional Parthian",
characters = "𐭀-𐭟",
direction = "rtl",
Line ၁၁၄၉ ⟶ ၁၂၃၁:
 
m["Ranj"] = {
canonicalName = "Ranjana",
systems = {"abugida"},
-- Not in Unicode
}
 
m["Rjng"] = {
canonicalName = "Rejang",
"abugida",
characters = "ꤰ-꥟",
systems = {"abugida"},
}
 
m["Rohg"] = {
canonicalName = "Hanifi Rohingya",
"alphabet",
characters = "𐴀-𐴹",
direction = "rtl",
systems = {"alphabet"},
}
 
m["Roro"] = {
canonicalName = "Rongorongo",
-- Not in Unicode
}
 
m["RuminumeralsRumin"] = {
canonicalName = "Rumi numerals",
characters = "𐹠-𐹾",
character_category = "Rumi numerals",
Line ၁၁၇၉ ⟶ ၁၂၆၁:
 
m["Runr"] = {
canonicalName = "Runic",
"alphabet",
characters = "ᚠ-ᛰ",
systems = {"alphabet"},
}
 
m["Samr"] = {
canonicalName = "Samaritan",
"abjad",
characters = "ࠀ-࠾",
direction = "rtl",
systems = {"abjad"},
}
 
m["Sarb"] = {
canonicalName = "Old South Arabian",
"abjad",
characters = "𐩠-𐩿",
direction = "rtl",
systems = {"abjad"},
}
 
m["Saur"] = {
canonicalName = "Saurashtra",
"abugida",
characters = "ꢀ-꣙",
systems = {"abugida"},
}
 
m["Semap"] = {
canonicalName = "flag semaphore",
systems = {"pictography"},
}
 
m["Sgnw"] = {
canonicalName = "SignWriting",
"pictography",
characters = "𝠀-𝪯",
translit = false,
systems = {"pictography"},
}
 
m["Shaw"] = {
canonicalName = "Shavian",
characters = "𐑐-𐑿",
}
 
m["Shrd"] = {
canonicalName = "Sharada",
"abugida",
characters = "𑆀-𑇙",
systems = {"abugida"},
}
 
m["Shui"] = {
canonicalName = "Sui",
systems = {"logography"},
spaces = false,
-- Not in Unicode
}
 
m["Sidd"] = {
canonicalName = "Siddham",
"abugida",
characters = "𑖀-𑗝",
systems = {"abugida"},
}
 
m["Sind"] = {
canonicalName = "Khudawadi",
"abugida",
characters = "𑊰-𑋹",
systems = {"abugida"},
normalizationFixes = {
from = {"𑊰𑋠", "𑊰𑋥", "𑊰𑋦", "𑊰𑋧", "𑊰𑋨"},
Line ၁၂၄၉ ⟶ ၁၃၃၃:
 
m["Sinh"] = {
canonicalName = "Sinhalese",
"abugida",
aliases = {"Sinhala"},
characters = "ං-෴",
systems = {"abugida"},
normalizationFixes = {
from = {"අා", "අැ", "අෑ", "උෟ", "ඍෘ", "ඏෟ", "එ්", "එෙ", "ඔෟ", "ෘෘ"},
Line ၁၂၆၀ ⟶ ၁၃၄၄:
 
m["Sogd"] = {
canonicalName = "Sogdian",
"abjad",
characters = "𐼰-𐽙",
direction = "rtl",
systems = {"abjad"},
}
 
m["Sogo"] = {
canonicalName = "Old Sogdian",
"abjad",
characters = "𐼀-𐼧",
direction = "rtl",
systems = {"abjad"},
}
 
m["Sora"] = {
canonicalName = "Sorang Sompeng",
aliases = {"Sora Sompeng"},
characters = "𑃐-𑃹",
Line ၁၂၈၀ ⟶ ၁၃၆၄:
 
m["Soyo"] = {
canonicalName = "Soyombo",
"abugida",
characters = "𑩐-𑪢",
systems = {"abugida"},
}
 
m["Sund"] = {
canonicalName = "Sundanese",
"abugida",
characters = "ᮀ-ᮿ",
systems = {"abugida"},
}
 
m["Sylo"] = {
canonicalName = "Syloti Nagri",
"abugida",
aliases = {"Sylheti Nagari"},
characters = "ꠀ-꠫",
systems = {"abugida"},
}
 
m["Syrc"] = {
canonicalName = "Syriac",
"abjad", -- more precisely, impure abjad
characters = "܀-ݏ"..u(0x0860).."-"..u(0x086A),
direction = "rtl",
systems = {"abjad"}, -- more precisely, impure abjad
}
 
Line ၁၃၀၈ ⟶ ၁၃၉၂:
 
m["Tagb"] = {
canonicalName = "Tagbanwa",
"abugida",
characters = "ᝠ-ᝳ",
systems = {"abugida"},
}
 
m["Takr"] = {
canonicalName = "Takri",
"abugida",
characters = "𑚀-𑛉",
systems = {"abugida"},
normalizationFixes = {
from = {"𑚀𑚭", "𑚀𑚴", "𑚀𑚵", "𑚆𑚲"},
Line ၁၃၂၄ ⟶ ၁၄၀၈:
 
m["Tale"] = {
canonicalName = "Tai Nüa",
"abugida",
aliases = {"Tai Nuea", "New Tai Nüa", "New Tai Nuea", "Dehong Dai", "Tai Dehong", "Tai Le"},
characters = "ᥐ-ᥭᥰ-ᥴ",
systemsspaces = {"abugida"}false,
}
 
m["Talu"] = {
canonicalName = "New Tai Lue",
"abugida",
characters = "ᦀ-᧟",
characters = "ᦀ-ᦫᦰ-ᧉ᧐-᧚᧞᧟",
systems = {"abugida"},
spaces = false,
}
 
m["Taml"] = {
canonicalName = "Tamil",
"abugida",
characters = "ஂ-௺𑿀-𑿿",
systems = {"abugida"},
normalizationFixes = {
from = {"அூ", "ஸ்ரீ"},
Line ၁၃၄၇ ⟶ ၁၄၃၃:
 
m["Tang"] = {
canonicalName = "Tangut",
"logography, syllabary",
characters = "𖿠𗀀-𘫿𘴀-𘴈",
spaces = false,
systems = {"logography", "syllabary"},
}
 
m["Tavt"] = {
canonicalName = "Tai Viet",
"abugida",
characters = "ꪀ-꫟",
systemscharacters = {"abugidaꪀ-ꫂꫛ-꫟"},
spaces = false,
}
 
m["Telu"] = {
canonicalName = "Telugu",
"abugida",
characters = "ఀ-౿",
systems = {"abugida"},
normalizationFixes = {
from = {"ఒౌ", "ఒౕ", "ిౕ", "ెౕ", "ొౕ"},
Line ၁၃၆၉ ⟶ ၁၄၅၇:
 
m["Teng"] = {
canonicalName = "Tengwar",
}
 
m["Tfng"] = {
canonicalName = "Tifinagh",
"abjad, alphabet",
otherNames = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent
characters = "ⴰ-⵿",
otherNames = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent
systems = {"abjad", "alphabet"},
}
 
m["Tglg"] = {
canonicalName = "Baybayin",
"abugida",
aliases = {"Tagalog"},
characters = "ᜀ-᜔",
systems = {"abugida"},
}
 
m["Thaa"] = {
canonicalName = "Thaana",
"abugida",
characters = "ހ-ޱ",
systems = {"abugida"},
direction = "rtl",
}
 
m["Thai"] = {
canonicalName = "Thai",
"abugida",
characters = "ก-๛",
systemscharacters = {"abugidaก-ฺเ-๛"},
spaces = false,
}
 
m["Tibt"] = {
canonicalName = "Tibetan",
"abugida",
characters = "ༀ-࿚",
systems = {"abugida"},
normalizationFixes = {
combiningClasses = {["༹"] = 1},
Line ၁၄၁၁ ⟶ ၁၅၀၀:
 
m["sit-tam-Tibt"] = {
canonicalName = "Tamyig",
m["Tibt"][2],
characters = m["Tibt"].characters,
systems = {"abugida"},
parent = "Tibt",
normalizationFixes = m["Tibt"].normalizationFixes,
Line ၁၄၁၉ ⟶ ၁၅၀၈:
 
m["xzh-Tibt"] = {
canonicalName = "Zhang-Zhung",
m["Tibt"][2],
systems = {"abugida"},
characters = m["Tibt"].characters,
parent = "Tibt",
normalizationFixes = m["Tibt"].normalizationFixes,
Line ၁၄၂၆ ⟶ ၁၅၁၆:
 
m["Tirh"] = {
canonicalName = "Tirhuta",
"abugida",
characters = "𑒀-𑓙",
systems = {"abugida"},
normalizationFixes = {
from = {"𑒁𑒰", "𑒋𑒺", "𑒍𑒺", "𑒪𑒵", "𑒪𑒶"},
Line ၁၄၃၆ ⟶ ၁၅၂၆:
 
m["Tnsa"] = {
canonicalName = "Tangsa",
"alphabet",
characters = "𖩰-𖫉",
systems = {"alphabet"},
}
 
m["Toto"] = {
canonicalName = "Toto",
"abugida",
characters = "𞊐-𞊮",
systems = {"abugida"},
}
 
m["Ugar"] = {
canonicalName = "Ugaritic",
"abjad",
characters = "𐎀-𐎟",
systems = {"abjad"},
}
 
m["Vaii"] = {
canonicalName = "Vai",
"syllabary",
characters = "ꔀ-ꘫ",
systems = {"syllabary"},
}
 
m["Visp"] = {
canonicalName = "Visible Speech",
systems = {"alphabet"},
-- Not in Unicode
}
 
m["Vith"] = {
canonicalName = "Vithkuqi",
"alphabet",
characters = "𐕰-𐖼",
capitalized = true,
systems = {"alphabet"},
}
 
m["Wara"] = {
canonicalName = "Varang Kshiti",
aliases = {"Warang Citi"},
characters = "𑢠-𑣿",
capitalized = true,
Line ၁၄၇၉ ⟶ ၁၅၇၀:
 
m["Wcho"] = {
canonicalName = "Wancho",
"alphabet",
characters = "𞋀-𞋿",
systems = {"alphabet"},
}
 
m["Wole"] = {
canonicalName = "Woleai",
systems = {"syllabary"},
-- Not in Unicode
}
 
m["Xpeo"] = {
canonicalName = "Old Persian",
characters = "𐎠-𐏕",
}
 
m["Xsux"] = {
canonicalName = "Cuneiform",
aliases = {"Sumero-Akkadian Cuneiform"},
characters = "𒀀-𒎙𒐀-𒑳",
}
 
m["Yezi"] = {
"Yezidi",
"alphabet",
characters = "𐺀-𐺱",
direction = "rtl",
}
 
m["Yiii"] = {
canonicalName = "Yi",
"syllabary",
characters = "ꀀ-꓆",
systems = {"syllabary"},
}
 
m["Zanb"] = {
canonicalName = "Zanabazar Square",
characters = u(0x11A00).."-"..u(0x11A47),
}
 
m["Zmth"] = {
canonicalName = "mathematical notation",
characters = "ℵ∀-⋿⟀-⟯⦀-⫿𝐀-𝟿",
translit = false,
character_category = "Mathematical notation symbols", -- ?
}
 
m["Zsym"] = {
canonicalName = "symbol",
"pictography",
characters = "─-➿←-⇿⌀-⏿⬀-⯾🀀-🃵🌀-🩭",
translit = false,
character_category = false, -- none
systems = {"pictography"},
}
 
m["Zyyy"] = {
canonicalName = "undetermined",
-- This should not have any characters listed, probably
translit = false,
character_category = false, -- none
characters = m["Latn"].characters,
}
 
m["Zzzz"] = {
canonicalName = "uncoded",
-- This should not have any characters listed
translit = false,
character_category = false, -- none
}
 
-- These should be defined after the scripts they are composed of.
 
m["Hrkt"] = { -- TODO: add hentaigana
"Kana",
"syllabary",
aliases = {"Japanese syllabaries"},
characters = m["Hira"].characters .. m["Kana"].characters,
spaces = false,
}
 
m["Jpan"] = {
canonicalName = "Japanese",
"logography, syllabary",
characters = m["Hira"].characters .. m["Kana"].characters .. m["Hani"].characters .. m["Latn"].characters,
characters = m["Hrkt"].characters .. m["Hani"].characters .. m["Latnx"].characters,
systems = {"syllabary", "logography"},
spaces = false,
sort_by_scraping = true,
}
 
m["Kore"] = {
canonicalName = "Korean",
"logography, syllabary",
characters = m["Hang"].characters .. m["Hani"].characters,
systems = {"syllabary", "logography"},
}