မော်ဂျူး:scripts/data: ခြပ်ချော်ꩻမုꩻခါႏ ဗိုန်ပီတဝ်းဒါႏဖိုင်ႏ
အပွိုင်အငုဲင်ꩻ
Content deleted Content added
အရေꩻတန်တဝ်း ၂ revisions imported: [TEST] importing blkwiktionary via a tool |
No edit summary လိတ်တွယ်ꩻ: နောက်ပြန်ပြင်ခဲ့ပြီး |
||
လိတ်ရဲဉ်ႏ ၁: | လိတ်ရဲဉ်ႏ ၁: | ||
--[=[ |
--[=[ |
||
When adding new scripts to this file, please don't forget to add |
When adding new scripts to this file, please don't forget to add |
||
style definitons for the script in [[ |
style definitons for the script in [[MediaWiki:Common.css]]. |
||
]=] |
]=] |
||
local u = mw.ustring.char |
|||
local u = mw.ustring.char |
|||
local m = {} |
local m = {} |
||
local u = mw.ustring.char |
|||
m["Adlm"] = { |
m["Adlm"] = { |
||
"Adlam", |
|||
"alphabet", |
|||
characters = "؟ـ𞤀-𞥟", |
characters = "؟ـ𞤀-𞥟", |
||
capitalized = true, |
capitalized = true, |
||
လိတ်ရဲဉ်ႏ ၁၆: | လိတ်ရဲဉ်ႏ ၁၆: | ||
m["Afak"] = { |
m["Afak"] = { |
||
"Afaka", |
|||
"syllabary", |
|||
} |
} |
||
m["Aghb"] = { |
m["Aghb"] = { |
||
"Caucasian Albanian", |
|||
"alphabet", |
|||
characters = "𐔰-𐕯", |
characters = "𐔰-𐕯", |
||
} |
} |
||
m["Ahom"] = { |
m["Ahom"] = { |
||
"Ahom", |
|||
"abugida", |
|||
characters = "𑜀-", |
characters = "𑜀-", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Arab"] = { |
m["Arab"] = { |
||
"Arabic", |
|||
"abjad", -- more precisely, impure abjad |
|||
varieties = {"Jawi", {"Nastaliq", "Nastaleeq"}}, |
varieties = {"Jawi", {"Nastaliq", "Nastaleeq"}}, |
||
characters = "-ۿݐ-ݿࡰ-ࣿﭐ-﷏ﷰ-﷿ﹰ-𐋠-𐋻𐹠--𐻿𞸀-", |
characters = "-ۿݐ-ݿࡰ-ࣿﭐ-﷏ﷰ-﷿ﹰ-𐋠-𐋻𐹠--𐻿𞸀-", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, -- more precisely, impure abjad |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ٳ"}, |
from = {"ٳ"}, |
||
လိတ်ရဲဉ်ႏ ၄၃: | လိတ်ရဲဉ်ႏ ၄၅: | ||
m["fa-Arab"] = { |
m["fa-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
otherNames = {"Perso-Arabic"}, |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
otherNames = {"Perso-Arabic"}, |
|||
direction = "rtl", |
direction = "rtl", |
||
parent = "Arab", |
parent = "Arab", |
||
လိတ်ရဲဉ်ႏ ၅၂: | လိတ်ရဲဉ်ႏ ၅၅: | ||
m["kk-Arab"] = { |
m["kk-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၆၀: | လိတ်ရဲဉ်ႏ ၆၄: | ||
m["ks-Arab"] = { |
m["ks-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၆၈: | လိတ်ရဲဉ်ႏ ၇၃: | ||
m["ku-Arab"] = { |
m["ku-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၇၆: | လိတ်ရဲဉ်ႏ ၈၂: | ||
m["ms-Arab"] = { |
m["ms-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၈၄: | လိတ်ရဲဉ်ႏ ၉၁: | ||
m["mzn-Arab"] = { |
m["mzn-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၉၂: | လိတ်ရဲဉ်ႏ ၁၀၀: | ||
m["ota-Arab"] = { |
m["ota-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၀၀: | လိတ်ရဲဉ်ႏ ၁၀၉: | ||
m["pa-Arab"] = { |
m["pa-Arab"] = { |
||
"Shahmukhi", |
|||
m["Arab"][2], |
|||
otherNames = {"Arabic"}, |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
otherNames = {"Arabic"}, |
|||
direction = "rtl", |
direction = "rtl", |
||
parent = "Arab", |
parent = "Arab", |
||
လိတ်ရဲဉ်ႏ ၁၀၉: | လိတ်ရဲဉ်ႏ ၁၁၉: | ||
m["ps-Arab"] = { |
m["ps-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၁၇: | လိတ်ရဲဉ်ႏ ၁၂၈: | ||
m["sd-Arab"] = { |
m["sd-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၂၅: | လိတ်ရဲဉ်ႏ ၁၃၇: | ||
m["tt-Arab"] = { |
m["tt-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၃၃: | လိတ်ရဲဉ်ႏ ၁၄၆: | ||
m["ug-Arab"] = { |
m["ug-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၄၁: | လိတ်ရဲဉ်ႏ ၁၅၅: | ||
m["ur-Arab"] = { |
m["ur-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၄၉: | လိတ်ရဲဉ်ႏ ၁၆၄: | ||
m["xka-Arab"] = { |
m["xka-Arab"] = { |
||
"Arabic", |
|||
m["Arab"][2], |
|||
characters = m["Arab"].characters, |
characters = m["Arab"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၅၉: | လိတ်ရဲဉ်ႏ ၁၇၅: | ||
m["Armi"] = { |
m["Armi"] = { |
||
"Imperial Aramaic", |
|||
"abjad", |
|||
characters = "𐡀-𐡟", |
characters = "𐡀-𐡟", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Armn"] = { |
m["Armn"] = { |
||
"Armenian", |
|||
"alphabet", |
|||
characters = "-֏ﬓ-ﬗ", |
characters = "-֏ﬓ-ﬗ", |
||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Avst"] = { |
m["Avst"] = { |
||
"Avestan", |
|||
"alphabet", |
|||
characters = "𐬀-𐬿", |
characters = "𐬀-𐬿", |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၇၉: | လိတ်ရဲဉ်ႏ ၁၉၆: | ||
m["pal-Avst"] = { |
m["pal-Avst"] = { |
||
"Pazend", |
|||
m["Avst"][2], |
|||
characters = m["Avst"].characters, |
characters = m["Avst"].characters, |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၈၆: | လိတ်ရဲဉ်ႏ ၂၀၄: | ||
m["Bali"] = { |
m["Bali"] = { |
||
"Balinese", |
|||
"abugida", |
|||
characters = "ᬀ-", |
characters = "ᬀ-", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Bamu"] = { |
m["Bamu"] = { |
||
"Bamum", |
|||
"syllabary", |
|||
characters = "ꚠ-𖠀-", |
characters = "ꚠ-𖠀-", |
||
} |
} |
||
m["Bass"] = { |
m["Bass"] = { |
||
"Bassa", |
|||
"alphabet", |
|||
aliases = {"Bassa Vah", "Vah"}, |
aliases = {"Bassa Vah", "Vah"}, |
||
characters = "𖫐-", |
characters = "𖫐-", |
||
လိတ်ရဲဉ်ႏ ၂၀၃: | လိတ်ရဲဉ်ႏ ၂၂၃: | ||
m["Batk"] = { |
m["Batk"] = { |
||
"Batak", |
|||
"abugida", |
|||
characters = "ᯀ-᯿", |
characters = "ᯀ-᯿", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Beng"] = { |
m["Beng"] = { |
||
"Bengali", |
|||
"abugida", |
|||
characters = "॒॑।॥ঀ-৯৲-᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱", |
characters = "॒॑।॥ঀ-৯৲-᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"অা", "ঋৃ", "ঌৢ"}, |
from = {"অা", "ঋৃ", "ঌৢ"}, |
||
လိတ်ရဲဉ်ႏ ၂၁၉: | လိတ်ရဲဉ်ႏ ၂၃၉: | ||
m["as-Beng"] = { |
m["as-Beng"] = { |
||
"Assamese", |
|||
m["Beng"][2], |
|||
otherNames = {"Bengali-Assamese", "Eastern Nagari"}, |
otherNames = {"Bengali-Assamese", "Eastern Nagari"}, |
||
characters = "॒॑।॥ঀ-য-᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱", |
characters = "॒॑।॥ঀ-য-᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱", |
||
systems = {"abugida"}, |
|||
normalizationFixes = m["Beng"].normalizationFixes, |
normalizationFixes = m["Beng"].normalizationFixes, |
||
} |
} |
||
m["Bhks"] = { |
m["Bhks"] = { |
||
"Bhaiksuki", |
|||
"abugida", |
|||
characters = "𑰀-", |
characters = "𑰀-", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Blis"] = { |
m["Blis"] = { |
||
"Blissymbols", |
|||
"logography", |
|||
aliases = {"Blissymbolics"}, |
aliases = {"Blissymbolics"}, |
||
systems = {"logography"}, |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Bopo"] = { |
m["Bopo"] = { |
||
"Zhuyin", |
|||
"semisyllabary", |
|||
aliases = {"Zhuyin Fuhao", "Bopomofo"}, |
aliases = {"Zhuyin Fuhao", "Bopomofo"}, |
||
characters = "ˇˉˊˋ˙˪˫、-〃〈-】〓-〟〪-〭〰〷・-ㄯ﹅﹆。-・", |
characters = "ˇˉˊˋ˙˪˫、-〃〈-】〓-〟〪-〭〰〷・-ㄯ﹅﹆。-・", |
||
လိတ်ရဲဉ်ႏ ၂၄၆: | လိတ်ရဲဉ်ႏ ၂၆၇: | ||
m["Brah"] = { |
m["Brah"] = { |
||
"Brahmi", |
|||
"abugida", |
|||
characters = "𑀀-𑁿", |
characters = "𑀀-𑁿", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"𑀅𑀸", "𑀋𑀾", "𑀏𑁂"}, |
from = {"𑀅𑀸", "𑀋𑀾", "𑀏𑁂"}, |
||
လိတ်ရဲဉ်ႏ ၂၅၆: | လိတ်ရဲဉ်ႏ ၂၇၇: | ||
m["Brai"] = { |
m["Brai"] = { |
||
"Braille", |
|||
"alphabet", |
|||
characters = "⠀-⣿", |
characters = "⠀-⣿", |
||
} |
} |
||
m["Bugi"] = { |
m["Bugi"] = { |
||
"Buginese", |
|||
"abugida", |
|||
aliases = {"Lontara"}, |
aliases = {"Lontara"}, |
||
characters = "ᨀ-᨟ꧏ", |
characters = "ᨀ-᨟ꧏ", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Buhd"] = { |
m["Buhd"] = { |
||
"Buhid", |
|||
"abugida", |
|||
characters = "᜵᜶ᝀ-ꧏ", |
characters = "᜵᜶ᝀ-ꧏ", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Cakm"] = { |
m["Cakm"] = { |
||
"Chakma", |
|||
"abugida", |
|||
characters = "০-৯၀-၉𑄀-", |
characters = "০-৯၀-၉𑄀-", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Cans"] = { |
m["Cans"] = { |
||
"Canadian syllabics", |
|||
"abugida", |
|||
characters = "᐀-ᙿᢰ-𑪰-𑪿", |
characters = "᐀-ᙿᢰ-𑪰-𑪿", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Cari"] = { |
m["Cari"] = { |
||
"Carian", |
|||
"alphabet", |
|||
characters = "𐊠-", |
characters = "𐊠-", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Cham"] = { |
m["Cham"] = { |
||
"Cham", |
|||
"abugida", |
|||
characters = "ꨀ-꩟", |
characters = "ꨀ-꩟", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Cher"] = { |
m["Cher"] = { |
||
"Cherokee", |
|||
"syllabary", |
|||
characters = "Ꭰ-ꭰ-ꮿ", |
characters = "Ꭰ-ꭰ-ꮿ", |
||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Chrs"] = { |
m["Chrs"] = { |
||
"Chorasmian", |
|||
"abjad", |
|||
characters = "𐾰-", |
characters = "𐾰-", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Copt"] = { |
m["Copt"] = { |
||
"Coptic", |
|||
"alphabet", |
|||
characters = "Ϣ-ϯⲀ-⳿𐋠-𐋻", -- this is mostly "Coptic", not unified "Greek and Coptic" |
characters = "Ϣ-ϯⲀ-⳿𐋠-𐋻", -- this is mostly "Coptic", not unified "Greek and Coptic" |
||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Cpmn"] = { |
m["Cpmn"] = { |
||
"Cypro-Minoan", |
|||
"syllabary", |
|||
aliases = {"Cypro Minoan"}, |
aliases = {"Cypro Minoan"}, |
||
characters = "𐄀𐄁𒾐-", |
characters = "𐄀𐄁𒾐-", |
||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Cprt"] = { |
m["Cprt"] = { |
||
"Cypriot", |
|||
"syllabary", |
|||
characters = "𐄀-𐄂𐄇-𐄳𐄷-𐄿𐠀-𐠿", |
characters = "𐄀-𐄂𐄇-𐄳𐄷-𐄿𐠀-𐠿", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Cyrl"] = { |
m["Cyrl"] = { |
||
"Cyrillic", |
|||
"alphabet", |
|||
characters = "Ѐ-ԯᲀ-ᴫᵸ᷸ⷠ-ⷿ⹃Ꙁ-ꚟ︮︯𞀰-𞂏", |
characters = "Ѐ-ԯᲀ-ᴫᵸ᷸ⷠ-ⷿ⹃Ꙁ-ꚟ︮︯𞀰-𞂏", |
||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Cyrs"] = { |
m["Cyrs"] = { |
||
"Old Cyrillic", |
|||
m["Cyrl"][2], |
|||
aliases = {"Early Cyrillic"}, |
aliases = {"Early Cyrillic"}, |
||
characters = m["Cyrl"].characters, |
characters = m["Cyrl"].characters, |
||
capitalized = m["Cyrl"].capitalized, |
capitalized = m["Cyrl"].capitalized, |
||
wikipedia_article = "Early Cyrillic alphabet", |
wikipedia_article = "Early Cyrillic alphabet", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Deva"] = { |
m["Deva"] = { |
||
"Devanagari", |
|||
"abugida", |
|||
characters = "ऀ-ॿ꣠-ꣿ𑬀-𑬉", |
characters = "ऀ-ॿ꣠-ꣿ𑬀-𑬉", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ॆॆ", "ेे", "ाॅ", "ाॆ", "ाꣿ", "ॊॆ", "ाे", "ाै", "ोे", "ाऺ", "ॖॖ", "अॅ", "अॆ", "अा", "एॅ", "एॆ", "एे", "एꣿ", "ऎॆ", "अॉ", "आॅ", "अॊ", "आॆ", "अो", "आे", "अौ", "आै", "ओे", "अऺ", "अऻ", "आऺ", "अाꣿ", "आꣿ", "ऒॆ", "अॖ", "अॗ", "ॶॖ", "्?ा"}, |
from = {"ॆॆ", "ेे", "ाॅ", "ाॆ", "ाꣿ", "ॊॆ", "ाे", "ाै", "ोे", "ाऺ", "ॖॖ", "अॅ", "अॆ", "अा", "एॅ", "एॆ", "एे", "एꣿ", "ऎॆ", "अॉ", "आॅ", "अॊ", "आॆ", "अो", "आे", "अौ", "आै", "ओे", "अऺ", "अऻ", "आऺ", "अाꣿ", "आꣿ", "ऒॆ", "अॖ", "अॗ", "ॶॖ", "्?ा"}, |
||
လိတ်ရဲဉ်ႏ ၃၅၈: | လိတ်ရဲဉ်ႏ ၃၈၀: | ||
m["Diak"] = { |
m["Diak"] = { |
||
"Dhives Akuru", |
|||
"abugida", |
|||
aliases = {"Dives Akuru"}, |
aliases = {"Dives Akuru"}, |
||
characters = "𑤀-𑤆𑤉𑤌-𑤓𑤕𑤖𑤘-𑤵𑤷𑤸𑤻-𑥆𑥐-𑥙", |
characters = "𑤀-𑤆𑤉𑤌-𑤓𑤕𑤖𑤘-𑤵𑤷𑤸𑤻-𑥆𑥐-𑥙", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Dogr"] = { |
m["Dogr"] = { |
||
"Dogra", |
|||
"abugida", |
|||
characters = "𑠀-𑠻", |
characters = "𑠀-𑠻", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Dsrt"] = { |
m["Dsrt"] = { |
||
"Deseret", |
|||
"alphabet", |
|||
characters = "𐐀-𐑏", |
characters = "𐐀-𐑏", |
||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Dupl"] = { |
m["Dupl"] = { |
||
"Duployan", |
|||
"alphabet", |
|||
characters = "𛰀-𛱪𛱰-𛱼𛲀-𛲈𛲐-𛲙𛲜-𛲟", |
characters = "𛰀-𛱪𛱰-𛱼𛲀-𛲈𛲐-𛲙𛲜-𛲟", |
||
} |
} |
||
m["Egyd"] = { |
m["Egyd"] = { |
||
"Demotic", |
|||
"abjad, logography", |
|||
} |
} |
||
m["Egyh"] = { |
m["Egyh"] = { |
||
"Hieratic", |
|||
"abjad, logography", |
|||
} |
} |
||
m["Egyp"] = { |
m["Egyp"] = { |
||
"Egyptian hieroglyphic", |
|||
"abjad, logography", |
|||
varieties = {"Hieratic"}, |
|||
characters = "𓀀-𓑕", |
characters = "𓀀-𓑕", |
||
varieties = {"Hieratic"}, |
|||
wikipedia_article = "Egyptian hieroglyphs", |
wikipedia_article = "Egyptian hieroglyphs", |
||
systems = {"abjad", "logography"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = { |
from = {"𓃁", "𓆖"}, |
||
to = { |
to = {"𓃀𓂝", "𓆓𓏏𓇿"} |
||
}, |
}, |
||
} |
} |
||
m["Elba"] = { |
m["Elba"] = { |
||
"Elbasan", |
|||
"alphabet", |
|||
characters = "𐔀-𐔧", |
characters = "𐔀-𐔧", |
||
} |
|||
systems = {"alphabet"}, |
|||
m["Elym"] = { |
|||
"Elymaic", |
|||
"abjad", |
|||
characters = "𐿠-𐿶", |
|||
direction = "rtl", |
|||
} |
} |
||
m["Ethi"] = { |
m["Ethi"] = { |
||
"Ethiopic", |
|||
"abugida", |
|||
aliases = {"Ge'ez"}, |
aliases = {"Ge'ez"}, |
||
characters = "ሀ-ቈቊ-ቍቐ-ቖቘቚ-ቝበ-ኈኊ-ኍነ-ኰኲ-ኵኸ-ኾዀዂ-ዅወ-ዖዘ-ጐጒ-ጕጘ-ፚ፝-፼ᎀ-᎙ⶀ-ⶖⶠ-ⶦⶨ-ⶮⶰ-ⶶⶸ-ⶾⷀ-ⷆⷈ-ⷎⷐ-ⷖⷘ-ⷞꬁ-ꬆꬉ-ꬎꬑ-ꬖꬠ-ꬦꬨ-ꬮ𞟠-𞟦𞟨-𞟫𞟭𞟮𞟰-𞟾", |
characters = "ሀ-ቈቊ-ቍቐ-ቖቘቚ-ቝበ-ኈኊ-ኍነ-ኰኲ-ኵኸ-ኾዀዂ-ዅወ-ዖዘ-ጐጒ-ጕጘ-ፚ፝-፼ᎀ-᎙ⶀ-ⶖⶠ-ⶦⶨ-ⶮⶰ-ⶶⶸ-ⶾⷀ-ⷆⷈ-ⷎⷐ-ⷖⷘ-ⷞꬁ-ꬆꬉ-ꬎꬑ-ꬖꬠ-ꬦꬨ-ꬮ𞟠-𞟦𞟨-𞟫𞟭𞟮𞟰-𞟾", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Geok"] = { |
m["Geok"] = { |
||
"Khutsuri", |
|||
"alphabet", |
|||
varieties = {"Nuskhuri", "Asomtavruli"}, |
|||
characters = "Ⴀ-ჅჇჍ჻ⴀ-ⴥⴧⴭ", -- Ⴀ-Ⴭ is Asomtavruli, ⴀ-ⴭ is Nuskhuri |
characters = "Ⴀ-ჅჇჍ჻ⴀ-ⴥⴧⴭ", -- Ⴀ-Ⴭ is Asomtavruli, ⴀ-ⴭ is Nuskhuri |
||
varieties = {"Nuskhuri", "Asomtavruli"}, |
|||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Geor"] = { |
m["Geor"] = { |
||
"Georgian", |
|||
"alphabet", |
|||
varieties = {"Mkhedruli", "Mtavruli"}, |
|||
characters = "ა-ჿᲐ-ᲺᲽ-Ჿ", -- ა-ჿ is lowercase Mkhedruli; Ა-Ჿ is uppercase Mkhedruli (Mtavruli) |
characters = "ა-ჿᲐ-ᲺᲽ-Ჿ", -- ა-ჿ is lowercase Mkhedruli; Ა-Ჿ is uppercase Mkhedruli (Mtavruli) |
||
varieties = {"Mkhedruli", "Mtavruli"}, |
|||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Glag"] = { |
m["Glag"] = { |
||
"Glagolitic", |
|||
"alphabet", |
|||
characters = "Ⰰ-ⱟ𞀀-𞀆𞀈-𞀘𞀛-𞀡𞀣𞀤𞀦-𞀪", |
characters = "Ⰰ-ⱟ𞀀-𞀆𞀈-𞀘𞀛-𞀡𞀣𞀤𞀦-𞀪", |
||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Gong"] = { |
m["Gong"] = { |
||
"Gunjala Gondi", |
|||
"abugida", |
|||
characters = "𑵠-𑵥𑵧𑵨𑵪-𑶎𑶐𑶑𑶓-𑶘𑶠-𑶩", |
characters = "𑵠-𑵥𑵧𑵨𑵪-𑶎𑶐𑶑𑶓-𑶘𑶠-𑶩", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Gonm"] = { |
m["Gonm"] = { |
||
"Masaram Gondi", |
|||
"abugida", |
|||
characters = "𑴀-𑴆𑴈𑴉𑴋-𑴶𑴺𑴼𑴽𑴿-𑵇𑵐-𑵙", |
characters = "𑴀-𑴆𑴈𑴉𑴋-𑴶𑴺𑴼𑴽𑴿-𑵇𑵐-𑵙", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Goth"] = { |
m["Goth"] = { |
||
"Gothic", |
|||
"alphabet", |
|||
characters = "𐌰-𐍊", |
characters = "𐌰-𐍊", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Gran"] = { |
m["Gran"] = { |
||
"Grantha", |
|||
"abugida", |
|||
characters = "𑌀-𑌃𑌅-𑌌𑌏-𑌐𑌓-𑌨𑌪-𑌰𑌲𑌳𑌵-𑌹𑌼-𑍄𑍇𑍈𑍋-𑍍𑍐𑍗𑍝-𑍣𑍦-𑍬𑍰-𑍴", |
characters = "𑌀-𑌃𑌅-𑌌𑌏-𑌐𑌓-𑌨𑌪-𑌰𑌲𑌳𑌵-𑌹𑌼-𑍄𑍇𑍈𑍋-𑍍𑍐𑍗𑍝-𑍣𑍦-𑍬𑍰-𑍴", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Grek"] = { |
m["Grek"] = { |
||
"Greek", |
|||
"alphabet", |
|||
characters = "Ͱ-ͷͺ-Ϳ΄-ΊΌΎ-ΡΣ-ϡϰ-Ͽᴦ-ᴪᵝ-ᵡᵦ-ᵪᶿΩ℩ꭥ𐅀-𐆎𐆠𝈀-𝉅", |
characters = "Ͱ-ͷͺ-Ϳ΄-ΊΌΎ-ΡΣ-ϡϰ-Ͽᴦ-ᴪᵝ-ᵡᵦ-ᵪᶿΩ℩ꭥ𐅀-𐆎𐆠𝈀-𝉅", |
||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m[" |
m["Polyt"] = { |
||
"Greek", |
|||
m["Grek"][2], |
|||
characters = "ἀ-῾" .. m["Grek"].characters, |
characters = "ἀ-῾" .. m["Grek"].characters, |
||
capitalized = m["Grek"].capitalized, |
capitalized = m["Grek"].capitalized, |
||
parent = "Grek", |
parent = "Grek", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Gujr"] = { |
m["Gujr"] = { |
||
"Gujarati", |
|||
"abugida", |
|||
characters = "ઁ-ઃઅ-ઍએ-ઑઓ-નપ-રલળવ-હ઼-ૅે-ૉો-્ૐૠ-ૣ૦-૱ૺ-૿", |
characters = "ઁ-ઃઅ-ઍએ-ઑઓ-નપ-રલળવ-હ઼-ૅે-ૉો-્ૐૠ-ૣ૦-૱ૺ-૿", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ઓ", "અાૈ", "અા", "અૅ", "અે", "અૈ", "અૉ", "અો", "અૌ", "આૅ", "આૈ", "ૅા"}, |
from = {"ઓ", "અાૈ", "અા", "અૅ", "અે", "અૈ", "અૉ", "અો", "અૌ", "આૅ", "આૈ", "ૅા"}, |
||
လိတ်ရဲဉ်ႏ ၄၉၀: | လိတ်ရဲဉ်ႏ ၅၂၀: | ||
m["Guru"] = { |
m["Guru"] = { |
||
"Gurmukhi", |
|||
"abugida", |
|||
characters = "ਁ-ਃਅ-ਊਏਐਓ-ਨਪ-ਰਲਲ਼ਵਸ਼ਸਹ਼ਾ-ੂੇੈੋ-੍ੑਖ਼-ੜਫ਼੦-੶", |
characters = "ਁ-ਃਅ-ਊਏਐਓ-ਨਪ-ਰਲਲ਼ਵਸ਼ਸਹ਼ਾ-ੂੇੈੋ-੍ੑਖ਼-ੜਫ਼੦-੶", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ਅਾ", "ਅੈ", "ਅੌ", "ੲਿ", "ੲੀ", "ੲੇ", "ੳੁ", "ੳੂ", "ੳੋ"}, |
from = {"ਅਾ", "ਅੈ", "ਅੌ", "ੲਿ", "ੲੀ", "ੲੇ", "ੳੁ", "ੳੂ", "ੳੋ"}, |
||
လိတ်ရဲဉ်ႏ ၅၀၀: | လိတ်ရဲဉ်ႏ ၅၃၀: | ||
m["Hang"] = { |
m["Hang"] = { |
||
"Hangul", |
|||
"syllabary", |
|||
aliases = {"Hangeul"}, |
aliases = {"Hangeul"}, |
||
characters = ( |
characters = ( |
||
လိတ်ရဲဉ်ႏ ၅၁၀: | လိတ်ရဲဉ်ႏ ၅၄၁: | ||
"ᅠ-ᅵ" -- Halfwidth |
"ᅠ-ᅵ" -- Halfwidth |
||
), |
), |
||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Hani"] = { |
m["Hani"] = { |
||
"Han", |
|||
"logography", |
|||
varieties = {"Hanzi", "Kanji", "Hanja", "Chu Nom"}, |
|||
characters = ( |
characters = ( |
||
"一-鿿".. |
"一-鿿" .. |
||
"㐀-䶿".. -- ExtA |
"㐀-䶿" .. -- ExtA |
||
"𠀀- |
"𠀀-𪛟" .. -- ExtB |
||
" |
"𪜀-" .. -- ExtC-F & I |
||
"﨎﨏﨑﨓﨔﨟﨡﨣﨤﨧﨨﨩".. |
"𰀀-𲎯" .. -- ExtG-H |
||
"﨎﨏﨑﨓﨔﨟﨡﨣﨤﨧﨨﨩" .. |
|||
" |
"⼀-" .. -- Kangxi Radicals |
||
" |
"⺀-" .. -- Radicals Supplement |
||
" |
" -〿" .. -- CJK Symbols and Punctuation |
||
"𖿢𖿣𖿰𖿱" .. -- Ideographic Symbols and Punctuation |
|||
"㇀-".. -- Strokes |
|||
" |
"㇀-" .. -- Strokes |
||
"㋿㍻-㍿" .. -- 組文字 |
|||
"㈠-㉇㊀-㊰㋀-㋋㍘-㍰㏠-㏾🈐-🈒🈔-🈻🉀-🉈🉐🉑🉠-🉥" .. |
|||
-- Saved as bytes to stop normalization on save. |
|||
"\239\164\128-\239\171\191" .. -- Compatibility Ideographs |
|||
"\240\175\160\128-\240\175\168\159" -- Compatibility Ideographs Supplement |
|||
), |
), |
||
varieties = {"Hanzi", "Kanji", "Hanja", "Chu Nom"}, |
|||
systems = {"logography"}, |
|||
spaces = false, |
|||
} |
} |
||
m["Hans"] = { |
m["Hans"] = { |
||
"Simplified Han", |
|||
m["Hani"][2], |
|||
characters = m["Hani"].characters, |
characters = m["Hani"].characters, |
||
spaces = m["Hani"].spaces, |
|||
parent = "Hani", |
parent = "Hani", |
||
} |
} |
||
m["Hant"] = { |
m["Hant"] = { |
||
"Traditional Han", |
|||
m["Hani"][2], |
|||
characters = m["Hani"].characters, |
characters = m["Hani"].characters, |
||
spaces = m["Hani"].spaces, |
|||
parent = "Hani", |
parent = "Hani", |
||
} |
} |
||
m["Hano"] = { |
m["Hano"] = { |
||
"Hanunoo", |
|||
"abugida", |
|||
characters = "ᜠ-᜴", |
characters = "ᜠ-᜴", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Hatr"] = { |
m["Hatr"] = { |
||
"Hatran", |
|||
"abjad", |
|||
characters = "𐣠-𐣿", |
characters = "𐣠-𐣿", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Hebr"] = { |
m["Hebr"] = { |
||
"Hebrew", |
|||
"abjad", -- more precisely, impure abjad |
|||
characters = u(0x0590) .. "-" .. u(0x05FF) .. u(0xFB1D) .. "-" .. u(0xFB4F), |
characters = u(0x0590) .. "-" .. u(0x05FF) .. u(0xFB1D) .. "-" .. u(0xFB4F), |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, -- more precisely, impure abjad |
|||
} |
} |
||
m["Hira"] = { |
m["Hira"] = { |
||
"Hiragana", |
|||
"syllabary", |
|||
varieties = {"Hentaigana"}, |
|||
characters = "ぁ-ゟ𛀁-𛄞𛅐𛅑𛅒🈀", |
characters = "ぁ-ゟ𛀁-𛄞𛅐𛅑𛅒🈀", |
||
varieties = {"Hentaigana"}, |
|||
spaces = false, |
|||
} |
} |
||
m["Hluw"] = { |
m["Hluw"] = { |
||
"Anatolian Hieroglyphs", |
|||
"logography, syllabary", |
|||
characters = "𔐀-𔙆", |
characters = "𔐀-𔙆", |
||
wikipedia_article = "Anatolian hieroglyphs", |
wikipedia_article = "Anatolian hieroglyphs", |
||
လိတ်ရဲဉ်ႏ ၅၇၉: | လိတ်ရဲဉ်ႏ ၆၂၀: | ||
m["Hmng"] = { |
m["Hmng"] = { |
||
"Pahawh Hmong", |
|||
"semisyllabary", |
|||
aliases = {"Pahawh Hmong"}, |
|||
aliases = {"Hmong"}, |
|||
characters = "𖬀-𖮏", |
characters = "𖬀-𖮏", |
||
} |
|||
m["Hmnp"] = { |
|||
"Nyiakeng Puachue Hmong", |
|||
"alphabet", |
|||
characters = "𞄀-𞅏", |
|||
} |
} |
||
m["Hung"] = { |
m["Hung"] = { |
||
"Old Hungarian", |
|||
"alphabet", |
|||
aliases = {"Hungarian runic"}, |
aliases = {"Hungarian runic"}, |
||
characters = "𐲀-𐲲", |
characters = "𐲀-𐲲", |
||
လိတ်ရဲဉ်ႏ ၅၉၃: | လိတ်ရဲဉ်ႏ ၆၄၂: | ||
m["Ibrn"] = { |
m["Ibrn"] = { |
||
"Iberian", |
|||
"semisyllabary", |
|||
} |
} |
||
m["Imag"] = { |
m["Imag"] = { |
||
-- To be used to avoid any formatting or link processing |
-- To be used to avoid any formatting or link processing |
||
"Image-rendered", |
|||
-- This should not have any characters listed |
-- This should not have any characters listed |
||
translit = false, |
|||
character_category = false, |
character_category = false, |
||
} |
} |
||
m["Inds"] = { |
m["Inds"] = { |
||
"Indus", |
|||
aliases = {"Harappan", "Indus Valley"}, |
aliases = {"Harappan", "Indus Valley"}, |
||
} |
} |
||
m[" |
m["Ipach"] = { |
||
"International Phonetic Alphabet", |
|||
aliases = {"IPA"}, |
aliases = {"IPA"}, |
||
} |
} |
||
m["Ital"] = { |
m["Ital"] = { |
||
"Old Italic", |
|||
"alphabet", |
|||
characters = "𐌀-𐌯", |
characters = "𐌀-𐌯", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Java"] = { |
m["Java"] = { |
||
"Javanese", |
|||
"abugida", |
|||
characters = "ꦀ-꧟", |
characters = "ꦀ-꧟", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Jurc"] = { |
m["Jurc"] = { |
||
"Jurchen", |
|||
spaces = false, |
|||
} |
} |
||
m["Kali"] = { |
m["Kali"] = { |
||
"Kayah Li", |
|||
"abugida", |
|||
characters = "꤀-꤯", |
characters = "꤀-꤯", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Kana"] = { |
m["Kana"] = { |
||
"Katakana", |
|||
"syllabary", |
|||
characters = "゠-ヿㇰ-ㇿ㌀-㍗ヲ-゚𛀀𛅤𛅥𛅦𛅧", |
characters = "゠-ヿㇰ-ㇿ㌀-㍗ヲ-゚𛀀𛅤𛅥𛅦𛅧", |
||
spaces = false, |
|||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Kawi"] = { |
m["Kawi"] = { |
||
"Kawi", |
|||
"abugida", |
|||
characters = "𑼀-𑽙", |
characters = "𑼀-𑽙", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Khar"] = { |
m["Khar"] = { |
||
"Kharoshthi", |
|||
"abugida", |
|||
characters = "𐨀-𐩘", |
characters = "𐨀-𐩘", |
||
systems = {"abugida"}, |
|||
direction = "rtl", |
direction = "rtl", |
||
} |
} |
||
m["Khmr"] = { |
m["Khmr"] = { |
||
"Khmer", |
|||
"abugida", |
|||
characters = "ក-៹᧠-᧿", |
|||
characters = "ក-៝០-៩៰-៹᧠-᧿", |
|||
systems = {"abugida"}, |
|||
spaces = false, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ឣ", "ឤ"}, |
from = {"ឣ", "ឤ"}, |
||
လိတ်ရဲဉ်ႏ ၆၆၅: | လိတ်ရဲဉ်ႏ ၇၁၉: | ||
m["Khoj"] = { |
m["Khoj"] = { |
||
"Khojki", |
|||
"abugida", |
|||
characters = "𑈀-𑈾", |
characters = "𑈀-𑈾", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"𑈀𑈬𑈱", "𑈀𑈬", "𑈀𑈱", "𑈀𑈳", "𑈁𑈱", "𑈆𑈬", "𑈬𑈰", "𑈬𑈱", "𑉀𑈮"}, |
from = {"𑈀𑈬𑈱", "𑈀𑈬", "𑈀𑈱", "𑈀𑈳", "𑈁𑈱", "𑈆𑈬", "𑈬𑈰", "𑈬𑈱", "𑉀𑈮"}, |
||
လိတ်ရဲဉ်ႏ ၆၇၅: | လိတ်ရဲဉ်ႏ ၇၂၉: | ||
m["Kitl"] = { |
m["Kitl"] = { |
||
"Khitan Large", |
|||
"logography, syllabary", |
|||
spaces = false, |
|||
} |
} |
||
m["Kits"] = { |
m["Kits"] = { |
||
"Khitan Small", |
|||
"logography, syllabary", |
|||
characters = "𘬀-𘳕"..u(0x16FE4), |
characters = "𘬀-𘳕"..u(0x16FE4), |
||
spaces = false, |
|||
systems = {"logography", "syllabary"}, |
|||
} |
} |
||
m["Knda"] = { |
m["Knda"] = { |
||
"Kannada", |
|||
"abugida", |
|||
characters = "ಀ-ೲ", |
characters = "ಀ-ೲ", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ಉಾ", "ಋಾ", "ಒೌ"}, |
from = {"ಉಾ", "ಋಾ", "ಒೌ"}, |
||
လိတ်ရဲဉ်ႏ ၆၉၆: | လိတ်ရဲဉ်ႏ ၇၅၂: | ||
m["Kpel"] = { |
m["Kpel"] = { |
||
"Kpelle", |
|||
"syllabary", |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Kthi"] = { |
m["Kthi"] = { |
||
"Kaithi", |
|||
"abugida", |
|||
characters = "𑂀-", |
characters = "𑂀-", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Lana"] = { |
m["Lana"] = { |
||
"Tai Tham", |
|||
"abugida", |
|||
aliases = {"Tham", "Tua Mueang", "Lanna"}, |
aliases = {"Tham", "Tua Mueang", "Lanna"}, |
||
characters = "ᨠ-᪭", |
characters = "ᨠ-ᩞ᩠-᩿᩼᪀-᪉᪐-᪙᪠-᪭", |
||
spaces = false, |
|||
} |
} |
||
m["Laoo"] = { |
m["Laoo"] = { |
||
"Lao", |
|||
"abugida", |
|||
characters = "ກ-ໟ", |
|||
characters = "ກຂຄຆ-ຊຌ-ຣລວ-ຽເ-ໄໆ່-໎໐-໙ໜ-ໟ", |
|||
systems = {"abugida"}, |
|||
spaces = false, |
|||
} |
} |
||
m["Latn"] = { |
m["Latn"] = { |
||
"Latin", |
|||
"alphabet", |
|||
aliases = {"Roman"}, |
aliases = {"Roman"}, |
||
varieties = {"Rumi", "Romaji", "Rōmaji", "Romaja"}, |
|||
characters = "A-Za-zªºÀ-ÖØ-öø-ɏḀ-ỿ", |
characters = "A-Za-zªºÀ-ÖØ-öø-ɏḀ-ỿ", |
||
varieties = {"Rumi", "Romaji", "Rōmaji", "Romaja"}, |
|||
capitalized = true, |
capitalized = true, |
||
translit = false, |
|||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Latf"] = { |
m["Latf"] = { |
||
"Fraktur", |
|||
m["Latn"][2], |
|||
otherNames = {"Blackletter"}, -- Blackletter is actually the parent "script" |
|||
characters = m["Latn"].characters, |
characters = m["Latn"].characters, |
||
otherNames = {"Blackletter"}, -- Blackletter is actually the parent "script" |
|||
capitalized = m["Latn"].capitalized, |
capitalized = m["Latn"].capitalized, |
||
translit = m["Latn"].translit, |
|||
parent = "Latn", |
parent = "Latn", |
||
} |
} |
||
m["Latg"] = { |
m["Latg"] = { |
||
"Gaelic", |
|||
m["Latn"][2], |
|||
otherNames = {"Irish"}, |
|||
characters = m["Latn"].characters, |
characters = m["Latn"].characters, |
||
otherNames = {"Irish"}, |
|||
capitalized = m["Latn"].capitalized, |
capitalized = m["Latn"].capitalized, |
||
translit = m["Latn"].translit, |
|||
parent = "Latn", |
parent = "Latn", |
||
} |
} |
||
m[" |
m["Latnx"] = { |
||
"Latin", |
|||
m["Latn"][2], |
|||
characters = m["Latn"].characters .. "ɐ-ʸˠ-ˤᴀ-ᴥᴬ-ᵜᵢ-ᵥᵫ-ᵷᵹ-ᶾⁱⁿₐ-ₜKÅℲⅎⅠ-ↈⱠ-ⱿꜢ-ꞇꞋ-ꟊꟐꟑꟓꟕ-ꟙꟲ-ꟿꬰ-ꭚꭜ-ꭤꭦ-ꭩff-stA-Za-z𐞀-𐞅𐞇-𐞰𐞲-𐞺𝼀-𝼞𝼥-𝼪", |
characters = m["Latn"].characters .. "ɐ-ʸˠ-ˤᴀ-ᴥᴬ-ᵜᵢ-ᵥᵫ-ᵷᵹ-ᶾⁱⁿₐ-ₜKÅℲⅎⅠ-ↈⱠ-ⱿꜢ-ꞇꞋ-ꟊꟐꟑꟓꟕ-ꟙꟲ-ꟿꬰ-ꭚꭜ-ꭤꭦ-ꭩff-stA-Za-z𐞀-𐞅𐞇-𐞰𐞲-𐞺𝼀-𝼞𝼥-𝼪", |
||
capitalized = m["Latn"].capitalized, |
capitalized = m["Latn"].capitalized, |
||
translit = m["Latn"].translit, |
|||
parent = "Latn", |
parent = "Latn", |
||
} |
} |
||
m["pjt-Latn"] = { |
m["pjt-Latn"] = { |
||
"Latin", |
|||
m["Latn"][2], |
|||
characters = m["Latn"].characters, |
characters = m["Latn"].characters, |
||
capitalized = m["Latn"].capitalized, |
|||
translit = m["Latn"].translit, |
|||
parent = "Latn", |
parent = "Latn", |
||
} |
} |
||
m["Leke"] = { |
m["Leke"] = { |
||
"Leke", |
|||
"abugida", |
|||
} |
} |
||
m["Lepc"] = { |
m["Lepc"] = { |
||
"Lepcha", |
|||
"abugida", |
|||
characters = "ᰀ-ᱏ", |
characters = "ᰀ-ᱏ", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Limb"] = { |
m["Limb"] = { |
||
"Limbu", |
|||
"abugida", |
|||
characters = "ᤀ-᥏", |
characters = "ᤀ-᥏", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Lina"] = { |
m["Lina"] = { |
||
"Linear A", |
|||
characters = "𐘀-𐝧", |
characters = "𐘀-𐝧", |
||
} |
} |
||
m["Linb"] = { |
m["Linb"] = { |
||
"Linear B", |
|||
characters = "𐀀-𐃺", |
characters = "𐀀-𐃺", |
||
} |
} |
||
m["Lisu"] = { |
m["Lisu"] = { |
||
"Lisu", |
|||
"alphabet", |
|||
aliases = {"Fraser"}, |
aliases = {"Fraser"}, |
||
characters = "ꓐ-꓿𑾰", |
characters = "ꓐ-꓿𑾰", |
||
normalizationFixes = { |
|||
systems = {"alphabet"}, |
|||
from = {"['’]", "[.ꓸ][.ꓸ]", "[.ꓸ][,ꓹ]"}, |
|||
to = {"ʼ", "ꓺ", "ꓻ"} |
|||
}, |
|||
} |
} |
||
m["Loma"] = { |
m["Loma"] = { |
||
"Loma", |
|||
"syllabary", |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Lyci"] = { |
m["Lyci"] = { |
||
"Lycian", |
|||
"alphabet", |
|||
characters = "𐊀-𐊜", |
characters = "𐊀-𐊜", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Lydi"] = { |
m["Lydi"] = { |
||
"Lydian", |
|||
"alphabet", |
|||
characters = "𐤠-𐤿", |
characters = "𐤠-𐤿", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Mahj"] = { |
m["Mahj"] = { |
||
"Mahajani", |
|||
"abugida", |
|||
characters = "𑅐-𑅶", |
characters = "𑅐-𑅶", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Maka"] = { |
m["Maka"] = { |
||
"Lontara", |
|||
"abugida", |
|||
aliases = {"Makasar"}, |
aliases = {"Makasar"}, |
||
characters = "𑻠-𑻸", |
characters = "𑻠-𑻸", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Mand"] = { |
m["Mand"] = { |
||
"Mandaic", |
|||
aliases = {"Mandaean"}, |
aliases = {"Mandaean"}, |
||
characters = "ࡀ-࡞", |
characters = "ࡀ-࡞", |
||
လိတ်ရဲဉ်ႏ ၈၃၂: | လိတ်ရဲဉ်ႏ ၉၀၄: | ||
m["Mani"] = { |
m["Mani"] = { |
||
"Manichaean", |
|||
"abjad", |
|||
characters = "𐫀-𐫶", |
characters = "𐫀-𐫶", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Marc"] = { |
m["Marc"] = { |
||
"Marchen", |
|||
"abugida", |
|||
characters = "𑱰-𑲶", |
characters = "𑱰-𑲶", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Maya"] = { |
m["Maya"] = { |
||
"Maya", |
|||
aliases = {"Maya hieroglyphic", "Mayan", "Mayan hieroglyphic"}, |
aliases = {"Maya hieroglyphic", "Mayan", "Mayan hieroglyphic"}, |
||
characters = "𝋠-𝋳", |
characters = "𝋠-𝋳", |
||
လိတ်ရဲဉ်ႏ ၈၅၁: | လိတ်ရဲဉ်ႏ ၉၂၃: | ||
m["Medf"] = { |
m["Medf"] = { |
||
"Medefaidrin", |
|||
aliases = {"Oberi Okaime", "Oberi Ɔkaimɛ"}, |
aliases = {"Oberi Okaime", "Oberi Ɔkaimɛ"}, |
||
characters = "𖹀-𖺚", |
characters = "𖹀-𖺚", |
||
လိတ်ရဲဉ်ႏ ၈၅၈: | လိတ်ရဲဉ်ႏ ၉၃၀: | ||
m["Mend"] = { |
m["Mend"] = { |
||
"Mende", |
|||
aliases = {"Mende Kikakui"}, |
aliases = {"Mende Kikakui"}, |
||
characters = "𞠀-𞣖", |
characters = "𞠀-𞣖", |
||
လိတ်ရဲဉ်ႏ ၈၆၅: | လိတ်ရဲဉ်ႏ ၉၃၇: | ||
m["Merc"] = { |
m["Merc"] = { |
||
"Meroitic cursive", |
|||
"abugida", |
|||
characters = "𐦠-𐦿", |
characters = "𐦠-𐦿", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Mero"] = { |
m["Mero"] = { |
||
"Meroitic hieroglyphic", |
|||
"abugida", |
|||
characters = "𐦀-𐦟", |
characters = "𐦀-𐦟", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Mlym"] = { |
m["Mlym"] = { |
||
"Malayalam", |
|||
"abugida", |
|||
characters = "ഀ-ൿ", |
characters = "ഀ-ൿ", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ഇൗ", "ഉൗ", "എെ", "ഒാ", "ഒൗ", "ക്", "ണ്", "ന്റ", "ന്", "മ്", "യ്", "ര്", "ല്", "ള്", "ഴ്", "െെ", "ൻ്റ"}, |
from = {"ഇൗ", "ഉൗ", "എെ", "ഒാ", "ഒൗ", "ക്", "ണ്", "ന്റ", "ന്", "മ്", "യ്", "ര്", "ല്", "ള്", "ഴ്", "െെ", "ൻ്റ"}, |
||
လိတ်ရဲဉ်ႏ ၈၈၉: | လိတ်ရဲဉ်ႏ ၉၆၁: | ||
m["Modi"] = { |
m["Modi"] = { |
||
"Modi", |
|||
"abugida", |
|||
characters = "𑘀-𑙙", |
characters = "𑘀-𑙙", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"𑘀𑘹", "𑘀𑘺", "𑘁𑘹", "𑘁𑘺"}, |
from = {"𑘀𑘹", "𑘀𑘺", "𑘁𑘹", "𑘁𑘺"}, |
||
လိတ်ရဲဉ်ႏ ၈၉၉: | လိတ်ရဲဉ်ႏ ၉၇၁: | ||
m["Mong"] = { |
m["Mong"] = { |
||
"Mongolian", |
|||
"alphabet", |
|||
aliases = {"Mongol bichig", "Hudum Mongol bichig"}, |
aliases = {"Mongol bichig", "Hudum Mongol bichig"}, |
||
characters = "᠀-᠅᠊-᠙ᠠ-ᡂᡸᢀ-ᢗᢦᢩ 𑙠-𑙨", |
characters = "᠀-᠅᠊-᠙ᠠ-ᡂᡸᢀ-ᢗᢦᢩ 𑙠-𑙨", |
||
direction = "down", |
direction = "down", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["mnc-Mong"] = { |
m["mnc-Mong"] = { |
||
"Manchu", |
|||
m["Mong"][2], |
|||
characters = "᠁᠄᠈-᠏ᠠᠣᠨ-ᠪᠮ-ᠰᠴ-ᠸᠺᡝᡟ-ᡡᡤ-ᡩᡬ-ᡱᡳ-ᡷᢀ-ᢈᢏᢚ-ᢥᢨᢪ ", |
characters = "᠁᠄᠈-᠏ᠠᠣᠨ-ᠪᠮ-ᠰᠴ-ᠸᠺᡝᡟ-ᡡᡤ-ᡩᡬ-ᡱᡳ-ᡷᢀ-ᢈᢏᢚ-ᢥᢨᢪ ", |
||
direction = "down", |
direction = "down", |
||
systems = {"alphabet"}, |
|||
parent = "Mong", |
parent = "Mong", |
||
} |
} |
||
m["sjo-Mong"] = { |
m["sjo-Mong"] = { |
||
"Xibe", |
|||
m["Mong"][2], |
|||
aliases = {"Sibe"}, |
aliases = {"Sibe"}, |
||
characters = "᠄᠇᠊-᠏ᠠᠣᠨᠪᠮ-ᠰᠴ-ᠸᠺᡝ-ᡲ ", |
characters = "᠄᠇᠊-᠏ᠠᠣᠨᠪᠮ-ᠰᠴ-ᠸᠺᡝ-ᡲ ", |
||
direction = "down", |
direction = "down", |
||
systems = {"alphabet"}, |
|||
parent = "mnc-Mong", |
parent = "mnc-Mong", |
||
} |
} |
||
m["xwo-Mong"] = { |
m["xwo-Mong"] = { |
||
"Clear Script", |
|||
m["Mong"][2], |
|||
aliases = {"Todo", "Todo bichig"}, |
aliases = {"Todo", "Todo bichig"}, |
||
characters = "᠀᠁᠄-᠆᠊-ᠠᠨᠯ-ᠱᠴᠷᠸᠺᠻᡀᡃ-ᡜᢀ-ᢇᢉ-ᢏᢔᢖ-ᢙᢧ 𑙩-𑙬", |
characters = "᠀᠁᠄-᠆᠊-ᠠᠨᠯ-ᠱᠴᠷᠸᠺᠻᡀᡃ-ᡜᢀ-ᢇᢉ-ᢏᢔᢖ-ᢙᢧ 𑙩-𑙬", |
||
direction = "down", |
direction = "down", |
||
systems = {"alphabet"}, |
|||
parent = "Mong", |
parent = "Mong", |
||
} |
} |
||
m["Moon"] = { |
m["Moon"] = { |
||
"Moon", |
|||
"alphabet", |
|||
aliases = {"Moon System of Embossed Reading", "Moon type", "Moon writing", "Moon alphabet", "Moon code"}, |
aliases = {"Moon System of Embossed Reading", "Moon type", "Moon writing", "Moon alphabet", "Moon code"}, |
||
systems = {"alphabet"}, |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Morse"] = { |
m["Morse"] = { |
||
"Morse code", |
|||
} |
} |
||
m["Mroo"] = { |
m["Mroo"] = { |
||
"Mro", |
|||
characters = "𖩀-𖩯", |
characters = "𖩀-𖩯", |
||
} |
} |
||
m["Mtei"] = { |
m["Mtei"] = { |
||
"Meitei Mayek", |
|||
"abugida", |
|||
aliases = {"Meetei Mayek", "Manipuri"}, |
aliases = {"Meetei Mayek", "Manipuri"}, |
||
characters = "ꯀ-꯹ꫠ-꫶", |
characters = "ꯀ-꯹ꫠ-꫶", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Mult"] = { |
m["Mult"] = { |
||
"Multani", |
|||
"abugida", |
|||
characters = "𑊀-𑊩", |
characters = "𑊀-𑊩", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m[" |
m["Music"] = { |
||
"Musical notation", |
|||
"pictography", |
|||
characters = "𝄀-𝇨", |
characters = "𝄀-𝇨", |
||
translit = false, |
|||
systems = {"pictography"}, |
|||
} |
} |
||
m["Mymr"] = { |
m["Mymr"] = { |
||
"Burmese", |
|||
canonicalName = "မန်း", |
|||
"abugida", |
|||
aliases = {"Myanmar"}, |
aliases = {"Myanmar"}, |
||
characters = "က-႟ꩠ-ꩿꧠ-ꧾ", |
characters = "က-႟ꩠ-ꩿꧠ-ꧾ", |
||
spaces = false, |
|||
} |
} |
||
m["Nagm"] = { |
m["Nagm"] = { |
||
"Nag Mundari", |
|||
"alphabet", |
|||
characters = "𞓐-𞓹", |
characters = "𞓐-𞓹", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Nand"] = { |
m["Nand"] = { |
||
"Nandinagari", |
|||
"abugida", |
|||
characters = "𑦠-𑧤", |
characters = "𑦠-𑧤", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Narb"] = { |
m["Narb"] = { |
||
"Old North Arabian", |
|||
"abjad", |
|||
characters = "𐪀-𐪟", |
characters = "𐪀-𐪟", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Nbat"] = { |
m["Nbat"] = { |
||
"Nabataean", |
|||
"abjad", |
|||
aliases = {"Nabatean"}, |
aliases = {"Nabatean"}, |
||
characters = "𐢀-𐢯", |
characters = "𐢀-𐢯", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Newa"] = { |
m["Newa"] = { |
||
"Newa", |
|||
"abugida", |
|||
aliases = {"Newar", "Newari", "Prachalit Nepal"}, |
aliases = {"Newar", "Newari", "Prachalit Nepal"}, |
||
characters = "𑐀-𑑡", |
characters = "𑐀-𑑡", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Nkdb"] = { |
m["Nkdb"] = { |
||
"Dongba", |
|||
"pictography", |
|||
aliases = {"Naxi Dongba", "Nakhi Dongba", "Tomba", "Tompa", "Mo-so"}, |
|||
spaces = false, |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Nkgb"] = { |
m["Nkgb"] = { |
||
"Geba", |
|||
"syllabary", |
|||
aliases = {"Nakhi Geba", "Naxi Geba"}, |
|||
spaces = false, |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Nkoo"] = { |
m["Nkoo"] = { |
||
"N'Ko", |
|||
"alphabet", |
|||
characters = "߀-߿", |
characters = "߀-߿", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["None"] = { |
m["None"] = { |
||
"Unspecified", -- renders as 'unspecified script' |
|||
-- This should not have any characters listed |
-- This should not have any characters listed |
||
translit = false, |
|||
character_category = false, |
|||
} |
} |
||
m["Nshu"] = { |
m["Nshu"] = { |
||
"Nüshu", |
|||
"syllabary", |
|||
aliases = {"Nushu"}, |
aliases = {"Nushu"}, |
||
characters = "𖿡𛅰-𛋻", |
characters = "𖿡𛅰-𛋻", |
||
spaces = false, |
|||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Ogam"] = { |
m["Ogam"] = { |
||
"Ogham", |
|||
characters = " -᚜", |
characters = " -᚜", |
||
} |
} |
||
m["Olck"] = { |
m["Olck"] = { |
||
"Ol Chiki", |
|||
characters = "᱐-᱿", |
characters = "᱐-᱿", |
||
} |
} |
||
m["Orkh"] = { |
m["Orkh"] = { |
||
"Orkhon runes", |
|||
aliases = {"Old Turkic"}, |
|||
characters = "𐰀-𐱈", |
characters = "𐰀-𐱈", |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၀၅၇: | လိတ်ရဲဉ်ႏ ၁၁၃၈: | ||
m["Orya"] = { |
m["Orya"] = { |
||
"Oriya", |
|||
"abugida", |
|||
aliases = {"Odia"}, |
aliases = {"Odia"}, |
||
characters = "ଁ-୷", |
characters = "ଁ-୷", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ଅା", "ଏୗ", "ଓୗ"}, |
from = {"ଅା", "ଏୗ", "ଓୗ"}, |
||
လိတ်ရဲဉ်ႏ ၁၀၆၈: | လိတ်ရဲဉ်ႏ ၁၁၄၉: | ||
m["Osge"] = { |
m["Osge"] = { |
||
"Osage", |
|||
characters = "𐒰-𐓻", |
characters = "𐒰-𐓻", |
||
capitalized = true, |
capitalized = true, |
||
လိတ်ရဲဉ်ႏ ၁၀၇၄: | လိတ်ရဲဉ်ႏ ၁၁၅၅: | ||
m["Osma"] = { |
m["Osma"] = { |
||
"Osmanya", |
|||
characters = "𐒀-𐒩", |
characters = "𐒀-𐒩", |
||
} |
} |
||
m["Ougr"] = { |
m["Ougr"] = { |
||
"Old Uyghur", |
|||
"abjad, alphabet", |
|||
characters = "𐽰-𐾉", |
characters = "𐽰-𐾉", |
||
direction = "down", |
direction = "down", |
||
systems = {"abjad", "alphabet"}, |
|||
} |
} |
||
m["Palm"] = { |
m["Palm"] = { |
||
"Palmyrene", |
|||
characters = "𐡠-𐡿", |
characters = "𐡠-𐡿", |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၀၉၂: | လိတ်ရဲဉ်ႏ ၁၁၇၃: | ||
m["Pauc"] = { |
m["Pauc"] = { |
||
"Pau Cin Hau", |
|||
characters = "𑫀-𑫸", |
characters = "𑫀-𑫸", |
||
} |
} |
||
m["Perm"] = { |
m["Perm"] = { |
||
"Old Permic", |
|||
characters = "𐍐-𐍺", |
characters = "𐍐-𐍺", |
||
} |
} |
||
m["Phag"] = { |
m["Phag"] = { |
||
"Phags-pa", |
|||
"abugida", |
|||
characters = "᠂᠃᠅ 。ꡀ-꡷", |
characters = "᠂᠃᠅ 。ꡀ-꡷", |
||
direction = "down", |
direction = "down", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Phli"] = { |
m["Phli"] = { |
||
"Inscriptional Pahlavi", |
|||
"abjad", |
|||
characters = "𐭠-𐭿", |
characters = "𐭠-𐭿", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Phlp"] = { |
m["Phlp"] = { |
||
"Psalter Pahlavi", |
|||
"abjad", |
|||
characters = "𐮀-𐮯", |
characters = "𐮀-𐮯", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Phlv"] = { |
m["Phlv"] = { |
||
"Book Pahlavi", |
|||
"abjad", |
|||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Phnx"] = { |
m["Phnx"] = { |
||
"Phoenician", |
|||
"abjad", |
|||
characters = "𐤀-𐤟", |
characters = "𐤀-𐤟", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Plrd"] = { |
m["Plrd"] = { |
||
"Pollard", |
|||
"abugida", |
|||
aliases = {"Miao"}, |
|||
characters = "𖼀-𖾟", |
characters = "𖼀-𖾟", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Prti"] = { |
m["Prti"] = { |
||
"Inscriptional Parthian", |
|||
characters = "𐭀-𐭟", |
characters = "𐭀-𐭟", |
||
direction = "rtl", |
direction = "rtl", |
||
လိတ်ရဲဉ်ႏ ၁၁၄၉: | လိတ်ရဲဉ်ႏ ၁၂၃၁: | ||
m["Ranj"] = { |
m["Ranj"] = { |
||
"Ranjana", |
|||
"abugida", |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Rjng"] = { |
m["Rjng"] = { |
||
"Rejang", |
|||
"abugida", |
|||
characters = "ꤰ-꥟", |
characters = "ꤰ-꥟", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Rohg"] = { |
m["Rohg"] = { |
||
"Hanifi Rohingya", |
|||
"alphabet", |
|||
characters = "𐴀-𐴹", |
characters = "𐴀-𐴹", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Roro"] = { |
m["Roro"] = { |
||
"Rongorongo", |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m[" |
m["Rumin"] = { |
||
"Rumi numerals", |
|||
characters = "𐹠-𐹾", |
characters = "𐹠-𐹾", |
||
character_category = "Rumi numerals", |
character_category = "Rumi numerals", |
||
လိတ်ရဲဉ်ႏ ၁၁၇၉: | လိတ်ရဲဉ်ႏ ၁၂၆၁: | ||
m["Runr"] = { |
m["Runr"] = { |
||
"Runic", |
|||
"alphabet", |
|||
characters = "ᚠ-ᛰ", |
characters = "ᚠ-ᛰ", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Samr"] = { |
m["Samr"] = { |
||
"Samaritan", |
|||
"abjad", |
|||
characters = "ࠀ-࠾", |
characters = "ࠀ-࠾", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Sarb"] = { |
m["Sarb"] = { |
||
"Old South Arabian", |
|||
"abjad", |
|||
characters = "𐩠-𐩿", |
characters = "𐩠-𐩿", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Saur"] = { |
m["Saur"] = { |
||
"Saurashtra", |
|||
"abugida", |
|||
characters = "ꢀ-꣙", |
characters = "ꢀ-꣙", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Semap"] = { |
m["Semap"] = { |
||
"flag semaphore", |
|||
"pictography", |
|||
} |
} |
||
m["Sgnw"] = { |
m["Sgnw"] = { |
||
"SignWriting", |
|||
"pictography", |
|||
characters = "𝠀-𝪯", |
characters = "𝠀-𝪯", |
||
translit = false, |
|||
systems = {"pictography"}, |
|||
} |
} |
||
m["Shaw"] = { |
m["Shaw"] = { |
||
"Shavian", |
|||
characters = "𐑐-𐑿", |
characters = "𐑐-𐑿", |
||
} |
} |
||
m["Shrd"] = { |
m["Shrd"] = { |
||
"Sharada", |
|||
"abugida", |
|||
characters = "𑆀-𑇙", |
characters = "𑆀-𑇙", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Shui"] = { |
m["Shui"] = { |
||
"Sui", |
|||
"logography", |
|||
spaces = false, |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Sidd"] = { |
m["Sidd"] = { |
||
"Siddham", |
|||
"abugida", |
|||
characters = "𑖀-𑗝", |
characters = "𑖀-𑗝", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Sind"] = { |
m["Sind"] = { |
||
"Khudawadi", |
|||
"abugida", |
|||
characters = "𑊰-𑋹", |
characters = "𑊰-𑋹", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"𑊰𑋠", "𑊰𑋥", "𑊰𑋦", "𑊰𑋧", "𑊰𑋨"}, |
from = {"𑊰𑋠", "𑊰𑋥", "𑊰𑋦", "𑊰𑋧", "𑊰𑋨"}, |
||
လိတ်ရဲဉ်ႏ ၁၂၄၉: | လိတ်ရဲဉ်ႏ ၁၃၃၃: | ||
m["Sinh"] = { |
m["Sinh"] = { |
||
"Sinhalese", |
|||
"abugida", |
|||
aliases = {"Sinhala"}, |
aliases = {"Sinhala"}, |
||
characters = "ං-෴", |
characters = "ං-෴", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"අා", "අැ", "අෑ", "උෟ", "ඍෘ", "ඏෟ", "එ්", "එෙ", "ඔෟ", "ෘෘ"}, |
from = {"අා", "අැ", "අෑ", "උෟ", "ඍෘ", "ඏෟ", "එ්", "එෙ", "ඔෟ", "ෘෘ"}, |
||
လိတ်ရဲဉ်ႏ ၁၂၆၀: | လိတ်ရဲဉ်ႏ ၁၃၄၄: | ||
m["Sogd"] = { |
m["Sogd"] = { |
||
"Sogdian", |
|||
"abjad", |
|||
characters = "𐼰-𐽙", |
characters = "𐼰-𐽙", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Sogo"] = { |
m["Sogo"] = { |
||
"Old Sogdian", |
|||
"abjad", |
|||
characters = "𐼀-𐼧", |
characters = "𐼀-𐼧", |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Sora"] = { |
m["Sora"] = { |
||
"Sorang Sompeng", |
|||
aliases = {"Sora Sompeng"}, |
aliases = {"Sora Sompeng"}, |
||
characters = "𑃐-𑃹", |
characters = "𑃐-𑃹", |
||
လိတ်ရဲဉ်ႏ ၁၂၈၀: | လိတ်ရဲဉ်ႏ ၁၃၆၄: | ||
m["Soyo"] = { |
m["Soyo"] = { |
||
"Soyombo", |
|||
"abugida", |
|||
characters = "𑩐-𑪢", |
characters = "𑩐-𑪢", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Sund"] = { |
m["Sund"] = { |
||
"Sundanese", |
|||
"abugida", |
|||
characters = "ᮀ-ᮿ", |
characters = "ᮀ-ᮿ", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Sylo"] = { |
m["Sylo"] = { |
||
"Syloti Nagri", |
|||
"abugida", |
|||
aliases = {"Sylheti Nagari"}, |
aliases = {"Sylheti Nagari"}, |
||
characters = "ꠀ-꠫", |
characters = "ꠀ-꠫", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Syrc"] = { |
m["Syrc"] = { |
||
"Syriac", |
|||
"abjad", -- more precisely, impure abjad |
|||
characters = "܀-ݏ"..u(0x0860).."-"..u(0x086A), |
characters = "܀-ݏ"..u(0x0860).."-"..u(0x086A), |
||
direction = "rtl", |
direction = "rtl", |
||
systems = {"abjad"}, -- more precisely, impure abjad |
|||
} |
} |
||
လိတ်ရဲဉ်ႏ ၁၃၀၈: | လိတ်ရဲဉ်ႏ ၁၃၉၂: | ||
m["Tagb"] = { |
m["Tagb"] = { |
||
"Tagbanwa", |
|||
"abugida", |
|||
characters = "ᝠ-ᝳ", |
characters = "ᝠ-ᝳ", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Takr"] = { |
m["Takr"] = { |
||
"Takri", |
|||
"abugida", |
|||
characters = "𑚀-𑛉", |
characters = "𑚀-𑛉", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"𑚀𑚭", "𑚀𑚴", "𑚀𑚵", "𑚆𑚲"}, |
from = {"𑚀𑚭", "𑚀𑚴", "𑚀𑚵", "𑚆𑚲"}, |
||
လိတ်ရဲဉ်ႏ ၁၃၂၄: | လိတ်ရဲဉ်ႏ ၁၄၀၈: | ||
m["Tale"] = { |
m["Tale"] = { |
||
"Tai Nüa", |
|||
"abugida", |
|||
aliases = {"Tai Nuea", "New Tai Nüa", "New Tai Nuea", "Dehong Dai", "Tai Dehong", "Tai Le"}, |
aliases = {"Tai Nuea", "New Tai Nüa", "New Tai Nuea", "Dehong Dai", "Tai Dehong", "Tai Le"}, |
||
characters = "ᥐ-ᥴ", |
characters = "ᥐ-ᥭᥰ-ᥴ", |
||
spaces = false, |
|||
} |
} |
||
m["Talu"] = { |
m["Talu"] = { |
||
"New Tai Lue", |
|||
"abugida", |
|||
characters = "ᦀ-᧟", |
|||
characters = "ᦀ-ᦫᦰ-ᧉ᧐-᧚᧞᧟", |
|||
systems = {"abugida"}, |
|||
spaces = false, |
|||
} |
} |
||
m["Taml"] = { |
m["Taml"] = { |
||
"Tamil", |
|||
"abugida", |
|||
characters = "ஂ-௺𑿀-𑿿", |
characters = "ஂ-௺𑿀-𑿿", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"அூ", "ஸ்ரீ"}, |
from = {"அூ", "ஸ்ரீ"}, |
||
လိတ်ရဲဉ်ႏ ၁၃၄၇: | လိတ်ရဲဉ်ႏ ၁၄၃၃: | ||
m["Tang"] = { |
m["Tang"] = { |
||
"Tangut", |
|||
"logography, syllabary", |
|||
characters = "𖿠𗀀-𘫿𘴀-𘴈", |
characters = "𖿠𗀀-𘫿𘴀-𘴈", |
||
spaces = false, |
|||
systems = {"logography", "syllabary"}, |
|||
} |
} |
||
m["Tavt"] = { |
m["Tavt"] = { |
||
"Tai Viet", |
|||
"abugida", |
|||
characters = "ꪀ-꫟", |
|||
characters = "ꪀ-ꫂꫛ-꫟", |
|||
spaces = false, |
|||
} |
} |
||
m["Telu"] = { |
m["Telu"] = { |
||
"Telugu", |
|||
"abugida", |
|||
characters = "ఀ-౿", |
characters = "ఀ-౿", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"ఒౌ", "ఒౕ", "ిౕ", "ెౕ", "ొౕ"}, |
from = {"ఒౌ", "ఒౕ", "ిౕ", "ెౕ", "ొౕ"}, |
||
လိတ်ရဲဉ်ႏ ၁၃၆၉: | လိတ်ရဲဉ်ႏ ၁၄၅၇: | ||
m["Teng"] = { |
m["Teng"] = { |
||
"Tengwar", |
|||
} |
} |
||
m["Tfng"] = { |
m["Tfng"] = { |
||
"Tifinagh", |
|||
"abjad, alphabet", |
|||
otherNames = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent |
|||
characters = "ⴰ-⵿", |
characters = "ⴰ-⵿", |
||
otherNames = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent |
|||
systems = {"abjad", "alphabet"}, |
|||
} |
} |
||
m["Tglg"] = { |
m["Tglg"] = { |
||
"Baybayin", |
|||
"abugida", |
|||
aliases = {"Tagalog"}, |
aliases = {"Tagalog"}, |
||
characters = "ᜀ-᜔", |
characters = "ᜀ-᜔", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Thaa"] = { |
m["Thaa"] = { |
||
"Thaana", |
|||
"abugida", |
|||
characters = "ހ-ޱ", |
characters = "ހ-ޱ", |
||
systems = {"abugida"}, |
|||
direction = "rtl", |
direction = "rtl", |
||
} |
} |
||
m["Thai"] = { |
m["Thai"] = { |
||
"Thai", |
|||
"abugida", |
|||
characters = "ก-๛", |
|||
characters = "ก-ฺเ-๛", |
|||
spaces = false, |
|||
} |
} |
||
m["Tibt"] = { |
m["Tibt"] = { |
||
"Tibetan", |
|||
"abugida", |
|||
characters = "ༀ-࿚", |
characters = "ༀ-࿚", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
combiningClasses = {["༹"] = 1}, |
combiningClasses = {["༹"] = 1}, |
||
လိတ်ရဲဉ်ႏ ၁၄၁၁: | လိတ်ရဲဉ်ႏ ၁၅၀၀: | ||
m["sit-tam-Tibt"] = { |
m["sit-tam-Tibt"] = { |
||
"Tamyig", |
|||
m["Tibt"][2], |
|||
characters = m["Tibt"].characters, |
characters = m["Tibt"].characters, |
||
systems = {"abugida"}, |
|||
parent = "Tibt", |
parent = "Tibt", |
||
normalizationFixes = m["Tibt"].normalizationFixes, |
normalizationFixes = m["Tibt"].normalizationFixes, |
||
လိတ်ရဲဉ်ႏ ၁၄၁၉: | လိတ်ရဲဉ်ႏ ၁၅၀၈: | ||
m["xzh-Tibt"] = { |
m["xzh-Tibt"] = { |
||
"Zhang-Zhung", |
|||
m["Tibt"][2], |
|||
systems = {"abugida"}, |
|||
characters = m["Tibt"].characters, |
|||
parent = "Tibt", |
parent = "Tibt", |
||
normalizationFixes = m["Tibt"].normalizationFixes, |
normalizationFixes = m["Tibt"].normalizationFixes, |
||
လိတ်ရဲဉ်ႏ ၁၄၂၆: | လိတ်ရဲဉ်ႏ ၁၅၁၆: | ||
m["Tirh"] = { |
m["Tirh"] = { |
||
"Tirhuta", |
|||
"abugida", |
|||
characters = "𑒀-𑓙", |
characters = "𑒀-𑓙", |
||
systems = {"abugida"}, |
|||
normalizationFixes = { |
normalizationFixes = { |
||
from = {"𑒁𑒰", "𑒋𑒺", "𑒍𑒺", "𑒪𑒵", "𑒪𑒶"}, |
from = {"𑒁𑒰", "𑒋𑒺", "𑒍𑒺", "𑒪𑒵", "𑒪𑒶"}, |
||
လိတ်ရဲဉ်ႏ ၁၄၃၆: | လိတ်ရဲဉ်ႏ ၁၅၂၆: | ||
m["Tnsa"] = { |
m["Tnsa"] = { |
||
"Tangsa", |
|||
"alphabet", |
|||
characters = "𖩰-𖫉", |
characters = "𖩰-𖫉", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Toto"] = { |
m["Toto"] = { |
||
"Toto", |
|||
"abugida", |
|||
characters = "𞊐-𞊮", |
characters = "𞊐-𞊮", |
||
systems = {"abugida"}, |
|||
} |
} |
||
m["Ugar"] = { |
m["Ugar"] = { |
||
"Ugaritic", |
|||
"abjad", |
|||
characters = "𐎀-𐎟", |
characters = "𐎀-𐎟", |
||
systems = {"abjad"}, |
|||
} |
} |
||
m["Vaii"] = { |
m["Vaii"] = { |
||
"Vai", |
|||
"syllabary", |
|||
characters = "ꔀ-ꘫ", |
characters = "ꔀ-ꘫ", |
||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Visp"] = { |
m["Visp"] = { |
||
"Visible Speech", |
|||
"alphabet", |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Vith"] = { |
m["Vith"] = { |
||
"Vithkuqi", |
|||
"alphabet", |
|||
characters = "𐕰-𐖼", |
characters = "𐕰-𐖼", |
||
capitalized = true, |
capitalized = true, |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Wara"] = { |
m["Wara"] = { |
||
"Varang Kshiti", |
|||
aliases = {"Warang Citi"}, |
|||
characters = "𑢠-𑣿", |
characters = "𑢠-𑣿", |
||
capitalized = true, |
capitalized = true, |
||
လိတ်ရဲဉ်ႏ ၁၄၇၉: | လိတ်ရဲဉ်ႏ ၁၅၇၀: | ||
m["Wcho"] = { |
m["Wcho"] = { |
||
"Wancho", |
|||
"alphabet", |
|||
characters = "𞋀-𞋿", |
characters = "𞋀-𞋿", |
||
systems = {"alphabet"}, |
|||
} |
} |
||
m["Wole"] = { |
m["Wole"] = { |
||
"Woleai", |
|||
"syllabary", |
|||
-- Not in Unicode |
-- Not in Unicode |
||
} |
} |
||
m["Xpeo"] = { |
m["Xpeo"] = { |
||
"Old Persian", |
|||
characters = "𐎠-𐏕", |
characters = "𐎠-𐏕", |
||
} |
} |
||
m["Xsux"] = { |
m["Xsux"] = { |
||
"Cuneiform", |
|||
aliases = {"Sumero-Akkadian Cuneiform"}, |
aliases = {"Sumero-Akkadian Cuneiform"}, |
||
characters = "𒀀-𒎙𒐀-𒑳", |
characters = "𒀀-𒎙𒐀-𒑳", |
||
} |
|||
m["Yezi"] = { |
|||
"Yezidi", |
|||
"alphabet", |
|||
characters = "𐺀-𐺱", |
|||
direction = "rtl", |
|||
} |
} |
||
m["Yiii"] = { |
m["Yiii"] = { |
||
"Yi", |
|||
"syllabary", |
|||
characters = "ꀀ-꓆", |
characters = "ꀀ-꓆", |
||
systems = {"syllabary"}, |
|||
} |
} |
||
m["Zanb"] = { |
m["Zanb"] = { |
||
"Zanabazar Square", |
|||
characters = u(0x11A00).."-"..u(0x11A47), |
characters = u(0x11A00).."-"..u(0x11A47), |
||
} |
} |
||
m["Zmth"] = { |
m["Zmth"] = { |
||
"mathematical notation", |
|||
characters = "ℵ∀-⋿⟀-⟯⦀-⫿𝐀-𝟿", |
characters = "ℵ∀-⋿⟀-⟯⦀-⫿𝐀-𝟿", |
||
translit = false, |
|||
character_category = "Mathematical notation symbols", -- ? |
character_category = "Mathematical notation symbols", -- ? |
||
} |
} |
||
m["Zsym"] = { |
m["Zsym"] = { |
||
"symbol", |
|||
"pictography", |
|||
characters = "─-➿←-⇿⌀-⏿⬀-⯾🀀-🃵🌀-🩭", |
characters = "─-➿←-⇿⌀-⏿⬀-⯾🀀-🃵🌀-🩭", |
||
translit = false, |
|||
character_category = false, -- none |
character_category = false, -- none |
||
systems = {"pictography"}, |
|||
} |
} |
||
m["Zyyy"] = { |
m["Zyyy"] = { |
||
"undetermined", |
|||
-- This should not have any characters listed, probably |
-- This should not have any characters listed, probably |
||
translit = false, |
|||
character_category = false, -- none |
character_category = false, -- none |
||
characters = m["Latn"].characters, |
|||
} |
} |
||
m["Zzzz"] = { |
m["Zzzz"] = { |
||
"uncoded", |
|||
-- This should not have any characters listed |
-- This should not have any characters listed |
||
translit = false, |
|||
character_category = false, -- none |
character_category = false, -- none |
||
} |
} |
||
-- These should be defined after the scripts they are composed of |
-- These should be defined after the scripts they are composed of. |
||
m["Hrkt"] = { -- TODO: add hentaigana |
|||
"Kana", |
|||
"syllabary", |
|||
aliases = {"Japanese syllabaries"}, |
|||
characters = m["Hira"].characters .. m["Kana"].characters, |
|||
spaces = false, |
|||
} |
|||
m["Jpan"] = { |
m["Jpan"] = { |
||
"Japanese", |
|||
"logography, syllabary", |
|||
characters = m["Hira"].characters .. m["Kana"].characters .. m["Hani"].characters .. m["Latn"].characters, |
|||
characters = m["Hrkt"].characters .. m["Hani"].characters .. m["Latnx"].characters, |
|||
systems = {"syllabary", "logography"}, |
|||
spaces = false, |
|||
sort_by_scraping = true, |
|||
} |
} |
||
m["Kore"] = { |
m["Kore"] = { |
||
"Korean", |
|||
"logography, syllabary", |
|||
characters = m["Hang"].characters .. m["Hani"].characters, |
characters = m["Hang"].characters .. m["Hani"].characters, |
||
systems = {"syllabary", "logography"}, |
|||
} |
} |
||
ခြပ်ထွားချာ ၁၀:၂၂၊ ၂၁ သဲက်တဲဉ်ဗာ ၂၀၂၃ နီꩻကိုကာႏ
Documentation for this module may be created at မော်ဂျူး:scripts/data/doc
--[=[
When adding new scripts to this file, please don't forget to add
style definitons for the script in [[MediaWiki:Common.css]].
]=]
local u = mw.ustring.char
local m = {}
m["Adlm"] = {
"Adlam",
"alphabet",
characters = "؟ـ𞤀-𞥟",
capitalized = true,
direction = "rtl",
}
m["Afak"] = {
"Afaka",
"syllabary",
}
m["Aghb"] = {
"Caucasian Albanian",
"alphabet",
characters = "𐔰-𐕯",
}
m["Ahom"] = {
"Ahom",
"abugida",
characters = "𑜀-",
}
m["Arab"] = {
"Arabic",
"abjad", -- more precisely, impure abjad
varieties = {"Jawi", {"Nastaliq", "Nastaleeq"}},
characters = "-ۿݐ-ݿࡰ-ࣿﭐ-﷏ﷰ-﷿ﹰ-𐋠-𐋻𐹠--𐻿𞸀-",
direction = "rtl",
normalizationFixes = {
from = {"ٳ"},
to = {"اٟ"}
},
}
m["fa-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
otherNames = {"Perso-Arabic"},
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["kk-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["ks-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["ku-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["ms-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["mzn-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["ota-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["pa-Arab"] = {
"Shahmukhi",
m["Arab"][2],
characters = m["Arab"].characters,
otherNames = {"Arabic"},
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["ps-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["sd-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["tt-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["ug-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["ur-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
m["xka-Arab"] = {
"Arabic",
m["Arab"][2],
characters = m["Arab"].characters,
direction = "rtl",
parent = "Arab",
normalizationFixes = m["Arab"].normalizationFixes,
}
-- Aran (Nastaliq) is subsumed into Arab
m["Armi"] = {
"Imperial Aramaic",
"abjad",
characters = "𐡀-𐡟",
direction = "rtl",
}
m["Armn"] = {
"Armenian",
"alphabet",
characters = "-֏ﬓ-ﬗ",
capitalized = true,
}
m["Avst"] = {
"Avestan",
"alphabet",
characters = "𐬀-𐬿",
direction = "rtl",
}
m["pal-Avst"] = {
"Pazend",
m["Avst"][2],
characters = m["Avst"].characters,
direction = "rtl",
parent = "Avst",
}
m["Bali"] = {
"Balinese",
"abugida",
characters = "ᬀ-",
}
m["Bamu"] = {
"Bamum",
"syllabary",
characters = "ꚠ-𖠀-",
}
m["Bass"] = {
"Bassa",
"alphabet",
aliases = {"Bassa Vah", "Vah"},
characters = "𖫐-",
}
m["Batk"] = {
"Batak",
"abugida",
characters = "ᯀ-᯿",
}
m["Beng"] = {
"Bengali",
"abugida",
characters = "॒॑।॥ঀ-৯৲-᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱",
normalizationFixes = {
from = {"অা", "ঋৃ", "ঌৢ"},
to = {"আ", "ৠ", "ৡ"}
},
}
m["as-Beng"] = {
"Assamese",
m["Beng"][2],
otherNames = {"Bengali-Assamese", "Eastern Nagari"},
characters = "॒॑।॥ঀ-য-᳕᳖᳘᳐᳒᳡ᳪ᳭ᳲᳵ-᳷꣱",
normalizationFixes = m["Beng"].normalizationFixes,
}
m["Bhks"] = {
"Bhaiksuki",
"abugida",
characters = "𑰀-",
}
m["Blis"] = {
"Blissymbols",
"logography",
aliases = {"Blissymbolics"},
-- Not in Unicode
}
m["Bopo"] = {
"Zhuyin",
"semisyllabary",
aliases = {"Zhuyin Fuhao", "Bopomofo"},
characters = "ˇˉˊˋ˙˪˫、-〃〈-】〓-〟〪-〭〰〷・-ㄯ﹅﹆。-・",
}
m["Brah"] = {
"Brahmi",
"abugida",
characters = "𑀀-𑁿",
normalizationFixes = {
from = {"𑀅𑀸", "𑀋𑀾", "𑀏𑁂"},
to = {"𑀆", "𑀌", "𑀐"}
},
}
m["Brai"] = {
"Braille",
"alphabet",
characters = "⠀-⣿",
}
m["Bugi"] = {
"Buginese",
"abugida",
aliases = {"Lontara"},
characters = "ᨀ-᨟ꧏ",
}
m["Buhd"] = {
"Buhid",
"abugida",
characters = "᜵᜶ᝀ-ꧏ",
}
m["Cakm"] = {
"Chakma",
"abugida",
characters = "০-৯၀-၉𑄀-",
}
m["Cans"] = {
"Canadian syllabics",
"abugida",
characters = "᐀-ᙿᢰ-𑪰-𑪿",
}
m["Cari"] = {
"Carian",
"alphabet",
characters = "𐊠-",
}
m["Cham"] = {
"Cham",
"abugida",
characters = "ꨀ-꩟",
}
m["Cher"] = {
"Cherokee",
"syllabary",
characters = "Ꭰ-ꭰ-ꮿ",
}
m["Chrs"] = {
"Chorasmian",
"abjad",
characters = "𐾰-",
direction = "rtl",
}
m["Copt"] = {
"Coptic",
"alphabet",
characters = "Ϣ-ϯⲀ-⳿𐋠-𐋻", -- this is mostly "Coptic", not unified "Greek and Coptic"
capitalized = true,
}
m["Cpmn"] = {
"Cypro-Minoan",
"syllabary",
aliases = {"Cypro Minoan"},
characters = "𐄀𐄁𒾐-",
}
m["Cprt"] = {
"Cypriot",
"syllabary",
characters = "𐄀-𐄂𐄇-𐄳𐄷-𐄿𐠀-𐠿",
direction = "rtl",
}
m["Cyrl"] = {
"Cyrillic",
"alphabet",
characters = "Ѐ-ԯᲀ-ᴫᵸ᷸ⷠ-ⷿ⹃Ꙁ-ꚟ︮︯𞀰-𞂏",
capitalized = true,
}
m["Cyrs"] = {
"Old Cyrillic",
m["Cyrl"][2],
aliases = {"Early Cyrillic"},
characters = m["Cyrl"].characters,
capitalized = m["Cyrl"].capitalized,
wikipedia_article = "Early Cyrillic alphabet",
}
m["Deva"] = {
"Devanagari",
"abugida",
characters = "ऀ-ॿ꣠-ꣿ𑬀-𑬉",
normalizationFixes = {
from = {"ॆॆ", "ेे", "ाॅ", "ाॆ", "ाꣿ", "ॊॆ", "ाे", "ाै", "ोे", "ाऺ", "ॖॖ", "अॅ", "अॆ", "अा", "एॅ", "एॆ", "एे", "एꣿ", "ऎॆ", "अॉ", "आॅ", "अॊ", "आॆ", "अो", "आे", "अौ", "आै", "ओे", "अऺ", "अऻ", "आऺ", "अाꣿ", "आꣿ", "ऒॆ", "अॖ", "अॗ", "ॶॖ", "्?ा"},
to = {"ꣿ", "ै", "ॉ", "ॊ", "ॏ", "ॏ", "ो", "ौ", "ौ", "ऻ", "ॗ", "ॲ", "ऄ", "आ", "ऍ", "ऎ", "ऐ", "ꣾ", "ꣾ", "ऑ", "ऑ", "ऒ", "ऒ", "ओ", "ओ", "औ", "औ", "औ", "ॳ", "ॴ", "ॴ", "ॵ", "ॵ", "ॵ", "ॶ", "ॷ", "ॷ"}
},
}
m["Diak"] = {
"Dhives Akuru",
"abugida",
aliases = {"Dives Akuru"},
characters = "𑤀-𑤆𑤉𑤌-𑤓𑤕𑤖𑤘-𑤵𑤷𑤸𑤻-𑥆𑥐-𑥙",
}
m["Dogr"] = {
"Dogra",
"abugida",
characters = "𑠀-𑠻",
}
m["Dsrt"] = {
"Deseret",
"alphabet",
characters = "𐐀-𐑏",
capitalized = true,
}
m["Dupl"] = {
"Duployan",
"alphabet",
characters = "𛰀-𛱪𛱰-𛱼𛲀-𛲈𛲐-𛲙𛲜-𛲟",
}
m["Egyd"] = {
"Demotic",
"abjad, logography",
}
m["Egyh"] = {
"Hieratic",
"abjad, logography",
}
m["Egyp"] = {
"Egyptian hieroglyphic",
"abjad, logography",
characters = "𓀀-𓑕",
varieties = {"Hieratic"},
wikipedia_article = "Egyptian hieroglyphs",
normalizationFixes = {
from = {"𓃁", "𓆖"},
to = {"𓃀𓂝", "𓆓𓏏𓇿"}
},
}
m["Elba"] = {
"Elbasan",
"alphabet",
characters = "𐔀-𐔧",
}
m["Elym"] = {
"Elymaic",
"abjad",
characters = "𐿠-𐿶",
direction = "rtl",
}
m["Ethi"] = {
"Ethiopic",
"abugida",
aliases = {"Ge'ez"},
characters = "ሀ-ቈቊ-ቍቐ-ቖቘቚ-ቝበ-ኈኊ-ኍነ-ኰኲ-ኵኸ-ኾዀዂ-ዅወ-ዖዘ-ጐጒ-ጕጘ-ፚ፝-፼ᎀ-᎙ⶀ-ⶖⶠ-ⶦⶨ-ⶮⶰ-ⶶⶸ-ⶾⷀ-ⷆⷈ-ⷎⷐ-ⷖⷘ-ⷞꬁ-ꬆꬉ-ꬎꬑ-ꬖꬠ-ꬦꬨ-ꬮ𞟠-𞟦𞟨-𞟫𞟭𞟮𞟰-𞟾",
}
m["Geok"] = {
"Khutsuri",
"alphabet",
characters = "Ⴀ-ჅჇჍ჻ⴀ-ⴥⴧⴭ", -- Ⴀ-Ⴭ is Asomtavruli, ⴀ-ⴭ is Nuskhuri
varieties = {"Nuskhuri", "Asomtavruli"},
capitalized = true,
}
m["Geor"] = {
"Georgian",
"alphabet",
characters = "ა-ჿᲐ-ᲺᲽ-Ჿ", -- ა-ჿ is lowercase Mkhedruli; Ა-Ჿ is uppercase Mkhedruli (Mtavruli)
varieties = {"Mkhedruli", "Mtavruli"},
capitalized = true,
}
m["Glag"] = {
"Glagolitic",
"alphabet",
characters = "Ⰰ-ⱟ𞀀-𞀆𞀈-𞀘𞀛-𞀡𞀣𞀤𞀦-𞀪",
capitalized = true,
}
m["Gong"] = {
"Gunjala Gondi",
"abugida",
characters = "𑵠-𑵥𑵧𑵨𑵪-𑶎𑶐𑶑𑶓-𑶘𑶠-𑶩",
}
m["Gonm"] = {
"Masaram Gondi",
"abugida",
characters = "𑴀-𑴆𑴈𑴉𑴋-𑴶𑴺𑴼𑴽𑴿-𑵇𑵐-𑵙",
}
m["Goth"] = {
"Gothic",
"alphabet",
characters = "𐌰-𐍊",
}
m["Gran"] = {
"Grantha",
"abugida",
characters = "𑌀-𑌃𑌅-𑌌𑌏-𑌐𑌓-𑌨𑌪-𑌰𑌲𑌳𑌵-𑌹𑌼-𑍄𑍇𑍈𑍋-𑍍𑍐𑍗𑍝-𑍣𑍦-𑍬𑍰-𑍴",
}
m["Grek"] = {
"Greek",
"alphabet",
characters = "Ͱ-ͷͺ-Ϳ΄-ΊΌΎ-ΡΣ-ϡϰ-Ͽᴦ-ᴪᵝ-ᵡᵦ-ᵪᶿΩ℩ꭥ𐅀-𐆎𐆠𝈀-𝉅",
capitalized = true,
}
m["Polyt"] = {
"Greek",
m["Grek"][2],
characters = "ἀ-῾" .. m["Grek"].characters,
capitalized = m["Grek"].capitalized,
parent = "Grek",
}
m["Gujr"] = {
"Gujarati",
"abugida",
characters = "ઁ-ઃઅ-ઍએ-ઑઓ-નપ-રલળવ-હ઼-ૅે-ૉો-્ૐૠ-ૣ૦-૱ૺ-૿",
normalizationFixes = {
from = {"ઓ", "અાૈ", "અા", "અૅ", "અે", "અૈ", "અૉ", "અો", "અૌ", "આૅ", "આૈ", "ૅા"},
to = {"અાૅ", "ઔ", "આ", "ઍ", "એ", "ઐ", "ઑ", "ઓ", "ઔ", "ઓ", "ઔ", "ૉ"}
},
}
m["Guru"] = {
"Gurmukhi",
"abugida",
characters = "ਁ-ਃਅ-ਊਏਐਓ-ਨਪ-ਰਲਲ਼ਵਸ਼ਸਹ਼ਾ-ੂੇੈੋ-੍ੑਖ਼-ੜਫ਼੦-੶",
normalizationFixes = {
from = {"ਅਾ", "ਅੈ", "ਅੌ", "ੲਿ", "ੲੀ", "ੲੇ", "ੳੁ", "ੳੂ", "ੳੋ"},
to = {"ਆ", "ਐ", "ਔ", "ਇ", "ਈ", "ਏ", "ਉ", "ਊ", "ਓ"}
},
}
m["Hang"] = {
"Hangul",
"syllabary",
aliases = {"Hangeul"},
characters = (
"가-힣".. -- Syllables
"ᄀ-ᇿ".. -- Jamo
"ꥠ-ꥼ".. -- Jamo Ext-A
"ힰ-ퟻ".. -- Jamo Ext-B
"ㄱ-ㆎ".. -- Compat Jamo
"ᅠ-ᅵ" -- Halfwidth
),
}
m["Hani"] = {
"Han",
"logography",
characters = (
"一-鿿" ..
"㐀-䶿" .. -- ExtA
"𠀀-𪛟" .. -- ExtB
"𪜀-" .. -- ExtC-F & I
"𰀀-𲎯" .. -- ExtG-H
"﨎﨏﨑﨓﨔﨟﨡﨣﨤﨧﨨﨩" ..
"⼀-" .. -- Kangxi Radicals
"⺀-" .. -- Radicals Supplement
" -〿" .. -- CJK Symbols and Punctuation
"𖿢𖿣𖿰𖿱" .. -- Ideographic Symbols and Punctuation
"㇀-" .. -- Strokes
"㋿㍻-㍿" .. -- 組文字
"㈠-㉇㊀-㊰㋀-㋋㍘-㍰㏠-㏾🈐-🈒🈔-🈻🉀-🉈🉐🉑🉠-🉥" ..
-- Saved as bytes to stop normalization on save.
"\239\164\128-\239\171\191" .. -- Compatibility Ideographs
"\240\175\160\128-\240\175\168\159" -- Compatibility Ideographs Supplement
),
varieties = {"Hanzi", "Kanji", "Hanja", "Chu Nom"},
spaces = false,
}
m["Hans"] = {
"Simplified Han",
m["Hani"][2],
characters = m["Hani"].characters,
spaces = m["Hani"].spaces,
parent = "Hani",
}
m["Hant"] = {
"Traditional Han",
m["Hani"][2],
characters = m["Hani"].characters,
spaces = m["Hani"].spaces,
parent = "Hani",
}
m["Hano"] = {
"Hanunoo",
"abugida",
characters = "ᜠ-᜴",
}
m["Hatr"] = {
"Hatran",
"abjad",
characters = "𐣠-𐣿",
direction = "rtl",
}
m["Hebr"] = {
"Hebrew",
"abjad", -- more precisely, impure abjad
characters = u(0x0590) .. "-" .. u(0x05FF) .. u(0xFB1D) .. "-" .. u(0xFB4F),
direction = "rtl",
}
m["Hira"] = {
"Hiragana",
"syllabary",
characters = "ぁ-ゟ𛀁-𛄞𛅐𛅑𛅒🈀",
varieties = {"Hentaigana"},
spaces = false,
}
m["Hluw"] = {
"Anatolian Hieroglyphs",
"logography, syllabary",
characters = "𔐀-𔙆",
wikipedia_article = "Anatolian hieroglyphs",
}
m["Hmng"] = {
"Pahawh Hmong",
"semisyllabary",
aliases = {"Hmong"},
characters = "𖬀-𖮏",
}
m["Hmnp"] = {
"Nyiakeng Puachue Hmong",
"alphabet",
characters = "𞄀-𞅏",
}
m["Hung"] = {
"Old Hungarian",
"alphabet",
aliases = {"Hungarian runic"},
characters = "𐲀-𐲲",
capitalized = true,
direction = "rtl",
}
m["Ibrn"] = {
"Iberian",
"semisyllabary",
}
m["Imag"] = {
-- To be used to avoid any formatting or link processing
"Image-rendered",
-- This should not have any characters listed
translit = false,
character_category = false,
}
m["Inds"] = {
"Indus",
aliases = {"Harappan", "Indus Valley"},
}
m["Ipach"] = {
"International Phonetic Alphabet",
aliases = {"IPA"},
}
m["Ital"] = {
"Old Italic",
"alphabet",
characters = "𐌀-𐌯",
}
m["Java"] = {
"Javanese",
"abugida",
characters = "ꦀ-꧟",
}
m["Jurc"] = {
"Jurchen",
spaces = false,
}
m["Kali"] = {
"Kayah Li",
"abugida",
characters = "꤀-꤯",
}
m["Kana"] = {
"Katakana",
"syllabary",
characters = "゠-ヿㇰ-ㇿ㌀-㍗ヲ-゚𛀀𛅤𛅥𛅦𛅧",
spaces = false,
}
m["Kawi"] = {
"Kawi",
"abugida",
characters = "𑼀-𑽙",
}
m["Khar"] = {
"Kharoshthi",
"abugida",
characters = "𐨀-𐩘",
direction = "rtl",
}
m["Khmr"] = {
"Khmer",
"abugida",
characters = "ក-៝០-៩៰-៹᧠-᧿",
spaces = false,
normalizationFixes = {
from = {"ឣ", "ឤ"},
to = {"អ", "អា"}
},
}
m["Khoj"] = {
"Khojki",
"abugida",
characters = "𑈀-𑈾",
normalizationFixes = {
from = {"𑈀𑈬𑈱", "𑈀𑈬", "𑈀𑈱", "𑈀𑈳", "𑈁𑈱", "𑈆𑈬", "𑈬𑈰", "𑈬𑈱", "𑉀𑈮"},
to = {"𑈇", "𑈁", "𑈅", "𑈇", "𑈇", "𑈃", "𑈲", "𑈳", "𑈂"}
},
}
m["Kitl"] = {
"Khitan Large",
"logography, syllabary",
spaces = false,
}
m["Kits"] = {
"Khitan Small",
"logography, syllabary",
characters = "𘬀-𘳕"..u(0x16FE4),
spaces = false,
}
m["Knda"] = {
"Kannada",
"abugida",
characters = "ಀ-ೲ",
normalizationFixes = {
from = {"ಉಾ", "ಋಾ", "ಒೌ"},
to = {"ಊ", "ೠ", "ಔ"}
},
}
m["Kpel"] = {
"Kpelle",
"syllabary",
-- Not in Unicode
}
m["Kthi"] = {
"Kaithi",
"abugida",
characters = "𑂀-",
}
m["Lana"] = {
"Tai Tham",
"abugida",
aliases = {"Tham", "Tua Mueang", "Lanna"},
characters = "ᨠ-ᩞ᩠-᩿᩼᪀-᪉᪐-᪙᪠-᪭",
spaces = false,
}
m["Laoo"] = {
"Lao",
"abugida",
characters = "ກຂຄຆ-ຊຌ-ຣລວ-ຽເ-ໄໆ່-໎໐-໙ໜ-ໟ",
spaces = false,
}
m["Latn"] = {
"Latin",
"alphabet",
aliases = {"Roman"},
characters = "A-Za-zªºÀ-ÖØ-öø-ɏḀ-ỿ",
varieties = {"Rumi", "Romaji", "Rōmaji", "Romaja"},
capitalized = true,
translit = false,
}
m["Latf"] = {
"Fraktur",
m["Latn"][2],
characters = m["Latn"].characters,
otherNames = {"Blackletter"}, -- Blackletter is actually the parent "script"
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
m["Latg"] = {
"Gaelic",
m["Latn"][2],
characters = m["Latn"].characters,
otherNames = {"Irish"},
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
m["Latnx"] = {
"Latin",
m["Latn"][2],
characters = m["Latn"].characters .. "ɐ-ʸˠ-ˤᴀ-ᴥᴬ-ᵜᵢ-ᵥᵫ-ᵷᵹ-ᶾⁱⁿₐ-ₜKÅℲⅎⅠ-ↈⱠ-ⱿꜢ-ꞇꞋ-ꟊꟐꟑꟓꟕ-ꟙꟲ-ꟿꬰ-ꭚꭜ-ꭤꭦ-ꭩff-stA-Za-z𐞀-𐞅𐞇-𐞰𐞲-𐞺𝼀-𝼞𝼥-𝼪",
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
m["pjt-Latn"] = {
"Latin",
m["Latn"][2],
characters = m["Latn"].characters,
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
parent = "Latn",
}
m["Leke"] = {
"Leke",
"abugida",
}
m["Lepc"] = {
"Lepcha",
"abugida",
characters = "ᰀ-ᱏ",
}
m["Limb"] = {
"Limbu",
"abugida",
characters = "ᤀ-᥏",
}
m["Lina"] = {
"Linear A",
characters = "𐘀-𐝧",
}
m["Linb"] = {
"Linear B",
characters = "𐀀-𐃺",
}
m["Lisu"] = {
"Lisu",
"alphabet",
aliases = {"Fraser"},
characters = "ꓐ-꓿𑾰",
normalizationFixes = {
from = {"['’]", "[.ꓸ][.ꓸ]", "[.ꓸ][,ꓹ]"},
to = {"ʼ", "ꓺ", "ꓻ"}
},
}
m["Loma"] = {
"Loma",
"syllabary",
-- Not in Unicode
}
m["Lyci"] = {
"Lycian",
"alphabet",
characters = "𐊀-𐊜",
}
m["Lydi"] = {
"Lydian",
"alphabet",
characters = "𐤠-𐤿",
direction = "rtl",
}
m["Mahj"] = {
"Mahajani",
"abugida",
characters = "𑅐-𑅶",
}
m["Maka"] = {
"Lontara",
"abugida",
aliases = {"Makasar"},
characters = "𑻠-𑻸",
}
m["Mand"] = {
"Mandaic",
aliases = {"Mandaean"},
characters = "ࡀ-࡞",
direction = "rtl",
}
m["Mani"] = {
"Manichaean",
"abjad",
characters = "𐫀-𐫶",
direction = "rtl",
}
m["Marc"] = {
"Marchen",
"abugida",
characters = "𑱰-𑲶",
}
m["Maya"] = {
"Maya",
aliases = {"Maya hieroglyphic", "Mayan", "Mayan hieroglyphic"},
characters = "𝋠-𝋳",
}
m["Medf"] = {
"Medefaidrin",
aliases = {"Oberi Okaime", "Oberi Ɔkaimɛ"},
characters = "𖹀-𖺚",
capitalized = true,
}
m["Mend"] = {
"Mende",
aliases = {"Mende Kikakui"},
characters = "𞠀-𞣖",
direction = "rtl",
}
m["Merc"] = {
"Meroitic cursive",
"abugida",
characters = "𐦠-𐦿",
direction = "rtl",
}
m["Mero"] = {
"Meroitic hieroglyphic",
"abugida",
characters = "𐦀-𐦟",
direction = "rtl",
}
m["Mlym"] = {
"Malayalam",
"abugida",
characters = "ഀ-ൿ",
normalizationFixes = {
from = {"ഇൗ", "ഉൗ", "എെ", "ഒാ", "ഒൗ", "ക്", "ണ്", "ന്റ", "ന്", "മ്", "യ്", "ര്", "ല്", "ള്", "ഴ്", "െെ", "ൻ്റ"},
to = {"ഈ", "ഊ", "ഐ", "ഓ", "ഔ", "ൿ", "ൺ", "ൻറ", "ൻ", "ൔ", "ൕ", "ർ", "ൽ", "ൾ", "ൖ", "ൈ", "ന്റ"}
},
}
m["Modi"] = {
"Modi",
"abugida",
characters = "𑘀-𑙙",
normalizationFixes = {
from = {"𑘀𑘹", "𑘀𑘺", "𑘁𑘹", "𑘁𑘺"},
to = {"𑘊", "𑘋", "𑘌", "𑘍"}
},
}
m["Mong"] = {
"Mongolian",
"alphabet",
aliases = {"Mongol bichig", "Hudum Mongol bichig"},
characters = "᠀-᠅᠊-᠙ᠠ-ᡂᡸᢀ-ᢗᢦᢩ 𑙠-𑙨",
direction = "down",
}
m["mnc-Mong"] = {
"Manchu",
m["Mong"][2],
characters = "᠁᠄᠈-᠏ᠠᠣᠨ-ᠪᠮ-ᠰᠴ-ᠸᠺᡝᡟ-ᡡᡤ-ᡩᡬ-ᡱᡳ-ᡷᢀ-ᢈᢏᢚ-ᢥᢨᢪ ",
direction = "down",
parent = "Mong",
}
m["sjo-Mong"] = {
"Xibe",
m["Mong"][2],
aliases = {"Sibe"},
characters = "᠄᠇᠊-᠏ᠠᠣᠨᠪᠮ-ᠰᠴ-ᠸᠺᡝ-ᡲ ",
direction = "down",
parent = "mnc-Mong",
}
m["xwo-Mong"] = {
"Clear Script",
m["Mong"][2],
aliases = {"Todo", "Todo bichig"},
characters = "᠀᠁᠄-᠆᠊-ᠠᠨᠯ-ᠱᠴᠷᠸᠺᠻᡀᡃ-ᡜᢀ-ᢇᢉ-ᢏᢔᢖ-ᢙᢧ 𑙩-𑙬",
direction = "down",
parent = "Mong",
}
m["Moon"] = {
"Moon",
"alphabet",
aliases = {"Moon System of Embossed Reading", "Moon type", "Moon writing", "Moon alphabet", "Moon code"},
-- Not in Unicode
}
m["Morse"] = {
"Morse code",
}
m["Mroo"] = {
"Mro",
characters = "𖩀-𖩯",
}
m["Mtei"] = {
"Meitei Mayek",
"abugida",
aliases = {"Meetei Mayek", "Manipuri"},
characters = "ꯀ-꯹ꫠ-꫶",
}
m["Mult"] = {
"Multani",
"abugida",
characters = "𑊀-𑊩",
}
m["Music"] = {
"Musical notation",
"pictography",
characters = "𝄀-𝇨",
translit = false,
}
m["Mymr"] = {
"Burmese",
"abugida",
aliases = {"Myanmar"},
characters = "က-႟ꩠ-ꩿꧠ-ꧾ",
spaces = false,
}
m["Nagm"] = {
"Nag Mundari",
"alphabet",
characters = "𞓐-𞓹",
}
m["Nand"] = {
"Nandinagari",
"abugida",
characters = "𑦠-𑧤",
}
m["Narb"] = {
"Old North Arabian",
"abjad",
characters = "𐪀-𐪟",
direction = "rtl",
}
m["Nbat"] = {
"Nabataean",
"abjad",
aliases = {"Nabatean"},
characters = "𐢀-𐢯",
direction = "rtl",
}
m["Newa"] = {
"Newa",
"abugida",
aliases = {"Newar", "Newari", "Prachalit Nepal"},
characters = "𑐀-𑑡",
}
m["Nkdb"] = {
"Dongba",
"pictography",
aliases = {"Naxi Dongba", "Nakhi Dongba", "Tomba", "Tompa", "Mo-so"},
spaces = false,
-- Not in Unicode
}
m["Nkgb"] = {
"Geba",
"syllabary",
aliases = {"Nakhi Geba", "Naxi Geba"},
spaces = false,
-- Not in Unicode
}
m["Nkoo"] = {
"N'Ko",
"alphabet",
characters = "߀-߿",
direction = "rtl",
}
m["None"] = {
"Unspecified", -- renders as 'unspecified script'
-- This should not have any characters listed
translit = false,
character_category = false,
}
m["Nshu"] = {
"Nüshu",
"syllabary",
aliases = {"Nushu"},
characters = "𖿡𛅰-𛋻",
spaces = false,
}
m["Ogam"] = {
"Ogham",
characters = " -᚜",
}
m["Olck"] = {
"Ol Chiki",
characters = "᱐-᱿",
}
m["Orkh"] = {
"Orkhon runes",
aliases = {"Old Turkic"},
characters = "𐰀-𐱈",
direction = "rtl",
}
m["Orya"] = {
"Oriya",
"abugida",
aliases = {"Odia"},
characters = "ଁ-୷",
normalizationFixes = {
from = {"ଅା", "ଏୗ", "ଓୗ"},
to = {"ଆ", "ଐ", "ଔ"}
},
}
m["Osge"] = {
"Osage",
characters = "𐒰-𐓻",
capitalized = true,
}
m["Osma"] = {
"Osmanya",
characters = "𐒀-𐒩",
}
m["Ougr"] = {
"Old Uyghur",
"abjad, alphabet",
characters = "𐽰-𐾉",
direction = "down",
}
m["Palm"] = {
"Palmyrene",
characters = "𐡠-𐡿",
direction = "rtl",
}
m["Pauc"] = {
"Pau Cin Hau",
characters = "𑫀-𑫸",
}
m["Perm"] = {
"Old Permic",
characters = "𐍐-𐍺",
}
m["Phag"] = {
"Phags-pa",
"abugida",
characters = "᠂᠃᠅ 。ꡀ-꡷",
direction = "down",
}
m["Phli"] = {
"Inscriptional Pahlavi",
"abjad",
characters = "𐭠-𐭿",
direction = "rtl",
}
m["Phlp"] = {
"Psalter Pahlavi",
"abjad",
characters = "𐮀-𐮯",
direction = "rtl",
}
m["Phlv"] = {
"Book Pahlavi",
"abjad",
direction = "rtl",
-- Not in Unicode
}
m["Phnx"] = {
"Phoenician",
"abjad",
characters = "𐤀-𐤟",
direction = "rtl",
}
m["Plrd"] = {
"Pollard",
"abugida",
aliases = {"Miao"},
characters = "𖼀-𖾟",
}
m["Prti"] = {
"Inscriptional Parthian",
characters = "𐭀-𐭟",
direction = "rtl",
}
m["Ranj"] = {
"Ranjana",
"abugida",
-- Not in Unicode
}
m["Rjng"] = {
"Rejang",
"abugida",
characters = "ꤰ-꥟",
}
m["Rohg"] = {
"Hanifi Rohingya",
"alphabet",
characters = "𐴀-𐴹",
direction = "rtl",
}
m["Roro"] = {
"Rongorongo",
-- Not in Unicode
}
m["Rumin"] = {
"Rumi numerals",
characters = "𐹠-𐹾",
character_category = "Rumi numerals",
}
m["Runr"] = {
"Runic",
"alphabet",
characters = "ᚠ-ᛰ",
}
m["Samr"] = {
"Samaritan",
"abjad",
characters = "ࠀ-࠾",
direction = "rtl",
}
m["Sarb"] = {
"Old South Arabian",
"abjad",
characters = "𐩠-𐩿",
direction = "rtl",
}
m["Saur"] = {
"Saurashtra",
"abugida",
characters = "ꢀ-꣙",
}
m["Semap"] = {
"flag semaphore",
"pictography",
}
m["Sgnw"] = {
"SignWriting",
"pictography",
characters = "𝠀-𝪯",
translit = false,
}
m["Shaw"] = {
"Shavian",
characters = "𐑐-𐑿",
}
m["Shrd"] = {
"Sharada",
"abugida",
characters = "𑆀-𑇙",
}
m["Shui"] = {
"Sui",
"logography",
spaces = false,
-- Not in Unicode
}
m["Sidd"] = {
"Siddham",
"abugida",
characters = "𑖀-𑗝",
}
m["Sind"] = {
"Khudawadi",
"abugida",
characters = "𑊰-𑋹",
normalizationFixes = {
from = {"𑊰𑋠", "𑊰𑋥", "𑊰𑋦", "𑊰𑋧", "𑊰𑋨"},
to = {"𑊱", "𑊶", "𑊷", "𑊸", "𑊹"}
},
}
m["Sinh"] = {
"Sinhalese",
"abugida",
aliases = {"Sinhala"},
characters = "ං-෴",
normalizationFixes = {
from = {"අා", "අැ", "අෑ", "උෟ", "ඍෘ", "ඏෟ", "එ්", "එෙ", "ඔෟ", "ෘෘ"},
to = {"ආ", "ඇ", "ඈ", "ඌ", "ඎ", "ඐ", "ඒ", "ඓ", "ඖ", "ෲ"}
},
}
m["Sogd"] = {
"Sogdian",
"abjad",
characters = "𐼰-𐽙",
direction = "rtl",
}
m["Sogo"] = {
"Old Sogdian",
"abjad",
characters = "𐼀-𐼧",
direction = "rtl",
}
m["Sora"] = {
"Sorang Sompeng",
aliases = {"Sora Sompeng"},
characters = "𑃐-𑃹",
}
m["Soyo"] = {
"Soyombo",
"abugida",
characters = "𑩐-𑪢",
}
m["Sund"] = {
"Sundanese",
"abugida",
characters = "ᮀ-ᮿ",
}
m["Sylo"] = {
"Syloti Nagri",
"abugida",
aliases = {"Sylheti Nagari"},
characters = "ꠀ-꠫",
}
m["Syrc"] = {
"Syriac",
"abjad", -- more precisely, impure abjad
characters = "܀-ݏ"..u(0x0860).."-"..u(0x086A),
direction = "rtl",
}
-- Syre, Syrj, Syrn are apparently subsumed into Syrc; discuss if this causes issues
m["Tagb"] = {
"Tagbanwa",
"abugida",
characters = "ᝠ-ᝳ",
}
m["Takr"] = {
"Takri",
"abugida",
characters = "𑚀-𑛉",
normalizationFixes = {
from = {"𑚀𑚭", "𑚀𑚴", "𑚀𑚵", "𑚆𑚲"},
to = {"𑚁", "𑚈", "𑚉", "𑚇"}
},
}
m["Tale"] = {
"Tai Nüa",
"abugida",
aliases = {"Tai Nuea", "New Tai Nüa", "New Tai Nuea", "Dehong Dai", "Tai Dehong", "Tai Le"},
characters = "ᥐ-ᥭᥰ-ᥴ",
spaces = false,
}
m["Talu"] = {
"New Tai Lue",
"abugida",
characters = "ᦀ-ᦫᦰ-ᧉ᧐-᧚᧞᧟",
spaces = false,
}
m["Taml"] = {
"Tamil",
"abugida",
characters = "ஂ-௺𑿀-𑿿",
normalizationFixes = {
from = {"அூ", "ஸ்ரீ"},
to = {"ஆ", "ஶ்ரீ"}
},
}
m["Tang"] = {
"Tangut",
"logography, syllabary",
characters = "𖿠𗀀-𘫿𘴀-𘴈",
spaces = false,
}
m["Tavt"] = {
"Tai Viet",
"abugida",
characters = "ꪀ-ꫂꫛ-꫟",
spaces = false,
}
m["Telu"] = {
"Telugu",
"abugida",
characters = "ఀ-౿",
normalizationFixes = {
from = {"ఒౌ", "ఒౕ", "ిౕ", "ెౕ", "ొౕ"},
to = {"ఔ", "ఓ", "ీ", "ే", "ో"}
},
}
m["Teng"] = {
"Tengwar",
}
m["Tfng"] = {
"Tifinagh",
"abjad, alphabet",
characters = "ⴰ-⵿",
otherNames = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent
}
m["Tglg"] = {
"Baybayin",
"abugida",
aliases = {"Tagalog"},
characters = "ᜀ-᜔",
}
m["Thaa"] = {
"Thaana",
"abugida",
characters = "ހ-ޱ",
direction = "rtl",
}
m["Thai"] = {
"Thai",
"abugida",
characters = "ก-ฺเ-๛",
spaces = false,
}
m["Tibt"] = {
"Tibetan",
"abugida",
characters = "ༀ-࿚",
normalizationFixes = {
combiningClasses = {["༹"] = 1},
from = {"ཷ", "ཹ"},
to = {"ྲཱྀ", "ླཱྀ"}
},
}
m["sit-tam-Tibt"] = {
"Tamyig",
m["Tibt"][2],
characters = m["Tibt"].characters,
parent = "Tibt",
normalizationFixes = m["Tibt"].normalizationFixes,
}
m["xzh-Tibt"] = {
"Zhang-Zhung",
m["Tibt"][2],
characters = m["Tibt"].characters,
parent = "Tibt",
normalizationFixes = m["Tibt"].normalizationFixes,
}
m["Tirh"] = {
"Tirhuta",
"abugida",
characters = "𑒀-𑓙",
normalizationFixes = {
from = {"𑒁𑒰", "𑒋𑒺", "𑒍𑒺", "𑒪𑒵", "𑒪𑒶"},
to = {"𑒂", "𑒌", "𑒎", "𑒉", "𑒊"}
},
}
m["Tnsa"] = {
"Tangsa",
"alphabet",
characters = "𖩰-𖫉",
}
m["Toto"] = {
"Toto",
"abugida",
characters = "𞊐-𞊮",
}
m["Ugar"] = {
"Ugaritic",
"abjad",
characters = "𐎀-𐎟",
}
m["Vaii"] = {
"Vai",
"syllabary",
characters = "ꔀ-ꘫ",
}
m["Visp"] = {
"Visible Speech",
"alphabet",
-- Not in Unicode
}
m["Vith"] = {
"Vithkuqi",
"alphabet",
characters = "𐕰-𐖼",
capitalized = true,
}
m["Wara"] = {
"Varang Kshiti",
aliases = {"Warang Citi"},
characters = "𑢠-𑣿",
capitalized = true,
}
m["Wcho"] = {
"Wancho",
"alphabet",
characters = "𞋀-𞋿",
}
m["Wole"] = {
"Woleai",
"syllabary",
-- Not in Unicode
}
m["Xpeo"] = {
"Old Persian",
characters = "𐎠-𐏕",
}
m["Xsux"] = {
"Cuneiform",
aliases = {"Sumero-Akkadian Cuneiform"},
characters = "𒀀-𒎙𒐀-𒑳",
}
m["Yezi"] = {
"Yezidi",
"alphabet",
characters = "𐺀-𐺱",
direction = "rtl",
}
m["Yiii"] = {
"Yi",
"syllabary",
characters = "ꀀ-꓆",
}
m["Zanb"] = {
"Zanabazar Square",
characters = u(0x11A00).."-"..u(0x11A47),
}
m["Zmth"] = {
"mathematical notation",
characters = "ℵ∀-⋿⟀-⟯⦀-⫿𝐀-𝟿",
translit = false,
character_category = "Mathematical notation symbols", -- ?
}
m["Zsym"] = {
"symbol",
"pictography",
characters = "─-➿←-⇿⌀-⏿⬀-⯾🀀-🃵🌀-🩭",
translit = false,
character_category = false, -- none
}
m["Zyyy"] = {
"undetermined",
-- This should not have any characters listed, probably
translit = false,
character_category = false, -- none
}
m["Zzzz"] = {
"uncoded",
-- This should not have any characters listed
translit = false,
character_category = false, -- none
}
-- These should be defined after the scripts they are composed of.
m["Hrkt"] = { -- TODO: add hentaigana
"Kana",
"syllabary",
aliases = {"Japanese syllabaries"},
characters = m["Hira"].characters .. m["Kana"].characters,
spaces = false,
}
m["Jpan"] = {
"Japanese",
"logography, syllabary",
characters = m["Hrkt"].characters .. m["Hani"].characters .. m["Latnx"].characters,
spaces = false,
sort_by_scraping = true,
}
m["Kore"] = {
"Korean",
"logography, syllabary",
characters = m["Hang"].characters .. m["Hani"].characters,
}
return m