Module:scripts/data: Difference between revisions

From Linguifex
Jump to navigation Jump to search
No edit summary
No edit summary
 
(19 intermediate revisions by 3 users not shown)
Line 1: Line 1:
--[=[
--[=[
    This is imported from Wiktionary - it'll be updated for this wiki - the data is left currently as examples.
When adding new scripts to this file, please don't forget to add
When adding new scripts to this file, please don't forget to add
style definitons for the script in [[MediaWiki:Common.css]].
style definitons for the script in [[MediaWiki:Gadget-LanguagesAndScripts.css]].
]=]
]=]
local concat = table.concat
local concat = table.concat
local insert = table.insert
local insert = table.insert
Line 13: Line 10:
local select = select
local select = select
local sort = table.sort
local sort = table.sort
local u = require("Module:string utilities").char
 
-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
u = require("Module:string/char")
return u(...)
end
 
-- We can't use mw.loadData() on [[Module:languages/chars]] because [[Module:languages/data]] itself is sometimes loaded
-- using mw.loadData(), and calling mw.loadData() on [[Module:languages/chars]] will insert metatables into the
-- character tables, which the second mw.loadData() will choke on.
local m_chars = require("Module:languages/chars")
 
local c = m_chars.chars
local p = m_chars.puaChars
local cs = m_chars.chars_substitutions


------------------------------------------------------------------------------------
------------------------------------------------------------------------------------
Line 91: Line 102:


local m = {}
local m = {}
--Constructed languages
m["Ayer"] = {
"Tahano Hikamu",
"abugida",
characters = "A-Za-z*ñÑʔəƏꜷꜶ¯ˀ¨ʰʲː[]&+0-9¹²",
character_category = false,
}
m["Roka"] = {
"Rokadong Curakjang",
"abugida",
characters = "A-Za-z*[]{}'\"0-9",
character_category = false,
}
--Natural languages


m["Adlm"] = process_ranges{
m["Adlm"] = process_ranges{
"Adlam",
"Adlam",
19606346,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 126: Line 120:
m["Afak"] = {
m["Afak"] = {
"Afaka",
"Afaka",
382019,
"syllabary",
"syllabary",
-- Not in Unicode
-- Not in Unicode
Line 132: Line 127:
m["Aghb"] = process_ranges{
m["Aghb"] = process_ranges{
"Caucasian Albanian",
"Caucasian Albanian",
2495716,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 141: Line 137:
m["Ahom"] = process_ranges{
m["Ahom"] = process_ranges{
"Ahom",
"Ahom",
2839633,
"abugida",
"abugida",
ranges = {
ranges = {
Line 151: Line 148:
m["Arab"] = process_ranges{
m["Arab"] = process_ranges{
"Arabic",
"Arabic",
"abjad", -- more precisely, impure abjad
1828555,
"abjad", -- more precisely, impure abjad
varieties = {"Jawi", {"Nastaliq", "Nastaleeq"}},
varieties = {"Jawi", {"Nastaliq", "Nastaleeq"}},
ranges = {
ranges = {
Line 158: Line 156:
0x0870, 0x088E,
0x0870, 0x088E,
0x0890, 0x0891,
0x0890, 0x0891,
0x0898, 0x08E1,
0x0897, 0x08E1,
0x08E3, 0x08FF,
0x08E3, 0x08FF,
0xFB50, 0xFBC2,
0xFB50, 0xFBC2,
Line 169: Line 167:
0x102E0, 0x102FB,
0x102E0, 0x102FB,
0x10E60, 0x10E7E,
0x10E60, 0x10E7E,
0x10EFD, 0x10EFF,
0x10EC2, 0x10EC4,
0x10EFC, 0x10EFF,
0x1EE00, 0x1EE03,
0x1EE00, 0x1EE03,
0x1EE05, 0x1EE1F,
0x1EE05, 0x1EE1F,
Line 214: Line 213:
m["fa-Arab"] = {
m["fa-Arab"] = {
"Arabic",
"Arabic",
m["Arab"][2],
744068,
m["Arab"][3],
ranges = m["Arab"].ranges,
ranges = m["Arab"].ranges,
characters = m["Arab"].characters,
characters = m["Arab"].characters,
otherNames = {"Perso-Arabic"},
other_names = {"Perso-Arabic"},
direction = "rtl",
direction = "rtl",
parent = "Arab",
parent = "Arab",
Line 225: Line 225:
m["kk-Arab"] = {
m["kk-Arab"] = {
"Arabic",
"Arabic",
m["Arab"][2],
90681452,
m["Arab"][3],
ranges = m["Arab"].ranges,
ranges = m["Arab"].ranges,
characters = m["Arab"].characters,
characters = m["Arab"].characters,
Line 241: Line 242:
m["pa-Arab"] = {
m["pa-Arab"] = {
"Shahmukhi",
"Shahmukhi",
m["Arab"][2],
133800,
m["Arab"][3],
ranges = m["Arab"].ranges,
ranges = m["Arab"].ranges,
characters = m["Arab"].characters,
characters = m["Arab"].characters,
otherNames = {"Arabic"},
other_names = {"Arabic"},
direction = "rtl",
direction = "rtl",
parent = "Arab",
parent = "Arab",
Line 260: Line 262:
m["Armi"] = process_ranges{
m["Armi"] = process_ranges{
"Imperial Aramaic",
"Imperial Aramaic",
26978,
"abjad",
"abjad",
ranges = {
ranges = {
Line 270: Line 273:
m["Armn"] = process_ranges{
m["Armn"] = process_ranges{
"Armenian",
"Armenian",
11932,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 278: Line 282:
},
},
capitalized = true,
capitalized = true,
translit = "Armn-translit",
}
}


m["Avst"] = process_ranges{
m["Avst"] = process_ranges{
"Avestan",
"Avestan",
790681,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 292: Line 298:
m["pal-Avst"] = {
m["pal-Avst"] = {
"Pazend",
"Pazend",
m["Avst"][2],
4925073,
m["Avst"][3],
ranges = m["Avst"].ranges,
ranges = m["Avst"].ranges,
characters = m["Avst"].characters,
characters = m["Avst"].characters,
Line 301: Line 308:
m["Bali"] = process_ranges{
m["Bali"] = process_ranges{
"Balinese",
"Balinese",
804984,
"abugida",
"abugida",
ranges = {
ranges = {
0x1B00, 0x1B4C,
0x1B00, 0x1B4C,
0x1B50, 0x1B7E,
0x1B4E, 0x1B7F,
},
},
}
}
Line 310: Line 318:
m["Bamu"] = process_ranges{
m["Bamu"] = process_ranges{
"Bamum",
"Bamum",
806024,
"syllabary",
"syllabary",
ranges = {
ranges = {
Line 319: Line 328:
m["Bass"] = process_ranges{
m["Bass"] = process_ranges{
"Bassa",
"Bassa",
810458,
"alphabet",
"alphabet",
aliases = {"Bassa Vah", "Vah"},
aliases = {"Bassa Vah", "Vah"},
Line 329: Line 339:
m["Batk"] = process_ranges{
m["Batk"] = process_ranges{
"Batak",
"Batak",
51592,
"abugida",
"abugida",
ranges = {
ranges = {
Line 338: Line 349:
m["Beng"] = process_ranges{
m["Beng"] = process_ranges{
"Bengali",
"Bengali",
756802,
"abugida",
"abugida",
ranges = {
ranges = {
Line 376: Line 388:
m["as-Beng"] = process_ranges{
m["as-Beng"] = process_ranges{
"Assamese",
"Assamese",
m["Beng"][2],
191272,
otherNames = {"Bengali-Assamese", "Eastern Nagari"},
m["Beng"][3],
other_names = {"Eastern Nagari"},
ranges = {
ranges = {
0x0951, 0x0952,
0x0951, 0x0952,
Line 411: Line 424:
m["Bhks"] = process_ranges{
m["Bhks"] = process_ranges{
"Bhaiksuki",
"Bhaiksuki",
17017839,
"abugida",
"abugida",
ranges = {
ranges = {
Line 421: Line 435:


m["Blis"] = {
m["Blis"] = {
"Blissymbols",
"Blissymbolic",
609817,
"logography",
"logography",
aliases = {"Blissymbolics"},
aliases = {"Blissymbols"},
-- Not in Unicode
-- Not in Unicode
}
}
Line 429: Line 444:
m["Bopo"] = process_ranges{
m["Bopo"] = process_ranges{
"Zhuyin",
"Zhuyin",
198269,
"semisyllabary",
"semisyllabary",
aliases = {"Zhuyin Fuhao", "Bopomofo"},
aliases = {"Zhuyin Fuhao", "Bopomofo"},
Line 449: Line 465:
m["Brah"] = process_ranges{
m["Brah"] = process_ranges{
"Brahmi",
"Brahmi",
185083,
"abugida",
"abugida",
ranges = {
ranges = {
Line 459: Line 476:
to = {"𑀆", "𑀌", "𑀐"}
to = {"𑀆", "𑀌", "𑀐"}
},
},
translit = "Brah-translit",
}
}


m["Brai"] = process_ranges{
m["Brai"] = process_ranges{
"Braille",
"Braille",
79894,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 471: Line 490:
m["Bugi"] = process_ranges{
m["Bugi"] = process_ranges{
"Lontara",
"Lontara",
1074947,
"abugida",
"abugida",
aliases = {"Buginese"},
aliases = {"Buginese"},
Line 482: Line 502:
m["Buhd"] = process_ranges{
m["Buhd"] = process_ranges{
"Buhid",
"Buhid",
1002969,
"abugida",
"abugida",
ranges = {
ranges = {
Line 492: Line 513:
m["Cakm"] = process_ranges{
m["Cakm"] = process_ranges{
"Chakma",
"Chakma",
1059328,
"abugida",
"abugida",
ranges = {
ranges = {
Line 502: Line 524:


m["Cans"] = process_ranges{
m["Cans"] = process_ranges{
"Canadian syllabics",
"Canadian syllabic",
2479183,
"abugida",
"abugida",
ranges = {
ranges = {
Line 513: Line 536:
m["Cari"] = process_ranges{
m["Cari"] = process_ranges{
"Carian",
"Carian",
1094567,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 521: Line 545:
m["Cham"] = process_ranges{
m["Cham"] = process_ranges{
"Cham",
"Cham",
1060381,
"abugida",
"abugida",
ranges = {
ranges = {
Line 532: Line 557:
m["Cher"] = process_ranges{
m["Cher"] = process_ranges{
"Cherokee",
"Cherokee",
26549,
"syllabary",
"syllabary",
ranges = {
ranges = {
Line 542: Line 568:
m["Chis"] = {
m["Chis"] = {
"Chisoi",
"Chisoi",
123173777,
"abugida",
"abugida",
-- Not in Unicode
-- Not in Unicode
Line 547: Line 574:


m["Chrs"] = process_ranges{
m["Chrs"] = process_ranges{
"Chorasmian",
"Khwarezmian",
72386710,
"abjad",
"abjad",
aliases = {"Chorasmian"},
ranges = {
ranges = {
0x10FB0, 0x10FCB,
0x10FB0, 0x10FCB,
Line 557: Line 586:
m["Copt"] = process_ranges{
m["Copt"] = process_ranges{
"Coptic",
"Coptic",
321083,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 569: Line 599:
m["Cpmn"] = process_ranges{
m["Cpmn"] = process_ranges{
"Cypro-Minoan",
"Cypro-Minoan",
1751985,
"syllabary",
"syllabary",
aliases = {"Cypro Minoan"},
aliases = {"Cypro Minoan"},
Line 579: Line 610:
m["Cprt"] = process_ranges{
m["Cprt"] = process_ranges{
"Cypriot",
"Cypriot",
1757689,
"syllabary",
"syllabary",
ranges = {
ranges = {
Line 596: Line 628:
m["Cyrl"] = process_ranges{
m["Cyrl"] = process_ranges{
"Cyrillic",
"Cyrillic",
8209,
"alphabet",
"alphabet",
ranges = {
ranges = {
0x0400, 0x052F,
0x0400, 0x052F,
0x1C80, 0x1C88,
0x1C80, 0x1C8A,
0x1D2B, 0x1D2B,
0x1D2B, 0x1D2B,
0x1D78, 0x1D78,
0x1D78, 0x1D78,
Line 615: Line 648:
m["Cyrs"] = {
m["Cyrs"] = {
"Old Cyrillic",
"Old Cyrillic",
m["Cyrl"][2],
442244,
m["Cyrl"][3],
aliases = {"Early Cyrillic"},
aliases = {"Early Cyrillic"},
ranges = m["Cyrl"].ranges,
ranges = m["Cyrl"].ranges,
Line 625: Line 659:
to = {"Ꙋ", "ꙋ"}
to = {"Ꙋ", "ꙋ"}
},
},
strip_diacritics = {remove_diacritics = cs.Cyrs_remove_diacritics},
sort_key = {
remove_diacritics = cs.Cyrs_remove_diacritics,
from = {
"ї", "оу", -- 2 chars
"[ґꙣєѕꙃꙅꙁіꙇђꙉѻꙩꙫꙭꙮꚙꚛꙋѡѿꙍѽꙑѣꙗѥꙕѧꙙѩꙝꙛѫѭѯѱѳѵҁ]"
},
to = {
"и" .. p[1], "у", {
["ґ"] = "г" .. p[1], ["ꙣ"] = "д" .. p[1], ["є"] = "е", ["ѕ"] = "ж" .. p[1], ["ꙃ"] = "ж" .. p[1],
["ꙅ"] = "ж" .. p[1], ["ꙁ"] = "з", ["і"] = "и" .. p[1], ["ꙇ"] = "и" .. p[1], ["ђ"] = "и" .. p[2],
["ꙉ"] = "и" .. p[2], ["ѻ"] = "о", ["ꙩ"] = "о", ["ꙫ"] = "о", ["ꙭ"] = "о",
["ꙮ"] = "о", ["ꚙ"] = "о", ["ꚛ"] = "о", ["ꙋ"] = "у", ["ѡ"] = "х" .. p[1],
["ѿ"] = "х" .. p[1], ["ꙍ"] = "х" .. p[1], ["ѽ"] = "х" .. p[1], ["ꙑ"] = "ы", ["ѣ"] = "ь" .. p[1],
["ꙗ"] = "ь" .. p[2], ["ѥ"] = "ь" .. p[3], ["ꙕ"] = "ю", ["ѧ"] = "я", ["ꙙ"] = "я",
["ѩ"] = "я" .. p[1], ["ꙝ"] = "я" .. p[1], ["ꙛ"] = "я" .. p[2], ["ѫ"] = "я" .. p[3], ["ѭ"] = "я" .. p[4],
["ѯ"] = "я" .. p[5], ["ѱ"] = "я" .. p[6], ["ѳ"] = "я" .. p[7], ["ѵ"] = "я" .. p[8], ["ҁ"] = "я" .. p[9],
}
},
}
}
}


m["Deva"] = process_ranges{
m["Deva"] = process_ranges{
"Devanagari",
"Devanagari",
38592,
"abugida",
"abugida",
ranges = {
ranges = {
Line 647: Line 702:
m["Diak"] = process_ranges{
m["Diak"] = process_ranges{
"Dhives Akuru",
"Dhives Akuru",
3307073,
"abugida",
"abugida",
aliases = {"Dhivehi Akuru", "Dives Akuru", "Divehi Akuru"},
aliases = {"Dhivehi Akuru", "Dives Akuru", "Divehi Akuru"},
Line 663: Line 719:
m["Dogr"] = process_ranges{
m["Dogr"] = process_ranges{
"Dogra",
"Dogra",
72402987,
"abugida",
"abugida",
ranges = {
ranges = {
Line 673: Line 730:
m["Dsrt"] = process_ranges{
m["Dsrt"] = process_ranges{
"Deseret",
"Deseret",
1200582,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 682: Line 740:
m["Dupl"] = process_ranges{
m["Dupl"] = process_ranges{
"Duployan",
"Duployan",
5316025,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 694: Line 753:
m["Egyd"] = {
m["Egyd"] = {
"Demotic",
"Demotic",
188519,
"abjad, logography",
"abjad, logography",
-- Not in Unicode
-- Not in Unicode
Line 700: Line 760:
m["Egyh"] = {
m["Egyh"] = {
"Hieratic",
"Hieratic",
208111,
"abjad, logography",
"abjad, logography",
-- Unified with Egyptian hieroglyphic in Unicode
-- Unified with Egyptian hieroglyphic in Unicode
Line 706: Line 767:
m["Egyp"] = process_ranges{
m["Egyp"] = process_ranges{
"Egyptian hieroglyphic",
"Egyptian hieroglyphic",
132659,
"abjad, logography",
"abjad, logography",
ranges = {
ranges = {
0x13000, 0x13455,
0x13000, 0x13455,
0x13460, 0x143FA,
},
},
varieties = {"Hieratic"},
varieties = {"Hieratic"},
Line 720: Line 783:
m["Elba"] = process_ranges{
m["Elba"] = process_ranges{
"Elbasan",
"Elbasan",
1036714,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 728: Line 792:
m["Elym"] = process_ranges{
m["Elym"] = process_ranges{
"Elymaic",
"Elymaic",
60744423,
"abjad",
"abjad",
ranges = {
ranges = {
Line 737: Line 802:
m["Ethi"] = process_ranges{
m["Ethi"] = process_ranges{
"Ethiopic",
"Ethiopic",
257634,
"abugida",
"abugida",
aliases = {"Ge'ez"},
aliases = {"Ge'ez", "Geʽez"},
ranges = {
ranges = {
0x1200, 0x1248,
0x1200, 0x1248,
Line 777: Line 843:
0x1E7F0, 0x1E7FE,
0x1E7F0, 0x1E7FE,
},
},
sort_key = "Ethi-sortkey",
strip_diacritics = {remove_diacritics = u(0x135D) .. u(0x135E) .. u(0x135F)}
}
}


m["Gara"] = {
m["Gara"] = process_ranges{
"Garay",
"Garay",
3095302,
"alphabet",
"alphabet",
capitalized = true,
capitalized = true,
direction = "rtl",
direction = "rtl",
-- Not in Unicode
ranges = {
0x060C, 0x060C,
0x061B, 0x061B,
0x061F, 0x061F,
0x10D40, 0x10D65,
0x10D69, 0x10D85,
0x10D8E, 0x10D8F,
},
}
}


m["Geok"] = process_ranges{
m["Geok"] = process_ranges{
"Khutsuri",
"Khutsuri",
1090055,
"alphabet",
"alphabet",
ranges = { -- Ⴀ-Ⴭ is Asomtavruli, ⴀ-ⴭ is Nuskhuri
ranges = { -- Ⴀ-Ⴭ is Asomtavruli, ⴀ-ⴭ is Nuskhuri
Line 801: Line 878:
varieties = {"Nuskhuri", "Asomtavruli"},
varieties = {"Nuskhuri", "Asomtavruli"},
capitalized = true,
capitalized = true,
translit = "Geok-translit",
}
}


m["Geor"] = process_ranges{
m["Geor"] = process_ranges{
"Georgian",
"Georgian",
3317411,
"alphabet",
"alphabet",
ranges = { -- ა-ჿ is lowercase Mkhedruli; Ა-Ჿ is uppercase Mkhedruli (Mtavruli)
ranges = { -- ა-ჿ is lowercase Mkhedruli; Ა-Ჿ is uppercase Mkhedruli (Mtavruli)
0x0589, 0x0589,
0x10D0, 0x10FF,
0x10D0, 0x10FF,
0x1C90, 0x1CBA,
0x1C90, 0x1CBA,
Line 813: Line 893:
varieties = {"Mkhedruli", "Mtavruli"},
varieties = {"Mkhedruli", "Mtavruli"},
capitalized = true,
capitalized = true,
translit = "Geor-translit",
}
}


m["Glag"] = process_ranges{
m["Glag"] = process_ranges{
"Glagolitic",
"Glagolitic",
145625,
"alphabet",
"alphabet",
ranges = {
ranges = {
0x0484, 0x0484,
0x0484, 0x0484,
0x0487, 0x0487,
0x0487, 0x0487,
0x0589, 0x0589,
0x10FB, 0x10FB,
0x2C00, 0x2C5F,
0x2C00, 0x2C5F,
0x2E43, 0x2E43,
0x2E43, 0x2E43,
Line 835: Line 919:
m["Gong"] = process_ranges{
m["Gong"] = process_ranges{
"Gunjala Gondi",
"Gunjala Gondi",
18125340,
"abugida",
"abugida",
ranges = {
ranges = {
Line 849: Line 934:
m["Gonm"] = process_ranges{
m["Gonm"] = process_ranges{
"Masaram Gondi",
"Masaram Gondi",
16977603,
"abugida",
"abugida",
ranges = {
ranges = {
Line 864: Line 950:
m["Goth"] = process_ranges{
m["Goth"] = process_ranges{
"Gothic",
"Gothic",
467784,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 873: Line 960:
m["Gran"] = process_ranges{
m["Gran"] = process_ranges{
"Grantha",
"Grantha",
1119274,
"abugida",
"abugida",
ranges = {
ranges = {
Line 905: Line 993:
m["Grek"] = process_ranges{
m["Grek"] = process_ranges{
"Greek",
"Greek",
8216,
"alphabet",
"alphabet",
ranges = {
ranges = {
0x0342, 0x0342,
0x0341, 0x0341,
0x0345, 0x0345,
0x0374, 0x0375,
0x0370, 0x0377,
0x037E, 0x037E,
0x037A, 0x037F,
0x0384, 0x038A,
0x0384, 0x038A,
0x038C, 0x038C,
0x038C, 0x038C,
0x038E, 0x03A1,
0x038E, 0x03A1,
0x03A3, 0x03E1,
0x03A3, 0x03D7,
0x03F0, 0x03FF,
0x03DA, 0x03DB,
0x03DE, 0x03E1,
0x03F0, 0x03F1,
0x03F4, 0x03F4,
0x03FC, 0x03FC,
0x1D26, 0x1D2A,
0x1D26, 0x1D2A,
0x1D5D, 0x1D61,
0x1D5D, 0x1D61,
Line 929: Line 1,021:
},
},
capitalized = true,
capitalized = true,
display_text = cs["Grek-displaytext"],
strip_diacritics = cs["Grek-stripdiacritics"],
sort_key = {
remove_diacritics = "'ʼ;·`¨´῀" .. c.grave .. c.acute .. c.diaer .. c.caron .. c.turnedcommaabove .. c.commaabove .. c.revcommaabove .. c.macron .. c.breve .. c.diaerbelow .. c.brevebelow .. c.perispomeni .. c.ypogegrammeni .. c.RSQuo .. c.prime .. c.keraia .. c.lowerkeraia .. c.tonos .. c.coronis .. c.psili .. c.dasia,
from = {"ϝ", "ͷ", "ϛ", "ͱ", "ͺ", "ϳ", "ϻ", "[ϟϙ]", "[ςϲ]", "ͳ"},
to = {"ε" .. p[1], "ε" .. p[2], "ε" .. p[3], "ζ" .. p[1], "ι", "ι" .. p[1], "π" .. p[1], "π" .. p[2], "σ", "ϡ"},
},
}
}


m["Polyt"] = process_ranges{
m["Polyt"] = process_ranges{
"Greek",
"Greek",
m["Grek"][2],
1475332,
m["Grek"][3],
ranges = union(m["Grek"].ranges, {
ranges = union(m["Grek"].ranges, {
0x0340, 0x0340,
0x0342, 0x0345,
0x0370, 0x0373,
0x0376, 0x0377,
0x037A, 0x037D,
0x037F, 0x037F,
0x03D8, 0x03D9,
0x03DC, 0x03DD,
0x03F2, 0x03F3,
0x03F5, 0x03FB,
0x03FD, 0x03FF,
0x1F00, 0x1F15,
0x1F00, 0x1F15,
0x1F18, 0x1F1D,
0x1F18, 0x1F1D,
Line 955: Line 1,066:
capitalized = m["Grek"].capitalized,
capitalized = m["Grek"].capitalized,
parent = "Grek",
parent = "Grek",
display_text = m["Grek"].display_text,
strip_diacritics = "Polyt-stripdiacritics",
sort_key = m["Grek"].sort_key,
translit = "grc-translit",
}
}


m["Gujr"] = process_ranges{
m["Gujr"] = process_ranges{
"Gujarati",
"Gujarati",
733944,
"abugida",
"abugida",
ranges = {
ranges = {
Line 985: Line 1,101:
}
}


m["Gukh"] = {
m["Gukh"] = process_ranges{
"Khema",
"Khema",
110064239,
"abugida",
"abugida",
aliases = {"Gurung Khema", "Khema Phri", "Khema Lipi"},
aliases = {"Gurung Khema", "Khema Phri", "Khema Lipi"},
-- Not in Unicode
ranges = {
0x0965, 0x0965,
0x16100, 0x16139,
},
}
}


m["Guru"] = process_ranges{
m["Guru"] = process_ranges{
"Gurmukhi",
"Gurmukhi",
689894,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,024: Line 1,145:
m["Hang"] = process_ranges{
m["Hang"] = process_ranges{
"Hangul",
"Hangul",
8222,
"syllabary",
"syllabary",
aliases = {"Hangeul"},
aliases = {"Hangeul"},
Line 1,053: Line 1,175:
m["Hani"] = process_ranges{
m["Hani"] = process_ranges{
"Han",
"Han",
8201,
"logography",
"logography",
ranges = {
ranges = {
Line 1,066: Line 1,189:
0x3037, 0x303F,
0x3037, 0x303F,
0x3190, 0x319F,
0x3190, 0x319F,
0x31C0, 0x31E3,
0x31C0, 0x31E5,
0x31EF, 0x31EF,
0x31EF, 0x31EF,
0x3220, 0x3247,
0x3220, 0x3247,
Line 1,103: Line 1,226:
m["Hans"] = {
m["Hans"] = {
"Simplified Han",
"Simplified Han",
m["Hani"][2],
185614,
m["Hani"][3],
ranges = m["Hani"].ranges,
ranges = m["Hani"].ranges,
characters = m["Hani"].characters,
characters = m["Hani"].characters,
Line 1,112: Line 1,236:
m["Hant"] = {
m["Hant"] = {
"Traditional Han",
"Traditional Han",
m["Hani"][2],
178528,
m["Hani"][3],
ranges = m["Hani"].ranges,
ranges = m["Hani"].ranges,
characters = m["Hani"].characters,
characters = m["Hani"].characters,
Line 1,121: Line 1,246:
m["Hano"] = process_ranges{
m["Hano"] = process_ranges{
"Hanunoo",
"Hanunoo",
1584045,
"abugida",
"abugida",
aliases = {"Hanunó'o", "Hanuno'o"},
ranges = {
ranges = {
0x1720, 0x1736,
0x1720, 0x1736,
Line 1,129: Line 1,256:
m["Hatr"] = process_ranges{
m["Hatr"] = process_ranges{
"Hatran",
"Hatran",
20813038,
"abjad",
"abjad",
ranges = {
ranges = {
Line 1,140: Line 1,268:
m["Hebr"] = process_ranges{
m["Hebr"] = process_ranges{
"Hebrew",
"Hebrew",
"abjad", -- more precisely, impure abjad
33513,
"abjad", -- more precisely, impure abjad
ranges = {
ranges = {
0x0591, 0x05C7,
0x0591, 0x05C7,
Line 1,154: Line 1,283:
},
},
direction = "rtl",
direction = "rtl",
display_text = "Hebr-common",
sort_key = "Hebr-common",
strip_diacritics = "Hebr-common",
}
}


m["Hira"] = process_ranges{
m["Hira"] = process_ranges{
"Hiragana",
"Hiragana",
48332,
"syllabary",
"syllabary",
ranges = {
ranges = {
Line 1,183: Line 1,316:


m["Hluw"] = process_ranges{
m["Hluw"] = process_ranges{
"Anatolian Hieroglyphs",
"Anatolian hieroglyphic",
521323,
"logography, syllabary",
"logography, syllabary",
ranges = {
ranges = {
Line 1,193: Line 1,327:
m["Hmng"] = process_ranges{
m["Hmng"] = process_ranges{
"Pahawh Hmong",
"Pahawh Hmong",
365954,
"semisyllabary",
"semisyllabary",
aliases = {"Hmong"},
aliases = {"Hmong"},
Line 1,206: Line 1,341:
m["Hmnp"] = process_ranges{
m["Hmnp"] = process_ranges{
"Nyiakeng Puachue Hmong",
"Nyiakeng Puachue Hmong",
33712499,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 1,217: Line 1,353:
m["Hung"] = process_ranges{
m["Hung"] = process_ranges{
"Old Hungarian",
"Old Hungarian",
446224,
"alphabet",
"alphabet",
aliases = {"Hungarian runic"},
aliases = {"Hungarian runic"},
Line 1,230: Line 1,367:
m["Ibrnn"] = {
m["Ibrnn"] = {
"Northeastern Iberian",
"Northeastern Iberian",
1113155,
"semisyllabary",
"semisyllabary",
ietf_subtag = "Zzzz",
ietf_subtag = "Zzzz",
Line 1,237: Line 1,375:
m["Ibrns"] = {
m["Ibrns"] = {
"Southeastern Iberian",
"Southeastern Iberian",
2305351,
"semisyllabary",
"semisyllabary",
ietf_subtag = "Zzzz",
ietf_subtag = "Zzzz",
Line 1,245: Line 1,384:
-- To be used to avoid any formatting or link processing
-- To be used to avoid any formatting or link processing
"Image-rendered",
"Image-rendered",
478798,
-- This should not have any characters listed
-- This should not have any characters listed
ietf_subtag = "Zyyy",
ietf_subtag = "Zyyy",
translit = false,
translit = false,
character_category = false,
character_category = false, -- none
}
}


m["Inds"] = {
m["Inds"] = {
"Indus",
"Indus",
601388,
aliases = {"Harappan", "Indus Valley"},
aliases = {"Harappan", "Indus Valley"},
}
}
Line 1,258: Line 1,399:
m["Ipach"] = {
m["Ipach"] = {
"International Phonetic Alphabet",
"International Phonetic Alphabet",
21204,
aliases = {"IPA"},
aliases = {"IPA"},
ietf_subtag = "Latn",
ietf_subtag = "Latn",
Line 1,264: Line 1,406:
m["Ital"] = process_ranges{
m["Ital"] = process_ranges{
"Old Italic",
"Old Italic",
4891256,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 1,269: Line 1,412:
0x1032D, 0x1032F,
0x1032D, 0x1032F,
},
},
translit = "Ital-translit",
}
}


m["Java"] = process_ranges{
m["Java"] = process_ranges{
"Javanese",
"Javanese",
879704,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,283: Line 1,428:
m["Jurc"] = {
m["Jurc"] = {
"Jurchen",
"Jurchen",
912240,
"logography",
"logography",
spaces = false,
spaces = false,
Line 1,289: Line 1,435:
m["Kali"] = process_ranges{
m["Kali"] = process_ranges{
"Kayah Li",
"Kayah Li",
4919239,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,297: Line 1,444:
m["Kana"] = process_ranges{
m["Kana"] = process_ranges{
"Katakana",
"Katakana",
82946,
"syllabary",
"syllabary",
ranges = {
ranges = {
Line 1,325: Line 1,473:
m["Kawi"] = process_ranges{
m["Kawi"] = process_ranges{
"Kawi",
"Kawi",
975802,
"abugida",
"abugida",
ranges = {
ranges = {
0x11F00, 0x11F10,
0x11F00, 0x11F10,
0x11F12, 0x11F3A,
0x11F12, 0x11F3A,
0x11F3E, 0x11F59,
0x11F3E, 0x11F5A,
},
},
}
}
Line 1,335: Line 1,484:
m["Khar"] = process_ranges{
m["Khar"] = process_ranges{
"Kharoshthi",
"Kharoshthi",
1161266,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,351: Line 1,501:
m["Khmr"] = process_ranges{
m["Khmr"] = process_ranges{
"Khmer",
"Khmer",
1054190,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,367: Line 1,518:
m["Khoj"] = process_ranges{
m["Khoj"] = process_ranges{
"Khojki",
"Khojki",
1740656,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,378: Line 1,530:
to = {"𑈇", "𑈁", "𑈅", "𑈇", "𑈇", "𑈃", "𑈲", "𑈳", "𑈂"}
to = {"𑈇", "𑈁", "𑈅", "𑈇", "𑈇", "𑈃", "𑈲", "𑈳", "𑈂"}
},
},
}
m["Khomt"] = {
"Khom Thai",
13023788,
"abugida",
-- Not in Unicode
}
}


m["Kitl"] = {
m["Kitl"] = {
"Khitan Large",
"Khitan large",
6401797,
"logography",
"logography",
spaces = false,
spaces = false,
Line 1,387: Line 1,547:


m["Kits"] = process_ranges{
m["Kits"] = process_ranges{
"Khitan Small",
"Khitan small",
6401800,
"logography, syllabary",
"logography, syllabary",
ranges = {
ranges = {
0x16FE4, 0x16FE4,
0x16FE4, 0x16FE4,
0x18B00, 0x18CD5,
0x18B00, 0x18CD5,
0x18CFF, 0x18CFF,
},
},
spaces = false,
spaces = false,
Line 1,398: Line 1,560:
m["Knda"] = process_ranges{
m["Knda"] = process_ranges{
"Kannada",
"Kannada",
839666,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,416: Line 1,579:
0x0CF1, 0x0CF3,
0x0CF1, 0x0CF3,
0x1CD0, 0x1CD0,
0x1CD0, 0x1CD0,
0x1CD2, 0x1CD2,
0x1CD2, 0x1CD3,
0x1CDA, 0x1CDA,
0x1CDA, 0x1CDA,
0x1CF2, 0x1CF2,
0x1CF2, 0x1CF2,
Line 1,426: Line 1,589:
to = {"ಊ", "ೠ", "ಔ"}
to = {"ಊ", "ೠ", "ಔ"}
},
},
translit = "kn-translit",
}
}


m["Kpel"] = {
m["Kpel"] = {
"Kpelle",
"Kpelle",
1586299,
"syllabary",
"syllabary",
-- Not in Unicode
-- Not in Unicode
}
}


m["Krai"] = {
m["Krai"] = process_ranges{
"Kirat Rai",
"Kirat Rai",
123173834,
"abugida",
"abugida",
aliases = {"Rai", "Khambu Rai", "Rai Barṇamālā", "Kirat Khambu Rai"},
aliases = {"Rai", "Khambu Rai", "Rai Barṇamālā", "Kirat Khambu Rai"},
-- Not in Unicode
ranges = {
0x16D40, 0x16D79,
},
}
}


m["Kthi"] = process_ranges{
m["Kthi"] = process_ranges{
"Kaithi",
"Kaithi",
1253814,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,450: Line 1,619:
0x110CD, 0x110CD,
0x110CD, 0x110CD,
},
},
}
m["Kulit"] = {
"Kulitan",
6443044,
"abugida",
-- Not in Unicode
}
}


m["Lana"] = process_ranges{
m["Lana"] = process_ranges{
"Tai Tham",
"Tai Tham",
1314503,
"abugida",
"abugida",
aliases = {"Tham", "Tua Mueang", "Lanna"},
aliases = {"Tham", "Tua Mueang", "Lanna"},
Line 1,468: Line 1,645:
m["Laoo"] = process_ranges{
m["Laoo"] = process_ranges{
"Lao",
"Lao",
1815229,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,487: Line 1,665:
m["Latn"] = process_ranges{
m["Latn"] = process_ranges{
"Latin",
"Latin",
8229,
"alphabet",
"alphabet",
aliases = {"Roman"},
aliases = {"Roman"},
Line 1,508: Line 1,687:
0x1D6B, 0x1D77,
0x1D6B, 0x1D77,
0x1D79, 0x1DBE,
0x1D79, 0x1DBE,
0x1DF8, 0x1DF8,
0x1E00, 0x1EFF,
0x1E00, 0x1EFF,
0x202F, 0x202F,
0x202F, 0x202F,
Line 1,523: Line 1,703:
0xA700, 0xA707,
0xA700, 0xA707,
0xA722, 0xA787,
0xA722, 0xA787,
0xA78B, 0xA7CA,
0xA78B, 0xA7CD,
0xA7D0, 0xA7D1,
0xA7D0, 0xA7D1,
0xA7D3, 0xA7D3,
0xA7D3, 0xA7D3,
0xA7D5, 0xA7D9,
0xA7D5, 0xA7DC,
0xA7F2, 0xA7FF,
0xA7F2, 0xA7FF,
0xA92E, 0xA92E,
0xA92E, 0xA92E,
Line 1,548: Line 1,728:
m["Latf"] = {
m["Latf"] = {
"Fraktur",
"Fraktur",
m["Latn"][2],
148443,
m["Latn"][3],
ranges = m["Latn"].ranges,
ranges = m["Latn"].ranges,
characters = m["Latn"].characters,
characters = m["Latn"].characters,
otherNames = {"Blackletter"}, -- Blackletter is actually the parent "script"
other_names = {"Blackletter"}, -- Blackletter is actually the parent "script"
capitalized = m["Latn"].capitalized,
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
translit = m["Latn"].translit,
Line 1,559: Line 1,740:
m["Latg"] = {
m["Latg"] = {
"Gaelic",
"Gaelic",
m["Latn"][2],
1432616,
m["Latn"][3],
ranges = m["Latn"].ranges,
ranges = m["Latn"].ranges,
characters = m["Latn"].characters,
characters = m["Latn"].characters,
otherNames = {"Irish"},
other_names = {"Irish"},
capitalized = m["Latn"].capitalized,
capitalized = m["Latn"].capitalized,
translit = m["Latn"].translit,
translit = m["Latn"].translit,
Line 1,570: Line 1,752:
m["pjt-Latn"] = {
m["pjt-Latn"] = {
"Latin",
"Latin",
m["Latn"][2],
nil,
m["Latn"][3],
ranges = m["Latn"].ranges,
ranges = m["Latn"].ranges,
characters = m["Latn"].characters,
characters = m["Latn"].characters,
Line 1,580: Line 1,763:
m["Leke"] = {
m["Leke"] = {
"Leke",
"Leke",
19572613,
"abugida",
"abugida",
-- Not in Unicode
-- Not in Unicode
Line 1,586: Line 1,770:
m["Lepc"] = process_ranges{
m["Lepc"] = process_ranges{
"Lepcha",
"Lepcha",
1481626,
"abugida",
"abugida",
aliases = {"Róng"},
ranges = {
ranges = {
0x1C00, 0x1C37,
0x1C00, 0x1C37,
Line 1,596: Line 1,782:
m["Limb"] = process_ranges{
m["Limb"] = process_ranges{
"Limbu",
"Limbu",
933796,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,609: Line 1,796:
m["Lina"] = process_ranges{
m["Lina"] = process_ranges{
"Linear A",
"Linear A",
30972,
ranges = {
ranges = {
0x10107, 0x10133,
0x10107, 0x10133,
Line 1,619: Line 1,807:
m["Linb"] = process_ranges{
m["Linb"] = process_ranges{
"Linear B",
"Linear B",
190102,
ranges = {
ranges = {
0x10000, 0x1000B,
0x10000, 0x1000B,
Line 1,635: Line 1,824:
m["Lisu"] = process_ranges{
m["Lisu"] = process_ranges{
"Fraser",
"Fraser",
1194621,
"alphabet",
"alphabet",
aliases = {"Old Lisu", "Lisu"},
aliases = {"Old Lisu", "Lisu"},
ranges = {
ranges = {
0x300A, 0x300B,
0xA4D0, 0xA4FF,
0xA4D0, 0xA4FF,
0x11FB0, 0x11FB0,
0x11FB0, 0x11FB0,
Line 1,644: Line 1,835:
from = {"['’]", "[.ꓸ][.ꓸ]", "[.ꓸ][,ꓹ]"},
from = {"['’]", "[.ꓸ][.ꓸ]", "[.ꓸ][,ꓹ]"},
to = {"ʼ", "ꓺ", "ꓻ"}
to = {"ʼ", "ꓺ", "ꓻ"}
},
translit = "Lisu-translit",
sort_key = {
from = {"𑾰"},
to = {"ꓬ" .. p[1]}
},
},
}
}
Line 1,649: Line 1,845:
m["Loma"] = {
m["Loma"] = {
"Loma",
"Loma",
13023816,
"syllabary",
"syllabary",
-- Not in Unicode
-- Not in Unicode
Line 1,655: Line 1,852:
m["Lyci"] = process_ranges{
m["Lyci"] = process_ranges{
"Lycian",
"Lycian",
913587,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 1,663: Line 1,861:
m["Lydi"] = process_ranges{
m["Lydi"] = process_ranges{
"Lydian",
"Lydian",
4261300,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 1,673: Line 1,872:
m["Mahj"] = process_ranges{
m["Mahj"] = process_ranges{
"Mahajani",
"Mahajani",
6732850,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,683: Line 1,883:
m["Maka"] = process_ranges{
m["Maka"] = process_ranges{
"Makasar",
"Makasar",
72947229,
"abugida",
"abugida",
aliases = {"Old Makasar"},
aliases = {"Old Makasar"},
Line 1,692: Line 1,893:
m["Mand"] = process_ranges{
m["Mand"] = process_ranges{
"Mandaic",
"Mandaic",
1812130,
aliases = {"Mandaean"},
aliases = {"Mandaean"},
ranges = {
ranges = {
Line 1,703: Line 1,905:
m["Mani"] = process_ranges{
m["Mani"] = process_ranges{
"Manichaean",
"Manichaean",
3544702,
"abjad",
"abjad",
ranges = {
ranges = {
Line 1,710: Line 1,913:
},
},
direction = "rtl",
direction = "rtl",
translit = "Mani-translit",
}
}


m["Marc"] = process_ranges{
m["Marc"] = process_ranges{
"Marchen",
"Marchen",
72403709,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,724: Line 1,929:
m["Maya"] = process_ranges{
m["Maya"] = process_ranges{
"Maya",
"Maya",
211248,
aliases = {"Maya hieroglyphic", "Mayan", "Mayan hieroglyphic"},
aliases = {"Maya hieroglyphic", "Mayan", "Mayan hieroglyphic"},
ranges = {
ranges = {
Line 1,732: Line 1,938:
m["Medf"] = process_ranges{
m["Medf"] = process_ranges{
"Medefaidrin",
"Medefaidrin",
1519764,
aliases = {"Oberi Okaime", "Oberi Ɔkaimɛ"},
aliases = {"Oberi Okaime", "Oberi Ɔkaimɛ"},
ranges = {
ranges = {
Line 1,741: Line 1,948:
m["Mend"] = process_ranges{
m["Mend"] = process_ranges{
"Mende",
"Mende",
951069,
aliases = {"Mende Kikakui"},
aliases = {"Mende Kikakui"},
ranges = {
ranges = {
Line 1,751: Line 1,959:
m["Merc"] = process_ranges{
m["Merc"] = process_ranges{
"Meroitic cursive",
"Meroitic cursive",
73028124,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,762: Line 1,971:
m["Mero"] = process_ranges{
m["Mero"] = process_ranges{
"Meroitic hieroglyphic",
"Meroitic hieroglyphic",
73028623,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,767: Line 1,977:
},
},
direction = "rtl",
direction = "rtl",
wikipedia_article = "Meroitic hieroglyphs",
}
}


m["Mlym"] = process_ranges{
m["Mlym"] = process_ranges{
"Malayalam",
"Malayalam",
1164129,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,790: Line 2,002:
to = {"ഈ", "ഊ", "ഐ", "ഓ", "ഔ", "ൿ", "ൺ", "ൻറ", "ൻ", "ൔ", "ൕ", "ർ", "ൽ", "ൾ", "ൖ", "ൈ", "ന്റ"}
to = {"ഈ", "ഊ", "ഐ", "ഓ", "ഔ", "ൿ", "ൺ", "ൻറ", "ൻ", "ൔ", "ൕ", "ർ", "ൽ", "ൾ", "ൖ", "ൈ", "ന്റ"}
},
},
translit = "ml-translit",
}
}


m["Modi"] = process_ranges{
m["Modi"] = process_ranges{
"Modi",
"Modi",
1703713,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,806: Line 2,020:
}
}


m["Mong"] = process_ranges{
do
"Mongolian",
local Mong_displaytext = {
"alphabet",
from = {"([ᠨ-ᡂᡸ])ᠶ([ᠨ-ᡂᡸ])", "([ᠠ-ᡂᡸ])ᠸ([^᠋ᠠ-])", "([ᠠ-ᡂᡸ])ᠸ$"},
aliases = {"Mongol bichig", "Hudum Mongol bichig"},
to = {"%1ᠢ%2", "%1ᠧ%2", "%1ᠧ"}
ranges = {
0x1800, 0x1805,
0x180A, 0x1819,
0x1820, 0x1842,
0x1878, 0x1878,
0x1880, 0x1897,
0x18A6, 0x18A6,
0x18A9, 0x18A9,
0x200C, 0x200D,
0x202F, 0x202F,
0x11660, 0x11668,
},
direction = "vertical-ltr",
}
 
m["mnc-Mong"] = process_ranges{
"Manchu",
m["Mong"][2],
ranges = {
0x1801, 0x1801,
0x1804, 0x1804,
0x1808, 0x180F,
0x1820, 0x1820,
0x1823, 0x1823,
0x1828, 0x182A,
0x182E, 0x1830,
0x1834, 0x1838,
0x183A, 0x183A,
0x185D, 0x185D,
0x185F, 0x1861,
0x1864, 0x1869,
0x186C, 0x1871,
0x1873, 0x1877,
0x1880, 0x1888,
0x188F, 0x188F,
0x189A, 0x18A5,
0x18A8, 0x18A8,
0x18AA, 0x18AA,
0x200C, 0x200D,
0x202F, 0x202F,
},
direction = "vertical-ltr",
parent = "Mong",
}
}
m["sjo-Mong"] = process_ranges{
m["Mong"] = process_ranges{
"Xibe",
"Mongolian",
m["Mong"][2],
1055705,
aliases = {"Sibe"},
"alphabet",
aliases = {"Mongol bichig", "Hudum Mongol bichig"},
ranges = {
ranges = {
0x1804, 0x1804,
0x1800, 0x1805,
0x1807, 0x1807,
0x180A, 0x1819,
0x180A, 0x180F,
0x1820, 0x1842,
0x1820, 0x1820,
0x1878, 0x1878,
0x1823, 0x1823,
0x1880, 0x1897,
0x1828, 0x1828,
0x18A6, 0x18A6,
0x182A, 0x182A,
0x18A9, 0x18A9,
0x182E, 0x1830,
0x1834, 0x1838,
0x183A, 0x183A,
0x185D, 0x1872,
0x200C, 0x200D,
0x200C, 0x200D,
0x202F, 0x202F,
0x202F, 0x202F,
0x3001, 0x3002,
0x3008, 0x300B,
0x11660, 0x11668,
},
},
direction = "vertical-ltr",
direction = "vertical-ltr",
parent = "mnc-Mong",
display_text = Mong_displaytext,
}
strip_diacritics = Mong_displaytext,
translit = "Mong-translit",
m["xwo-Mong"] = process_ranges{
"Clear Script",
m["Mong"][2],
aliases = {"Todo", "Todo bichig"},
ranges = {
0x1800, 0x1801,
0x1804, 0x1806,
0x180A, 0x1820,
0x1828, 0x1828,
0x182F, 0x1831,
0x1834, 0x1834,
0x1837, 0x1838,
0x183A, 0x183B,
0x1840, 0x1840,
0x1843, 0x185C,
0x1880, 0x1887,
0x1889, 0x188F,
0x1894, 0x1894,
0x1896, 0x1899,
0x18A7, 0x18A7,
0x200C, 0x200D,
0x202F, 0x202F,
0x11669, 0x1166C,
},
direction = "vertical-ltr",
parent = "Mong",
}
}
m["mnc-Mong"] = process_ranges{
"Manchu",
122888,
m["Mong"][3],
ranges = {
0x1801, 0x1801,
0x1804, 0x1804,
0x1808, 0x180F,
0x1820, 0x1820,
0x1823, 0x1823,
0x1828, 0x182A,
0x182E, 0x1830,
0x1834, 0x1838,
0x183A, 0x183A,
0x185D, 0x185D,
0x185F, 0x1861,
0x1864, 0x1869,
0x186C, 0x1871,
0x1873, 0x1877,
0x1880, 0x1888,
0x188F, 0x188F,
0x189A, 0x18A5,
0x18A8, 0x18A8,
0x18AA, 0x18AA,
0x200C, 0x200D,
0x202F, 0x202F,
},
direction = "vertical-ltr",
parent = "Mong",
translit = "mnc-translit",
}
m["sjo-Mong"] = process_ranges{
"Xibe",
113624153,
m["Mong"][3],
aliases = {"Sibe"},
ranges = {
0x1804, 0x1804,
0x1807, 0x1807,
0x180A, 0x180F,
0x1820, 0x1820,
0x1823, 0x1823,
0x1828, 0x1828,
0x182A, 0x182A,
0x182E, 0x1830,
0x1834, 0x1838,
0x183A, 0x183A,
0x185D, 0x1872,
0x200C, 0x200D,
0x202F, 0x202F,
},
direction = "vertical-ltr",
parent = "mnc-Mong",
}
m["xwo-Mong"] = process_ranges{
"Clear Script",
529085,
m["Mong"][3],
aliases = {"Todo", "Todo bichig"},
ranges = {
0x1800, 0x1801,
0x1804, 0x1806,
0x180A, 0x1820,
0x1828, 0x1828,
0x182F, 0x1831,
0x1834, 0x1834,
0x1837, 0x1838,
0x183A, 0x183B,
0x1840, 0x1840,
0x1843, 0x185C,
0x1880, 0x1887,
0x1889, 0x188F,
0x1894, 0x1894,
0x1896, 0x1899,
0x18A7, 0x18A7,
0x200C, 0x200D,
0x202F, 0x202F,
0x11669, 0x1166C,
},
direction = "vertical-ltr",
parent = "Mong",
translit = "xwo-translit",
}
end


m["Moon"] = {
m["Moon"] = {
"Moon",
"Moon",
918391,
"alphabet",
"alphabet",
aliases = {"Moon System of Embossed Reading", "Moon type", "Moon writing", "Moon alphabet", "Moon code"},
aliases = {"Moon System of Embossed Reading", "Moon type", "Moon writing", "Moon alphabet", "Moon code"},
Line 1,915: Line 2,148:
m["Morse"] = {
m["Morse"] = {
"Morse code",
"Morse code",
79897,
ietf_subtag = "Zsym",
ietf_subtag = "Zsym",
}
}


m["Mroo"] = process_ranges{
m["Mroo"] = process_ranges{
"Mro",
"Mru",
75919253,
aliases = {"Mro", "Mrung"},
ranges = {
ranges = {
0x16A40, 0x16A5E,
0x16A40, 0x16A5E,
Line 1,929: Line 2,165:
m["Mtei"] = process_ranges{
m["Mtei"] = process_ranges{
"Meitei Mayek",
"Meitei Mayek",
2981413,
"abugida",
"abugida",
aliases = {"Meetei Mayek", "Manipuri"},
aliases = {"Meetei Mayek", "Manipuri"},
Line 1,940: Line 2,177:
m["Mult"] = process_ranges{
m["Mult"] = process_ranges{
"Multani",
"Multani",
17047906,
"abugida",
"abugida",
ranges = {
ranges = {
Line 1,952: Line 2,190:


m["Music"] = process_ranges{
m["Music"] = process_ranges{
"Musical notation",
"musical notation",
233861,
"pictography",
"pictography",
ranges = {
ranges = {
Line 1,965: Line 2,204:
m["Mymr"] = process_ranges{
m["Mymr"] = process_ranges{
"Burmese",
"Burmese",
43887939,
"abugida",
"abugida",
aliases = {"Myanmar"},
aliases = {"Myanmar"},
Line 1,972: Line 2,212:
0xA9E0, 0xA9FE,
0xA9E0, 0xA9FE,
0xAA60, 0xAA7F,
0xAA60, 0xAA7F,
0x116D0, 0x116E3,
},
},
spaces = false,
spaces = false,
Line 1,977: Line 2,218:


m["Nagm"] = process_ranges{
m["Nagm"] = process_ranges{
"Nag Mundari",
"Mundari Bani",
106917274,
"alphabet",
"alphabet",
aliases = {"Nag Mundari"},
ranges = {
ranges = {
0x1E4D0, 0x1E4F9,
0x1E4D0, 0x1E4F9,
Line 1,986: Line 2,229:
m["Nand"] = process_ranges{
m["Nand"] = process_ranges{
"Nandinagari",
"Nandinagari",
6963324,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,001: Line 2,245:


m["Narb"] = process_ranges{
m["Narb"] = process_ranges{
"Old North Arabian",
"Ancient North Arabian",
1472213,
"abjad",
"abjad",
aliases = {"Old North Arabian"},
ranges = {
ranges = {
0x10A80, 0x10A9F,
0x10A80, 0x10A9F,
},
},
direction = "rtl",
direction = "rtl",
translit = "Narb-translit",
}
}


m["Nbat"] = process_ranges{
m["Nbat"] = process_ranges{
"Nabataean",
"Nabataean",
855624,
"abjad",
"abjad",
aliases = {"Nabatean"},
aliases = {"Nabatean"},
Line 2,022: Line 2,270:
m["Newa"] = process_ranges{
m["Newa"] = process_ranges{
"Newa",
"Newa",
7237292,
"abugida",
"abugida",
aliases = {"Newar", "Newari", "Prachalit Nepal"},
aliases = {"Newar", "Newari", "Prachalit Nepal"},
Line 2,032: Line 2,281:
m["Nkdb"] = {
m["Nkdb"] = {
"Dongba",
"Dongba",
1190953,
"pictography",
"pictography",
aliases = {"Naxi Dongba", "Nakhi Dongba", "Tomba", "Tompa", "Mo-so"},
aliases = {"Naxi Dongba", "Nakhi Dongba", "Tomba", "Tompa", "Mo-so"},
Line 2,040: Line 2,290:
m["Nkgb"] = {
m["Nkgb"] = {
"Geba",
"Geba",
731189,
"syllabary",
"syllabary",
aliases = {"Nakhi Geba", "Naxi Geba"},
aliases = {"Nakhi Geba", "Naxi Geba"},
Line 2,048: Line 2,299:
m["Nkoo"] = process_ranges{
m["Nkoo"] = process_ranges{
"N'Ko",
"N'Ko",
1062587,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 2,061: Line 2,313:


m["None"] = {
m["None"] = {
"Unspecified", -- renders as 'unspecified script'
"unspecified",
nil,
-- This should not have any characters listed
-- This should not have any characters listed
ietf_subtag = "Zyyy",
ietf_subtag = "Zyyy",
translit = false,
translit = false,
character_category = false,
character_category = false, -- none
}
}


m["Nshu"] = process_ranges{
m["Nshu"] = process_ranges{
"Nüshu",
"Nüshu",
56436,
"syllabary",
"syllabary",
aliases = {"Nushu"},
aliases = {"Nushu"},
Line 2,081: Line 2,335:
m["Ogam"] = process_ranges{
m["Ogam"] = process_ranges{
"Ogham",
"Ogham",
184661,
ranges = {
ranges = {
0x1680, 0x169C,
0x1680, 0x169C,
Line 2,088: Line 2,343:
m["Olck"] = process_ranges{
m["Olck"] = process_ranges{
"Ol Chiki",
"Ol Chiki",
201688,
aliases = {"Ol Chemetʼ", "Ol", "Santali"},
aliases = {"Ol Chemetʼ", "Ol", "Santali"},
ranges = {
ranges = {
Line 2,094: Line 2,350:
}
}


m["Onao"] = {
m["Onao"] = process_ranges{
"Ol Onal",
"Ol Onal",
108607084,
"alphabet",
"alphabet",
-- Not in Unicode
ranges = {
0x0964, 0x0965,
0x1E5D0, 0x1E5FA,
0x1E5FF, 0x1E5FF,
},
}
}


m["Orkh"] = process_ranges{
m["Orkh"] = process_ranges{
"Orkhon runes",
"Old Turkic",
aliases = {"Old Turkic"},
5058305,
aliases = {"Orkhon runic"},
ranges = {
ranges = {
0x10C00, 0x10C48,
0x10C00, 0x10C48,
},
},
direction = "rtl",
direction = "rtl",
translit = "Orkh-translit",
}
}


m["Orya"] = process_ranges{
m["Orya"] = process_ranges{
"Odia",
"Odia",
1760127,
"abugida",
"abugida",
aliases = {"Oriya"},
aliases = {"Oriya"},
Line 2,141: Line 2,405:
m["Osge"] = process_ranges{
m["Osge"] = process_ranges{
"Osage",
"Osage",
7105529,
ranges = {
ranges = {
0x104B0, 0x104D3,
0x104B0, 0x104D3,
Line 2,150: Line 2,415:
m["Osma"] = process_ranges{
m["Osma"] = process_ranges{
"Osmanya",
"Osmanya",
1377866,
ranges = {
ranges = {
0x10480, 0x1049D,
0x10480, 0x1049D,
Line 2,158: Line 2,424:
m["Ougr"] = process_ranges{
m["Ougr"] = process_ranges{
"Old Uyghur",
"Old Uyghur",
1998938,
"abjad, alphabet",
"abjad, alphabet",
ranges = {
ranges = {
Line 2,170: Line 2,437:
m["Palm"] = process_ranges{
m["Palm"] = process_ranges{
"Palmyrene",
"Palmyrene",
17538100,
ranges = {
ranges = {
0x10860, 0x1087F,
0x10860, 0x1087F,
Line 2,178: Line 2,446:
m["Pauc"] = process_ranges{
m["Pauc"] = process_ranges{
"Pau Cin Hau",
"Pau Cin Hau",
25339852,
ranges = {
ranges = {
0x11AC0, 0x11AF8,
0x11AC0, 0x11AF8,
},
},
}
m["Pcun"] = {
"Proto-Cuneiform",
1650699,
"pictography",
-- Not in Unicode
}
m["Pelm"] = {
"Proto-Elamite",
56305763,
"pictography",
-- Not in Unicode
}
}


m["Perm"] = process_ranges{
m["Perm"] = process_ranges{
"Old Permic",
"Old Permic",
147899,
ranges = {
ranges = {
0x0483, 0x0483,
0x0483, 0x0483,
Line 2,193: Line 2,477:
m["Phag"] = process_ranges{
m["Phag"] = process_ranges{
"Phags-pa",
"Phags-pa",
822836,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,207: Line 2,492:
m["Phli"] = process_ranges{
m["Phli"] = process_ranges{
"Inscriptional Pahlavi",
"Inscriptional Pahlavi",
24089793,
"abjad",
"abjad",
ranges = {
ranges = {
Line 2,217: Line 2,503:
m["Phlp"] = process_ranges{
m["Phlp"] = process_ranges{
"Psalter Pahlavi",
"Psalter Pahlavi",
7253954,
"abjad",
"abjad",
ranges = {
ranges = {
Line 2,229: Line 2,516:
m["Phlv"] = {
m["Phlv"] = {
"Book Pahlavi",
"Book Pahlavi",
72403118,
"abjad",
"abjad",
direction = "rtl",
direction = "rtl",
wikipedia_article = "Pahlavi scripts#Book Pahlavi",
-- Not in Unicode
-- Not in Unicode
}
}
Line 2,236: Line 2,525:
m["Phnx"] = process_ranges{
m["Phnx"] = process_ranges{
"Phoenician",
"Phoenician",
26752,
"abjad",
"abjad",
ranges = {
ranges = {
Line 2,242: Line 2,532:
},
},
direction = "rtl",
direction = "rtl",
translit = "Phnx-translit",
}
}


m["Plrd"] = process_ranges{
m["Plrd"] = process_ranges{
"Pollard",
"Pollard",
601734,
"abugida",
"abugida",
aliases = {"Miao"},
aliases = {"Miao"},
Line 2,257: Line 2,549:
m["Prti"] = process_ranges{
m["Prti"] = process_ranges{
"Inscriptional Parthian",
"Inscriptional Parthian",
13023804,
ranges = {
ranges = {
0x10B40, 0x10B55,
0x10B40, 0x10B55,
Line 2,262: Line 2,555:
},
},
direction = "rtl",
direction = "rtl",
}
m["Psin"] = {
"Proto-Sinaitic",
1065250,
"abjad",
direction = "rtl",
-- Not in Unicode
}
}


m["Ranj"] = {
m["Ranj"] = {
"Ranjana",
"Ranjana",
2385276,
"abugida",
"abugida",
-- Not in Unicode
-- Not in Unicode
Line 2,272: Line 2,574:
m["Rjng"] = process_ranges{
m["Rjng"] = process_ranges{
"Rejang",
"Rejang",
2007960,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,281: Line 2,584:
m["Rohg"] = process_ranges{
m["Rohg"] = process_ranges{
"Hanifi Rohingya",
"Hanifi Rohingya",
21028705,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 2,296: Line 2,600:
m["Roro"] = {
m["Roro"] = {
"Rongorongo",
"Rongorongo",
209764,
-- Not in Unicode
-- Not in Unicode
}
}
Line 2,301: Line 2,606:
m["Rumin"] = process_ranges{
m["Rumin"] = process_ranges{
"Rumi numerals",
"Rumi numerals",
nil,
ranges = {
ranges = {
0x10E60, 0x10E7E,
0x10E60, 0x10E7E,
},
},
ietf_subtag = "Arab",
ietf_subtag = "Arab",
character_category = "Rumi numerals",
}
}


m["Runr"] = process_ranges{
m["Runr"] = process_ranges{
"Runic",
"Runic",
82996,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 2,317: Line 2,623:
}
}


m["Samr"] = process_ranges{
do
"Samaritan",
local Samr_stripdiacritics = {
"abjad",
remove_diacritics = c.CGJ .. u(0x0816) .. "-" .. u(0x082D),
ranges = {
}
0x0800, 0x082D,
0x0830, 0x083E,
m["Samr"] = process_ranges{
},
"Samaritan",
direction = "rtl",
1550930,
}
"abjad",
ranges = {
0x0800, 0x082D,
0x0830, 0x083E,
},
direction = "rtl",
strip_diacritics = Samr_stripdiacritics,
sort_key = Samr_stripdiacritics,
}
end


m["Sarb"] = process_ranges{
m["Sarb"] = process_ranges{
"Old South Arabian",
"Ancient South Arabian",
446074,
"abjad",
"abjad",
aliases = {"Old South Arabian"},
ranges = {
ranges = {
0x10A60, 0x10A7F,
0x10A60, 0x10A7F,
},
},
direction = "rtl",
direction = "rtl",
translit = "Sarb-translit",
}
}


m["Saur"] = process_ranges{
m["Saur"] = process_ranges{
"Saurashtra",
"Saurashtra",
3535165,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,347: Line 2,666:
m["Semap"] = {
m["Semap"] = {
"flag semaphore",
"flag semaphore",
250796,
"pictography",
"pictography",
ietf_subtag = "Zsym",
ietf_subtag = "Zsym",
Line 2,353: Line 2,673:
m["Sgnw"] = process_ranges{
m["Sgnw"] = process_ranges{
"SignWriting",
"SignWriting",
1497335,
"pictography",
"pictography",
aliases = {"Sutton SignWriting"},
aliases = {"Sutton SignWriting"},
Line 2,365: Line 2,686:
m["Shaw"] = process_ranges{
m["Shaw"] = process_ranges{
"Shavian",
"Shavian",
1970098,
aliases = {"Shaw"},
aliases = {"Shaw"},
ranges = {
ranges = {
Line 2,373: Line 2,695:
m["Shrd"] = process_ranges{
m["Shrd"] = process_ranges{
"Sharada",
"Sharada",
2047117,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,384: Line 2,707:
0x11180, 0x111DF,
0x11180, 0x111DF,
},
},
translit = "Shrd-translit",
}
}


m["Shui"] = {
m["Shui"] = {
"Sui",
"Sui",
752854,
"logography",
"logography",
spaces = false,
spaces = false,
Line 2,395: Line 2,720:
m["Sidd"] = process_ranges{
m["Sidd"] = process_ranges{
"Siddham",
"Siddham",
250379,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,400: Line 2,726:
0x115B8, 0x115DD,
0x115B8, 0x115DD,
},
},
translit = "Sidd-translit",
}
}


m["Sidt"] = {
m["Sidt"] = {
"Sidetic",
"Sidetic",
36659,
"alphabet",
"alphabet",
direction = "rtl",
direction = "rtl",
Line 2,410: Line 2,738:


m["Sind"] = process_ranges{
m["Sind"] = process_ranges{
"Khudawadi",
"Khudabadi",
6402810,
"abugida",
"abugida",
aliases = {"Khudabadi"},
aliases = {"Khudawadi"},
ranges = {
ranges = {
0x0964, 0x0965,
0x0964, 0x0965,
Line 2,427: Line 2,756:
m["Sinh"] = process_ranges{
m["Sinh"] = process_ranges{
"Sinhalese",
"Sinhalese",
1574992,
"abugida",
"abugida",
aliases = {"Sinhala"},
aliases = {"Sinhala"},
Line 2,454: Line 2,784:
m["Sogd"] = process_ranges{
m["Sogd"] = process_ranges{
"Sogdian",
"Sogdian",
578359,
"abjad",
"abjad",
ranges = {
ranges = {
Line 2,464: Line 2,795:
m["Sogo"] = process_ranges{
m["Sogo"] = process_ranges{
"Old Sogdian",
"Old Sogdian",
72403254,
"abjad",
"abjad",
ranges = {
ranges = {
Line 2,473: Line 2,805:
m["Sora"] = process_ranges{
m["Sora"] = process_ranges{
"Sorang Sompeng",
"Sorang Sompeng",
7563292,
aliases = {"Sora Sompeng"},
aliases = {"Sora Sompeng"},
ranges = {
ranges = {
Line 2,482: Line 2,815:
m["Soyo"] = process_ranges{
m["Soyo"] = process_ranges{
"Soyombo",
"Soyombo",
8009382,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,490: Line 2,824:
m["Sund"] = process_ranges{
m["Sund"] = process_ranges{
"Sundanese",
"Sundanese",
51589,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,497: Line 2,832:
}
}


m["Sunu"] = {
m["Sunu"] = process_ranges{
"Sunuwar",
"Sunuwar",
109984965,
"alphabet",
"alphabet",
-- Not in Unicode
ranges = {
0x11BC0, 0x11BE1,
0x11BF0, 0x11BF9,
},
}
}


m["Sylo"] = process_ranges{
m["Sylo"] = process_ranges{
"Syloti Nagri",
"Sylheti Nagri",
144128,
"abugida",
"abugida",
aliases = {"Sylheti Nagari"},
aliases = {"Sylheti Nāgarī", "Syloti Nagri"},
ranges = {
ranges = {
0x0964, 0x0965,
0x0964, 0x0965,
Line 2,516: Line 2,856:
m["Syrc"] = process_ranges{
m["Syrc"] = process_ranges{
"Syriac",
"Syriac",
"abjad", -- more precisely, impure abjad
26567,
"abjad", -- more precisely, impure abjad
ranges = {
ranges = {
0x060C, 0x060C,
0x060C, 0x060C,
Line 2,538: Line 2,879:
m["Tagb"] = process_ranges{
m["Tagb"] = process_ranges{
"Tagbanwa",
"Tagbanwa",
977444,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,549: Line 2,891:
m["Takr"] = process_ranges{
m["Takr"] = process_ranges{
"Takri",
"Takri",
759202,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,564: Line 2,907:
m["Tale"] = process_ranges{
m["Tale"] = process_ranges{
"Tai Nüa",
"Tai Nüa",
2566326,
"abugida",
"abugida",
aliases = {"Tai Nuea", "New Tai Nüa", "New Tai Nuea", "Dehong Dai", "Tai Dehong", "Tai Le"},
aliases = {"Tai Nuea", "New Tai Nüa", "New Tai Nuea", "Dehong Dai", "Tai Dehong", "Tai Le"},
Line 2,576: Line 2,920:
m["Talu"] = process_ranges{
m["Talu"] = process_ranges{
"New Tai Lue",
"New Tai Lue",
3498863,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,588: Line 2,933:
m["Taml"] = process_ranges{
m["Taml"] = process_ranges{
"Tamil",
"Tamil",
26803,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,624: Line 2,970:
m["Tang"] = process_ranges{
m["Tang"] = process_ranges{
"Tangut",
"Tangut",
1373610,
"logography, syllabary",
"logography, syllabary",
ranges = {
ranges = {
0x31EF, 0x31EF,
0x16FE0, 0x16FE0,
0x16FE0, 0x16FE0,
0x17000, 0x187F7,
0x17000, 0x187F7,
Line 2,632: Line 2,980:
},
},
spaces = false,
spaces = false,
translit = "txg-translit",
}
}


m["Tavt"] = process_ranges{
m["Tavt"] = process_ranges{
"Tai Viet",
"Tai Viet",
11818517,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,644: Line 2,994:
}
}


m["Tayo"] = {
m["Tayo"] = process_ranges{
"Lai Tay",
"Lai Tay",
16306701,
"abugida",
"abugida",
aliases = {"Tai Yo"},
aliases = {"Tai Yo"},
direction = "vertical-rtl",
direction = "vertical-rtl",
-- Not in Unicode
ranges = {
0x1E6C0, 0x1E6DE,
0x1E6E0, 0x1E6F5,
0x1E6FE, 0x1E6FF,
},
spaces = false,
}
}


m["Telu"] = process_ranges{
m["Telu"] = process_ranges{
"Telugu",
"Telugu",
570450,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,682: Line 3,039:
m["Teng"] = {
m["Teng"] = {
"Tengwar",
"Tengwar",
473725,
}
}


m["Tfng"] = process_ranges{
m["Tfng"] = process_ranges{
"Tifinagh",
"Tifinagh",
208503,
"abjad, alphabet",
"abjad, alphabet",
ranges = {
ranges = {
Line 2,692: Line 3,051:
0x2D7F, 0x2D7F,
0x2D7F, 0x2D7F,
},
},
otherNames = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent
other_names = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent
}
}


m["Tglg"] = process_ranges{
m["Tglg"] = process_ranges{
"Baybayin",
"Baybayin",
812124,
"abugida",
"abugida",
aliases = {"Tagalog"},
aliases = {"Tagalog"},
varieties = {"Kur-itan"},
ranges = {
ranges = {
0x1700, 0x1715,
0x1700, 0x1715,
Line 2,708: Line 3,069:
m["Thaa"] = process_ranges{
m["Thaa"] = process_ranges{
"Thaana",
"Thaana",
877906,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,723: Line 3,085:
m["Thai"] = process_ranges{
m["Thai"] = process_ranges{
"Thai",
"Thai",
236376,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,731: Line 3,094:
}
}


m["Tibt"] = process_ranges{
do
"Tibetan",
local Tibt_displaytext = {
"abugida",
from = {"", "", "།།", "༚༚", "༚༝", "༝༚", "༝༝", "ཷ", "ཹ", "ེེ", "ོོ"},
ranges = {
to = {"ཨོཾ", "་", "༎", "༛", "", "", "", "ྲཱྀ", "ླཱྀ", "ཻ", "ཽ"}
0x0F00, 0x0F47,
}
0x0F49, 0x0F6C,
0x0F71, 0x0F97,
0x0F99, 0x0FBC,
0x0FBE, 0x0FCC,
0x0FCE, 0x0FD4,
0x0FD9, 0x0FDA,
},
normalizationFixes = handle_normalization_fixes{
combiningClasses = {[""] = 1},
from = {"", ""},
to = {"ྲཱྀ", "ླཱྀ"}
},
}


m["sit-tam-Tibt"] = {
m["Tibt"] = process_ranges{
"Tamyig",
"Tibetan",
m["Tibt"][2],
46861,
ranges = m["Tibt"].ranges,
"abugida",
characters = m["Tibt"].characters,
ranges = {
parent = "Tibt",
0x0F00, 0x0F47,
normalizationFixes = m["Tibt"].normalizationFixes,
0x0F49, 0x0F6C,
0x0F71, 0x0F97,
0x0F99, 0x0FBC,
0x0FBE, 0x0FCC,
0x0FCE, 0x0FD4,
0x0FD9, 0x0FDA,
0x3008, 0x300B,
},
normalizationFixes = handle_normalization_fixes{
combiningClasses = {[""] = 1},
from = {"ཷ", "ཹ"},
to = {"ྲཱྀ", "ླཱྀ"}
},
display_text = Tibt_displaytext,
strip_diacritics = Tibt_displaytext,
sort_key = "Tibt-sortkey",
translit = "Tibt-translit",
}
}
m["sit-tam-Tibt"] = {
"Tamyig",
109875213,
m["Tibt"][3],
-- There is no inheritance of properties currently implemented for scripts. Per [[User:Theknightwho]], this
-- is because it's tricky to do since there are several types of child scripts: those that are mere display
-- variants (like fa-Arab, kk-Arab), which should be eliminated in favor of CSS language selectors to
-- handle the font differences; those that are genuinely different scripts that happen to share the same
-- Unicode codepoints but have mostly different properties (e.g. Manchu vs. Mongolian); and those that are
-- somewhere in between (like Tamyig vs. Tibetan). As a result, we currently have to manually specify
-- which properties we want inherited as follows.
ranges = m["Tibt"].ranges,
characters = m["Tibt"].characters,
parent = "Tibt",
normalizationFixes = m["Tibt"].normalizationFixes,
display_text = m["Tibt"].display_text,
strip_diacritics = m["Tibt"].strip_diacritics,
sort_key = m["Tibt"].sort_key,
translit = m["Tibt"].translit,
}
end


m["Tirh"] = process_ranges{
m["Tirh"] = process_ranges{
"Tirhuta",
"Tirhuta",
1765752,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,778: Line 3,167:
m["Tnsa"] = process_ranges{
m["Tnsa"] = process_ranges{
"Tangsa",
"Tangsa",
105576311,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 2,785: Line 3,175:
}
}


m["Todr"] = {
m["Todr"] = process_ranges{
"Todhri",
"Todhri",
10274731,
"alphabet",
"alphabet",
direction = "rtl",
direction = "rtl",
-- Not in Unicode
ranges = {
0x105C0, 0x105F3,
},
}
}


m["Tols"] = {
m["Tols"] = {
"Tolong Siki",
"Tolong Siki",
4459822,
"alphabet",
"alphabet",
-- Not in Unicode
-- Not in Unicode
Line 2,800: Line 3,194:
m["Toto"] = process_ranges{
m["Toto"] = process_ranges{
"Toto",
"Toto",
104837516,
"abugida",
"abugida",
ranges = {
ranges = {
Line 2,806: Line 3,201:
}
}


m["Tutg"] = {
m["Tutg"] = process_ranges{
"Tigalari",
"Tigalari",
2604990,
"abugida",
"abugida",
aliases = {"Tulu"},
aliases = {"Tulu"},
-- Not in Unicode
ranges = {
0x1CF2, 0x1CF2,
0x1CF4, 0x1CF4,
0xA8F1, 0xA8F1,
0x11380, 0x11389,
0x1138B, 0x1138B,
0x1138E, 0x1138E,
0x11390, 0x113B5,
0x113B7, 0x113C0,
0x113C2, 0x113C2,
0x113C5, 0x113C5,
0x113C7, 0x113CA,
0x113CC, 0x113D5,
0x113D7, 0x113D8,
0x113E1, 0x113E2,
},
}
}


m["Ugar"] = process_ranges{
m["Ugar"] = process_ranges{
"Ugaritic",
"Ugaritic",
332652,
"abjad",
"abjad",
ranges = {
ranges = {
Line 2,824: Line 3,236:
m["Vaii"] = process_ranges{
m["Vaii"] = process_ranges{
"Vai",
"Vai",
523078,
"syllabary",
"syllabary",
ranges = {
ranges = {
Line 2,832: Line 3,245:
m["Visp"] = {
m["Visp"] = {
"Visible Speech",
"Visible Speech",
1303365,
"alphabet",
"alphabet",
-- Not in Unicode
-- Not in Unicode
Line 2,838: Line 3,252:
m["Vith"] = process_ranges{
m["Vith"] = process_ranges{
"Vithkuqi",
"Vithkuqi",
3301993,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 2,854: Line 3,269:
m["Wara"] = process_ranges{
m["Wara"] = process_ranges{
"Varang Kshiti",
"Varang Kshiti",
79199,
aliases = {"Warang Citi"},
aliases = {"Warang Citi"},
ranges = {
ranges = {
Line 2,864: Line 3,280:
m["Wcho"] = process_ranges{
m["Wcho"] = process_ranges{
"Wancho",
"Wancho",
33713728,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 2,873: Line 3,290:
m["Wole"] = {
m["Wole"] = {
"Woleai",
"Woleai",
6643710,
"syllabary",
"syllabary",
-- Not in Unicode
-- Not in Unicode
Line 2,879: Line 3,297:
m["Xpeo"] = process_ranges{
m["Xpeo"] = process_ranges{
"Old Persian",
"Old Persian",
1471822,
ranges = {
ranges = {
0x103A0, 0x103C3,
0x103A0, 0x103C3,
Line 2,887: Line 3,306:
m["Xsux"] = process_ranges{
m["Xsux"] = process_ranges{
"Cuneiform",
"Cuneiform",
401,
aliases = {"Sumero-Akkadian Cuneiform"},
aliases = {"Sumero-Akkadian Cuneiform"},
ranges = {
ranges = {
Line 2,898: Line 3,318:
m["Yezi"] = process_ranges{
m["Yezi"] = process_ranges{
"Yezidi",
"Yezidi",
13175481,
"alphabet",
"alphabet",
ranges = {
ranges = {
Line 2,913: Line 3,334:
m["Yiii"] = process_ranges{
m["Yiii"] = process_ranges{
"Yi",
"Yi",
1197646,
"syllabary",
"syllabary",
ranges = {
ranges = {
Line 2,927: Line 3,349:
m["Zanb"] = process_ranges{
m["Zanb"] = process_ranges{
"Zanabazar Square",
"Zanabazar Square",
50809208,
"abugida",
ranges = {
ranges = {
0x11A00, 0x11A47,
0x11A00, 0x11A47,
Line 2,934: Line 3,358:
m["Zmth"] = process_ranges{
m["Zmth"] = process_ranges{
"mathematical notation",
"mathematical notation",
1140046,
ranges = {
ranges = {
0x00AC, 0x00AC,
0x00AC, 0x00AC,
Line 3,071: Line 3,496:
},
},
translit = false,
translit = false,
character_category = "Mathematical notation symbols", -- ?
}
 
m["Zname"] = process_ranges{
"Znamenny musical notation",
965834,
"pictography",
ranges = {
0x1CF00, 0x1CF2D,
0x1CF30, 0x1CF46,
0x1CF50, 0x1CFC3,
},
ietf_subtag = "Zsym",
translit = false,
}
}


m["Zsym"] = process_ranges{
m["Zsym"] = process_ranges{
"symbol",
"symbolic",
80071,
"pictography",
"pictography",
ranges = {
ranges = {
Line 3,170: Line 3,608:
m["Zyyy"] = {
m["Zyyy"] = {
"undetermined",
"undetermined",
104839687,
-- This should not have any characters listed, probably
-- This should not have any characters listed, probably
translit = false,
translit = false,
Line 3,177: Line 3,616:
m["Zzzz"] = {
m["Zzzz"] = {
"uncoded",
"uncoded",
104839675,
-- This should not have any characters listed
-- This should not have any characters listed
translit = false,
translit = false,
Line 3,186: Line 3,626:
m["Hrkt"] = process_ranges{
m["Hrkt"] = process_ranges{
"Kana",
"Kana",
187659,
"syllabary",
"syllabary",
aliases = {"Japanese syllabaries"},
aliases = {"Japanese syllabaries"},
Line 3,197: Line 3,638:
m["Jpan"] = process_ranges{
m["Jpan"] = process_ranges{
"Japanese",
"Japanese",
190502,
"logography, syllabary",
"logography, syllabary",
ranges = union(
ranges = union(
Line 3,209: Line 3,651:
m["Kore"] = process_ranges{
m["Kore"] = process_ranges{
"Korean",
"Korean",
711797,
"logography, syllabary",
"logography, syllabary",
ranges = union(
ranges = union(
Line 3,215: Line 3,658:
m["Latn"].ranges
m["Latn"].ranges
),
),
-- `漢字(한자)`→`漢字`
-- `가-나-다`→`가나다`, `가--나--다`→`가-나-다`
-- `온돌(溫突/溫堗)`→`온돌` ([[ondol]])
strip_diacritics = {
remove_diacritics = u(0x302E) .. u(0x302F),
from = {"([" .. m["Hani"].characters .. "])%(.-%)", "^%-", "%-$", "%-(%-?)", "\1", "%([" .. m["Hani"].characters .. "/]+%)"},
to = {"%1", "\1", "\1", "%1", "-"}
}
}
}


return m
--Constructed languages
m["Ayer"] = process_ranges{
"Tahano Hikamu",
nil,
"abugida",
ranges = {
0x0041, 0x005A,
0x0061, 0x007A,
0x002A, 0x002A,
0x00F1, 0x00F1,
0x00D1, 0x00D1,
0x0294, 0x0294,
0x0259, 0x0259,
0x018F, 0x018F,
0xA736, 0xA737,
0x0026, 0x0026,
0x002B, 0x002D,
0x005B, 0x005B,
0x005D, 0x005D,
0x00A8, 0x00A8,
0x00AF, 0x00AF,
0x00B2, 0x00B2,
0x00B9, 0x00B9,
0x02B0, 0x2B2,
0x02C0, 0x02C0,
0x02D0, 0x02D0,
},
character_category = false,
}
 
m["Jovl"] = process_ranges{
"Jovlish",
nil,
"alphabet",
ranges = {
0x0041, 0x005A,
0x0061, 0x007A,
0x00AA, 0x00AA,
0x00BA, 0x00BA,
0x00C0, 0x00D6,
0x00D8, 0x00F6,
0x00F8, 0x02B8,
0x022B, 0x022B,
0x02C0, 0x02C1,
0x02E0, 0x02E4,
0x0363, 0x036F,
0x039E, 0x039E,
0x03A8, 0x03A8,
0x03BE, 0x03BE,
0x03C8, 0x03C8,
0x0485, 0x0486,
0x0951, 0x0952,
0x10FB, 0x10FB,
0x1D00, 0x1D25,
0x1D2C, 0x1D5C,
0x1D62, 0x1D65,
0x1D6B, 0x1D77,
0x1D79, 0x1DBE,
0x1DF8, 0x1DF8,
0x1E00, 0x1EFF,
0x202F, 0x202F,
0x2071, 0x2071,
0x207F, 0x207F,
0x2090, 0x209C,
0x20F0, 0x20F0,
0x2100, 0x2125,
0x2128, 0x2128,
0x212A, 0x2134,
0x2139, 0x213B,
0x2141, 0x214E,
0x2160, 0x2188,
0x2C60, 0x2C7F,
0xA700, 0xA707,
0xA722, 0xA787,
0xA78B, 0xA7CD,
0xA7D0, 0xA7D1,
0xA7D3, 0xA7D3,
0xA7D5, 0xA7DC,
0xA7F2, 0xA7FF,
0xA92E, 0xA92E,
0xAB30, 0xAB5A,
0xAB5C, 0xAB64,
0xAB66, 0xAB69,
0xFB00, 0xFB06,
0xFF21, 0xFF3A,
0xFF41, 0xFF5A,
0x10780, 0x10785,
0x10787, 0x107B0,
0x107B2, 0x107BA,
0x1DF00, 0x1DF1E,
0x1DF25, 0x1DF2A,
},
character_category = false,
}
 
m["Gthv"] = process_ranges{
"Gothevian",
nil,
"alphabet",
ranges = {
    0x0041, 0x005A,
    0x0061, 0x007A,
    0x00C1, 0x00C4,
    0x00C8, 0x00CB,
    0x00CD, 0x00CD,
    0x00CF, 0x00CF,
    0x00D2, 0x00D4,
    0x00D6, 0x00D6,
    0x00DA, 0x00DC,
    0x00DD, 0x00DD,
    0x00E1, 0x00E4,
    0x00E8, 0x00EB,
    0x00ED, 0x00ED,
    0x00EF, 0x00EF,
    0x00F2, 0x00F4,
    0x00F6, 0x00F6,
    0x00FA, 0x00FC,
    0x00FD, 0x00FD,
    0x00FF, 0x00FF,
    0x0110, 0x0111,
    0x0160, 0x0161,
    0x0178, 0x0178,
    0x017D, 0x017E,
    0x0186, 0x0186,
    0x0190, 0x0190,
    0x0195, 0x0195,
    0x01F6, 0x01F6,
    0x0254, 0x0254,
    0x025B, 0x025B,
    0x0398, 0x0398,
    0x039E, 0x039E,
    0x03A8, 0x03A8,
    0x03B8, 0x03B8,
    0x03BE, 0x03BE,
    0x03C8, 0x03C8,
},
character_category = false,
}
 
m["Roka"] = process_ranges{
"Rokadong Curakjang",
nil,
"abugida",
ranges = {
0x0041, 0x005A,
0x0061, 0x007A,
0x0022, 0x0022,
0x0027, 0x0027,
0x002A, 0x002A,
0x002D, 0x002D,
0x005B, 0x005D,
0x007B, 0x007B,
0x007D, 0x007D
},
character_category = false,
}
m["Rsnold"] = process_ranges{
"Old Raysian",
nil,
"alphabet",
ranges = {
0x0041, 0x007A
},
character_category = false,
}
m["Pann"] = process_ranges{
"Pannonian",
nil,
"alphabet",
ranges = {
0x0041, 0x005A,
0x0061, 0x007A,
0x1D9C, 0x1D9D,
0x1D47, 0x1D4B,
0x02E1, 0x02E3,
0x0410, 0x044F,
0x0404, 0x0454,
0x04AE, 0x04B1,
0x0250, 0x0254,
0x0265, 0x0278,
0x028C, 0x028D,
0x0224, 0x0225,
0x01BA, 0x01BE,
0x019A, 0x01A3,
0x012D, 0x0131,
0xA793, 0xA794
},
character_category = false,
}
 
m["Teul"] = process_ranges{
"Teulgi",
nil,
"alphabet",
ranges = m["Latn"].ranges,
characters = m["Latn"].characters,
character_category = false,
}
 
m["Tugv"] = process_ranges{
"Tuġvut",
nil,
"alphabet",
ranges = m["Latn"].ranges,
characters = m["Latn"].characters,
character_category = false,
}
 
m["Ucrn"] = process_ranges{
"Draconian",
nil,
"alphabet",
ranges = {
    0x0020, 0x0021,
    0x0023, 0x0023,
    0x0027, 0x0027,
    0x0030, 0x0034,
    0x0040, 0x0040,
    0x0047, 0x0048,
    0x004B, 0x004B,
    0x0050, 0x0050,
    0x0058, 0x0058,
    0x0066, 0x0067,
    0x0069, 0x006A,
    0x006F, 0x0072,
    0x0079, 0x0079,
    0x010D, 0x010D,
    0x014B, 0x014B,
    0x01A9, 0x01A9,
    0x01E7, 0x01E7,
    0x0238, 0x0238,
    0x024F, 0x024F,
    0x1EFA, 0x1EFB,
};
character_category = false,
}
 
 
return require("Module:languages").finalizeData(m, "script")

Latest revision as of 15:47, 21 April 2026



--[=[
	When adding new scripts to this file, please don't forget to add
	style definitons for the script in [[MediaWiki:Gadget-LanguagesAndScripts.css]].
]=]
local concat = table.concat
local insert = table.insert
local ipairs = ipairs
local next = next
local remove = table.remove
local select = select
local sort = table.sort

-- Loaded on demand, as it may not be needed (depending on the data).
local function u(...)
	u = require("Module:string/char")
	return u(...)
end

-- We can't use mw.loadData() on [[Module:languages/chars]] because [[Module:languages/data]] itself is sometimes loaded
-- using mw.loadData(), and calling mw.loadData() on [[Module:languages/chars]] will insert metatables into the
-- character tables, which the second mw.loadData() will choke on.
local m_chars = require("Module:languages/chars")

local c = m_chars.chars
local p = m_chars.puaChars
local cs = m_chars.chars_substitutions

------------------------------------------------------------------------------------
--
-- Helper functions
--
------------------------------------------------------------------------------------

-- Note: a[2] > b[2] means opens are sorted before closes if otherwise equal.
local function sort_ranges(a, b)
	return a[1] < b[1] or a[1] == b[1] and a[2] > b[2]
end

-- Returns the union of two or more range tables.
local function union(...)
	local ranges = {}
	for i = 1, select("#", ...) do
		local argt = select(i, ...)
		for j, v in ipairs(argt) do
			insert(ranges, {v, j % 2 == 1 and 1 or -1})
		end
	end
	sort(ranges, sort_ranges)
	local ret, i = {}, 0
	for _, range in ipairs(ranges) do
		i = i + range[2]
		if i == 0 and range[2] == -1 then -- close
			insert(ret, range[1])
		elseif i == 1 and range[2] == 1 then -- open
			if ret[#ret] and range[1] <= ret[#ret] + 1 then
				remove(ret) -- merge adjacent ranges
			else
				insert(ret, range[1])
			end
		end
	end
	return ret
end

-- Adds the `characters` key, which is determined by a script's `ranges` table.
local function process_ranges(sc)
	local ranges, chars = sc.ranges, {}
	for i = 2, #ranges, 2 do
		if ranges[i] == ranges[i - 1] then
			insert(chars, u(ranges[i]))
		else
			insert(chars, u(ranges[i - 1]))
			if ranges[i] > ranges[i - 1] + 1 then
				insert(chars, "-")
			end
			insert(chars, u(ranges[i]))
		end
	end
	sc.characters = concat(chars)
	ranges.n = #ranges
	return sc
end

local function handle_normalization_fixes(fixes)
	local combiningClasses = fixes.combiningClasses
	if combiningClasses then
		local chars, i = {}, 0
		for char in next, combiningClasses do
			i = i + 1
			chars[i] = char
		end
		fixes.combiningClassCharacters = concat(chars)
	end
	return fixes
end

------------------------------------------------------------------------------------
--
-- Data
--
------------------------------------------------------------------------------------

local m = {}

m["Adlm"] = process_ranges{
	"Adlam",
	19606346,
	"alphabet",
	ranges = {
		0x061F, 0x061F,
		0x0640, 0x0640,
		0x1E900, 0x1E94B,
		0x1E950, 0x1E959,
		0x1E95E, 0x1E95F,
	},
	capitalized = true,
	direction = "rtl",
}

m["Afak"] = {
	"Afaka",
	382019,
	"syllabary",
	-- Not in Unicode
}

m["Aghb"] = process_ranges{
	"Caucasian Albanian",
	2495716,
	"alphabet",
	ranges = {
		0x10530, 0x10563,
		0x1056F, 0x1056F,
	},
}

m["Ahom"] = process_ranges{
	"Ahom",
	2839633,
	"abugida",
	ranges = {
		0x11700, 0x1171A,
		0x1171D, 0x1172B,
		0x11730, 0x11746,
	},
}

m["Arab"] = process_ranges{
	"Arabic",
	1828555,
	"abjad", -- more precisely, impure abjad
	varieties = {"Jawi", {"Nastaliq", "Nastaleeq"}},
	ranges = {
		0x0600, 0x06FF,
		0x0750, 0x077F,
		0x0870, 0x088E,
		0x0890, 0x0891,
		0x0897, 0x08E1,
		0x08E3, 0x08FF,
		0xFB50, 0xFBC2,
		0xFBD3, 0xFD8F,
		0xFD92, 0xFDC7,
		0xFDCF, 0xFDCF,
		0xFDF0, 0xFDFF,
		0xFE70, 0xFE74,
		0xFE76, 0xFEFC,
		0x102E0, 0x102FB,
		0x10E60, 0x10E7E,
		0x10EC2, 0x10EC4,
		0x10EFC, 0x10EFF,
		0x1EE00, 0x1EE03,
		0x1EE05, 0x1EE1F,
		0x1EE21, 0x1EE22,
		0x1EE24, 0x1EE24,
		0x1EE27, 0x1EE27,
		0x1EE29, 0x1EE32,
		0x1EE34, 0x1EE37,
		0x1EE39, 0x1EE39,
		0x1EE3B, 0x1EE3B,
		0x1EE42, 0x1EE42,
		0x1EE47, 0x1EE47,
		0x1EE49, 0x1EE49,
		0x1EE4B, 0x1EE4B,
		0x1EE4D, 0x1EE4F,
		0x1EE51, 0x1EE52,
		0x1EE54, 0x1EE54,
		0x1EE57, 0x1EE57,
		0x1EE59, 0x1EE59,
		0x1EE5B, 0x1EE5B,
		0x1EE5D, 0x1EE5D,
		0x1EE5F, 0x1EE5F,
		0x1EE61, 0x1EE62,
		0x1EE64, 0x1EE64,
		0x1EE67, 0x1EE6A,
		0x1EE6C, 0x1EE72,
		0x1EE74, 0x1EE77,
		0x1EE79, 0x1EE7C,
		0x1EE7E, 0x1EE7E,
		0x1EE80, 0x1EE89,
		0x1EE8B, 0x1EE9B,
		0x1EEA1, 0x1EEA3,
		0x1EEA5, 0x1EEA9,
		0x1EEAB, 0x1EEBB,
		0x1EEF0, 0x1EEF1,
	},
	direction = "rtl",
	normalizationFixes = handle_normalization_fixes{
		from = {"ٳ"},
		to = {"اٟ"}
	},
}

	m["fa-Arab"] = {
		"Arabic",
		744068,
		m["Arab"][3],
		ranges = m["Arab"].ranges,
		characters = m["Arab"].characters,
		other_names = {"Perso-Arabic"},
		direction = "rtl",
		parent = "Arab",
		normalizationFixes = m["Arab"].normalizationFixes,
	}

	m["kk-Arab"] = {
		"Arabic",
		90681452,
		m["Arab"][3],
		ranges = m["Arab"].ranges,
		characters = m["Arab"].characters,
		direction = "rtl",
		parent = "Arab",
		normalizationFixes = m["Arab"].normalizationFixes,
	}
	
	m["ks-Arab"] = m["fa-Arab"]
	m["ku-Arab"] = m["fa-Arab"]
	m["ms-Arab"] = m["kk-Arab"]
	m["mzn-Arab"] = m["fa-Arab"]
	m["ota-Arab"] = m["fa-Arab"]
	
	m["pa-Arab"] = {
		"Shahmukhi",
		133800,
		m["Arab"][3],
		ranges = m["Arab"].ranges,
		characters = m["Arab"].characters,
		other_names = {"Arabic"},
		direction = "rtl",
		parent = "Arab",
		normalizationFixes = m["Arab"].normalizationFixes,
	}
	
	m["ps-Arab"] = m["fa-Arab"]
	m["sd-Arab"] = m["fa-Arab"]
	m["tt-Arab"] = m["fa-Arab"]
	m["ug-Arab"] = m["fa-Arab"]
	m["ur-Arab"] = m["fa-Arab"]

-- Aran (Nastaliq) is subsumed into Arab

m["Armi"] = process_ranges{
	"Imperial Aramaic",
	26978,
	"abjad",
	ranges = {
		0x10840, 0x10855,
		0x10857, 0x1085F,
	},
	direction = "rtl",
}

m["Armn"] = process_ranges{
	"Armenian",
	11932,
	"alphabet",
	ranges = {
		0x0531, 0x0556,
		0x0559, 0x058A,
		0x058D, 0x058F,
		0xFB13, 0xFB17,
	},
	capitalized = true,
	translit = "Armn-translit",
}

m["Avst"] = process_ranges{
	"Avestan",
	790681,
	"alphabet",
	ranges = {
		0x10B00, 0x10B35,
		0x10B39, 0x10B3F,
	},
	direction = "rtl",
}

	m["pal-Avst"] = {
		"Pazend",
		4925073,
		m["Avst"][3],
		ranges = m["Avst"].ranges,
		characters = m["Avst"].characters,
		direction = "rtl",
		parent = "Avst",
	}

m["Bali"] = process_ranges{
	"Balinese",
	804984,
	"abugida",
	ranges = {
		0x1B00, 0x1B4C,
		0x1B4E, 0x1B7F,
	},
}

m["Bamu"] = process_ranges{
	"Bamum",
	806024,
	"syllabary",
	ranges = {
		0xA6A0, 0xA6F7,
		0x16800, 0x16A38,
	},
}

m["Bass"] = process_ranges{
	"Bassa",
	810458,
	"alphabet",
	aliases = {"Bassa Vah", "Vah"},
	ranges = {
		0x16AD0, 0x16AED,
		0x16AF0, 0x16AF5,
	},
}

m["Batk"] = process_ranges{
	"Batak",
	51592,
	"abugida",
	ranges = {
		0x1BC0, 0x1BF3,
		0x1BFC, 0x1BFF,
	},
}

m["Beng"] = process_ranges{
	"Bengali",
	756802,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0980, 0x0983,
		0x0985, 0x098C,
		0x098F, 0x0990,
		0x0993, 0x09A8,
		0x09AA, 0x09B0,
		0x09B2, 0x09B2,
		0x09B6, 0x09B9,
		0x09BC, 0x09C4,
		0x09C7, 0x09C8,
		0x09CB, 0x09CE,
		0x09D7, 0x09D7,
		0x09DC, 0x09DD,
		0x09DF, 0x09E3,
		0x09E6, 0x09EF,
		0x09F2, 0x09FE,
		0x1CD0, 0x1CD0,
		0x1CD2, 0x1CD2,
		0x1CD5, 0x1CD6,
		0x1CD8, 0x1CD8,
		0x1CE1, 0x1CE1,
		0x1CEA, 0x1CEA,
		0x1CED, 0x1CED,
		0x1CF2, 0x1CF2,
		0x1CF5, 0x1CF7,
		0xA8F1, 0xA8F1,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"অা", "ঋৃ", "ঌৢ"},
		to = {"আ", "ৠ", "ৡ"}
	},
}

	m["as-Beng"] = process_ranges{
		"Assamese",
		191272,
		m["Beng"][3],
		other_names = {"Eastern Nagari"},
		ranges = {
			0x0951, 0x0952,
			0x0964, 0x0965,
			0x0980, 0x0983,
			0x0985, 0x098C,
			0x098F, 0x0990,
			0x0993, 0x09A8,
			0x09AA, 0x09AF,
			0x09B2, 0x09B2,
			0x09B6, 0x09B9,
			0x09BC, 0x09C4,
			0x09C7, 0x09C8,
			0x09CB, 0x09CE,
			0x09D7, 0x09D7,
			0x09DC, 0x09DD,
			0x09DF, 0x09E3,
			0x09E6, 0x09FE,
			0x1CD0, 0x1CD0,
			0x1CD2, 0x1CD2,
			0x1CD5, 0x1CD6,
			0x1CD8, 0x1CD8,
			0x1CE1, 0x1CE1,
			0x1CEA, 0x1CEA,
			0x1CED, 0x1CED,
			0x1CF2, 0x1CF2,
			0x1CF5, 0x1CF7,
			0xA8F1, 0xA8F1,
		},
		normalizationFixes = m["Beng"].normalizationFixes,
	}

m["Bhks"] = process_ranges{
	"Bhaiksuki",
	17017839,
	"abugida",
	ranges = {
		0x11C00, 0x11C08,
		0x11C0A, 0x11C36,
		0x11C38, 0x11C45,
		0x11C50, 0x11C6C,
	},
}

m["Blis"] = {
	"Blissymbolic",
	609817,
	"logography",
	aliases = {"Blissymbols"},
	-- Not in Unicode
}

m["Bopo"] = process_ranges{
	"Zhuyin",
	198269,
	"semisyllabary",
	aliases = {"Zhuyin Fuhao", "Bopomofo"},
	ranges = {
		0x02EA, 0x02EB,
		0x3001, 0x3003,
		0x3008, 0x3011,
		0x3013, 0x301F,
		0x302A, 0x302D,
		0x3030, 0x3030,
		0x3037, 0x3037,
		0x30FB, 0x30FB,
		0x3105, 0x312F,
		0x31A0, 0x31BF,
		0xFE45, 0xFE46,
		0xFF61, 0xFF65,
	},
}

m["Brah"] = process_ranges{
	"Brahmi",
	185083,
	"abugida",
	ranges = {
		0x11000, 0x1104D,
		0x11052, 0x11075,
		0x1107F, 0x1107F,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"𑀅𑀸", "𑀋𑀾", "𑀏𑁂"},
		to = {"𑀆", "𑀌", "𑀐"}
	},
	translit = "Brah-translit",
}

m["Brai"] = process_ranges{
	"Braille",
	79894,
	"alphabet",
	ranges = {
		0x2800, 0x28FF,
	},
}

m["Bugi"] = process_ranges{
	"Lontara",
	1074947,
	"abugida",
	aliases = {"Buginese"},
	ranges = {
		0x1A00, 0x1A1B,
		0x1A1E, 0x1A1F,
		0xA9CF, 0xA9CF,
	},
}

m["Buhd"] = process_ranges{
	"Buhid",
	1002969,
	"abugida",
	ranges = {
		0x1735, 0x1736,
		0x1740, 0x1751,
		0x1752, 0x1753,
	},
}

m["Cakm"] = process_ranges{
	"Chakma",
	1059328,
	"abugida",
	ranges = {
		0x09E6, 0x09EF,
		0x1040, 0x1049,
		0x11100, 0x11134,
		0x11136, 0x11147,
	},
}

m["Cans"] = process_ranges{
	"Canadian syllabic",
	2479183,
	"abugida",
	ranges = {
		0x1400, 0x167F,
		0x18B0, 0x18F5,
		0x11AB0, 0x11ABF,
	},
}

m["Cari"] = process_ranges{
	"Carian",
	1094567,
	"alphabet",
	ranges = {
		0x102A0, 0x102D0,
	},
}

m["Cham"] = process_ranges{
	"Cham",
	1060381,
	"abugida",
	ranges = {
		0xAA00, 0xAA36,
		0xAA40, 0xAA4D,
		0xAA50, 0xAA59,
		0xAA5C, 0xAA5F,
	},
}

m["Cher"] = process_ranges{
	"Cherokee",
	26549,
	"syllabary",
	ranges = {
		0x13A0, 0x13F5,
		0x13F8, 0x13FD,
		0xAB70, 0xABBF,
	},
}

m["Chis"] = {
	"Chisoi",
	123173777,
	"abugida",
	-- Not in Unicode
}

m["Chrs"] = process_ranges{
	"Khwarezmian",
	72386710,
	"abjad",
	aliases = {"Chorasmian"},
	ranges = {
		0x10FB0, 0x10FCB,
	},
	direction = "rtl",
}

m["Copt"] = process_ranges{
	"Coptic",
	321083,
	"alphabet",
	ranges = {
		0x03E2, 0x03EF,
		0x2C80, 0x2CF3,
		0x2CF9, 0x2CFF,
		0x102E0, 0x102FB,
	},
	capitalized = true,
}

m["Cpmn"] = process_ranges{
	"Cypro-Minoan",
	1751985,
	"syllabary",
	aliases = {"Cypro Minoan"},
	ranges = {
		0x10100, 0x10101,
		0x12F90, 0x12FF2,
	},
}

m["Cprt"] = process_ranges{
	"Cypriot",
	1757689,
	"syllabary",
	ranges = {
		0x10100, 0x10102,
		0x10107, 0x10133,
		0x10137, 0x1013F,
		0x10800, 0x10805,
		0x10808, 0x10808,
		0x1080A, 0x10835,
		0x10837, 0x10838,
		0x1083C, 0x1083C,
		0x1083F, 0x1083F,
	},
	direction = "rtl",
}

m["Cyrl"] = process_ranges{
	"Cyrillic",
	8209,
	"alphabet",
	ranges = {
		0x0400, 0x052F,
		0x1C80, 0x1C8A,
		0x1D2B, 0x1D2B,
		0x1D78, 0x1D78,
		0x1DF8, 0x1DF8,
		0x2DE0, 0x2DFF,
		0x2E43, 0x2E43,
		0xA640, 0xA69F,
		0xFE2E, 0xFE2F,
		0x1E030, 0x1E06D,
		0x1E08F, 0x1E08F,
	},
	capitalized = true,
}

m["Cyrs"] = {
	"Old Cyrillic",
	442244,
	m["Cyrl"][3],
	aliases = {"Early Cyrillic"},
	ranges = m["Cyrl"].ranges,
	characters = m["Cyrl"].characters,
	capitalized = m["Cyrl"].capitalized,
	wikipedia_article = "Early Cyrillic alphabet",
	normalizationFixes = handle_normalization_fixes{
		from = {"Ѹ", "ѹ"},
		to = {"Ꙋ", "ꙋ"}
	},
	strip_diacritics = {remove_diacritics = cs.Cyrs_remove_diacritics},
	sort_key = {
		remove_diacritics = cs.Cyrs_remove_diacritics,
		from = {
			"ї", "оу", -- 2 chars
			"[ґꙣєѕꙃꙅꙁіꙇђꙉѻꙩꙫꙭꙮꚙꚛꙋѡѿꙍѽꙑѣꙗѥꙕѧꙙѩꙝꙛѫѭѯѱѳѵҁ]"
		},
		to = {
			"и" .. p[1], "у", {
				["ґ"] = "г" .. p[1], ["ꙣ"] = "д" .. p[1], ["є"] = "е", ["ѕ"] = "ж" .. p[1], ["ꙃ"] = "ж" .. p[1],
				["ꙅ"] = "ж" .. p[1], ["ꙁ"] = "з", ["і"] = "и" .. p[1], ["ꙇ"] = "и" .. p[1], ["ђ"] = "и" .. p[2],
				["ꙉ"] = "и" .. p[2], ["ѻ"] = "о", ["ꙩ"] = "о", ["ꙫ"] = "о", ["ꙭ"] = "о",
				["ꙮ"] = "о", ["ꚙ"] = "о", ["ꚛ"] = "о", ["ꙋ"] = "у", ["ѡ"] = "х" .. p[1],
				["ѿ"] = "х" .. p[1], ["ꙍ"] = "х" .. p[1], ["ѽ"] = "х" .. p[1], ["ꙑ"] = "ы", ["ѣ"] = "ь" .. p[1],
				["ꙗ"] = "ь" .. p[2], ["ѥ"] = "ь" .. p[3], ["ꙕ"] = "ю", ["ѧ"] = "я", ["ꙙ"] = "я",
				["ѩ"] = "я" .. p[1], ["ꙝ"] = "я" .. p[1], ["ꙛ"] = "я" .. p[2], ["ѫ"] = "я" .. p[3], ["ѭ"] = "я" .. p[4],
				["ѯ"] = "я" .. p[5], ["ѱ"] = "я" .. p[6], ["ѳ"] = "я" .. p[7], ["ѵ"] = "я" .. p[8], ["ҁ"] = "я" .. p[9],
			}
		},
	}
}

m["Deva"] = process_ranges{
	"Devanagari",
	38592,
	"abugida",
	ranges = {
		0x0900, 0x097F,
		0x1CD0, 0x1CF6,
		0x1CF8, 0x1CF9,
		0x20F0, 0x20F0,
		0xA830, 0xA839,
		0xA8E0, 0xA8FF,
		0x11B00, 0x11B09,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"ॆॆ", "ेे", "ाॅ", "ाॆ", "ाꣿ", "ॊॆ", "ाे", "ाै", "ोे", "ाऺ", "ॖॖ", "अॅ", "अॆ", "अा", "एॅ", "एॆ", "एे", "एꣿ", "ऎॆ", "अॉ", "आॅ", "अॊ", "आॆ", "अो", "आे", "अौ", "आै", "ओे", "अऺ", "अऻ", "आऺ", "अाꣿ", "आꣿ", "ऒॆ", "अॖ", "अॗ", "ॶॖ", "्‍?ा"},
		to = {"ꣿ", "ै", "ॉ", "ॊ", "ॏ", "ॏ", "ो", "ौ", "ौ", "ऻ", "ॗ", "ॲ", "ऄ", "आ", "ऍ", "ऎ", "ऐ", "ꣾ", "ꣾ", "ऑ", "ऑ", "ऒ", "ऒ", "ओ", "ओ", "औ", "औ", "औ", "ॳ", "ॴ", "ॴ", "ॵ", "ॵ", "ॵ", "ॶ", "ॷ", "ॷ"}
	},
}

m["Diak"] = process_ranges{
	"Dhives Akuru",
	3307073,
	"abugida",
	aliases = {"Dhivehi Akuru", "Dives Akuru", "Divehi Akuru"},
	ranges = {
		0x11900, 0x11906,
		0x11909, 0x11909,
		0x1190C, 0x11913,
		0x11915, 0x11916,
		0x11918, 0x11935,
		0x11937, 0x11938,
		0x1193B, 0x11946,
		0x11950, 0x11959,
	},
}

m["Dogr"] = process_ranges{
	"Dogra",
	72402987,
	"abugida",
	ranges = {
		0x0964, 0x096F,
		0xA830, 0xA839,
		0x11800, 0x1183B,
	},
}

m["Dsrt"] = process_ranges{
	"Deseret",
	1200582,
	"alphabet",
	ranges = {
		0x10400, 0x1044F,
	},
	capitalized = true,
}

m["Dupl"] = process_ranges{
	"Duployan",
	5316025,
	"alphabet",
	ranges = {
		0x1BC00, 0x1BC6A,
		0x1BC70, 0x1BC7C,
		0x1BC80, 0x1BC88,
		0x1BC90, 0x1BC99,
		0x1BC9C, 0x1BCA3,
	},
}

m["Egyd"] = {
	"Demotic",
	188519,
	"abjad, logography",
	-- Not in Unicode
}

m["Egyh"] = {
	"Hieratic",
	208111,
	"abjad, logography",
	-- Unified with Egyptian hieroglyphic in Unicode
}

m["Egyp"] = process_ranges{
	"Egyptian hieroglyphic",
	132659,
	"abjad, logography",
	ranges = {
		0x13000, 0x13455,
		0x13460, 0x143FA,
	},
	varieties = {"Hieratic"},
	wikipedia_article = "Egyptian hieroglyphs",
	normalizationFixes = handle_normalization_fixes{
		from = {"𓃁", "𓆖"},
		to = {"𓃀𓐶𓂝", "𓆓𓐳𓐷𓏏𓐰𓇿𓐸"}
	},
}

m["Elba"] = process_ranges{
	"Elbasan",
	1036714,
	"alphabet",
	ranges = {
		0x10500, 0x10527,
	},
}

m["Elym"] = process_ranges{
	"Elymaic",
	60744423,
	"abjad",
	ranges = {
		0x10FE0, 0x10FF6,
	},
	direction = "rtl",
}

m["Ethi"] = process_ranges{
	"Ethiopic",
	257634,
	"abugida",
	aliases = {"Ge'ez", "Geʽez"},
	ranges = {
		0x1200, 0x1248,
		0x124A, 0x124D,
		0x1250, 0x1256,
		0x1258, 0x1258,
		0x125A, 0x125D,
		0x1260, 0x1288,
		0x128A, 0x128D,
		0x1290, 0x12B0,
		0x12B2, 0x12B5,
		0x12B8, 0x12BE,
		0x12C0, 0x12C0,
		0x12C2, 0x12C5,
		0x12C8, 0x12D6,
		0x12D8, 0x1310,
		0x1312, 0x1315,
		0x1318, 0x135A,
		0x135D, 0x137C,
		0x1380, 0x1399,
		0x2D80, 0x2D96,
		0x2DA0, 0x2DA6,
		0x2DA8, 0x2DAE,
		0x2DB0, 0x2DB6,
		0x2DB8, 0x2DBE,
		0x2DC0, 0x2DC6,
		0x2DC8, 0x2DCE,
		0x2DD0, 0x2DD6,
		0x2DD8, 0x2DDE,
		0xAB01, 0xAB06,
		0xAB09, 0xAB0E,
		0xAB11, 0xAB16,
		0xAB20, 0xAB26,
		0xAB28, 0xAB2E,
		0x1E7E0, 0x1E7E6,
		0x1E7E8, 0x1E7EB,
		0x1E7ED, 0x1E7EE,
		0x1E7F0, 0x1E7FE,
	},
	sort_key = "Ethi-sortkey",
	strip_diacritics = {remove_diacritics = u(0x135D) .. u(0x135E) .. u(0x135F)} 
}

m["Gara"] = process_ranges{
	"Garay",
	3095302,
	"alphabet",
	capitalized = true,
	direction = "rtl",
	ranges = {
		0x060C, 0x060C,
		0x061B, 0x061B,
		0x061F, 0x061F,
		0x10D40, 0x10D65,
		0x10D69, 0x10D85,
		0x10D8E, 0x10D8F,
	},
}

m["Geok"] = process_ranges{
	"Khutsuri",
	1090055,
	"alphabet",
	ranges = { -- Ⴀ-Ⴭ is Asomtavruli, ⴀ-ⴭ is Nuskhuri
		0x10A0, 0x10C5,
		0x10C7, 0x10C7,
		0x10CD, 0x10CD,
		0x10FB, 0x10FB,
		0x2D00, 0x2D25,
		0x2D27, 0x2D27,
		0x2D2D, 0x2D2D,
	},
	varieties = {"Nuskhuri", "Asomtavruli"},
	capitalized = true,
	translit = "Geok-translit",
}

m["Geor"] = process_ranges{
	"Georgian",
	3317411,
	"alphabet",
	ranges = { -- ა-ჿ is lowercase Mkhedruli; Ა-Ჿ is uppercase Mkhedruli (Mtavruli)
		0x0589, 0x0589,
		0x10D0, 0x10FF,
		0x1C90, 0x1CBA,
		0x1CBD, 0x1CBF,
	},
	varieties = {"Mkhedruli", "Mtavruli"},
	capitalized = true,
	translit = "Geor-translit",
}

m["Glag"] = process_ranges{
	"Glagolitic",
	145625,
	"alphabet",
	ranges = {
		0x0484, 0x0484,
		0x0487, 0x0487,
		0x0589, 0x0589,
		0x10FB, 0x10FB,
		0x2C00, 0x2C5F,
		0x2E43, 0x2E43,
		0xA66F, 0xA66F,
		0x1E000, 0x1E006,
		0x1E008, 0x1E018,
		0x1E01B, 0x1E021,
		0x1E023, 0x1E024,
		0x1E026, 0x1E02A,
	},
	capitalized = true,
}

m["Gong"] = process_ranges{
	"Gunjala Gondi",
	18125340,
	"abugida",
	ranges = {
		0x0964, 0x0965,
		0x11D60, 0x11D65,
		0x11D67, 0x11D68,
		0x11D6A, 0x11D8E,
		0x11D90, 0x11D91,
		0x11D93, 0x11D98,
		0x11DA0, 0x11DA9,
	},
}

m["Gonm"] = process_ranges{
	"Masaram Gondi",
	16977603,
	"abugida",
	ranges = {
		0x0964, 0x0965,
		0x11D00, 0x11D06,
		0x11D08, 0x11D09,
		0x11D0B, 0x11D36,
		0x11D3A, 0x11D3A,
		0x11D3C, 0x11D3D,
		0x11D3F, 0x11D47,
		0x11D50, 0x11D59,
	},
}

m["Goth"] = process_ranges{
	"Gothic",
	467784,
	"alphabet",
	ranges = {
		0x10330, 0x1034A,
	},
	wikipedia_article = "Gothic alphabet",
}

m["Gran"] = process_ranges{
	"Grantha",
	1119274,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0BE6, 0x0BF3,
		0x1CD0, 0x1CD0,
		0x1CD2, 0x1CD3,
		0x1CF2, 0x1CF4,
		0x1CF8, 0x1CF9,
		0x20F0, 0x20F0,
		0x11300, 0x11303,
		0x11305, 0x1130C,
		0x1130F, 0x11310,
		0x11313, 0x11328,
		0x1132A, 0x11330,
		0x11332, 0x11333,
		0x11335, 0x11339,
		0x1133B, 0x11344,
		0x11347, 0x11348,
		0x1134B, 0x1134D,
		0x11350, 0x11350,
		0x11357, 0x11357,
		0x1135D, 0x11363,
		0x11366, 0x1136C,
		0x11370, 0x11374,
		0x11FD0, 0x11FD1,
		0x11FD3, 0x11FD3,
	},
}

m["Grek"] = process_ranges{
	"Greek",
	8216,
	"alphabet",
	ranges = {
		0x0341, 0x0341,
		0x0374, 0x0375,
		0x037E, 0x037E,
		0x0384, 0x038A,
		0x038C, 0x038C,
		0x038E, 0x03A1,
		0x03A3, 0x03D7,
		0x03DA, 0x03DB,
		0x03DE, 0x03E1,
		0x03F0, 0x03F1,
		0x03F4, 0x03F4,
		0x03FC, 0x03FC,
		0x1D26, 0x1D2A,
		0x1D5D, 0x1D61,
		0x1D66, 0x1D6A,
		0x1DBF, 0x1DBF,
		0x2126, 0x2127,
		0x2129, 0x2129,
		0x213C, 0x2140,
		0xAB65, 0xAB65,
		0x10140, 0x1018E,
		0x101A0, 0x101A0,
		0x1D200, 0x1D245,
	},
	capitalized = true,
	display_text = cs["Grek-displaytext"],
	strip_diacritics = cs["Grek-stripdiacritics"],
	sort_key = {
		remove_diacritics = "'ʼ;·`¨´῀" .. c.grave .. c.acute .. c.diaer .. c.caron .. c.turnedcommaabove .. c.commaabove .. c.revcommaabove .. c.macron .. c.breve .. c.diaerbelow .. c.brevebelow .. c.perispomeni .. c.ypogegrammeni .. c.RSQuo .. c.prime .. c.keraia .. c.lowerkeraia .. c.tonos .. c.coronis .. c.psili .. c.dasia,
		from = {"ϝ", "ͷ", "ϛ", "ͱ", "ͺ", "ϳ", "ϻ", "[ϟϙ]", "[ςϲ]", "ͳ"},
		to = {"ε" .. p[1], "ε" .. p[2], "ε" .. p[3], "ζ" .. p[1], "ι", "ι" .. p[1], "π" .. p[1], "π" .. p[2], "σ", "ϡ"},
	},
}

	m["Polyt"] = process_ranges{
		"Greek",
		1475332,
		m["Grek"][3],
		ranges = union(m["Grek"].ranges, {
			0x0340, 0x0340,
			0x0342, 0x0345,
			0x0370, 0x0373,
			0x0376, 0x0377,
			0x037A, 0x037D,
			0x037F, 0x037F,
			0x03D8, 0x03D9,
			0x03DC, 0x03DD,
			0x03F2, 0x03F3,
			0x03F5, 0x03FB,
			0x03FD, 0x03FF,
			0x1F00, 0x1F15,
			0x1F18, 0x1F1D,
			0x1F20, 0x1F45,
			0x1F48, 0x1F4D,
			0x1F50, 0x1F57,
			0x1F59, 0x1F59,
			0x1F5B, 0x1F5B,
			0x1F5D, 0x1F5D,
			0x1F5F, 0x1F7D,
			0x1F80, 0x1FB4,
			0x1FB6, 0x1FC4,
			0x1FC6, 0x1FD3,
			0x1FD6, 0x1FDB,
			0x1FDD, 0x1FEF,
			0x1FF2, 0x1FF4,
			0x1FF6, 0x1FFE,
		}),
		ietf_subtag = "Grek",
		capitalized = m["Grek"].capitalized,
		parent = "Grek",
		display_text = m["Grek"].display_text,
		strip_diacritics = "Polyt-stripdiacritics",
		sort_key = m["Grek"].sort_key,
		translit = "grc-translit",
	}

m["Gujr"] = process_ranges{
	"Gujarati",
	733944,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0A81, 0x0A83,
		0x0A85, 0x0A8D,
		0x0A8F, 0x0A91,
		0x0A93, 0x0AA8,
		0x0AAA, 0x0AB0,
		0x0AB2, 0x0AB3,
		0x0AB5, 0x0AB9,
		0x0ABC, 0x0AC5,
		0x0AC7, 0x0AC9,
		0x0ACB, 0x0ACD,
		0x0AD0, 0x0AD0,
		0x0AE0, 0x0AE3,
		0x0AE6, 0x0AF1,
		0x0AF9, 0x0AFF,
		0xA830, 0xA839,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"ઓ", "અાૈ", "અા", "અૅ", "અે", "અૈ", "અૉ", "અો", "અૌ", "આૅ", "આૈ", "ૅા"},
		to = {"અાૅ", "ઔ", "આ", "ઍ", "એ", "ઐ", "ઑ", "ઓ", "ઔ", "ઓ", "ઔ", "ૉ"}
	},
}

m["Gukh"] = process_ranges{
	"Khema",
	110064239,
	"abugida",
	aliases = {"Gurung Khema", "Khema Phri", "Khema Lipi"},
	ranges = {
		0x0965, 0x0965,
		0x16100, 0x16139,
	},
}

m["Guru"] = process_ranges{
	"Gurmukhi",
	689894,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0A01, 0x0A03,
		0x0A05, 0x0A0A,
		0x0A0F, 0x0A10,
		0x0A13, 0x0A28,
		0x0A2A, 0x0A30,
		0x0A32, 0x0A33,
		0x0A35, 0x0A36,
		0x0A38, 0x0A39,
		0x0A3C, 0x0A3C,
		0x0A3E, 0x0A42,
		0x0A47, 0x0A48,
		0x0A4B, 0x0A4D,
		0x0A51, 0x0A51,
		0x0A59, 0x0A5C,
		0x0A5E, 0x0A5E,
		0x0A66, 0x0A76,
		0xA830, 0xA839,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"ਅਾ", "ਅੈ", "ਅੌ", "ੲਿ", "ੲੀ", "ੲੇ", "ੳੁ", "ੳੂ", "ੳੋ"},
		to = {"ਆ", "ਐ", "ਔ", "ਇ", "ਈ", "ਏ", "ਉ", "ਊ", "ਓ"}
	},
}

m["Hang"] = process_ranges{
	"Hangul",
	8222,
	"syllabary",
	aliases = {"Hangeul"},
	ranges = {
		0x1100, 0x11FF,
		0x3001, 0x3003,
		0x3008, 0x3011,
		0x3013, 0x301F,
		0x302E, 0x3030,
		0x3037, 0x3037,
		0x30FB, 0x30FB,
		0x3131, 0x318E,
		0x3200, 0x321E,
		0x3260, 0x327E,
		0xA960, 0xA97C,
		0xAC00, 0xD7A3,
		0xD7B0, 0xD7C6,
		0xD7CB, 0xD7FB,
		0xFE45, 0xFE46,
		0xFF61, 0xFF65,
		0xFFA0, 0xFFBE,
		0xFFC2, 0xFFC7,
		0xFFCA, 0xFFCF,
		0xFFD2, 0xFFD7,
		0xFFDA, 0xFFDC,
	},
}

m["Hani"] = process_ranges{
	"Han",
	8201,
	"logography",
	ranges = {
		0x2E80, 0x2E99,
		0x2E9B, 0x2EF3,
		0x2F00, 0x2FD5,
		0x2FF0, 0x2FFF,
		0x3001, 0x3003,
		0x3005, 0x3011,
		0x3013, 0x301F,
		0x3021, 0x302D,
		0x3030, 0x3030,
		0x3037, 0x303F,
		0x3190, 0x319F,
		0x31C0, 0x31E5,
		0x31EF, 0x31EF,
		0x3220, 0x3247,
		0x3280, 0x32B0,
		0x32C0, 0x32CB,
		0x30FB, 0x30FB,
		0x32FF, 0x32FF,
		0x3358, 0x3370,
		0x337B, 0x337F,
		0x33E0, 0x33FE,
		0x3400, 0x4DBF,
		0x4E00, 0x9FFF,
		0xA700, 0xA707,
		0xF900, 0xFA6D,
		0xFA70, 0xFAD9,
		0xFE45, 0xFE46,
		0xFF61, 0xFF65,
		0x16FE2, 0x16FE3,
		0x16FF0, 0x16FF1,
		0x1D360, 0x1D371,
		0x1F250, 0x1F251,
		0x20000, 0x2A6DF,
		0x2A700, 0x2B739,
		0x2B740, 0x2B81D,
		0x2B820, 0x2CEA1,
		0x2CEB0, 0x2EBE0,
		0x2EBF0, 0x2EE5D,
		0x2F800, 0x2FA1D,
		0x30000, 0x3134A,
		0x31350, 0x323AF,
	},
	varieties = {"Hanzi", "Kanji", "Hanja", "Chu Nom"},
	spaces = false,
}

	m["Hans"] = {
		"Simplified Han",
		185614,
		m["Hani"][3],
		ranges = m["Hani"].ranges,
		characters = m["Hani"].characters,
		spaces = m["Hani"].spaces,
		parent = "Hani",
	}

	m["Hant"] = {
		"Traditional Han",
		178528,
		m["Hani"][3],
		ranges = m["Hani"].ranges,
		characters = m["Hani"].characters,
		spaces = m["Hani"].spaces,
		parent = "Hani",
	}

m["Hano"] = process_ranges{
	"Hanunoo",
	1584045,
	"abugida",
	aliases = {"Hanunó'o", "Hanuno'o"},
	ranges = {
		0x1720, 0x1736,
	},
}

m["Hatr"] = process_ranges{
	"Hatran",
	20813038,
	"abjad",
	ranges = {
		0x108E0, 0x108F2,
		0x108F4, 0x108F5,
		0x108FB, 0x108FF,
	},
	direction = "rtl",
}

m["Hebr"] = process_ranges{
	"Hebrew",
	33513,
	"abjad", -- more precisely, impure abjad
	ranges = {
		0x0591, 0x05C7,
		0x05D0, 0x05EA,
		0x05EF, 0x05F4,
		0x2135, 0x2138,
		0xFB1D, 0xFB36,
		0xFB38, 0xFB3C,
		0xFB3E, 0xFB3E,
		0xFB40, 0xFB41,
		0xFB43, 0xFB44,
		0xFB46, 0xFB4F,
	},
	direction = "rtl",
	display_text = "Hebr-common",
	sort_key = "Hebr-common",
	strip_diacritics = "Hebr-common",
}

m["Hira"] = process_ranges{
	"Hiragana",
	48332,
	"syllabary",
	ranges = {
		0x3001, 0x3003,
		0x3008, 0x3011,
		0x3013, 0x301F,
		0x3030, 0x3035,
		0x3037, 0x3037,
		0x303C, 0x303D,
		0x3041, 0x3096,
		0x3099, 0x30A0,
		0x30FB, 0x30FC,
		0xFE45, 0xFE46,
		0xFF61, 0xFF65,
		0xFF70, 0xFF70,
		0xFF9E, 0xFF9F,
		0x1B001, 0x1B11F,
		0x1B132, 0x1B132,
		0x1B150, 0x1B152,
		0x1F200, 0x1F200,
	},
	varieties = {"Hentaigana"},
	spaces = false,
}

m["Hluw"] = process_ranges{
	"Anatolian hieroglyphic",
	521323,
	"logography, syllabary",
	ranges = {
		0x14400, 0x14646,
	},
	wikipedia_article = "Anatolian hieroglyphs",
}

m["Hmng"] = process_ranges{
	"Pahawh Hmong",
	365954,
	"semisyllabary",
	aliases = {"Hmong"},
	ranges = {
		0x16B00, 0x16B45,
		0x16B50, 0x16B59,
		0x16B5B, 0x16B61,
		0x16B63, 0x16B77,
		0x16B7D, 0x16B8F,
	},
}

m["Hmnp"] = process_ranges{
	"Nyiakeng Puachue Hmong",
	33712499,
	"alphabet",
	ranges = {
		0x1E100, 0x1E12C,
		0x1E130, 0x1E13D,
		0x1E140, 0x1E149,
		0x1E14E, 0x1E14F,
	},
}

m["Hung"] = process_ranges{
	"Old Hungarian",
	446224,
	"alphabet",
	aliases = {"Hungarian runic"},
	ranges = {
		0x10C80, 0x10CB2,
		0x10CC0, 0x10CF2,
		0x10CFA, 0x10CFF,
	},
	capitalized = true,
	direction = "rtl",
}

m["Ibrnn"] = {
	"Northeastern Iberian",
	1113155,
	"semisyllabary",
	ietf_subtag = "Zzzz",
	-- Not in Unicode
}

m["Ibrns"] = {
	"Southeastern Iberian",
	2305351,
	"semisyllabary",
	ietf_subtag = "Zzzz",
	-- Not in Unicode
}

m["Image"] = {
	-- To be used to avoid any formatting or link processing
	"Image-rendered",
	478798,
	-- This should not have any characters listed
	ietf_subtag = "Zyyy",
	translit = false,
	character_category = false, -- none
}

m["Inds"] = {
	"Indus",
	601388,
	aliases = {"Harappan", "Indus Valley"},
}

m["Ipach"] = {
	"International Phonetic Alphabet",
	21204,
	aliases = {"IPA"},
	ietf_subtag = "Latn",
}

m["Ital"] = process_ranges{
	"Old Italic",
	4891256,
	"alphabet",
	ranges = {
		0x10300, 0x10323,
		0x1032D, 0x1032F,
	},
	translit = "Ital-translit",
}

m["Java"] = process_ranges{
	"Javanese",
	879704,
	"abugida",
	ranges = {
		0xA980, 0xA9CD,
		0xA9CF, 0xA9D9,
		0xA9DE, 0xA9DF,
	},
}

m["Jurc"] = {
	"Jurchen",
	912240,
	"logography",
	spaces = false,
}

m["Kali"] = process_ranges{
	"Kayah Li",
	4919239,
	"abugida",
	ranges = {
		0xA900, 0xA92F,
	},
}

m["Kana"] = process_ranges{
	"Katakana",
	82946,
	"syllabary",
	ranges = {
		0x3001, 0x3003,
		0x3008, 0x3011,
		0x3013, 0x301F,
		0x3030, 0x3035,
		0x3037, 0x3037,
		0x303C, 0x303D,
		0x3099, 0x309C,
		0x30A0, 0x30FF,
		0x31F0, 0x31FF,
		0x32D0, 0x32FE,
		0x3300, 0x3357,
		0xFE45, 0xFE46,
		0xFF61, 0xFF9F,
		0x1AFF0, 0x1AFF3,
		0x1AFF5, 0x1AFFB,
		0x1AFFD, 0x1AFFE,
		0x1B000, 0x1B000,
		0x1B120, 0x1B122,
		0x1B155, 0x1B155,
		0x1B164, 0x1B167,
	},
	spaces = false,
}

m["Kawi"] = process_ranges{
	"Kawi",
	975802,
	"abugida",
	ranges = {
		0x11F00, 0x11F10,
		0x11F12, 0x11F3A,
		0x11F3E, 0x11F5A,
	},
}

m["Khar"] = process_ranges{
	"Kharoshthi",
	1161266,
	"abugida",
	ranges = {
		0x10A00, 0x10A03,
		0x10A05, 0x10A06,
		0x10A0C, 0x10A13,
		0x10A15, 0x10A17,
		0x10A19, 0x10A35,
		0x10A38, 0x10A3A,
		0x10A3F, 0x10A48,
		0x10A50, 0x10A58,
	},
	direction = "rtl",
}

m["Khmr"] = process_ranges{
	"Khmer",
	1054190,
	"abugida",
	ranges = {
		0x1780, 0x17DD,
		0x17E0, 0x17E9,
		0x17F0, 0x17F9,
		0x19E0, 0x19FF,
	},
	spaces = false,
	normalizationFixes = handle_normalization_fixes{
		from = {"ឣ", "ឤ"},
		to = {"អ", "អា"}
	},
}

m["Khoj"] = process_ranges{
	"Khojki",
	1740656,
	"abugida",
	ranges = {
		0x0AE6, 0x0AEF,
		0xA830, 0xA839,
		0x11200, 0x11211,
		0x11213, 0x11241,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"𑈀𑈬𑈱", "𑈀𑈬", "𑈀𑈱", "𑈀𑈳", "𑈁𑈱", "𑈆𑈬", "𑈬𑈰", "𑈬𑈱", "𑉀𑈮"},
		to = {"𑈇", "𑈁", "𑈅", "𑈇", "𑈇", "𑈃", "𑈲", "𑈳", "𑈂"}
	},
}

m["Khomt"] = {
	"Khom Thai",
	13023788,
	"abugida",
	-- Not in Unicode
}

m["Kitl"] = {
	"Khitan large",
	6401797,
	"logography",
	spaces = false,
}

m["Kits"] = process_ranges{
	"Khitan small",
	6401800,
	"logography, syllabary",
	ranges = {
		0x16FE4, 0x16FE4,
		0x18B00, 0x18CD5,
		0x18CFF, 0x18CFF,
	},
	spaces = false,
}

m["Knda"] = process_ranges{
	"Kannada",
	839666,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0C80, 0x0C8C,
		0x0C8E, 0x0C90,
		0x0C92, 0x0CA8,
		0x0CAA, 0x0CB3,
		0x0CB5, 0x0CB9,
		0x0CBC, 0x0CC4,
		0x0CC6, 0x0CC8,
		0x0CCA, 0x0CCD,
		0x0CD5, 0x0CD6,
		0x0CDD, 0x0CDE,
		0x0CE0, 0x0CE3,
		0x0CE6, 0x0CEF,
		0x0CF1, 0x0CF3,
		0x1CD0, 0x1CD0,
		0x1CD2, 0x1CD3,
		0x1CDA, 0x1CDA,
		0x1CF2, 0x1CF2,
		0x1CF4, 0x1CF4,
		0xA830, 0xA835,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"ಉಾ", "ಋಾ", "ಒೌ"},
		to = {"ಊ", "ೠ", "ಔ"}
	},
	translit = "kn-translit",
}

m["Kpel"] = {
	"Kpelle",
	1586299,
	"syllabary",
	-- Not in Unicode
}

m["Krai"] = process_ranges{
	"Kirat Rai",
	123173834,
	"abugida",
	aliases = {"Rai", "Khambu Rai", "Rai Barṇamālā", "Kirat Khambu Rai"},
	ranges = {
		0x16D40, 0x16D79,
	},
}

m["Kthi"] = process_ranges{
	"Kaithi",
	1253814,
	"abugida",
	ranges = {
		0x0966, 0x096F,
		0xA830, 0xA839,
		0x11080, 0x110C2,
		0x110CD, 0x110CD,
	},
}

m["Kulit"] = {
	"Kulitan",
	6443044,
	"abugida",
	-- Not in Unicode
}

m["Lana"] = process_ranges{
	"Tai Tham",
	1314503,
	"abugida",
	aliases = {"Tham", "Tua Mueang", "Lanna"},
	ranges = {
		0x1A20, 0x1A5E,
		0x1A60, 0x1A7C,
		0x1A7F, 0x1A89,
		0x1A90, 0x1A99,
		0x1AA0, 0x1AAD,
	},
	spaces = false,
}

m["Laoo"] = process_ranges{
	"Lao",
	1815229,
	"abugida",
	ranges = {
		0x0E81, 0x0E82,
		0x0E84, 0x0E84,
		0x0E86, 0x0E8A,
		0x0E8C, 0x0EA3,
		0x0EA5, 0x0EA5,
		0x0EA7, 0x0EBD,
		0x0EC0, 0x0EC4,
		0x0EC6, 0x0EC6,
		0x0EC8, 0x0ECE,
		0x0ED0, 0x0ED9,
		0x0EDC, 0x0EDF,
	},
	spaces = false,
}

m["Latn"] = process_ranges{
	"Latin",
	8229,
	"alphabet",
	aliases = {"Roman"},
	ranges = {
		0x0041, 0x005A,
		0x0061, 0x007A,
		0x00AA, 0x00AA,
		0x00BA, 0x00BA,
		0x00C0, 0x00D6,
		0x00D8, 0x00F6,
		0x00F8, 0x02B8,
		0x02C0, 0x02C1,
		0x02E0, 0x02E4,
		0x0363, 0x036F,
		0x0485, 0x0486,
		0x0951, 0x0952,
		0x10FB, 0x10FB,
		0x1D00, 0x1D25,
		0x1D2C, 0x1D5C,
		0x1D62, 0x1D65,
		0x1D6B, 0x1D77,
		0x1D79, 0x1DBE,
		0x1DF8, 0x1DF8,
		0x1E00, 0x1EFF,
		0x202F, 0x202F,
		0x2071, 0x2071,
		0x207F, 0x207F,
		0x2090, 0x209C,
		0x20F0, 0x20F0,
		0x2100, 0x2125,
		0x2128, 0x2128,
		0x212A, 0x2134,
		0x2139, 0x213B,
		0x2141, 0x214E,
		0x2160, 0x2188,
		0x2C60, 0x2C7F,
		0xA700, 0xA707,
		0xA722, 0xA787,
		0xA78B, 0xA7CD,
		0xA7D0, 0xA7D1,
		0xA7D3, 0xA7D3,
		0xA7D5, 0xA7DC,
		0xA7F2, 0xA7FF,
		0xA92E, 0xA92E,
		0xAB30, 0xAB5A,
		0xAB5C, 0xAB64,
		0xAB66, 0xAB69,
		0xFB00, 0xFB06,
		0xFF21, 0xFF3A,
		0xFF41, 0xFF5A,
		0x10780, 0x10785,
		0x10787, 0x107B0,
		0x107B2, 0x107BA,
		0x1DF00, 0x1DF1E,
		0x1DF25, 0x1DF2A,
	},
	varieties = {"Rumi", "Romaji", "Rōmaji", "Romaja"},
	capitalized = true,
	translit = false,
}

	m["Latf"] = {
		"Fraktur",
		148443,
		m["Latn"][3],
		ranges = m["Latn"].ranges,
		characters = m["Latn"].characters,
		other_names = {"Blackletter"}, -- Blackletter is actually the parent "script"
		capitalized = m["Latn"].capitalized,
		translit = m["Latn"].translit,
		parent = "Latn",
	}
	
	m["Latg"] = {
		"Gaelic",
		1432616,
		m["Latn"][3],
		ranges = m["Latn"].ranges,
		characters = m["Latn"].characters,
		other_names = {"Irish"},
		capitalized = m["Latn"].capitalized,
		translit = m["Latn"].translit,
		parent = "Latn",
	}
	
	m["pjt-Latn"] = {
		"Latin",
		nil,
		m["Latn"][3],
		ranges = m["Latn"].ranges,
		characters = m["Latn"].characters,
		capitalized = m["Latn"].capitalized,
		translit = m["Latn"].translit,
		parent = "Latn",
	}

m["Leke"] = {
	"Leke",
	19572613,
	"abugida",
	-- Not in Unicode
}

m["Lepc"] = process_ranges{
	"Lepcha",
	1481626,
	"abugida",
	aliases = {"Róng"},
	ranges = {
		0x1C00, 0x1C37,
		0x1C3B, 0x1C49,
		0x1C4D, 0x1C4F,
	},
}

m["Limb"] = process_ranges{
	"Limbu",
	933796,
	"abugida",
	ranges = {
		0x0965, 0x0965,
		0x1900, 0x191E,
		0x1920, 0x192B,
		0x1930, 0x193B,
		0x1940, 0x1940,
		0x1944, 0x194F,
	},
}

m["Lina"] = process_ranges{
	"Linear A",
	30972,
	ranges = {
		0x10107, 0x10133,
		0x10600, 0x10736,
		0x10740, 0x10755,
		0x10760, 0x10767,
	},
}

m["Linb"] = process_ranges{
	"Linear B",
	190102,
	ranges = {
		0x10000, 0x1000B,
		0x1000D, 0x10026,
		0x10028, 0x1003A,
		0x1003C, 0x1003D,
		0x1003F, 0x1004D,
		0x10050, 0x1005D,
		0x10080, 0x100FA,
		0x10100, 0x10102,
		0x10107, 0x10133,
		0x10137, 0x1013F,
	},
}

m["Lisu"] = process_ranges{
	"Fraser",
	1194621,
	"alphabet",
	aliases = {"Old Lisu", "Lisu"},
	ranges = {
		0x300A, 0x300B,
		0xA4D0, 0xA4FF,
		0x11FB0, 0x11FB0,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"['’]", "[.ꓸ][.ꓸ]", "[.ꓸ][,ꓹ]"},
		to = {"ʼ", "ꓺ", "ꓻ"}
	},
	translit = "Lisu-translit",
	sort_key = {
		from = {"𑾰"},
		to = {"ꓬ" .. p[1]}
	},
}

m["Loma"] = {
	"Loma",
	13023816,
	"syllabary",
	-- Not in Unicode
}

m["Lyci"] = process_ranges{
	"Lycian",
	913587,
	"alphabet",
	ranges = {
		0x10280, 0x1029C,
	},
}

m["Lydi"] = process_ranges{
	"Lydian",
	4261300,
	"alphabet",
	ranges = {
		0x10920, 0x10939,
		0x1093F, 0x1093F,
	},
	direction = "rtl",
}

m["Mahj"] = process_ranges{
	"Mahajani",
	6732850,
	"abugida",
	ranges = {
		0x0964, 0x096F,
		0xA830, 0xA839,
		0x11150, 0x11176,
	},
}

m["Maka"] = process_ranges{
	"Makasar",
	72947229,
	"abugida",
	aliases = {"Old Makasar"},
	ranges = {
		0x11EE0, 0x11EF8,
	},
}

m["Mand"] = process_ranges{
	"Mandaic",
	1812130,
	aliases = {"Mandaean"},
	ranges = {
		0x0640, 0x0640,
		0x0840, 0x085B,
		0x085E, 0x085E,
	},
	direction = "rtl",
}

m["Mani"] = process_ranges{
	"Manichaean",
	3544702,
	"abjad",
	ranges = {
		0x0640, 0x0640,
		0x10AC0, 0x10AE6,
		0x10AEB, 0x10AF6,
	},
	direction = "rtl",
	translit = "Mani-translit",
}

m["Marc"] = process_ranges{
	"Marchen",
	72403709,
	"abugida",
	ranges = {
		0x11C70, 0x11C8F,
		0x11C92, 0x11CA7,
		0x11CA9, 0x11CB6,
	},
}

m["Maya"] = process_ranges{
	"Maya",
	211248,
	aliases = {"Maya hieroglyphic", "Mayan", "Mayan hieroglyphic"},
	ranges = {
		0x1D2E0, 0x1D2F3,
	},
}

m["Medf"] = process_ranges{
	"Medefaidrin",
	1519764,
	aliases = {"Oberi Okaime", "Oberi Ɔkaimɛ"},
	ranges = {
		0x16E40, 0x16E9A,
	},
	capitalized = true,
}

m["Mend"] = process_ranges{
	"Mende",
	951069,
	aliases = {"Mende Kikakui"},
	ranges = {
		0x1E800, 0x1E8C4,
		0x1E8C7, 0x1E8D6,
	},
	direction = "rtl",
}

m["Merc"] = process_ranges{
	"Meroitic cursive",
	73028124,
	"abugida",
	ranges = {
		0x109A0, 0x109B7,
		0x109BC, 0x109CF,
		0x109D2, 0x109FF,
	},
	direction = "rtl",
}

m["Mero"] = process_ranges{
	"Meroitic hieroglyphic",
	73028623,
	"abugida",
	ranges = {
		0x10980, 0x1099F,
	},
	direction = "rtl",
	wikipedia_article = "Meroitic hieroglyphs",
}

m["Mlym"] = process_ranges{
	"Malayalam",
	1164129,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0D00, 0x0D0C,
		0x0D0E, 0x0D10,
		0x0D12, 0x0D44,
		0x0D46, 0x0D48,
		0x0D4A, 0x0D4F,
		0x0D54, 0x0D63,
		0x0D66, 0x0D7F,
		0x1CDA, 0x1CDA,
		0x1CF2, 0x1CF2,
		0xA830, 0xA832,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"ഇൗ", "ഉൗ", "എെ", "ഒാ", "ഒൗ", "ക്‍", "ണ്‍", "ന്‍റ", "ന്‍", "മ്‍", "യ്‍", "ര്‍", "ല്‍", "ള്‍", "ഴ്‍", "െെ", "ൻ്റ"},
		to = {"ഈ", "ഊ", "ഐ", "ഓ", "ഔ", "ൿ", "ൺ", "ൻറ", "ൻ", "ൔ", "ൕ", "ർ", "ൽ", "ൾ", "ൖ", "ൈ", "ന്റ"}
	},
	translit = "ml-translit",
}

m["Modi"] = process_ranges{
	"Modi",
	1703713,
	"abugida",
	ranges = {
		0xA830, 0xA839,
		0x11600, 0x11644,
		0x11650, 0x11659,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"𑘀𑘹", "𑘀𑘺", "𑘁𑘹", "𑘁𑘺"},
		to = {"𑘊", "𑘋", "𑘌", "𑘍"}
	},
}

do
	local Mong_displaytext = {
		from = {"([ᠨ-ᡂᡸ])ᠶ([ᠨ-ᡂᡸ])", "([ᠠ-ᡂᡸ])ᠸ([^᠋ᠠ-ᠧ])", "([ᠠ-ᡂᡸ])ᠸ$"},
		to = {"%1ᠢ%2", "%1ᠧ%2", "%1ᠧ"}
	}
	
	m["Mong"] = process_ranges{
		"Mongolian",
		1055705,
		"alphabet",
		aliases = {"Mongol bichig", "Hudum Mongol bichig"},
		ranges = {
			0x1800, 0x1805,
			0x180A, 0x1819,
			0x1820, 0x1842,
			0x1878, 0x1878,
			0x1880, 0x1897,
			0x18A6, 0x18A6,
			0x18A9, 0x18A9,
			0x200C, 0x200D,
			0x202F, 0x202F,
			0x3001, 0x3002,
			0x3008, 0x300B,
			0x11660, 0x11668,
		},
		direction = "vertical-ltr",
		display_text = Mong_displaytext,
		strip_diacritics = Mong_displaytext,
		translit = "Mong-translit",
	}

		m["mnc-Mong"] = process_ranges{
			"Manchu",
			122888,
			m["Mong"][3],
			ranges = {
				0x1801, 0x1801,
				0x1804, 0x1804,
				0x1808, 0x180F,
				0x1820, 0x1820,
				0x1823, 0x1823,
				0x1828, 0x182A,
				0x182E, 0x1830,
				0x1834, 0x1838,
				0x183A, 0x183A,
				0x185D, 0x185D,
				0x185F, 0x1861,
				0x1864, 0x1869,
				0x186C, 0x1871,
				0x1873, 0x1877,
				0x1880, 0x1888,
				0x188F, 0x188F,
				0x189A, 0x18A5,
				0x18A8, 0x18A8,
				0x18AA, 0x18AA,
				0x200C, 0x200D,
				0x202F, 0x202F,
			},
			direction = "vertical-ltr",
			parent = "Mong",
			translit = "mnc-translit",
		}
		
		m["sjo-Mong"] = process_ranges{
			"Xibe",
			113624153,
			m["Mong"][3],
			aliases = {"Sibe"},
			ranges = {
				0x1804, 0x1804,
				0x1807, 0x1807,
				0x180A, 0x180F,
				0x1820, 0x1820,
				0x1823, 0x1823,
				0x1828, 0x1828,
				0x182A, 0x182A,
				0x182E, 0x1830,
				0x1834, 0x1838,
				0x183A, 0x183A,
				0x185D, 0x1872,
				0x200C, 0x200D,
				0x202F, 0x202F,
			},
			direction = "vertical-ltr",
			parent = "mnc-Mong",
		}
		
		m["xwo-Mong"] = process_ranges{
			"Clear Script",
			529085,
			m["Mong"][3],
			aliases = {"Todo", "Todo bichig"},
			ranges = {
				0x1800, 0x1801,
				0x1804, 0x1806,
				0x180A, 0x1820,
				0x1828, 0x1828,
				0x182F, 0x1831,
				0x1834, 0x1834,
				0x1837, 0x1838,
				0x183A, 0x183B,
				0x1840, 0x1840,
				0x1843, 0x185C,
				0x1880, 0x1887,
				0x1889, 0x188F,
				0x1894, 0x1894,
				0x1896, 0x1899,
				0x18A7, 0x18A7,
				0x200C, 0x200D,
				0x202F, 0x202F,
				0x11669, 0x1166C,
			},
			direction = "vertical-ltr",
			parent = "Mong",
			translit = "xwo-translit",
		}
end

m["Moon"] = {
	"Moon",
	918391,
	"alphabet",
	aliases = {"Moon System of Embossed Reading", "Moon type", "Moon writing", "Moon alphabet", "Moon code"},
	-- Not in Unicode
}

m["Morse"] = {
	"Morse code",
	79897,
	ietf_subtag = "Zsym",
}

m["Mroo"] = process_ranges{
	"Mru",
	75919253,
	aliases = {"Mro", "Mrung"},
	ranges = {
		0x16A40, 0x16A5E,
		0x16A60, 0x16A69,
		0x16A6E, 0x16A6F,
	},
}

m["Mtei"] = process_ranges{
	"Meitei Mayek",
	2981413,
	"abugida",
	aliases = {"Meetei Mayek", "Manipuri"},
	ranges = {
		0xAAE0, 0xAAF6,
		0xABC0, 0xABED,
		0xABF0, 0xABF9,
	},
}

m["Mult"] = process_ranges{
	"Multani",
	17047906,
	"abugida",
	ranges = {
		0x0A66, 0x0A6F,
		0x11280, 0x11286,
		0x11288, 0x11288,
		0x1128A, 0x1128D,
		0x1128F, 0x1129D,
		0x1129F, 0x112A9,
	},
}

m["Music"] = process_ranges{
	"musical notation",
	233861,
	"pictography",
	ranges = {
		0x2669, 0x266F,
		0x1D100, 0x1D126,
		0x1D129, 0x1D1EA,
	},
	ietf_subtag = "Zsym",
	translit = false,
}

m["Mymr"] = process_ranges{
	"Burmese",
	43887939,
	"abugida",
	aliases = {"Myanmar"},
	ranges = {
		0x1000, 0x109F,
		0xA92E, 0xA92E,
		0xA9E0, 0xA9FE,
		0xAA60, 0xAA7F,
		0x116D0, 0x116E3,
	},
	spaces = false,
}

m["Nagm"] = process_ranges{
	"Mundari Bani",
	106917274,
	"alphabet",
	aliases = {"Nag Mundari"},
	ranges = {
		0x1E4D0, 0x1E4F9,
	},
}

m["Nand"] = process_ranges{
	"Nandinagari",
	6963324,
	"abugida",
	ranges = {
		0x0964, 0x0965,
		0x0CE6, 0x0CEF,
		0x1CE9, 0x1CE9,
		0x1CF2, 0x1CF2,
		0x1CFA, 0x1CFA,
		0xA830, 0xA835,
		0x119A0, 0x119A7,
		0x119AA, 0x119D7,
		0x119DA, 0x119E4,
	},
}

m["Narb"] = process_ranges{
	"Ancient North Arabian",
	1472213,
	"abjad",
	aliases = {"Old North Arabian"},
	ranges = {
		0x10A80, 0x10A9F,
	},
	direction = "rtl",
	translit = "Narb-translit",
}

m["Nbat"] = process_ranges{
	"Nabataean",
	855624,
	"abjad",
	aliases = {"Nabatean"},
	ranges = {
		0x10880, 0x1089E,
		0x108A7, 0x108AF,
	},
	direction = "rtl",
}

m["Newa"] = process_ranges{
	"Newa",
	7237292,
	"abugida",
	aliases = {"Newar", "Newari", "Prachalit Nepal"},
	ranges = {
		0x11400, 0x1145B,
		0x1145D, 0x11461,
	},
}

m["Nkdb"] = {
	"Dongba",
	1190953,
	"pictography",
	aliases = {"Naxi Dongba", "Nakhi Dongba", "Tomba", "Tompa", "Mo-so"},
	spaces = false,
	-- Not in Unicode
}

m["Nkgb"] = {
	"Geba",
	731189,
	"syllabary",
	aliases = {"Nakhi Geba", "Naxi Geba"},
	spaces = false,
	-- Not in Unicode
}

m["Nkoo"] = process_ranges{
	"N'Ko",
	1062587,
	"alphabet",
	ranges = {
		0x060C, 0x060C,
		0x061B, 0x061B,
		0x061F, 0x061F,
		0x07C0, 0x07FA,
		0x07FD, 0x07FF,
		0xFD3E, 0xFD3F,
	},
	direction = "rtl",
}

m["None"] = {
	"unspecified",
	nil,
	-- This should not have any characters listed
	ietf_subtag = "Zyyy",
	translit = false,
	character_category = false, -- none
}

m["Nshu"] = process_ranges{
	"Nüshu",
	56436,
	"syllabary",
	aliases = {"Nushu"},
	ranges = {
		0x16FE1, 0x16FE1,
		0x1B170, 0x1B2FB,
	},
	spaces = false,
}

m["Ogam"] = process_ranges{
	"Ogham",
	184661,
	ranges = {
		0x1680, 0x169C,
	},
}

m["Olck"] = process_ranges{
	"Ol Chiki",
	201688,
	aliases = {"Ol Chemetʼ", "Ol", "Santali"},
	ranges = {
		0x1C50, 0x1C7F,
	},
}

m["Onao"] = process_ranges{
	"Ol Onal",
	108607084,
	"alphabet",
	ranges = {
		0x0964, 0x0965,
		0x1E5D0, 0x1E5FA,
		0x1E5FF, 0x1E5FF,
	},
}

m["Orkh"] = process_ranges{
	"Old Turkic",
	5058305,
	aliases = {"Orkhon runic"},
	ranges = {
		0x10C00, 0x10C48,
	},
	direction = "rtl",
	translit = "Orkh-translit",
}

m["Orya"] = process_ranges{
	"Odia",
	1760127,
	"abugida",
	aliases = {"Oriya"},
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0B01, 0x0B03,
		0x0B05, 0x0B0C,
		0x0B0F, 0x0B10,
		0x0B13, 0x0B28,
		0x0B2A, 0x0B30,
		0x0B32, 0x0B33,
		0x0B35, 0x0B39,
		0x0B3C, 0x0B44,
		0x0B47, 0x0B48,
		0x0B4B, 0x0B4D,
		0x0B55, 0x0B57,
		0x0B5C, 0x0B5D,
		0x0B5F, 0x0B63,
		0x0B66, 0x0B77,
		0x1CDA, 0x1CDA,
		0x1CF2, 0x1CF2,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"ଅା", "ଏୗ", "ଓୗ"},
		to = {"ଆ", "ଐ", "ଔ"}
	},
}

m["Osge"] = process_ranges{
	"Osage",
	7105529,
	ranges = {
		0x104B0, 0x104D3,
		0x104D8, 0x104FB,
	},
	capitalized = true,
}

m["Osma"] = process_ranges{
	"Osmanya",
	1377866,
	ranges = {
		0x10480, 0x1049D,
		0x104A0, 0x104A9,
	},
}

m["Ougr"] = process_ranges{
	"Old Uyghur",
	1998938,
	"abjad, alphabet",
	ranges = {
		0x0640, 0x0640,
		0x10AF2, 0x10AF2,
		0x10F70, 0x10F89,
	},
	-- This should ideally be "vertical-ltr", but getting the CSS right is tricky because it's right-to-left horizontally, but left-to-right vertically. Currently, displaying it vertically causes it to display bottom-to-top.
	direction = "rtl",
}

m["Palm"] = process_ranges{
	"Palmyrene",
	17538100,
	ranges = {
		0x10860, 0x1087F,
	},
	direction = "rtl",
}

m["Pauc"] = process_ranges{
	"Pau Cin Hau",
	25339852,
	ranges = {
		0x11AC0, 0x11AF8,
	},
}

m["Pcun"] = {
	"Proto-Cuneiform",
	1650699,
	"pictography",
	-- Not in Unicode
}

m["Pelm"] = {
	"Proto-Elamite",
	56305763,
	"pictography",
	-- Not in Unicode
}

m["Perm"] = process_ranges{
	"Old Permic",
	147899,
	ranges = {
		0x0483, 0x0483,
		0x10350, 0x1037A,
	},
}

m["Phag"] = process_ranges{
	"Phags-pa",
	822836,
	"abugida",
	ranges = {
		0x1802, 0x1803,
		0x1805, 0x1805,
		0x200C, 0x200D,
		0x202F, 0x202F,
		0x3002, 0x3002,
		0xA840, 0xA877,
	},
	direction = "vertical-ltr",
}

m["Phli"] = process_ranges{
	"Inscriptional Pahlavi",
	24089793,
	"abjad",
	ranges = {
		0x10B60, 0x10B72,
		0x10B78, 0x10B7F,
	},
	direction = "rtl",
}

m["Phlp"] = process_ranges{
	"Psalter Pahlavi",
	7253954,
	"abjad",
	ranges = {
		0x0640, 0x0640,
		0x10B80, 0x10B91,
		0x10B99, 0x10B9C,
		0x10BA9, 0x10BAF,
	},
	direction = "rtl",
}

m["Phlv"] = {
	"Book Pahlavi",
	72403118,
	"abjad",
	direction = "rtl",
	wikipedia_article = "Pahlavi scripts#Book Pahlavi",
	-- Not in Unicode
}

m["Phnx"] = process_ranges{
	"Phoenician",
	26752,
	"abjad",
	ranges = {
		0x10900, 0x1091B,
		0x1091F, 0x1091F,
	},
	direction = "rtl",
	translit = "Phnx-translit",
}

m["Plrd"] = process_ranges{
	"Pollard",
	601734,
	"abugida",
	aliases = {"Miao"},
	ranges = {
		0x16F00, 0x16F4A,
		0x16F4F, 0x16F87,
		0x16F8F, 0x16F9F,
	},
}

m["Prti"] = process_ranges{
	"Inscriptional Parthian",
	13023804,
	ranges = {
		0x10B40, 0x10B55,
		0x10B58, 0x10B5F,
	},
	direction = "rtl",
}

m["Psin"] = {
	"Proto-Sinaitic",
	1065250,
	"abjad",
	direction = "rtl",
	-- Not in Unicode
}

m["Ranj"] = {
	"Ranjana",
	2385276,
	"abugida",
	-- Not in Unicode
}

m["Rjng"] = process_ranges{
	"Rejang",
	2007960,
	"abugida",
	ranges = {
		0xA930, 0xA953,
		0xA95F, 0xA95F,
	},
}

m["Rohg"] = process_ranges{
	"Hanifi Rohingya",
	21028705,
	"alphabet",
	ranges = {
		0x060C, 0x060C,
		0x061B, 0x061B,
		0x061F, 0x061F,
		0x0640, 0x0640,
		0x06D4, 0x06D4,
		0x10D00, 0x10D27,
		0x10D30, 0x10D39,
	},
	direction = "rtl",
}

m["Roro"] = {
	"Rongorongo",
	209764,
	-- Not in Unicode
}

m["Rumin"] = process_ranges{
	"Rumi numerals",
	nil,
	ranges = {
		0x10E60, 0x10E7E,
	},
	ietf_subtag = "Arab",
}

m["Runr"] = process_ranges{
	"Runic",
	82996,
	"alphabet",
	ranges = {
		0x16A0, 0x16EA,
		0x16EE, 0x16F8,
	},
}

do
	local Samr_stripdiacritics = {
		remove_diacritics = c.CGJ .. u(0x0816) .. "-" .. u(0x082D),
	}
	
	m["Samr"] = process_ranges{
		"Samaritan",
		1550930,
		"abjad",
		ranges = {
			0x0800, 0x082D,
			0x0830, 0x083E,
		},
		direction = "rtl",
		strip_diacritics = Samr_stripdiacritics,
		sort_key = Samr_stripdiacritics,
	}
end

m["Sarb"] = process_ranges{
	"Ancient South Arabian",
	446074,
	"abjad",
	aliases = {"Old South Arabian"},
	ranges = {
		0x10A60, 0x10A7F,
	},
	direction = "rtl",
	translit = "Sarb-translit",
}

m["Saur"] = process_ranges{
	"Saurashtra",
	3535165,
	"abugida",
	ranges = {
		0xA880, 0xA8C5,
		0xA8CE, 0xA8D9,
	},
}

m["Semap"] = {
	"flag semaphore",
	250796,
	"pictography",
	ietf_subtag = "Zsym",
}

m["Sgnw"] = process_ranges{
	"SignWriting",
	1497335,
	"pictography",
	aliases = {"Sutton SignWriting"},
	ranges = {
		0x1D800, 0x1DA8B,
		0x1DA9B, 0x1DA9F,
		0x1DAA1, 0x1DAAF,
	},
	translit = false,
}

m["Shaw"] = process_ranges{
	"Shavian",
	1970098,
	aliases = {"Shaw"},
	ranges = {
		0x10450, 0x1047F,
	},
}

m["Shrd"] = process_ranges{
	"Sharada",
	2047117,
	"abugida",
	ranges = {
		0x0951, 0x0951,
		0x1CD7, 0x1CD7,
		0x1CD9, 0x1CD9,
		0x1CDC, 0x1CDD,
		0x1CE0, 0x1CE0,
		0xA830, 0xA835,
		0xA838, 0xA838,
		0x11180, 0x111DF,
	},
	translit = "Shrd-translit",
}

m["Shui"] = {
	"Sui",
	752854,
	"logography",
	spaces = false,
	-- Not in Unicode
}

m["Sidd"] = process_ranges{
	"Siddham",
	250379,
	"abugida",
	ranges = {
		0x11580, 0x115B5,
		0x115B8, 0x115DD,
	},
	translit = "Sidd-translit",
}

m["Sidt"] = {
	"Sidetic",
	36659,
	"alphabet",
	direction = "rtl",
	-- Not in Unicode
}

m["Sind"] = process_ranges{
	"Khudabadi",
	6402810,
	"abugida",
	aliases = {"Khudawadi"},
	ranges = {
		0x0964, 0x0965,
		0xA830, 0xA839,
		0x112B0, 0x112EA,
		0x112F0, 0x112F9,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"𑊰𑋠", "𑊰𑋥", "𑊰𑋦", "𑊰𑋧", "𑊰𑋨"},
		to = {"𑊱", "𑊶", "𑊷", "𑊸", "𑊹"}
	},
}

m["Sinh"] = process_ranges{
	"Sinhalese",
	1574992,
	"abugida",
	aliases = {"Sinhala"},
	ranges = {
		0x0964, 0x0965,
		0x0D81, 0x0D83,
		0x0D85, 0x0D96,
		0x0D9A, 0x0DB1,
		0x0DB3, 0x0DBB,
		0x0DBD, 0x0DBD,
		0x0DC0, 0x0DC6,
		0x0DCA, 0x0DCA,
		0x0DCF, 0x0DD4,
		0x0DD6, 0x0DD6,
		0x0DD8, 0x0DDF,
		0x0DE6, 0x0DEF,
		0x0DF2, 0x0DF4,
		0x1CF2, 0x1CF2,
		0x111E1, 0x111F4,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"අා", "අැ", "අෑ", "උෟ", "ඍෘ", "ඏෟ", "එ්", "එෙ", "ඔෟ", "ෘෘ"},
		to = {"ආ", "ඇ", "ඈ", "ඌ", "ඎ", "ඐ", "ඒ", "ඓ", "ඖ", "ෲ"}
	},
}

m["Sogd"] = process_ranges{
	"Sogdian",
	578359,
	"abjad",
	ranges = {
		0x0640, 0x0640,
		0x10F30, 0x10F59,
	},
	direction = "rtl",
}

m["Sogo"] = process_ranges{
	"Old Sogdian",
	72403254,
	"abjad",
	ranges = {
		0x10F00, 0x10F27,
	},
	direction = "rtl",
}

m["Sora"] = process_ranges{
	"Sorang Sompeng",
	7563292,
	aliases = {"Sora Sompeng"},
	ranges = {
		0x110D0, 0x110E8,
		0x110F0, 0x110F9,
	},
}

m["Soyo"] = process_ranges{
	"Soyombo",
	8009382,
	"abugida",
	ranges = {
		0x11A50, 0x11AA2,
	},
}

m["Sund"] = process_ranges{
	"Sundanese",
	51589,
	"abugida",
	ranges = {
		0x1B80, 0x1BBF,
		0x1CC0, 0x1CC7,
	},
}

m["Sunu"] = process_ranges{
	"Sunuwar",
	109984965,
	"alphabet",
	ranges = {
		0x11BC0, 0x11BE1,
		0x11BF0, 0x11BF9,
	},
}

m["Sylo"] = process_ranges{
	"Sylheti Nagri",
	144128,
	"abugida",
	aliases = {"Sylheti Nāgarī", "Syloti Nagri"},
	ranges = {
		0x0964, 0x0965,
		0x09E6, 0x09EF,
		0xA800, 0xA82C,
	},
}

m["Syrc"] = process_ranges{
	"Syriac",
	26567,
	"abjad", -- more precisely, impure abjad
	ranges = {
		0x060C, 0x060C,
		0x061B, 0x061C,
		0x061F, 0x061F,
		0x0640, 0x0640,
		0x064B, 0x0655,
		0x0670, 0x0670,
		0x0700, 0x070D,
		0x070F, 0x074A,
		0x074D, 0x074F,
		0x0860, 0x086A,
		0x1DF8, 0x1DF8,
		0x1DFA, 0x1DFA,
	},
	direction = "rtl",
}

-- Syre, Syrj, Syrn are apparently subsumed into Syrc; discuss if this causes issues

m["Tagb"] = process_ranges{
	"Tagbanwa",
	977444,
	"abugida",
	ranges = {
		0x1735, 0x1736,
		0x1760, 0x176C,
		0x176E, 0x1770,
		0x1772, 0x1773,
	},
}

m["Takr"] = process_ranges{
	"Takri",
	759202,
	"abugida",
	ranges = {
		0x0964, 0x0965,
		0xA830, 0xA839,
		0x11680, 0x116B9,
		0x116C0, 0x116C9,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"𑚀𑚭", "𑚀𑚴", "𑚀𑚵", "𑚆𑚲"},
		to = {"𑚁", "𑚈", "𑚉", "𑚇"}
	},
}

m["Tale"] = process_ranges{
	"Tai Nüa",
	2566326,
	"abugida",
	aliases = {"Tai Nuea", "New Tai Nüa", "New Tai Nuea", "Dehong Dai", "Tai Dehong", "Tai Le"},
	ranges = {
		0x1040, 0x1049,
		0x1950, 0x196D,
		0x1970, 0x1974,
	},
	spaces = false,
}

m["Talu"] = process_ranges{
	"New Tai Lue",
	3498863,
	"abugida",
	ranges = {
		0x1980, 0x19AB,
		0x19B0, 0x19C9,
		0x19D0, 0x19DA,
		0x19DE, 0x19DF,
	},
	spaces = false,
}

m["Taml"] = process_ranges{
	"Tamil",
	26803,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0B82, 0x0B83,
		0x0B85, 0x0B8A,
		0x0B8E, 0x0B90,
		0x0B92, 0x0B95,
		0x0B99, 0x0B9A,
		0x0B9C, 0x0B9C,
		0x0B9E, 0x0B9F,
		0x0BA3, 0x0BA4,
		0x0BA8, 0x0BAA,
		0x0BAE, 0x0BB9,
		0x0BBE, 0x0BC2,
		0x0BC6, 0x0BC8,
		0x0BCA, 0x0BCD,
		0x0BD0, 0x0BD0,
		0x0BD7, 0x0BD7,
		0x0BE6, 0x0BFA,
		0x1CDA, 0x1CDA,
		0xA8F3, 0xA8F3,
		0x11301, 0x11301,
		0x11303, 0x11303,
		0x1133B, 0x1133C,
		0x11FC0, 0x11FF1,
		0x11FFF, 0x11FFF,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"அூ", "ஸ்ரீ"},
		to = {"ஆ", "ஶ்ரீ"}
	},
}

m["Tang"] = process_ranges{
	"Tangut",
	1373610,
	"logography, syllabary",
	ranges = {
		0x31EF, 0x31EF,
		0x16FE0, 0x16FE0,
		0x17000, 0x187F7,
		0x18800, 0x18AFF,
		0x18D00, 0x18D08,
	},
	spaces = false,
	translit = "txg-translit",
}

m["Tavt"] = process_ranges{
	"Tai Viet",
	11818517,
	"abugida",
	ranges = {
		0xAA80, 0xAAC2,
		0xAADB, 0xAADF,
	},
	spaces = false,
}

m["Tayo"] = process_ranges{
	"Lai Tay",
	16306701,
	"abugida",
	aliases = {"Tai Yo"},
	direction = "vertical-rtl",
	ranges = {
		0x1E6C0, 0x1E6DE,
		0x1E6E0, 0x1E6F5,
		0x1E6FE, 0x1E6FF,
	},
	spaces = false,
}

m["Telu"] = process_ranges{
	"Telugu",
	570450,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x0C00, 0x0C0C,
		0x0C0E, 0x0C10,
		0x0C12, 0x0C28,
		0x0C2A, 0x0C39,
		0x0C3C, 0x0C44,
		0x0C46, 0x0C48,
		0x0C4A, 0x0C4D,
		0x0C55, 0x0C56,
		0x0C58, 0x0C5A,
		0x0C5D, 0x0C5D,
		0x0C60, 0x0C63,
		0x0C66, 0x0C6F,
		0x0C77, 0x0C7F,
		0x1CDA, 0x1CDA,
		0x1CF2, 0x1CF2,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"ఒౌ", "ఒౕ", "ిౕ", "ెౕ", "ొౕ"},
		to = {"ఔ", "ఓ", "ీ", "ే", "ో"}
	},
}

m["Teng"] = {
	"Tengwar",
	473725,
}

m["Tfng"] = process_ranges{
	"Tifinagh",
	208503,
	"abjad, alphabet",
	ranges = {
		0x2D30, 0x2D67,
		0x2D6F, 0x2D70,
		0x2D7F, 0x2D7F,
	},
	other_names = {"Libyco-Berber", "Berber"}, -- per Wikipedia, Libyco-Berber is the parent
}

m["Tglg"] = process_ranges{
	"Baybayin",
	812124,
	"abugida",
	aliases = {"Tagalog"},
	varieties = {"Kur-itan"},
	ranges = {
		0x1700, 0x1715,
		0x171F, 0x171F,
		0x1735, 0x1736,
	},
}

m["Thaa"] = process_ranges{
	"Thaana",
	877906,
	"abugida",
	ranges = {
		0x060C, 0x060C,
		0x061B, 0x061C,
		0x061F, 0x061F,
		0x0660, 0x0669,
		0x0780, 0x07B1,
		0xFDF2, 0xFDF2,
		0xFDFD, 0xFDFD,
	},
	direction = "rtl",
}

m["Thai"] = process_ranges{
	"Thai",
	236376,
	"abugida",
	ranges = {
		0x0E01, 0x0E3A,
		0x0E40, 0x0E5B,
	},
	spaces = false,
}

do
	local Tibt_displaytext = {
		from = {"ༀ", "༌", "།།", "༚༚", "༚༝", "༝༚", "༝༝", "ཷ", "ཹ", "ེེ", "ོོ"},
		to = {"ཨོཾ", "་", "༎", "༛", "༟", "࿎", "༞", "ྲཱྀ", "ླཱྀ", "ཻ", "ཽ"}
	}

	m["Tibt"] = process_ranges{
		"Tibetan",
		46861,
		"abugida",
		ranges = {
			0x0F00, 0x0F47,
			0x0F49, 0x0F6C,
			0x0F71, 0x0F97,
			0x0F99, 0x0FBC,
			0x0FBE, 0x0FCC,
			0x0FCE, 0x0FD4,
			0x0FD9, 0x0FDA,
			0x3008, 0x300B,
		},
		normalizationFixes = handle_normalization_fixes{
			combiningClasses = {["༹"] = 1},
			from = {"ཷ", "ཹ"},
			to = {"ྲཱྀ", "ླཱྀ"}
		},
		display_text = Tibt_displaytext,
		strip_diacritics = Tibt_displaytext,
		sort_key = "Tibt-sortkey",
		translit = "Tibt-translit",
	}
	
		m["sit-tam-Tibt"] = {
			"Tamyig",
			109875213,
			m["Tibt"][3],
			-- There is no inheritance of properties currently implemented for scripts. Per [[User:Theknightwho]], this
			-- is because it's tricky to do since there are several types of child scripts: those that are mere display
			-- variants (like fa-Arab, kk-Arab), which should be eliminated in favor of CSS language selectors to
			-- handle the font differences; those that are genuinely different scripts that happen to share the same
			-- Unicode codepoints but have mostly different properties (e.g. Manchu vs. Mongolian); and those that are
			-- somewhere in between (like Tamyig vs. Tibetan). As a result, we currently have to manually specify
			-- which properties we want inherited as follows.
			ranges = m["Tibt"].ranges,
			characters = m["Tibt"].characters,
			parent = "Tibt",
			normalizationFixes = m["Tibt"].normalizationFixes,
			display_text = m["Tibt"].display_text,
			strip_diacritics = m["Tibt"].strip_diacritics,
			sort_key = m["Tibt"].sort_key,
			translit = m["Tibt"].translit,
		}
end

m["Tirh"] = process_ranges{
	"Tirhuta",
	1765752,
	"abugida",
	ranges = {
		0x0951, 0x0952,
		0x0964, 0x0965,
		0x1CF2, 0x1CF2,
		0xA830, 0xA839,
		0x11480, 0x114C7,
		0x114D0, 0x114D9,
	},
	normalizationFixes = handle_normalization_fixes{
		from = {"𑒁𑒰", "𑒋𑒺", "𑒍𑒺", "𑒪𑒵", "𑒪𑒶"},
		to = {"𑒂", "𑒌", "𑒎", "𑒉", "𑒊"}
	},
}

m["Tnsa"] = process_ranges{
	"Tangsa",
	105576311,
	"alphabet",
	ranges = {
		0x16A70, 0x16ABE,
		0x16AC0, 0x16AC9,
	},
}

m["Todr"] = process_ranges{
	"Todhri",
	10274731,
	"alphabet",
	direction = "rtl",
	ranges = {
		0x105C0, 0x105F3,
	},
}

m["Tols"] = {
	"Tolong Siki",
	4459822,
	"alphabet",
	-- Not in Unicode
}

m["Toto"] = process_ranges{
	"Toto",
	104837516,
	"abugida",
	ranges = {
		0x1E290, 0x1E2AE,
	},
}

m["Tutg"] = process_ranges{
	"Tigalari",
	2604990,
	"abugida",
	aliases = {"Tulu"},
	ranges = {
		0x1CF2, 0x1CF2,
		0x1CF4, 0x1CF4,
		0xA8F1, 0xA8F1,
		0x11380, 0x11389,
		0x1138B, 0x1138B,
		0x1138E, 0x1138E,
		0x11390, 0x113B5,
		0x113B7, 0x113C0,
		0x113C2, 0x113C2,
		0x113C5, 0x113C5,
		0x113C7, 0x113CA,
		0x113CC, 0x113D5,
		0x113D7, 0x113D8,
		0x113E1, 0x113E2,
	},
}

m["Ugar"] = process_ranges{
	"Ugaritic",
	332652,
	"abjad",
	ranges = {
		0x10380, 0x1039D,
		0x1039F, 0x1039F,
	},
}

m["Vaii"] = process_ranges{
	"Vai",
	523078,
	"syllabary",
	ranges = {
		0xA500, 0xA62B,
	},
}

m["Visp"] = {
	"Visible Speech",
	1303365,
	"alphabet",
	-- Not in Unicode
}

m["Vith"] = process_ranges{
	"Vithkuqi",
	3301993,
	"alphabet",
	ranges = {
		0x10570, 0x1057A,
		0x1057C, 0x1058A,
		0x1058C, 0x10592,
		0x10594, 0x10595,
		0x10597, 0x105A1,
		0x105A3, 0x105B1,
		0x105B3, 0x105B9,
		0x105BB, 0x105BC,
	},
	capitalized = true,
}

m["Wara"] = process_ranges{
	"Varang Kshiti",
	79199,
	aliases = {"Warang Citi"},
	ranges = {
		0x118A0, 0x118F2,
		0x118FF, 0x118FF,
	},
	capitalized = true,
}

m["Wcho"] = process_ranges{
	"Wancho",
	33713728,
	"alphabet",
	ranges = {
		0x1E2C0, 0x1E2F9,
		0x1E2FF, 0x1E2FF,
	},
}

m["Wole"] = {
	"Woleai",
	6643710,
	"syllabary",
	-- Not in Unicode
}

m["Xpeo"] = process_ranges{
	"Old Persian",
	1471822,
	ranges = {
		0x103A0, 0x103C3,
		0x103C8, 0x103D5,
	},
}

m["Xsux"] = process_ranges{
	"Cuneiform",
	401,
	aliases = {"Sumero-Akkadian Cuneiform"},
	ranges = {
		0x12000, 0x12399,
		0x12400, 0x1246E,
		0x12470, 0x12474,
		0x12480, 0x12543,
	},
}

m["Yezi"] = process_ranges{
	"Yezidi",
	13175481,
	"alphabet",
	ranges = {
		0x060C, 0x060C,
		0x061B, 0x061B,
		0x061F, 0x061F,
		0x0660, 0x0669,
		0x10E80, 0x10EA9,
		0x10EAB, 0x10EAD,
		0x10EB0, 0x10EB1,
	},
	direction = "rtl",
}

m["Yiii"] = process_ranges{
	"Yi",
	1197646,
	"syllabary",
	ranges = {
		0x3001, 0x3002,
		0x3008, 0x3011,
		0x3014, 0x301B,
		0x30FB, 0x30FB,
		0xA000, 0xA48C,
		0xA490, 0xA4C6,
		0xFF61, 0xFF65,
	},
}

m["Zanb"] = process_ranges{
	"Zanabazar Square",
	50809208,
	"abugida",
	ranges = {
		0x11A00, 0x11A47,
	},
}

m["Zmth"] = process_ranges{
	"mathematical notation",
	1140046,
	ranges = {
		0x00AC, 0x00AC,
		0x00B1, 0x00B1,
		0x00D7, 0x00D7,
		0x00F7, 0x00F7,
		0x03D0, 0x03D2,
		0x03D5, 0x03D5,
		0x03F0, 0x03F1,
		0x03F4, 0x03F6,
		0x0606, 0x0608,
		0x2016, 0x2016,
		0x2032, 0x2034,
		0x2040, 0x2040,
		0x2044, 0x2044,
		0x2052, 0x2052,
		0x205F, 0x205F,
		0x2061, 0x2064,
		0x207A, 0x207E,
		0x208A, 0x208E,
		0x20D0, 0x20DC,
		0x20E1, 0x20E1,
		0x20E5, 0x20E6,
		0x20EB, 0x20EF,
		0x2102, 0x2102,
		0x2107, 0x2107,
		0x210A, 0x2113,
		0x2115, 0x2115,
		0x2118, 0x211D,
		0x2124, 0x2124,
		0x2128, 0x2129,
		0x212C, 0x212D,
		0x212F, 0x2131,
		0x2133, 0x2138,
		0x213C, 0x2149,
		0x214B, 0x214B,
		0x2190, 0x21A7,
		0x21A9, 0x21AE,
		0x21B0, 0x21B1,
		0x21B6, 0x21B7,
		0x21BC, 0x21DB,
		0x21DD, 0x21DD,
		0x21E4, 0x21E5,
		0x21F4, 0x22FF,
		0x2308, 0x230B,
		0x2320, 0x2321,
		0x237C, 0x237C,
		0x239B, 0x23B5,
		0x23B7, 0x23B7,
		0x23D0, 0x23D0,
		0x23DC, 0x23E2,
		0x25A0, 0x25A1,
		0x25AE, 0x25B7,
		0x25BC, 0x25C1,
		0x25C6, 0x25C7,
		0x25CA, 0x25CB,
		0x25CF, 0x25D3,
		0x25E2, 0x25E2,
		0x25E4, 0x25E4,
		0x25E7, 0x25EC,
		0x25F8, 0x25FF,
		0x2605, 0x2606,
		0x2640, 0x2640,
		0x2642, 0x2642,
		0x2660, 0x2663,
		0x266D, 0x266F,
		0x27C0, 0x27FF,
		0x2900, 0x2AFF,
		0x2B30, 0x2B44,
		0x2B47, 0x2B4C,
		0xFB29, 0xFB29,
		0xFE61, 0xFE66,
		0xFE68, 0xFE68,
		0xFF0B, 0xFF0B,
		0xFF1C, 0xFF1E,
		0xFF3C, 0xFF3C,
		0xFF3E, 0xFF3E,
		0xFF5C, 0xFF5C,
		0xFF5E, 0xFF5E,
		0xFFE2, 0xFFE2,
		0xFFE9, 0xFFEC,
		0x1D400, 0x1D454,
		0x1D456, 0x1D49C,
		0x1D49E, 0x1D49F,
		0x1D4A2, 0x1D4A2,
		0x1D4A5, 0x1D4A6,
		0x1D4A9, 0x1D4AC,
		0x1D4AE, 0x1D4B9,
		0x1D4BB, 0x1D4BB,
		0x1D4BD, 0x1D4C3,
		0x1D4C5, 0x1D505,
		0x1D507, 0x1D50A,
		0x1D50D, 0x1D514,
		0x1D516, 0x1D51C,
		0x1D51E, 0x1D539,
		0x1D53B, 0x1D53E,
		0x1D540, 0x1D544,
		0x1D546, 0x1D546,
		0x1D54A, 0x1D550,
		0x1D552, 0x1D6A5,
		0x1D6A8, 0x1D7CB,
		0x1D7CE, 0x1D7FF,
		0x1EE00, 0x1EE03,
		0x1EE05, 0x1EE1F,
		0x1EE21, 0x1EE22,
		0x1EE24, 0x1EE24,
		0x1EE27, 0x1EE27,
		0x1EE29, 0x1EE32,
		0x1EE34, 0x1EE37,
		0x1EE39, 0x1EE39,
		0x1EE3B, 0x1EE3B,
		0x1EE42, 0x1EE42,
		0x1EE47, 0x1EE47,
		0x1EE49, 0x1EE49,
		0x1EE4B, 0x1EE4B,
		0x1EE4D, 0x1EE4F,
		0x1EE51, 0x1EE52,
		0x1EE54, 0x1EE54,
		0x1EE57, 0x1EE57,
		0x1EE59, 0x1EE59,
		0x1EE5B, 0x1EE5B,
		0x1EE5D, 0x1EE5D,
		0x1EE5F, 0x1EE5F,
		0x1EE61, 0x1EE62,
		0x1EE64, 0x1EE64,
		0x1EE67, 0x1EE6A,
		0x1EE6C, 0x1EE72,
		0x1EE74, 0x1EE77,
		0x1EE79, 0x1EE7C,
		0x1EE7E, 0x1EE7E,
		0x1EE80, 0x1EE89,
		0x1EE8B, 0x1EE9B,
		0x1EEA1, 0x1EEA3,
		0x1EEA5, 0x1EEA9,
		0x1EEAB, 0x1EEBB,
		0x1EEF0, 0x1EEF1,
	},
	translit = false,
}

m["Zname"] = process_ranges{
	"Znamenny musical notation",
	965834,
	"pictography",
	ranges = {
		0x1CF00, 0x1CF2D,
		0x1CF30, 0x1CF46,
		0x1CF50, 0x1CFC3,
	},
	ietf_subtag = "Zsym",
	translit = false,
}

m["Zsym"] = process_ranges{
	"symbolic",
	80071,
	"pictography",
	ranges = {
		0x20DD, 0x20E0,
		0x20E2, 0x20E4,
		0x20E7, 0x20EA,
		0x20F0, 0x20F0,
		0x2100, 0x2101,
		0x2103, 0x2106,
		0x2108, 0x2109,
		0x2114, 0x2114,
		0x2116, 0x2117,
		0x211E, 0x2123,
		0x2125, 0x2127,
		0x212A, 0x212B,
		0x212E, 0x212E,
		0x2132, 0x2132,
		0x2139, 0x213B,
		0x214A, 0x214A,
		0x214C, 0x214F,
		0x21A8, 0x21A8,
		0x21AF, 0x21AF,
		0x21B2, 0x21B5,
		0x21B8, 0x21BB,
		0x21DC, 0x21DC,
		0x21DE, 0x21E3,
		0x21E6, 0x21F3,
		0x2300, 0x2307,
		0x230C, 0x231F,
		0x2322, 0x237B,
		0x237D, 0x239A,
		0x23B6, 0x23B6,
		0x23B8, 0x23CF,
		0x23D1, 0x23DB,
		0x23E3, 0x23FF,
		0x2500, 0x259F,
		0x25A2, 0x25AD,
		0x25B8, 0x25BB,
		0x25C2, 0x25C5,
		0x25C8, 0x25C9,
		0x25CC, 0x25CE,
		0x25D4, 0x25E1,
		0x25E3, 0x25E3,
		0x25E5, 0x25E6,
		0x25ED, 0x25F7,
		0x2600, 0x2604,
		0x2607, 0x263F,
		0x2641, 0x2641,
		0x2643, 0x265F,
		0x2664, 0x266C,
		0x2670, 0x27BF,
		0x2B00, 0x2B2F,
		0x2B45, 0x2B46,
		0x2B4D, 0x2B73,
		0x2B76, 0x2B95,
		0x2B97, 0x2BFF,
		0x4DC0, 0x4DFF,
		0x1F000, 0x1F02B,
		0x1F030, 0x1F093,
		0x1F0A0, 0x1F0AE,
		0x1F0B1, 0x1F0BF,
		0x1F0C1, 0x1F0CF,
		0x1F0D1, 0x1F0F5,
		0x1F300, 0x1F6D7,
		0x1F6DC, 0x1F6EC,
		0x1F6F0, 0x1F6FC,
		0x1F700, 0x1F776,
		0x1F77B, 0x1F7D9,
		0x1F7E0, 0x1F7EB,
		0x1F7F0, 0x1F7F0,
		0x1F800, 0x1F80B,
		0x1F810, 0x1F847,
		0x1F850, 0x1F859,
		0x1F860, 0x1F887,
		0x1F890, 0x1F8AD,
		0x1F8B0, 0x1F8B1,
		0x1F900, 0x1FA53,
		0x1FA60, 0x1FA6D,
		0x1FA70, 0x1FA7C,
		0x1FA80, 0x1FA88,
		0x1FA90, 0x1FABD,
		0x1FABF, 0x1FAC5,
		0x1FACE, 0x1FADB,
		0x1FAE0, 0x1FAE8,
		0x1FAF0, 0x1FAF8,
		0x1FB00, 0x1FB92,
		0x1FB94, 0x1FBCA,
		0x1FBF0, 0x1FBF9,
	},
	translit = false,
	character_category = false, -- none
}

m["Zyyy"] = {
	"undetermined",
	104839687,
	-- This should not have any characters listed, probably
	translit = false,
	character_category = false, -- none
}

m["Zzzz"] = {
	"uncoded",
	104839675,
	-- This should not have any characters listed
	translit = false,
	character_category = false, -- none
}

-- These should be defined after the scripts they are composed of.

m["Hrkt"] = process_ranges{
	"Kana",
	187659,
	"syllabary",
	aliases = {"Japanese syllabaries"},
	ranges = union(
		m["Hira"].ranges,
		m["Kana"].ranges
	),
	spaces = false,
}

m["Jpan"] = process_ranges{
	"Japanese",
	190502,
	"logography, syllabary",
	ranges = union(
		m["Hrkt"].ranges,
		m["Hani"].ranges,
		m["Latn"].ranges
	),
	spaces = false,
	sort_by_scraping = true,
}

m["Kore"] = process_ranges{
	"Korean",
	711797,
	"logography, syllabary",
	ranges = union(
		m["Hang"].ranges,
		m["Hani"].ranges,
		m["Latn"].ranges
	),
	-- `漢字(한자)`→`漢字`
	-- `가-나-다`→`가나다`, `가--나--다`→`가-나-다`
	-- `온돌(溫突/溫堗)`→`온돌` ([[ondol]])
	strip_diacritics = {
		remove_diacritics = u(0x302E) .. u(0x302F),
		from = {"([" .. m["Hani"].characters .. "])%(.-%)", "^%-", "%-$", "%-(%-?)", "\1", "%([" .. m["Hani"].characters .. "/]+%)"},
		to = {"%1", "\1", "\1", "%1", "-"}
	}
}

--Constructed languages
m["Ayer"] = process_ranges{
	"Tahano Hikamu",
	nil,
	"abugida",
	ranges = {
		0x0041, 0x005A,
		0x0061, 0x007A,
		0x002A, 0x002A,
		0x00F1, 0x00F1,
		0x00D1, 0x00D1,
		0x0294, 0x0294,
		0x0259, 0x0259,
		0x018F, 0x018F,
		0xA736, 0xA737,
		0x0026, 0x0026,
		0x002B, 0x002D,
		0x005B, 0x005B,
		0x005D, 0x005D,
		0x00A8, 0x00A8,
		0x00AF, 0x00AF,
		0x00B2, 0x00B2,
		0x00B9, 0x00B9,
		0x02B0, 0x2B2,
		0x02C0, 0x02C0,
		0x02D0, 0x02D0,
	},
	character_category = false,
}

m["Jovl"] = process_ranges{
	"Jovlish",
	nil,
	"alphabet",
	ranges = {
		0x0041, 0x005A,
		0x0061, 0x007A,
		0x00AA, 0x00AA,
		0x00BA, 0x00BA,
		0x00C0, 0x00D6,
		0x00D8, 0x00F6,
		0x00F8, 0x02B8,
		0x022B, 0x022B,
		0x02C0, 0x02C1,
		0x02E0, 0x02E4,
		0x0363, 0x036F,
		0x039E, 0x039E,
		0x03A8, 0x03A8,
		0x03BE, 0x03BE,
		0x03C8, 0x03C8,
		0x0485, 0x0486,
		0x0951, 0x0952,
		0x10FB, 0x10FB,
		0x1D00, 0x1D25,
		0x1D2C, 0x1D5C,
		0x1D62, 0x1D65,
		0x1D6B, 0x1D77,
		0x1D79, 0x1DBE,
		0x1DF8, 0x1DF8,
		0x1E00, 0x1EFF,
		0x202F, 0x202F,
		0x2071, 0x2071,
		0x207F, 0x207F,
		0x2090, 0x209C,
		0x20F0, 0x20F0,
		0x2100, 0x2125,
		0x2128, 0x2128,
		0x212A, 0x2134,
		0x2139, 0x213B,
		0x2141, 0x214E,
		0x2160, 0x2188,
		0x2C60, 0x2C7F,
		0xA700, 0xA707,
		0xA722, 0xA787,
		0xA78B, 0xA7CD,
		0xA7D0, 0xA7D1,
		0xA7D3, 0xA7D3,
		0xA7D5, 0xA7DC,
		0xA7F2, 0xA7FF,
		0xA92E, 0xA92E,
		0xAB30, 0xAB5A,
		0xAB5C, 0xAB64,
		0xAB66, 0xAB69,
		0xFB00, 0xFB06,
		0xFF21, 0xFF3A,
		0xFF41, 0xFF5A,
		0x10780, 0x10785,
		0x10787, 0x107B0,
		0x107B2, 0x107BA,
		0x1DF00, 0x1DF1E,
		0x1DF25, 0x1DF2A,
	},
	character_category = false,
}

m["Gthv"] = process_ranges{
	"Gothevian",
	nil,
	"alphabet",
	ranges = {
	    0x0041, 0x005A,
	    0x0061, 0x007A,
	    0x00C1, 0x00C4,
	    0x00C8, 0x00CB,
	    0x00CD, 0x00CD,
	    0x00CF, 0x00CF,
	    0x00D2, 0x00D4,
	    0x00D6, 0x00D6,
	    0x00DA, 0x00DC,
	    0x00DD, 0x00DD,
	    0x00E1, 0x00E4,
	    0x00E8, 0x00EB,
	    0x00ED, 0x00ED,
	    0x00EF, 0x00EF,
	    0x00F2, 0x00F4,
	    0x00F6, 0x00F6,
	    0x00FA, 0x00FC,
	    0x00FD, 0x00FD,
	    0x00FF, 0x00FF,
	    0x0110, 0x0111,
	    0x0160, 0x0161,
	    0x0178, 0x0178,
	    0x017D, 0x017E,
	    0x0186, 0x0186,
	    0x0190, 0x0190,
	    0x0195, 0x0195,
	    0x01F6, 0x01F6,
	    0x0254, 0x0254,
	    0x025B, 0x025B,
	    0x0398, 0x0398,
	    0x039E, 0x039E,
	    0x03A8, 0x03A8,
	    0x03B8, 0x03B8,
	    0x03BE, 0x03BE,
	    0x03C8, 0x03C8,
	},
	character_category = false,
}

m["Roka"] = process_ranges{
	"Rokadong Curakjang",
	nil,
	"abugida",
	ranges = {
		0x0041, 0x005A,
		0x0061, 0x007A,
		0x0022, 0x0022,
		0x0027, 0x0027,
		0x002A, 0x002A,
		0x002D, 0x002D,
		0x005B, 0x005D,
		0x007B, 0x007B,
		0x007D, 0x007D
	},
	character_category = false,
}
m["Rsnold"] = process_ranges{
	"Old Raysian",
	nil,
	"alphabet",
	ranges = {
		0x0041, 0x007A
	},
	character_category = false,
}
m["Pann"] = process_ranges{
	"Pannonian",
	nil,
	"alphabet",
	ranges = {
		0x0041, 0x005A,
		0x0061, 0x007A,
		0x1D9C, 0x1D9D,
		0x1D47, 0x1D4B,
		0x02E1, 0x02E3,
		0x0410, 0x044F,
		0x0404, 0x0454,
		0x04AE, 0x04B1,
		0x0250, 0x0254,
		0x0265, 0x0278,
		0x028C, 0x028D,
		0x0224, 0x0225,
		0x01BA, 0x01BE,
		0x019A, 0x01A3,
		0x012D, 0x0131,
		0xA793, 0xA794
	},
	character_category = false,
}

m["Teul"] = process_ranges{
	"Teulgi",
	nil,
	"alphabet",
	ranges = m["Latn"].ranges,
	characters = m["Latn"].characters,
	character_category = false,
}

m["Tugv"] = process_ranges{
	"Tuġvut",
	nil,
	"alphabet",
	ranges = m["Latn"].ranges,
	characters = m["Latn"].characters,
	character_category = false,
}

m["Ucrn"] = process_ranges{
	"Draconian",
	nil,
	"alphabet",
	ranges = {
	    0x0020, 0x0021,
	    0x0023, 0x0023,
	    0x0027, 0x0027,
	    0x0030, 0x0034,
	    0x0040, 0x0040,
	    0x0047, 0x0048,
	    0x004B, 0x004B,
	    0x0050, 0x0050,
	    0x0058, 0x0058,
	    0x0066, 0x0067,
	    0x0069, 0x006A,
	    0x006F, 0x0072,
	    0x0079, 0x0079,
	    0x010D, 0x010D,
	    0x014B, 0x014B,
	    0x01A9, 0x01A9,
	    0x01E7, 0x01E7,
	    0x0238, 0x0238,
	    0x024F, 0x024F,
	    0x1EFA, 0x1EFB,
	};
	character_category = false,
}


return require("Module:languages").finalizeData(m, "script")