Content deleted Content added
Cobaltcigs (talk | contribs) made it this far |
Cobaltcigs (talk | contribs) done unless i fell asleep and missed something in the CJK blocks, pls double-check |
||
Line 1:
--[[-----------------
Values that look like meaningless pass-through assignments actually have the purpose of forcing a dashed box
on printable characters that otherwise would not be identified as needing one. This avoids setting up a second config table for the box status.
The character U+1F3F7 LABEL actually looks like the tags in the Tags block. At least according to the standard. Reality will vary by font. See:
* https://www.unicode.org/charts/PDF/U1F300.pdf
* https://www.unicode.org/charts/PDF/UE0000.pdf
--]]-----------------
local display = {
-- Basic Latin
[0x0000] = "NUL",
Line 73 ⟶ 84:
[0x034F] = "CGJ ◌",
-- Arabic
[0x0600] =
[0x0601] =
[0x0602] =
[0x0603] =
[0x0604] =
[0x061C] = "ALM",
[0x06DD] =
-- Syriac
[0x070F] = mw.ustring.char(0x070F).."
-- Arabic Extended-A
[0x070F] =
-- Kannada
[0x0CF1] =
[0x0CF2] =
-- Malayalam
[0x0D4E] =
-- Tibetan
[0x0F0C] = mw.ustring.char(0x0F0C).."
-- Myanmar
[0x1039] =
-- Hangul Jamo
[0x115F] = "HC F",
Line 101 ⟶ 112:
[0x17B4] = "KIV AQ",
[0x17B5] = "KIV AA",
[0x17D2] =
-- Mongolian
[0x180B] = "FV S1",
Line 108 ⟶ 119:
[0x180E] = "MV S",
-- Tai Tham
[0x1A60] =
-- Vedic Extensions
[0x1CF5] =
[0x1CF6] =
-- General Punctuation
[0x2000] = "NQ SP",
Line 150 ⟶ 161:
[0x206F] = "NO DS",
-- Tifinagh
[0x2D7F] =
-- Supplemental Punctuation
[0x2E3A] = "2M
[0x2E3B] = "3M
-- CJK Symbols and Punctuation
[0x3000] = "ID SP", --whitespace anyway
-- Hangul Compatibility Jamo
[0x3164] = "HF",
-- Meetei Mayek Extensions
[0x3164] = mw.ustring.char(0x3164),
-- Variation Selectors
[0xFE00] = "VS 1",
[0xFE01] = "VS 2",
[0xFE02] = "VS 3",
[0xFE03] = "VS 4",
[0xFE04] = "VS 5",
[0xFE05] = "VS 6",
[0xFE06] = "VS 7",
[0xFE07] = "VS 8",
[0xFE08] = "VS 9",
[0xFE09] = "VS 10",
[0xFE0A] = "VS 11",
[0xFE0B] = "VS 12",
[0xFE0C] = "VS 13",
[0xFE0D] = "VS 14",
[0xFE0E] = "VS 15",
[0xFE0F] = "VS 16",
-- Arabic Presentation Forms-B
[0xFEFF] = "ZWN BSP",
-- Halfwidth and Fullwidth Forms
[0xFFA0] = "HW HF",
-- Specials
[0xFFF9] = "IA A",
[0xFFFA] = "IA S",
[0xFFFB] = "IA T",
[0xFFFC] = "OBJ",
-- Kharoshthi
[0x10A3F] = mw.ustring.char(0x10A3F),
-- Brahmi
[0x11003] = mw.ustring.char(0x11003),
[0x11004] = mw.ustring.char(0x11004),
[0x1107F] = "BNJ",
-- Kaithi
[0x110BD] = mw.ustring.char(0x110BD),
[0x110CD] = mw.ustring.char(0x110CD),
-- Chakma
[0x11133] = mw.ustring.char(0x11133),
-- Sharada
[0x111C2] = mw.ustring.char(0x111C2),
[0x111C3] = mw.ustring.char(0x111C3),
-- Zanabazar Square
[0x11A3A] = mw.ustring.char(0x11A3A),
[0x11A47] = mw.ustring.char(0x11A47),
-- Soyombo
[0x11A84] = mw.ustring.char(0x11A84),
[0x11A85] = mw.ustring.char(0x11A85),
[0x11A86] = mw.ustring.char(0x11A86),
[0x11A87] = mw.ustring.char(0x11A87),
[0x11A88] = mw.ustring.char(0x11A88),
[0x11A89] = mw.ustring.char(0x11A89),
[0x11A47] = mw.ustring.char(0x11A99),
-- Masaram Gondi
[0x11D45] = mw.ustring.char(0x11D45),
[0x11D46] = mw.ustring.char(0x11D46),
-- Gunjala Gondi
[0x11D97] = mw.ustring.char(0x11D97),
-- Egyptian Hieroglyph Format Controls
[0x13430] = mw.ustring.char(0x13430),
[0x13431] = mw.ustring.char(0x13431),
[0x13432] = mw.ustring.char(0x13432),
[0x13433] = mw.ustring.char(0x13433),
[0x13434] = mw.ustring.char(0x13434),
[0x13435] = mw.ustring.char(0x13435),
[0x13436] = mw.ustring.char(0x13436),
[0x13437] = mw.ustring.char(0x13437),
[0x13438] = mw.ustring.char(0x13438),
-- Miao
[0x16F8F] = mw.ustring.char(0x16F8F),
[0x16F90] = mw.ustring.char(0x16F90),
[0x16F91] = mw.ustring.char(0x16F91),
[0x16F92] = mw.ustring.char(0x16F92),
-- Duployan
[0x1BC9D] = "DT LS",
-- Shorthand Format Controls
[0x1BCA0] = "⇸",
[0x1BCA1] = "⮡", -- not a very good approximation of pdf glyph https://www.unicode.org/charts/PDF/U1BCA0.pdf
[0x1BCA2] = "↑",
[0x1BCA3] = "↓",
-- Musical Symbols
[0x1D159] = "NULL NOTE HEAD",
[0x1D173] = "BEGIN BEAM
[0x1D174] = "END BEAM",
[0x1D175] = "BEGIN TIE
[0x1D176] = "END TIE",
[0x1D177] = "BEGIN SLUR
[0x1D178] = "END SLUR",
[0x1D179] = "BEGIN PHR
[0x1D17A] = "END PHR.",
-- Sutton SignWriting
[0x1DA9B] = "SW F2",
[0x1DA9C] = "SW F3",
[0x1DA9D] = "SW F4",
[0x1DA9E] = "SW F5",
[0x1DA9F] = "SW F6",
[0x1DAA1] = "SW R2",
[0x1DAA2] = "SW R3",
[0x1DAA3] = "SW R4",
[0x1DAA4] = "SW R5",
[0x1DAA5] = "SW R6",
[0x1DAA6] = "SW R7",
[0x1DAA7] = "SW R8",
[0x1DAA8] = "SW R9",
[0x1DAA9] = "SW R10",
[0x1DAAA] = "SW R11",
[0x1DAAB] = "SW R12",
[0x1DAAC] = "SW R13",
[0x1DAAD] = "SW R14",
[0x1DAAE] = "SW R15",
[0x1DAAF] = "SW R16",
-- Enclosed Alphanumeric Supplement
[0x1F1E6] = mw.ustring.char(0x1F1E6),
[0x1F1E7] = mw.ustring.char(0x1F1E7),
[0x1F1E8] = mw.ustring.char(0x1F1E8),
[0x1F1E9] = mw.ustring.char(0x1F1E9),
[0x1F1EA] = mw.ustring.char(0x1F1EA),
[0x1F1EB] = mw.ustring.char(0x1F1EB),
[0x1F1EC] = mw.ustring.char(0x1F1EC),
[0x1F1ED] = mw.ustring.char(0x1F1ED),
[0x1F1EE] = mw.ustring.char(0x1F1EE),
[0x1F1EF] = mw.ustring.char(0x1F1EF),
[0x1F1F0] = mw.ustring.char(0x1F1F0),
[0x1F1F1] = mw.ustring.char(0x1F1F1),
[0x1F1F2] = mw.ustring.char(0x1F1F2),
[0x1F1F3] = mw.ustring.char(0x1F1F3),
[0x1F1F4] = mw.ustring.char(0x1F1F4),
[0x1F1F5] = mw.ustring.char(0x1F1F5),
[0x1F1F6] = mw.ustring.char(0x1F1F6),
[0x1F1F7] = mw.ustring.char(0x1F1F7),
[0x1F1F8] = mw.ustring.char(0x1F1F8),
[0x1F1F9] = mw.ustring.char(0x1F1F9),
[0x1F1FA] = mw.ustring.char(0x1F1FA),
[0x1F1FB] = mw.ustring.char(0x1F1FB),
[0x1F1FC] = mw.ustring.char(0x1F1FC),
[0x1F1FD] = mw.ustring.char(0x1F1FD),
[0x1F1FE] = mw.ustring.char(0x1F1FE),
[0x1F1FF] = mw.ustring.char(0x1F1FF),
}
-- Tags
local tag = ' '..mw.ustring.char(0x1F3F7)
display[0xE0001] = "BEGIN"..tag
display[0xE0020] = "SP"..tag
for n = 0xE0021,0xE007F do display[n] = (string.char(n-0xE0000)..tag) end
-- Variation Selectors Supplement
for n = 0xE0100,0x0E01EF do display[n] = "VS "..(n-0xE00EF) end
return display
|