Zum Inhalt springen

Modul:Sort/utf8max2bytes

Faan Wikipedia

Die Dokumentation für dieses Modul kann unter Modul:Sort/utf8max2bytes/Doku erstellt werden

local Serial = "2018-03-26"
local Item   = 50978956
--[=[
Sort/utf8max2bytes
mw.loadData() table with simplification for characters > 0x7FF
]=]
return {
[  5760] = " ",  -- OGHAM SPACE MARK
[  8192] = " ",  -- EN QUAD
[  8193] = " ",  -- EM QUAD
[  8194] = " ",  -- N-SPACE
[  8195] = " ",  -- M-SPACE
[  8196] = " ",  -- THREE-PER-EM SPACE
[  8197] = " ",  -- FOUR-PER-EM SPACE
[  8198] = " ",  -- SIX-PER-EM SPACE
[  8199] = " ",  -- FIGURE SPACE
[  8200] = " ",  -- PUNCTUATION SPACE
[  8201] = " ",  -- thinsp
[  8202] = " ",  -- HAIR SPACE (english typography)
[  8239] = " ",  -- NARROW NO-BREAK SPACE
[  8287] = " ",  -- MEDIUM MATHEMATICAL SPACE
[917536] = " ",  -- TAG SPACE
[  8208] = "-",  -- HYPHEN
[  8209] = "-",  -- NON-BREAKING HYPHEN
[  8210] = "-",  -- FIGURE DASH
[  8211] = "-",  -- ndash
[  8212] = "-",  -- mdash
[  8213] = "-",  -- HORIZONTAL BAR
[  8259] = "-",  -- HYPHEN BULLET
[  8722] = "-",  -- MINUS SIGN
[  8216] = "'",  -- lsquo
[  8217] = "'",  -- rsquo
[  8218] = "'",  -- sbquo
[  8249] = "'",  -- lsaquo
[  8250] = "'",  -- rsaquo
[  8220] = "\"", -- ldquo
[  8221] = "\"", -- rdquo
[  8222] = "\"", -- bdquo
[  8264] = "/",  -- FRACTION SLASH
[  7840] = "A",  -- A with dot below
[  7841] = "a",  -- a with dot below
[  7842] = "A",  -- A with hook above
[  7843] = "a",  -- a with hook above
[  7844] = "A",  -- A with circumflex and acute
[  7845] = "a",  -- a with circumflex and acute
[  7846] = "A",  -- A with circumflex and grave
[  7847] = "a",  -- a with circumflex and grave
[  7848] = "A",  -- A with circumflex and hook above
[  7849] = "a",  -- a with circumflex and hook above
[  7850] = "A",  -- A with circumflex and tilde
[  7851] = "a",  -- a with circumflex and tilde
[  7852] = "A",  -- A with circumflex and dot below
[  7853] = "a",  -- a with circumflex and dot below
[  7854] = "A",  -- A with breve and acute
[  7855] = "a",  -- a with breve and acute
[  7856] = "A",  -- A with breve and grave
[  7857] = "a",  -- a with breve and grave
[  7858] = "A",  -- A with breve and hook above
[  7859] = "a",  -- a with breve and hook above
[  7860] = "A",  -- A with breve and tilde
[  7861] = "a",  -- a with breve and tilde
[  7862] = "A",  -- A with breve and dot below
[  7863] = "a",  -- a with breve and dot below
[  7864] = "E",  -- E with dot below
[  7865] = "e",  -- e with dot below
[  7866] = "E",  -- E with hook above
[  7867] = "e",  -- e with hook above
[  7868] = "E",  -- E with tilde
[  7869] = "e",  -- e with tilde
[  7870] = "E",  -- E with circumflex and acute
[  7871] = "e",  -- e with circumflex and acute
[  7872] = "E",  -- E with circumflex and grave
[  7873] = "e",  -- e with circumflex and grave
[  7874] = "E",  -- E with circumflex and hook above
[  7875] = "e",  -- e with circumflex and hook above
[  7876] = "E",  -- E with circumflex and tilde
[  7877] = "e",  -- e with circumflex and tilde
[  7878] = "E",  -- E with circumflex and dot below
[  7879] = "e",  -- e with circumflex and dot below
[  7880] = "I",  -- I with hook above
[  7881] = "i",  -- i with hook above
[  7882] = "I",  -- I with dot below
[  7883] = "i",  -- i with dot below
[  7884] = "O",  -- O with dot below
[  7885] = "o",  -- o with dot below
[  7886] = "O",  -- O with hook above
[  7887] = "o",  -- o with hook above
[  7888] = "O",  -- O with circumflex and acute
[  7889] = "o",  -- o with circumflex and acute
[  7890] = "O",  -- O with circumflex and grave
[  7891] = "o",  -- o with circumflex and grave
[  7892] = "O",  -- O with circumflex and hook above
[  7893] = "o",  -- o with circumflex and hook above
[  7894] = "O",  -- O with circumflex and tilde
[  7895] = "o",  -- o with circumflex and tilde
[  7896] = "O",  -- O with circumflex and dot below
[  7897] = "o",  -- o with circumflex and dot below
[  7898] = "O",  -- O with horn and acute
[  7899] = "o",  -- o with horn and acute
[  7900] = "O",  -- O with horn and grave
[  7901] = "o",  -- o with horn and grave
[  7902] = "O",  -- O with horn and hook above
[  7903] = "o",  -- o with horn and hook above
[  7904] = "O",  -- O with horn and tilde
[  7905] = "o",  -- o with horn and tilde
[  7906] = "O",  -- O with horn and dot below
[  7907] = "o",  -- o with horn and dot below
[  7838] = "SS", -- CAPITAL SHARP S
[  7908] = "U",  -- U with dot below
[  7909] = "u",  -- u with dot below
[  7910] = "U",  -- U with hook above
[  7911] = "u",  -- u with hook above
[  7912] = "U",  -- U with horn and acute
[  7913] = "u",  -- u with horn and acute
[  7914] = "U",  -- U with horn and grave
[  7915] = "u",  -- u with horn and grave
[  7916] = "U",  -- U with horn and hook above
[  7917] = "u",  -- u with horn and hook above
[  7918] = "U",  -- U with horn and tilde
[  7919] = "u",  -- u with horn and tilde
[  7920] = "U",  -- U with horn and dot below
[  7921] = "u",  -- u with horn and dot below
[  7922] = "Y",  -- Y with grave
[  7923] = "y",  -- y with grave
[  7924] = "Y",  -- Y with dot below
[  7925] = "y",  -- y with dot below
[  7926] = "Y",  -- Y with hook above
[  7927] = "y",  -- y with hook above
[  7928] = "Y",  -- Y with tilde
[  7929] = "y",  -- y with tilde
[  7932] = "V",  -- V (middle-welsh)
[  7933] = "v",  -- v (middle-welsh)
[  7934] = "Y",  -- Y with loop
[  7935] = "y",  -- y with loop
[ 0x3000] = " ",   -- IDEOGRAPHIC SPACE
[ 0x3001] = ",",   -- IDEOGRAPHIC COMMA
[ 0x3002] = ".",   -- IDEOGRAPHIC FULL STOP
[ 0x303F] = " ",   -- IDEOGRAPHIC HALF FILL SPACE
[ 0xFF01] = "!",   -- FULLWIDTH EXCLAMATION MARK
[ 0xFF02] = "\"",  -- FULLWIDTH QUOTATION MARK
[ 0xFF03] = "#",   -- FULLWIDTH NUMBER SIGN
[ 0xFF04] = "$",   -- FULLWIDTH DOLLAR SIGN
[ 0xFF05] = "%",   -- FULLWIDTH PERCENT SIGN
[ 0xFF06] = "&",   -- FULLWIDTH AMPERSAND
[ 0xFF07] = "'",   -- FULLWIDTH APOSTROPHE
[ 0xFF08] = "(",   -- FULLWIDTH LEFT PARENTHESIS
[ 0xFF09] = ")",   -- FULLWIDTH RIGHT PARENTHESIS
[ 0xFF0A] = "*",   -- FULLWIDTH ASTERISK
[ 0xFF0B] = "+",   -- FULLWIDTH PLUS SIGN
[ 0xFF0C] = ",",   -- FULLWIDTH COMMA
[ 0xFF0D] = "-",   -- FULLWIDTH HYPHEN-MINUS
[ 0xFF0E] = ".",   -- FULLWIDTH FULL STOP
[ 0xFF0F] = "/",   -- FULLWIDTH SOLIDUS
[ 0xFF10] = "0",   -- FULLWIDTH DIGIT ZERO
[ 0xFF11] = "1",   -- FULLWIDTH DIGIT ONE
[ 0xFF12] = "2",   -- FULLWIDTH DIGIT TWO
[ 0xFF13] = "3",   -- FULLWIDTH DIGIT THREE
[ 0xFF14] = "4",   -- FULLWIDTH DIGIT FOUR
[ 0xFF15] = "5",   -- FULLWIDTH DIGIT FIVE
[ 0xFF16] = "6",   -- FULLWIDTH DIGIT SIX
[ 0xFF17] = "7",   -- FULLWIDTH DIGIT SEVEN
[ 0xFF18] = "8",   -- FULLWIDTH DIGIT EIGHT
[ 0xFF19] = "9",   -- FULLWIDTH DIGIT NINE
[ 0xFF1A] = ":",   -- FULLWIDTH COLON
[ 0xFF1B] = ";",   -- FULLWIDTH SEMICOLON
[ 0xFF1C] = "<",   -- FULLWIDTH LESS-THAN SIGN
[ 0xFF1D] = "=",   -- FULLWIDTH EQUALS SIGN
[ 0xFF1E] = ">",   -- FULLWIDTH GREATER-THAN SIGN
[ 0xFF1F] = "?",   -- FULLWIDTH QUESTION MARK
[ 0xFF20] = "@",   -- FULLWIDTH COMMERCIAL AT
[ 0xFF21] = "A",   -- FULLWIDTH LATIN CAPITAL LETTER A
[ 0xFF22] = "B",   -- FULLWIDTH LATIN CAPITAL LETTER B
[ 0xFF23] = "C",   -- FULLWIDTH LATIN CAPITAL LETTER C
[ 0xFF24] = "D",   -- FULLWIDTH LATIN CAPITAL LETTER D
[ 0xFF25] = "E",   -- FULLWIDTH LATIN CAPITAL LETTER E
[ 0xFF26] = "F",   -- FULLWIDTH LATIN CAPITAL LETTER F
[ 0xFF27] = "G",   -- FULLWIDTH LATIN CAPITAL LETTER G
[ 0xFF28] = "H",   -- FULLWIDTH LATIN CAPITAL LETTER H
[ 0xFF29] = "I",   -- FULLWIDTH LATIN CAPITAL LETTER I
[ 0xFF2A] = "J",   -- FULLWIDTH LATIN CAPITAL LETTER J
[ 0xFF2B] = "K",   -- FULLWIDTH LATIN CAPITAL LETTER K
[ 0xFF2C] = "L",   -- FULLWIDTH LATIN CAPITAL LETTER L
[ 0xFF2D] = "M",   -- FULLWIDTH LATIN CAPITAL LETTER M
[ 0xFF2E] = "N",   -- FULLWIDTH LATIN CAPITAL LETTER N
[ 0xFF2F] = "O",   -- FULLWIDTH LATIN CAPITAL LETTER O
[ 0xFF30] = "P",   -- FULLWIDTH LATIN CAPITAL LETTER P
[ 0xFF31] = "Q",   -- FULLWIDTH LATIN CAPITAL LETTER Q
[ 0xFF32] = "R",   -- FULLWIDTH LATIN CAPITAL LETTER R
[ 0xFF33] = "S",   -- FULLWIDTH LATIN CAPITAL LETTER S
[ 0xFF34] = "T",   -- FULLWIDTH LATIN CAPITAL LETTER T
[ 0xFF35] = "U",   -- FULLWIDTH LATIN CAPITAL LETTER U
[ 0xFF36] = "V",   -- FULLWIDTH LATIN CAPITAL LETTER V
[ 0xFF37] = "W",   -- FULLWIDTH LATIN CAPITAL LETTER W
[ 0xFF38] = "X",   -- FULLWIDTH LATIN CAPITAL LETTER X
[ 0xFF39] = "Y",   -- FULLWIDTH LATIN CAPITAL LETTER Y
[ 0xFF3A] = "Z",   -- FULLWIDTH LATIN CAPITAL LETTER Z
[ 0xFF3B] = "[",   -- FULLWIDTH LEFT SQUARE BRACKET
[ 0xFF3C] = "\\",  -- FULLWIDTH REVERSE SOLIDUS
[ 0xFF3D] = "]",   -- FULLWIDTH RIGHT SQUARE BRACKET
[ 0xFF3E] = "^",   -- FULLWIDTH CIRCUMFLEX ACCENT
[ 0xFF3F] = "_",   -- FULLWIDTH LOW LINE
[ 0xFF40] = "`",   -- FULLWIDTH GRAVE ACCENT
[ 0xFF41] = "a",   -- FULLWIDTH LATIN SMALL LETTER A
[ 0xFF42] = "b",   -- FULLWIDTH LATIN SMALL LETTER B
[ 0xFF43] = "c",   -- FULLWIDTH LATIN SMALL LETTER C
[ 0xFF44] = "d",   -- FULLWIDTH LATIN SMALL LETTER D
[ 0xFF45] = "e",   -- FULLWIDTH LATIN SMALL LETTER E
[ 0xFF46] = "f",   -- FULLWIDTH LATIN SMALL LETTER F
[ 0xFF47] = "g",   -- FULLWIDTH LATIN SMALL LETTER G
[ 0xFF48] = "h",   -- FULLWIDTH LATIN SMALL LETTER H
[ 0xFF49] = "i",   -- FULLWIDTH LATIN SMALL LETTER I
[ 0xFF4A] = "j",   -- FULLWIDTH LATIN SMALL LETTER J
[ 0xFF4B] = "k",   -- FULLWIDTH LATIN SMALL LETTER K
[ 0xFF4C] = "l",   -- FULLWIDTH LATIN SMALL LETTER L
[ 0xFF4D] = "m",   -- FULLWIDTH LATIN SMALL LETTER M
[ 0xFF4E] = "n",   -- FULLWIDTH LATIN SMALL LETTER N
[ 0xFF4F] = "o",   -- FULLWIDTH LATIN SMALL LETTER O
[ 0xFF50] = "p",   -- FULLWIDTH LATIN SMALL LETTER P
[ 0xFF51] = "q",   -- FULLWIDTH LATIN SMALL LETTER Q
[ 0xFF52] = "r",   -- FULLWIDTH LATIN SMALL LETTER R
[ 0xFF53] = "s",   -- FULLWIDTH LATIN SMALL LETTER S
[ 0xFF54] = "t",   -- FULLWIDTH LATIN SMALL LETTER T
[ 0xFF55] = "u",   -- FULLWIDTH LATIN SMALL LETTER U
[ 0xFF56] = "v",   -- FULLWIDTH LATIN SMALL LETTER V
[ 0xFF57] = "w",   -- FULLWIDTH LATIN SMALL LETTER W
[ 0xFF58] = "x",   -- FULLWIDTH LATIN SMALL LETTER X
[ 0xFF59] = "y",   -- FULLWIDTH LATIN SMALL LETTER Y
[ 0xFF5A] = "z",   -- FULLWIDTH LATIN SMALL LETTER Z
[ 0xFF5B] = "{",   -- FULLWIDTH LEFT CURLY BRACKET
[ 0xFF5C] = "|",   -- FULLWIDTH VERTICAL LINE
[ 0xFF5D] = "}",   -- FULLWIDTH RIGHT CURLY BRACKET
[ 0xFF5E] = "~",   -- FULLWIDTH TILDE
[ 0xFF61] = ".",   -- HALFWIDTH IDEOGRAPHIC FULL STOP
[ 0xFF64] = ",",   -- HALFWIDTH IDEOGRAPHIC COMMA
failsafe = Serial,
item     = Item
};