prism 0.13.0

Sign up to get free protection for your applications and to get access to all the features.
Files changed (95) hide show
  1. checksums.yaml +7 -0
  2. data/CHANGELOG.md +172 -0
  3. data/CODE_OF_CONDUCT.md +76 -0
  4. data/CONTRIBUTING.md +62 -0
  5. data/LICENSE.md +7 -0
  6. data/Makefile +84 -0
  7. data/README.md +89 -0
  8. data/config.yml +2481 -0
  9. data/docs/build_system.md +74 -0
  10. data/docs/building.md +22 -0
  11. data/docs/configuration.md +60 -0
  12. data/docs/design.md +53 -0
  13. data/docs/encoding.md +117 -0
  14. data/docs/fuzzing.md +93 -0
  15. data/docs/heredocs.md +36 -0
  16. data/docs/mapping.md +117 -0
  17. data/docs/ripper.md +36 -0
  18. data/docs/ruby_api.md +25 -0
  19. data/docs/serialization.md +181 -0
  20. data/docs/testing.md +55 -0
  21. data/ext/prism/api_node.c +4725 -0
  22. data/ext/prism/api_pack.c +256 -0
  23. data/ext/prism/extconf.rb +136 -0
  24. data/ext/prism/extension.c +626 -0
  25. data/ext/prism/extension.h +18 -0
  26. data/include/prism/ast.h +1932 -0
  27. data/include/prism/defines.h +45 -0
  28. data/include/prism/diagnostic.h +231 -0
  29. data/include/prism/enc/pm_encoding.h +95 -0
  30. data/include/prism/node.h +41 -0
  31. data/include/prism/pack.h +141 -0
  32. data/include/prism/parser.h +418 -0
  33. data/include/prism/regexp.h +19 -0
  34. data/include/prism/unescape.h +48 -0
  35. data/include/prism/util/pm_buffer.h +51 -0
  36. data/include/prism/util/pm_char.h +91 -0
  37. data/include/prism/util/pm_constant_pool.h +78 -0
  38. data/include/prism/util/pm_list.h +67 -0
  39. data/include/prism/util/pm_memchr.h +14 -0
  40. data/include/prism/util/pm_newline_list.h +61 -0
  41. data/include/prism/util/pm_state_stack.h +24 -0
  42. data/include/prism/util/pm_string.h +61 -0
  43. data/include/prism/util/pm_string_list.h +25 -0
  44. data/include/prism/util/pm_strpbrk.h +29 -0
  45. data/include/prism/version.h +4 -0
  46. data/include/prism.h +82 -0
  47. data/lib/prism/compiler.rb +465 -0
  48. data/lib/prism/debug.rb +157 -0
  49. data/lib/prism/desugar_compiler.rb +206 -0
  50. data/lib/prism/dispatcher.rb +2051 -0
  51. data/lib/prism/dsl.rb +750 -0
  52. data/lib/prism/ffi.rb +251 -0
  53. data/lib/prism/lex_compat.rb +838 -0
  54. data/lib/prism/mutation_compiler.rb +718 -0
  55. data/lib/prism/node.rb +14540 -0
  56. data/lib/prism/node_ext.rb +55 -0
  57. data/lib/prism/node_inspector.rb +68 -0
  58. data/lib/prism/pack.rb +185 -0
  59. data/lib/prism/parse_result/comments.rb +172 -0
  60. data/lib/prism/parse_result/newlines.rb +60 -0
  61. data/lib/prism/parse_result.rb +266 -0
  62. data/lib/prism/pattern.rb +239 -0
  63. data/lib/prism/ripper_compat.rb +174 -0
  64. data/lib/prism/serialize.rb +662 -0
  65. data/lib/prism/visitor.rb +470 -0
  66. data/lib/prism.rb +64 -0
  67. data/prism.gemspec +113 -0
  68. data/src/diagnostic.c +287 -0
  69. data/src/enc/pm_big5.c +52 -0
  70. data/src/enc/pm_euc_jp.c +58 -0
  71. data/src/enc/pm_gbk.c +61 -0
  72. data/src/enc/pm_shift_jis.c +56 -0
  73. data/src/enc/pm_tables.c +507 -0
  74. data/src/enc/pm_unicode.c +2324 -0
  75. data/src/enc/pm_windows_31j.c +56 -0
  76. data/src/node.c +2633 -0
  77. data/src/pack.c +493 -0
  78. data/src/prettyprint.c +2136 -0
  79. data/src/prism.c +14587 -0
  80. data/src/regexp.c +580 -0
  81. data/src/serialize.c +1899 -0
  82. data/src/token_type.c +349 -0
  83. data/src/unescape.c +637 -0
  84. data/src/util/pm_buffer.c +103 -0
  85. data/src/util/pm_char.c +272 -0
  86. data/src/util/pm_constant_pool.c +252 -0
  87. data/src/util/pm_list.c +41 -0
  88. data/src/util/pm_memchr.c +33 -0
  89. data/src/util/pm_newline_list.c +134 -0
  90. data/src/util/pm_state_stack.c +19 -0
  91. data/src/util/pm_string.c +200 -0
  92. data/src/util/pm_string_list.c +29 -0
  93. data/src/util/pm_strncasecmp.c +17 -0
  94. data/src/util/pm_strpbrk.c +66 -0
  95. metadata +138 -0
@@ -0,0 +1,2324 @@
1
+ // Note that the UTF-8 decoding code is based on Bjoern Hoehrmann's UTF-8 DFA
2
+ // decoder. See http://bjoern.hoehrmann.de/utf-8/decoder/dfa/ for details.
3
+
4
+ #include "prism/enc/pm_encoding.h"
5
+
6
+ typedef uint32_t pm_unicode_codepoint_t;
7
+
8
+ // Each element of the following table contains a bitfield that indicates a
9
+ // piece of information about the corresponding unicode codepoint. Note that
10
+ // this table is different from other encodings where we used a lookup table
11
+ // because the indices of those tables are the byte representations, not the
12
+ // codepoints themselves.
13
+ const uint8_t pm_encoding_unicode_table[256] = {
14
+ // 0 1 2 3 4 5 6 7 8 9 A B C D E F
15
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 0x
16
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 1x
17
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 2x
18
+ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 0, 0, 0, 0, 0, 0, // 3x
19
+ 0, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, // 4x
20
+ 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 0, 0, 0, 0, 0, // 5x
21
+ 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, // 6x
22
+ 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 0, 0, 0, 0, // 7x
23
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 8x
24
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 9x
25
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, // Ax
26
+ 0, 0, 0, 0, 0, 3, 0, 0, 0, 0, 3, 0, 0, 0, 0, 0, // Bx
27
+ 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, // Cx
28
+ 7, 7, 7, 7, 7, 7, 7, 0, 7, 7, 7, 7, 7, 7, 7, 3, // Dx
29
+ 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, // Ex
30
+ 3, 3, 3, 3, 3, 3, 3, 0, 3, 3, 3, 3, 3, 3, 3, 3, // Fx
31
+ };
32
+
33
+ #define UNICODE_ALPHA_CODEPOINTS_LENGTH 1450
34
+ static const pm_unicode_codepoint_t unicode_alpha_codepoints[UNICODE_ALPHA_CODEPOINTS_LENGTH] = {
35
+ 0x100, 0x2C1,
36
+ 0x2C6, 0x2D1,
37
+ 0x2E0, 0x2E4,
38
+ 0x2EC, 0x2EC,
39
+ 0x2EE, 0x2EE,
40
+ 0x345, 0x345,
41
+ 0x370, 0x374,
42
+ 0x376, 0x377,
43
+ 0x37A, 0x37D,
44
+ 0x37F, 0x37F,
45
+ 0x386, 0x386,
46
+ 0x388, 0x38A,
47
+ 0x38C, 0x38C,
48
+ 0x38E, 0x3A1,
49
+ 0x3A3, 0x3F5,
50
+ 0x3F7, 0x481,
51
+ 0x48A, 0x52F,
52
+ 0x531, 0x556,
53
+ 0x559, 0x559,
54
+ 0x560, 0x588,
55
+ 0x5B0, 0x5BD,
56
+ 0x5BF, 0x5BF,
57
+ 0x5C1, 0x5C2,
58
+ 0x5C4, 0x5C5,
59
+ 0x5C7, 0x5C7,
60
+ 0x5D0, 0x5EA,
61
+ 0x5EF, 0x5F2,
62
+ 0x610, 0x61A,
63
+ 0x620, 0x657,
64
+ 0x659, 0x65F,
65
+ 0x66E, 0x6D3,
66
+ 0x6D5, 0x6DC,
67
+ 0x6E1, 0x6E8,
68
+ 0x6ED, 0x6EF,
69
+ 0x6FA, 0x6FC,
70
+ 0x6FF, 0x6FF,
71
+ 0x710, 0x73F,
72
+ 0x74D, 0x7B1,
73
+ 0x7CA, 0x7EA,
74
+ 0x7F4, 0x7F5,
75
+ 0x7FA, 0x7FA,
76
+ 0x800, 0x817,
77
+ 0x81A, 0x82C,
78
+ 0x840, 0x858,
79
+ 0x860, 0x86A,
80
+ 0x870, 0x887,
81
+ 0x889, 0x88E,
82
+ 0x8A0, 0x8C9,
83
+ 0x8D4, 0x8DF,
84
+ 0x8E3, 0x8E9,
85
+ 0x8F0, 0x93B,
86
+ 0x93D, 0x94C,
87
+ 0x94E, 0x950,
88
+ 0x955, 0x963,
89
+ 0x971, 0x983,
90
+ 0x985, 0x98C,
91
+ 0x98F, 0x990,
92
+ 0x993, 0x9A8,
93
+ 0x9AA, 0x9B0,
94
+ 0x9B2, 0x9B2,
95
+ 0x9B6, 0x9B9,
96
+ 0x9BD, 0x9C4,
97
+ 0x9C7, 0x9C8,
98
+ 0x9CB, 0x9CC,
99
+ 0x9CE, 0x9CE,
100
+ 0x9D7, 0x9D7,
101
+ 0x9DC, 0x9DD,
102
+ 0x9DF, 0x9E3,
103
+ 0x9F0, 0x9F1,
104
+ 0x9FC, 0x9FC,
105
+ 0xA01, 0xA03,
106
+ 0xA05, 0xA0A,
107
+ 0xA0F, 0xA10,
108
+ 0xA13, 0xA28,
109
+ 0xA2A, 0xA30,
110
+ 0xA32, 0xA33,
111
+ 0xA35, 0xA36,
112
+ 0xA38, 0xA39,
113
+ 0xA3E, 0xA42,
114
+ 0xA47, 0xA48,
115
+ 0xA4B, 0xA4C,
116
+ 0xA51, 0xA51,
117
+ 0xA59, 0xA5C,
118
+ 0xA5E, 0xA5E,
119
+ 0xA70, 0xA75,
120
+ 0xA81, 0xA83,
121
+ 0xA85, 0xA8D,
122
+ 0xA8F, 0xA91,
123
+ 0xA93, 0xAA8,
124
+ 0xAAA, 0xAB0,
125
+ 0xAB2, 0xAB3,
126
+ 0xAB5, 0xAB9,
127
+ 0xABD, 0xAC5,
128
+ 0xAC7, 0xAC9,
129
+ 0xACB, 0xACC,
130
+ 0xAD0, 0xAD0,
131
+ 0xAE0, 0xAE3,
132
+ 0xAF9, 0xAFC,
133
+ 0xB01, 0xB03,
134
+ 0xB05, 0xB0C,
135
+ 0xB0F, 0xB10,
136
+ 0xB13, 0xB28,
137
+ 0xB2A, 0xB30,
138
+ 0xB32, 0xB33,
139
+ 0xB35, 0xB39,
140
+ 0xB3D, 0xB44,
141
+ 0xB47, 0xB48,
142
+ 0xB4B, 0xB4C,
143
+ 0xB56, 0xB57,
144
+ 0xB5C, 0xB5D,
145
+ 0xB5F, 0xB63,
146
+ 0xB71, 0xB71,
147
+ 0xB82, 0xB83,
148
+ 0xB85, 0xB8A,
149
+ 0xB8E, 0xB90,
150
+ 0xB92, 0xB95,
151
+ 0xB99, 0xB9A,
152
+ 0xB9C, 0xB9C,
153
+ 0xB9E, 0xB9F,
154
+ 0xBA3, 0xBA4,
155
+ 0xBA8, 0xBAA,
156
+ 0xBAE, 0xBB9,
157
+ 0xBBE, 0xBC2,
158
+ 0xBC6, 0xBC8,
159
+ 0xBCA, 0xBCC,
160
+ 0xBD0, 0xBD0,
161
+ 0xBD7, 0xBD7,
162
+ 0xC00, 0xC0C,
163
+ 0xC0E, 0xC10,
164
+ 0xC12, 0xC28,
165
+ 0xC2A, 0xC39,
166
+ 0xC3D, 0xC44,
167
+ 0xC46, 0xC48,
168
+ 0xC4A, 0xC4C,
169
+ 0xC55, 0xC56,
170
+ 0xC58, 0xC5A,
171
+ 0xC5D, 0xC5D,
172
+ 0xC60, 0xC63,
173
+ 0xC80, 0xC83,
174
+ 0xC85, 0xC8C,
175
+ 0xC8E, 0xC90,
176
+ 0xC92, 0xCA8,
177
+ 0xCAA, 0xCB3,
178
+ 0xCB5, 0xCB9,
179
+ 0xCBD, 0xCC4,
180
+ 0xCC6, 0xCC8,
181
+ 0xCCA, 0xCCC,
182
+ 0xCD5, 0xCD6,
183
+ 0xCDD, 0xCDE,
184
+ 0xCE0, 0xCE3,
185
+ 0xCF1, 0xCF3,
186
+ 0xD00, 0xD0C,
187
+ 0xD0E, 0xD10,
188
+ 0xD12, 0xD3A,
189
+ 0xD3D, 0xD44,
190
+ 0xD46, 0xD48,
191
+ 0xD4A, 0xD4C,
192
+ 0xD4E, 0xD4E,
193
+ 0xD54, 0xD57,
194
+ 0xD5F, 0xD63,
195
+ 0xD7A, 0xD7F,
196
+ 0xD81, 0xD83,
197
+ 0xD85, 0xD96,
198
+ 0xD9A, 0xDB1,
199
+ 0xDB3, 0xDBB,
200
+ 0xDBD, 0xDBD,
201
+ 0xDC0, 0xDC6,
202
+ 0xDCF, 0xDD4,
203
+ 0xDD6, 0xDD6,
204
+ 0xDD8, 0xDDF,
205
+ 0xDF2, 0xDF3,
206
+ 0xE01, 0xE3A,
207
+ 0xE40, 0xE46,
208
+ 0xE4D, 0xE4D,
209
+ 0xE81, 0xE82,
210
+ 0xE84, 0xE84,
211
+ 0xE86, 0xE8A,
212
+ 0xE8C, 0xEA3,
213
+ 0xEA5, 0xEA5,
214
+ 0xEA7, 0xEB9,
215
+ 0xEBB, 0xEBD,
216
+ 0xEC0, 0xEC4,
217
+ 0xEC6, 0xEC6,
218
+ 0xECD, 0xECD,
219
+ 0xEDC, 0xEDF,
220
+ 0xF00, 0xF00,
221
+ 0xF40, 0xF47,
222
+ 0xF49, 0xF6C,
223
+ 0xF71, 0xF83,
224
+ 0xF88, 0xF97,
225
+ 0xF99, 0xFBC,
226
+ 0x1000, 0x1036,
227
+ 0x1038, 0x1038,
228
+ 0x103B, 0x103F,
229
+ 0x1050, 0x108F,
230
+ 0x109A, 0x109D,
231
+ 0x10A0, 0x10C5,
232
+ 0x10C7, 0x10C7,
233
+ 0x10CD, 0x10CD,
234
+ 0x10D0, 0x10FA,
235
+ 0x10FC, 0x1248,
236
+ 0x124A, 0x124D,
237
+ 0x1250, 0x1256,
238
+ 0x1258, 0x1258,
239
+ 0x125A, 0x125D,
240
+ 0x1260, 0x1288,
241
+ 0x128A, 0x128D,
242
+ 0x1290, 0x12B0,
243
+ 0x12B2, 0x12B5,
244
+ 0x12B8, 0x12BE,
245
+ 0x12C0, 0x12C0,
246
+ 0x12C2, 0x12C5,
247
+ 0x12C8, 0x12D6,
248
+ 0x12D8, 0x1310,
249
+ 0x1312, 0x1315,
250
+ 0x1318, 0x135A,
251
+ 0x1380, 0x138F,
252
+ 0x13A0, 0x13F5,
253
+ 0x13F8, 0x13FD,
254
+ 0x1401, 0x166C,
255
+ 0x166F, 0x167F,
256
+ 0x1681, 0x169A,
257
+ 0x16A0, 0x16EA,
258
+ 0x16EE, 0x16F8,
259
+ 0x1700, 0x1713,
260
+ 0x171F, 0x1733,
261
+ 0x1740, 0x1753,
262
+ 0x1760, 0x176C,
263
+ 0x176E, 0x1770,
264
+ 0x1772, 0x1773,
265
+ 0x1780, 0x17B3,
266
+ 0x17B6, 0x17C8,
267
+ 0x17D7, 0x17D7,
268
+ 0x17DC, 0x17DC,
269
+ 0x1820, 0x1878,
270
+ 0x1880, 0x18AA,
271
+ 0x18B0, 0x18F5,
272
+ 0x1900, 0x191E,
273
+ 0x1920, 0x192B,
274
+ 0x1930, 0x1938,
275
+ 0x1950, 0x196D,
276
+ 0x1970, 0x1974,
277
+ 0x1980, 0x19AB,
278
+ 0x19B0, 0x19C9,
279
+ 0x1A00, 0x1A1B,
280
+ 0x1A20, 0x1A5E,
281
+ 0x1A61, 0x1A74,
282
+ 0x1AA7, 0x1AA7,
283
+ 0x1ABF, 0x1AC0,
284
+ 0x1ACC, 0x1ACE,
285
+ 0x1B00, 0x1B33,
286
+ 0x1B35, 0x1B43,
287
+ 0x1B45, 0x1B4C,
288
+ 0x1B80, 0x1BA9,
289
+ 0x1BAC, 0x1BAF,
290
+ 0x1BBA, 0x1BE5,
291
+ 0x1BE7, 0x1BF1,
292
+ 0x1C00, 0x1C36,
293
+ 0x1C4D, 0x1C4F,
294
+ 0x1C5A, 0x1C7D,
295
+ 0x1C80, 0x1C88,
296
+ 0x1C90, 0x1CBA,
297
+ 0x1CBD, 0x1CBF,
298
+ 0x1CE9, 0x1CEC,
299
+ 0x1CEE, 0x1CF3,
300
+ 0x1CF5, 0x1CF6,
301
+ 0x1CFA, 0x1CFA,
302
+ 0x1D00, 0x1DBF,
303
+ 0x1DE7, 0x1DF4,
304
+ 0x1E00, 0x1F15,
305
+ 0x1F18, 0x1F1D,
306
+ 0x1F20, 0x1F45,
307
+ 0x1F48, 0x1F4D,
308
+ 0x1F50, 0x1F57,
309
+ 0x1F59, 0x1F59,
310
+ 0x1F5B, 0x1F5B,
311
+ 0x1F5D, 0x1F5D,
312
+ 0x1F5F, 0x1F7D,
313
+ 0x1F80, 0x1FB4,
314
+ 0x1FB6, 0x1FBC,
315
+ 0x1FBE, 0x1FBE,
316
+ 0x1FC2, 0x1FC4,
317
+ 0x1FC6, 0x1FCC,
318
+ 0x1FD0, 0x1FD3,
319
+ 0x1FD6, 0x1FDB,
320
+ 0x1FE0, 0x1FEC,
321
+ 0x1FF2, 0x1FF4,
322
+ 0x1FF6, 0x1FFC,
323
+ 0x2071, 0x2071,
324
+ 0x207F, 0x207F,
325
+ 0x2090, 0x209C,
326
+ 0x2102, 0x2102,
327
+ 0x2107, 0x2107,
328
+ 0x210A, 0x2113,
329
+ 0x2115, 0x2115,
330
+ 0x2119, 0x211D,
331
+ 0x2124, 0x2124,
332
+ 0x2126, 0x2126,
333
+ 0x2128, 0x2128,
334
+ 0x212A, 0x212D,
335
+ 0x212F, 0x2139,
336
+ 0x213C, 0x213F,
337
+ 0x2145, 0x2149,
338
+ 0x214E, 0x214E,
339
+ 0x2160, 0x2188,
340
+ 0x24B6, 0x24E9,
341
+ 0x2C00, 0x2CE4,
342
+ 0x2CEB, 0x2CEE,
343
+ 0x2CF2, 0x2CF3,
344
+ 0x2D00, 0x2D25,
345
+ 0x2D27, 0x2D27,
346
+ 0x2D2D, 0x2D2D,
347
+ 0x2D30, 0x2D67,
348
+ 0x2D6F, 0x2D6F,
349
+ 0x2D80, 0x2D96,
350
+ 0x2DA0, 0x2DA6,
351
+ 0x2DA8, 0x2DAE,
352
+ 0x2DB0, 0x2DB6,
353
+ 0x2DB8, 0x2DBE,
354
+ 0x2DC0, 0x2DC6,
355
+ 0x2DC8, 0x2DCE,
356
+ 0x2DD0, 0x2DD6,
357
+ 0x2DD8, 0x2DDE,
358
+ 0x2DE0, 0x2DFF,
359
+ 0x2E2F, 0x2E2F,
360
+ 0x3005, 0x3007,
361
+ 0x3021, 0x3029,
362
+ 0x3031, 0x3035,
363
+ 0x3038, 0x303C,
364
+ 0x3041, 0x3096,
365
+ 0x309D, 0x309F,
366
+ 0x30A1, 0x30FA,
367
+ 0x30FC, 0x30FF,
368
+ 0x3105, 0x312F,
369
+ 0x3131, 0x318E,
370
+ 0x31A0, 0x31BF,
371
+ 0x31F0, 0x31FF,
372
+ 0x3400, 0x4DBF,
373
+ 0x4E00, 0xA48C,
374
+ 0xA4D0, 0xA4FD,
375
+ 0xA500, 0xA60C,
376
+ 0xA610, 0xA61F,
377
+ 0xA62A, 0xA62B,
378
+ 0xA640, 0xA66E,
379
+ 0xA674, 0xA67B,
380
+ 0xA67F, 0xA6EF,
381
+ 0xA717, 0xA71F,
382
+ 0xA722, 0xA788,
383
+ 0xA78B, 0xA7CA,
384
+ 0xA7D0, 0xA7D1,
385
+ 0xA7D3, 0xA7D3,
386
+ 0xA7D5, 0xA7D9,
387
+ 0xA7F2, 0xA805,
388
+ 0xA807, 0xA827,
389
+ 0xA840, 0xA873,
390
+ 0xA880, 0xA8C3,
391
+ 0xA8C5, 0xA8C5,
392
+ 0xA8F2, 0xA8F7,
393
+ 0xA8FB, 0xA8FB,
394
+ 0xA8FD, 0xA8FF,
395
+ 0xA90A, 0xA92A,
396
+ 0xA930, 0xA952,
397
+ 0xA960, 0xA97C,
398
+ 0xA980, 0xA9B2,
399
+ 0xA9B4, 0xA9BF,
400
+ 0xA9CF, 0xA9CF,
401
+ 0xA9E0, 0xA9EF,
402
+ 0xA9FA, 0xA9FE,
403
+ 0xAA00, 0xAA36,
404
+ 0xAA40, 0xAA4D,
405
+ 0xAA60, 0xAA76,
406
+ 0xAA7A, 0xAABE,
407
+ 0xAAC0, 0xAAC0,
408
+ 0xAAC2, 0xAAC2,
409
+ 0xAADB, 0xAADD,
410
+ 0xAAE0, 0xAAEF,
411
+ 0xAAF2, 0xAAF5,
412
+ 0xAB01, 0xAB06,
413
+ 0xAB09, 0xAB0E,
414
+ 0xAB11, 0xAB16,
415
+ 0xAB20, 0xAB26,
416
+ 0xAB28, 0xAB2E,
417
+ 0xAB30, 0xAB5A,
418
+ 0xAB5C, 0xAB69,
419
+ 0xAB70, 0xABEA,
420
+ 0xAC00, 0xD7A3,
421
+ 0xD7B0, 0xD7C6,
422
+ 0xD7CB, 0xD7FB,
423
+ 0xF900, 0xFA6D,
424
+ 0xFA70, 0xFAD9,
425
+ 0xFB00, 0xFB06,
426
+ 0xFB13, 0xFB17,
427
+ 0xFB1D, 0xFB28,
428
+ 0xFB2A, 0xFB36,
429
+ 0xFB38, 0xFB3C,
430
+ 0xFB3E, 0xFB3E,
431
+ 0xFB40, 0xFB41,
432
+ 0xFB43, 0xFB44,
433
+ 0xFB46, 0xFBB1,
434
+ 0xFBD3, 0xFD3D,
435
+ 0xFD50, 0xFD8F,
436
+ 0xFD92, 0xFDC7,
437
+ 0xFDF0, 0xFDFB,
438
+ 0xFE70, 0xFE74,
439
+ 0xFE76, 0xFEFC,
440
+ 0xFF21, 0xFF3A,
441
+ 0xFF41, 0xFF5A,
442
+ 0xFF66, 0xFFBE,
443
+ 0xFFC2, 0xFFC7,
444
+ 0xFFCA, 0xFFCF,
445
+ 0xFFD2, 0xFFD7,
446
+ 0xFFDA, 0xFFDC,
447
+ 0x10000, 0x1000B,
448
+ 0x1000D, 0x10026,
449
+ 0x10028, 0x1003A,
450
+ 0x1003C, 0x1003D,
451
+ 0x1003F, 0x1004D,
452
+ 0x10050, 0x1005D,
453
+ 0x10080, 0x100FA,
454
+ 0x10140, 0x10174,
455
+ 0x10280, 0x1029C,
456
+ 0x102A0, 0x102D0,
457
+ 0x10300, 0x1031F,
458
+ 0x1032D, 0x1034A,
459
+ 0x10350, 0x1037A,
460
+ 0x10380, 0x1039D,
461
+ 0x103A0, 0x103C3,
462
+ 0x103C8, 0x103CF,
463
+ 0x103D1, 0x103D5,
464
+ 0x10400, 0x1049D,
465
+ 0x104B0, 0x104D3,
466
+ 0x104D8, 0x104FB,
467
+ 0x10500, 0x10527,
468
+ 0x10530, 0x10563,
469
+ 0x10570, 0x1057A,
470
+ 0x1057C, 0x1058A,
471
+ 0x1058C, 0x10592,
472
+ 0x10594, 0x10595,
473
+ 0x10597, 0x105A1,
474
+ 0x105A3, 0x105B1,
475
+ 0x105B3, 0x105B9,
476
+ 0x105BB, 0x105BC,
477
+ 0x10600, 0x10736,
478
+ 0x10740, 0x10755,
479
+ 0x10760, 0x10767,
480
+ 0x10780, 0x10785,
481
+ 0x10787, 0x107B0,
482
+ 0x107B2, 0x107BA,
483
+ 0x10800, 0x10805,
484
+ 0x10808, 0x10808,
485
+ 0x1080A, 0x10835,
486
+ 0x10837, 0x10838,
487
+ 0x1083C, 0x1083C,
488
+ 0x1083F, 0x10855,
489
+ 0x10860, 0x10876,
490
+ 0x10880, 0x1089E,
491
+ 0x108E0, 0x108F2,
492
+ 0x108F4, 0x108F5,
493
+ 0x10900, 0x10915,
494
+ 0x10920, 0x10939,
495
+ 0x10980, 0x109B7,
496
+ 0x109BE, 0x109BF,
497
+ 0x10A00, 0x10A03,
498
+ 0x10A05, 0x10A06,
499
+ 0x10A0C, 0x10A13,
500
+ 0x10A15, 0x10A17,
501
+ 0x10A19, 0x10A35,
502
+ 0x10A60, 0x10A7C,
503
+ 0x10A80, 0x10A9C,
504
+ 0x10AC0, 0x10AC7,
505
+ 0x10AC9, 0x10AE4,
506
+ 0x10B00, 0x10B35,
507
+ 0x10B40, 0x10B55,
508
+ 0x10B60, 0x10B72,
509
+ 0x10B80, 0x10B91,
510
+ 0x10C00, 0x10C48,
511
+ 0x10C80, 0x10CB2,
512
+ 0x10CC0, 0x10CF2,
513
+ 0x10D00, 0x10D27,
514
+ 0x10E80, 0x10EA9,
515
+ 0x10EAB, 0x10EAC,
516
+ 0x10EB0, 0x10EB1,
517
+ 0x10F00, 0x10F1C,
518
+ 0x10F27, 0x10F27,
519
+ 0x10F30, 0x10F45,
520
+ 0x10F70, 0x10F81,
521
+ 0x10FB0, 0x10FC4,
522
+ 0x10FE0, 0x10FF6,
523
+ 0x11000, 0x11045,
524
+ 0x11071, 0x11075,
525
+ 0x11080, 0x110B8,
526
+ 0x110C2, 0x110C2,
527
+ 0x110D0, 0x110E8,
528
+ 0x11100, 0x11132,
529
+ 0x11144, 0x11147,
530
+ 0x11150, 0x11172,
531
+ 0x11176, 0x11176,
532
+ 0x11180, 0x111BF,
533
+ 0x111C1, 0x111C4,
534
+ 0x111CE, 0x111CF,
535
+ 0x111DA, 0x111DA,
536
+ 0x111DC, 0x111DC,
537
+ 0x11200, 0x11211,
538
+ 0x11213, 0x11234,
539
+ 0x11237, 0x11237,
540
+ 0x1123E, 0x11241,
541
+ 0x11280, 0x11286,
542
+ 0x11288, 0x11288,
543
+ 0x1128A, 0x1128D,
544
+ 0x1128F, 0x1129D,
545
+ 0x1129F, 0x112A8,
546
+ 0x112B0, 0x112E8,
547
+ 0x11300, 0x11303,
548
+ 0x11305, 0x1130C,
549
+ 0x1130F, 0x11310,
550
+ 0x11313, 0x11328,
551
+ 0x1132A, 0x11330,
552
+ 0x11332, 0x11333,
553
+ 0x11335, 0x11339,
554
+ 0x1133D, 0x11344,
555
+ 0x11347, 0x11348,
556
+ 0x1134B, 0x1134C,
557
+ 0x11350, 0x11350,
558
+ 0x11357, 0x11357,
559
+ 0x1135D, 0x11363,
560
+ 0x11400, 0x11441,
561
+ 0x11443, 0x11445,
562
+ 0x11447, 0x1144A,
563
+ 0x1145F, 0x11461,
564
+ 0x11480, 0x114C1,
565
+ 0x114C4, 0x114C5,
566
+ 0x114C7, 0x114C7,
567
+ 0x11580, 0x115B5,
568
+ 0x115B8, 0x115BE,
569
+ 0x115D8, 0x115DD,
570
+ 0x11600, 0x1163E,
571
+ 0x11640, 0x11640,
572
+ 0x11644, 0x11644,
573
+ 0x11680, 0x116B5,
574
+ 0x116B8, 0x116B8,
575
+ 0x11700, 0x1171A,
576
+ 0x1171D, 0x1172A,
577
+ 0x11740, 0x11746,
578
+ 0x11800, 0x11838,
579
+ 0x118A0, 0x118DF,
580
+ 0x118FF, 0x11906,
581
+ 0x11909, 0x11909,
582
+ 0x1190C, 0x11913,
583
+ 0x11915, 0x11916,
584
+ 0x11918, 0x11935,
585
+ 0x11937, 0x11938,
586
+ 0x1193B, 0x1193C,
587
+ 0x1193F, 0x11942,
588
+ 0x119A0, 0x119A7,
589
+ 0x119AA, 0x119D7,
590
+ 0x119DA, 0x119DF,
591
+ 0x119E1, 0x119E1,
592
+ 0x119E3, 0x119E4,
593
+ 0x11A00, 0x11A32,
594
+ 0x11A35, 0x11A3E,
595
+ 0x11A50, 0x11A97,
596
+ 0x11A9D, 0x11A9D,
597
+ 0x11AB0, 0x11AF8,
598
+ 0x11C00, 0x11C08,
599
+ 0x11C0A, 0x11C36,
600
+ 0x11C38, 0x11C3E,
601
+ 0x11C40, 0x11C40,
602
+ 0x11C72, 0x11C8F,
603
+ 0x11C92, 0x11CA7,
604
+ 0x11CA9, 0x11CB6,
605
+ 0x11D00, 0x11D06,
606
+ 0x11D08, 0x11D09,
607
+ 0x11D0B, 0x11D36,
608
+ 0x11D3A, 0x11D3A,
609
+ 0x11D3C, 0x11D3D,
610
+ 0x11D3F, 0x11D41,
611
+ 0x11D43, 0x11D43,
612
+ 0x11D46, 0x11D47,
613
+ 0x11D60, 0x11D65,
614
+ 0x11D67, 0x11D68,
615
+ 0x11D6A, 0x11D8E,
616
+ 0x11D90, 0x11D91,
617
+ 0x11D93, 0x11D96,
618
+ 0x11D98, 0x11D98,
619
+ 0x11EE0, 0x11EF6,
620
+ 0x11F00, 0x11F10,
621
+ 0x11F12, 0x11F3A,
622
+ 0x11F3E, 0x11F40,
623
+ 0x11FB0, 0x11FB0,
624
+ 0x12000, 0x12399,
625
+ 0x12400, 0x1246E,
626
+ 0x12480, 0x12543,
627
+ 0x12F90, 0x12FF0,
628
+ 0x13000, 0x1342F,
629
+ 0x13441, 0x13446,
630
+ 0x14400, 0x14646,
631
+ 0x16800, 0x16A38,
632
+ 0x16A40, 0x16A5E,
633
+ 0x16A70, 0x16ABE,
634
+ 0x16AD0, 0x16AED,
635
+ 0x16B00, 0x16B2F,
636
+ 0x16B40, 0x16B43,
637
+ 0x16B63, 0x16B77,
638
+ 0x16B7D, 0x16B8F,
639
+ 0x16E40, 0x16E7F,
640
+ 0x16F00, 0x16F4A,
641
+ 0x16F4F, 0x16F87,
642
+ 0x16F8F, 0x16F9F,
643
+ 0x16FE0, 0x16FE1,
644
+ 0x16FE3, 0x16FE3,
645
+ 0x16FF0, 0x16FF1,
646
+ 0x17000, 0x187F7,
647
+ 0x18800, 0x18CD5,
648
+ 0x18D00, 0x18D08,
649
+ 0x1AFF0, 0x1AFF3,
650
+ 0x1AFF5, 0x1AFFB,
651
+ 0x1AFFD, 0x1AFFE,
652
+ 0x1B000, 0x1B122,
653
+ 0x1B132, 0x1B132,
654
+ 0x1B150, 0x1B152,
655
+ 0x1B155, 0x1B155,
656
+ 0x1B164, 0x1B167,
657
+ 0x1B170, 0x1B2FB,
658
+ 0x1BC00, 0x1BC6A,
659
+ 0x1BC70, 0x1BC7C,
660
+ 0x1BC80, 0x1BC88,
661
+ 0x1BC90, 0x1BC99,
662
+ 0x1BC9E, 0x1BC9E,
663
+ 0x1D400, 0x1D454,
664
+ 0x1D456, 0x1D49C,
665
+ 0x1D49E, 0x1D49F,
666
+ 0x1D4A2, 0x1D4A2,
667
+ 0x1D4A5, 0x1D4A6,
668
+ 0x1D4A9, 0x1D4AC,
669
+ 0x1D4AE, 0x1D4B9,
670
+ 0x1D4BB, 0x1D4BB,
671
+ 0x1D4BD, 0x1D4C3,
672
+ 0x1D4C5, 0x1D505,
673
+ 0x1D507, 0x1D50A,
674
+ 0x1D50D, 0x1D514,
675
+ 0x1D516, 0x1D51C,
676
+ 0x1D51E, 0x1D539,
677
+ 0x1D53B, 0x1D53E,
678
+ 0x1D540, 0x1D544,
679
+ 0x1D546, 0x1D546,
680
+ 0x1D54A, 0x1D550,
681
+ 0x1D552, 0x1D6A5,
682
+ 0x1D6A8, 0x1D6C0,
683
+ 0x1D6C2, 0x1D6DA,
684
+ 0x1D6DC, 0x1D6FA,
685
+ 0x1D6FC, 0x1D714,
686
+ 0x1D716, 0x1D734,
687
+ 0x1D736, 0x1D74E,
688
+ 0x1D750, 0x1D76E,
689
+ 0x1D770, 0x1D788,
690
+ 0x1D78A, 0x1D7A8,
691
+ 0x1D7AA, 0x1D7C2,
692
+ 0x1D7C4, 0x1D7CB,
693
+ 0x1DF00, 0x1DF1E,
694
+ 0x1DF25, 0x1DF2A,
695
+ 0x1E000, 0x1E006,
696
+ 0x1E008, 0x1E018,
697
+ 0x1E01B, 0x1E021,
698
+ 0x1E023, 0x1E024,
699
+ 0x1E026, 0x1E02A,
700
+ 0x1E030, 0x1E06D,
701
+ 0x1E08F, 0x1E08F,
702
+ 0x1E100, 0x1E12C,
703
+ 0x1E137, 0x1E13D,
704
+ 0x1E14E, 0x1E14E,
705
+ 0x1E290, 0x1E2AD,
706
+ 0x1E2C0, 0x1E2EB,
707
+ 0x1E4D0, 0x1E4EB,
708
+ 0x1E7E0, 0x1E7E6,
709
+ 0x1E7E8, 0x1E7EB,
710
+ 0x1E7ED, 0x1E7EE,
711
+ 0x1E7F0, 0x1E7FE,
712
+ 0x1E800, 0x1E8C4,
713
+ 0x1E900, 0x1E943,
714
+ 0x1E947, 0x1E947,
715
+ 0x1E94B, 0x1E94B,
716
+ 0x1EE00, 0x1EE03,
717
+ 0x1EE05, 0x1EE1F,
718
+ 0x1EE21, 0x1EE22,
719
+ 0x1EE24, 0x1EE24,
720
+ 0x1EE27, 0x1EE27,
721
+ 0x1EE29, 0x1EE32,
722
+ 0x1EE34, 0x1EE37,
723
+ 0x1EE39, 0x1EE39,
724
+ 0x1EE3B, 0x1EE3B,
725
+ 0x1EE42, 0x1EE42,
726
+ 0x1EE47, 0x1EE47,
727
+ 0x1EE49, 0x1EE49,
728
+ 0x1EE4B, 0x1EE4B,
729
+ 0x1EE4D, 0x1EE4F,
730
+ 0x1EE51, 0x1EE52,
731
+ 0x1EE54, 0x1EE54,
732
+ 0x1EE57, 0x1EE57,
733
+ 0x1EE59, 0x1EE59,
734
+ 0x1EE5B, 0x1EE5B,
735
+ 0x1EE5D, 0x1EE5D,
736
+ 0x1EE5F, 0x1EE5F,
737
+ 0x1EE61, 0x1EE62,
738
+ 0x1EE64, 0x1EE64,
739
+ 0x1EE67, 0x1EE6A,
740
+ 0x1EE6C, 0x1EE72,
741
+ 0x1EE74, 0x1EE77,
742
+ 0x1EE79, 0x1EE7C,
743
+ 0x1EE7E, 0x1EE7E,
744
+ 0x1EE80, 0x1EE89,
745
+ 0x1EE8B, 0x1EE9B,
746
+ 0x1EEA1, 0x1EEA3,
747
+ 0x1EEA5, 0x1EEA9,
748
+ 0x1EEAB, 0x1EEBB,
749
+ 0x1F130, 0x1F149,
750
+ 0x1F150, 0x1F169,
751
+ 0x1F170, 0x1F189,
752
+ 0x20000, 0x2A6DF,
753
+ 0x2A700, 0x2B739,
754
+ 0x2B740, 0x2B81D,
755
+ 0x2B820, 0x2CEA1,
756
+ 0x2CEB0, 0x2EBE0,
757
+ 0x2F800, 0x2FA1D,
758
+ 0x30000, 0x3134A,
759
+ 0x31350, 0x323AF,
760
+ };
761
+
762
+ #define UNICODE_ALNUM_CODEPOINTS_LENGTH 1528
763
+ static const pm_unicode_codepoint_t unicode_alnum_codepoints[UNICODE_ALNUM_CODEPOINTS_LENGTH] = {
764
+ 0x100, 0x2C1,
765
+ 0x2C6, 0x2D1,
766
+ 0x2E0, 0x2E4,
767
+ 0x2EC, 0x2EC,
768
+ 0x2EE, 0x2EE,
769
+ 0x345, 0x345,
770
+ 0x370, 0x374,
771
+ 0x376, 0x377,
772
+ 0x37A, 0x37D,
773
+ 0x37F, 0x37F,
774
+ 0x386, 0x386,
775
+ 0x388, 0x38A,
776
+ 0x38C, 0x38C,
777
+ 0x38E, 0x3A1,
778
+ 0x3A3, 0x3F5,
779
+ 0x3F7, 0x481,
780
+ 0x48A, 0x52F,
781
+ 0x531, 0x556,
782
+ 0x559, 0x559,
783
+ 0x560, 0x588,
784
+ 0x5B0, 0x5BD,
785
+ 0x5BF, 0x5BF,
786
+ 0x5C1, 0x5C2,
787
+ 0x5C4, 0x5C5,
788
+ 0x5C7, 0x5C7,
789
+ 0x5D0, 0x5EA,
790
+ 0x5EF, 0x5F2,
791
+ 0x610, 0x61A,
792
+ 0x620, 0x657,
793
+ 0x659, 0x669,
794
+ 0x66E, 0x6D3,
795
+ 0x6D5, 0x6DC,
796
+ 0x6E1, 0x6E8,
797
+ 0x6ED, 0x6FC,
798
+ 0x6FF, 0x6FF,
799
+ 0x710, 0x73F,
800
+ 0x74D, 0x7B1,
801
+ 0x7C0, 0x7EA,
802
+ 0x7F4, 0x7F5,
803
+ 0x7FA, 0x7FA,
804
+ 0x800, 0x817,
805
+ 0x81A, 0x82C,
806
+ 0x840, 0x858,
807
+ 0x860, 0x86A,
808
+ 0x870, 0x887,
809
+ 0x889, 0x88E,
810
+ 0x8A0, 0x8C9,
811
+ 0x8D4, 0x8DF,
812
+ 0x8E3, 0x8E9,
813
+ 0x8F0, 0x93B,
814
+ 0x93D, 0x94C,
815
+ 0x94E, 0x950,
816
+ 0x955, 0x963,
817
+ 0x966, 0x96F,
818
+ 0x971, 0x983,
819
+ 0x985, 0x98C,
820
+ 0x98F, 0x990,
821
+ 0x993, 0x9A8,
822
+ 0x9AA, 0x9B0,
823
+ 0x9B2, 0x9B2,
824
+ 0x9B6, 0x9B9,
825
+ 0x9BD, 0x9C4,
826
+ 0x9C7, 0x9C8,
827
+ 0x9CB, 0x9CC,
828
+ 0x9CE, 0x9CE,
829
+ 0x9D7, 0x9D7,
830
+ 0x9DC, 0x9DD,
831
+ 0x9DF, 0x9E3,
832
+ 0x9E6, 0x9F1,
833
+ 0x9FC, 0x9FC,
834
+ 0xA01, 0xA03,
835
+ 0xA05, 0xA0A,
836
+ 0xA0F, 0xA10,
837
+ 0xA13, 0xA28,
838
+ 0xA2A, 0xA30,
839
+ 0xA32, 0xA33,
840
+ 0xA35, 0xA36,
841
+ 0xA38, 0xA39,
842
+ 0xA3E, 0xA42,
843
+ 0xA47, 0xA48,
844
+ 0xA4B, 0xA4C,
845
+ 0xA51, 0xA51,
846
+ 0xA59, 0xA5C,
847
+ 0xA5E, 0xA5E,
848
+ 0xA66, 0xA75,
849
+ 0xA81, 0xA83,
850
+ 0xA85, 0xA8D,
851
+ 0xA8F, 0xA91,
852
+ 0xA93, 0xAA8,
853
+ 0xAAA, 0xAB0,
854
+ 0xAB2, 0xAB3,
855
+ 0xAB5, 0xAB9,
856
+ 0xABD, 0xAC5,
857
+ 0xAC7, 0xAC9,
858
+ 0xACB, 0xACC,
859
+ 0xAD0, 0xAD0,
860
+ 0xAE0, 0xAE3,
861
+ 0xAE6, 0xAEF,
862
+ 0xAF9, 0xAFC,
863
+ 0xB01, 0xB03,
864
+ 0xB05, 0xB0C,
865
+ 0xB0F, 0xB10,
866
+ 0xB13, 0xB28,
867
+ 0xB2A, 0xB30,
868
+ 0xB32, 0xB33,
869
+ 0xB35, 0xB39,
870
+ 0xB3D, 0xB44,
871
+ 0xB47, 0xB48,
872
+ 0xB4B, 0xB4C,
873
+ 0xB56, 0xB57,
874
+ 0xB5C, 0xB5D,
875
+ 0xB5F, 0xB63,
876
+ 0xB66, 0xB6F,
877
+ 0xB71, 0xB71,
878
+ 0xB82, 0xB83,
879
+ 0xB85, 0xB8A,
880
+ 0xB8E, 0xB90,
881
+ 0xB92, 0xB95,
882
+ 0xB99, 0xB9A,
883
+ 0xB9C, 0xB9C,
884
+ 0xB9E, 0xB9F,
885
+ 0xBA3, 0xBA4,
886
+ 0xBA8, 0xBAA,
887
+ 0xBAE, 0xBB9,
888
+ 0xBBE, 0xBC2,
889
+ 0xBC6, 0xBC8,
890
+ 0xBCA, 0xBCC,
891
+ 0xBD0, 0xBD0,
892
+ 0xBD7, 0xBD7,
893
+ 0xBE6, 0xBEF,
894
+ 0xC00, 0xC0C,
895
+ 0xC0E, 0xC10,
896
+ 0xC12, 0xC28,
897
+ 0xC2A, 0xC39,
898
+ 0xC3D, 0xC44,
899
+ 0xC46, 0xC48,
900
+ 0xC4A, 0xC4C,
901
+ 0xC55, 0xC56,
902
+ 0xC58, 0xC5A,
903
+ 0xC5D, 0xC5D,
904
+ 0xC60, 0xC63,
905
+ 0xC66, 0xC6F,
906
+ 0xC80, 0xC83,
907
+ 0xC85, 0xC8C,
908
+ 0xC8E, 0xC90,
909
+ 0xC92, 0xCA8,
910
+ 0xCAA, 0xCB3,
911
+ 0xCB5, 0xCB9,
912
+ 0xCBD, 0xCC4,
913
+ 0xCC6, 0xCC8,
914
+ 0xCCA, 0xCCC,
915
+ 0xCD5, 0xCD6,
916
+ 0xCDD, 0xCDE,
917
+ 0xCE0, 0xCE3,
918
+ 0xCE6, 0xCEF,
919
+ 0xCF1, 0xCF3,
920
+ 0xD00, 0xD0C,
921
+ 0xD0E, 0xD10,
922
+ 0xD12, 0xD3A,
923
+ 0xD3D, 0xD44,
924
+ 0xD46, 0xD48,
925
+ 0xD4A, 0xD4C,
926
+ 0xD4E, 0xD4E,
927
+ 0xD54, 0xD57,
928
+ 0xD5F, 0xD63,
929
+ 0xD66, 0xD6F,
930
+ 0xD7A, 0xD7F,
931
+ 0xD81, 0xD83,
932
+ 0xD85, 0xD96,
933
+ 0xD9A, 0xDB1,
934
+ 0xDB3, 0xDBB,
935
+ 0xDBD, 0xDBD,
936
+ 0xDC0, 0xDC6,
937
+ 0xDCF, 0xDD4,
938
+ 0xDD6, 0xDD6,
939
+ 0xDD8, 0xDDF,
940
+ 0xDE6, 0xDEF,
941
+ 0xDF2, 0xDF3,
942
+ 0xE01, 0xE3A,
943
+ 0xE40, 0xE46,
944
+ 0xE4D, 0xE4D,
945
+ 0xE50, 0xE59,
946
+ 0xE81, 0xE82,
947
+ 0xE84, 0xE84,
948
+ 0xE86, 0xE8A,
949
+ 0xE8C, 0xEA3,
950
+ 0xEA5, 0xEA5,
951
+ 0xEA7, 0xEB9,
952
+ 0xEBB, 0xEBD,
953
+ 0xEC0, 0xEC4,
954
+ 0xEC6, 0xEC6,
955
+ 0xECD, 0xECD,
956
+ 0xED0, 0xED9,
957
+ 0xEDC, 0xEDF,
958
+ 0xF00, 0xF00,
959
+ 0xF20, 0xF29,
960
+ 0xF40, 0xF47,
961
+ 0xF49, 0xF6C,
962
+ 0xF71, 0xF83,
963
+ 0xF88, 0xF97,
964
+ 0xF99, 0xFBC,
965
+ 0x1000, 0x1036,
966
+ 0x1038, 0x1038,
967
+ 0x103B, 0x1049,
968
+ 0x1050, 0x109D,
969
+ 0x10A0, 0x10C5,
970
+ 0x10C7, 0x10C7,
971
+ 0x10CD, 0x10CD,
972
+ 0x10D0, 0x10FA,
973
+ 0x10FC, 0x1248,
974
+ 0x124A, 0x124D,
975
+ 0x1250, 0x1256,
976
+ 0x1258, 0x1258,
977
+ 0x125A, 0x125D,
978
+ 0x1260, 0x1288,
979
+ 0x128A, 0x128D,
980
+ 0x1290, 0x12B0,
981
+ 0x12B2, 0x12B5,
982
+ 0x12B8, 0x12BE,
983
+ 0x12C0, 0x12C0,
984
+ 0x12C2, 0x12C5,
985
+ 0x12C8, 0x12D6,
986
+ 0x12D8, 0x1310,
987
+ 0x1312, 0x1315,
988
+ 0x1318, 0x135A,
989
+ 0x1380, 0x138F,
990
+ 0x13A0, 0x13F5,
991
+ 0x13F8, 0x13FD,
992
+ 0x1401, 0x166C,
993
+ 0x166F, 0x167F,
994
+ 0x1681, 0x169A,
995
+ 0x16A0, 0x16EA,
996
+ 0x16EE, 0x16F8,
997
+ 0x1700, 0x1713,
998
+ 0x171F, 0x1733,
999
+ 0x1740, 0x1753,
1000
+ 0x1760, 0x176C,
1001
+ 0x176E, 0x1770,
1002
+ 0x1772, 0x1773,
1003
+ 0x1780, 0x17B3,
1004
+ 0x17B6, 0x17C8,
1005
+ 0x17D7, 0x17D7,
1006
+ 0x17DC, 0x17DC,
1007
+ 0x17E0, 0x17E9,
1008
+ 0x1810, 0x1819,
1009
+ 0x1820, 0x1878,
1010
+ 0x1880, 0x18AA,
1011
+ 0x18B0, 0x18F5,
1012
+ 0x1900, 0x191E,
1013
+ 0x1920, 0x192B,
1014
+ 0x1930, 0x1938,
1015
+ 0x1946, 0x196D,
1016
+ 0x1970, 0x1974,
1017
+ 0x1980, 0x19AB,
1018
+ 0x19B0, 0x19C9,
1019
+ 0x19D0, 0x19D9,
1020
+ 0x1A00, 0x1A1B,
1021
+ 0x1A20, 0x1A5E,
1022
+ 0x1A61, 0x1A74,
1023
+ 0x1A80, 0x1A89,
1024
+ 0x1A90, 0x1A99,
1025
+ 0x1AA7, 0x1AA7,
1026
+ 0x1ABF, 0x1AC0,
1027
+ 0x1ACC, 0x1ACE,
1028
+ 0x1B00, 0x1B33,
1029
+ 0x1B35, 0x1B43,
1030
+ 0x1B45, 0x1B4C,
1031
+ 0x1B50, 0x1B59,
1032
+ 0x1B80, 0x1BA9,
1033
+ 0x1BAC, 0x1BE5,
1034
+ 0x1BE7, 0x1BF1,
1035
+ 0x1C00, 0x1C36,
1036
+ 0x1C40, 0x1C49,
1037
+ 0x1C4D, 0x1C7D,
1038
+ 0x1C80, 0x1C88,
1039
+ 0x1C90, 0x1CBA,
1040
+ 0x1CBD, 0x1CBF,
1041
+ 0x1CE9, 0x1CEC,
1042
+ 0x1CEE, 0x1CF3,
1043
+ 0x1CF5, 0x1CF6,
1044
+ 0x1CFA, 0x1CFA,
1045
+ 0x1D00, 0x1DBF,
1046
+ 0x1DE7, 0x1DF4,
1047
+ 0x1E00, 0x1F15,
1048
+ 0x1F18, 0x1F1D,
1049
+ 0x1F20, 0x1F45,
1050
+ 0x1F48, 0x1F4D,
1051
+ 0x1F50, 0x1F57,
1052
+ 0x1F59, 0x1F59,
1053
+ 0x1F5B, 0x1F5B,
1054
+ 0x1F5D, 0x1F5D,
1055
+ 0x1F5F, 0x1F7D,
1056
+ 0x1F80, 0x1FB4,
1057
+ 0x1FB6, 0x1FBC,
1058
+ 0x1FBE, 0x1FBE,
1059
+ 0x1FC2, 0x1FC4,
1060
+ 0x1FC6, 0x1FCC,
1061
+ 0x1FD0, 0x1FD3,
1062
+ 0x1FD6, 0x1FDB,
1063
+ 0x1FE0, 0x1FEC,
1064
+ 0x1FF2, 0x1FF4,
1065
+ 0x1FF6, 0x1FFC,
1066
+ 0x2071, 0x2071,
1067
+ 0x207F, 0x207F,
1068
+ 0x2090, 0x209C,
1069
+ 0x2102, 0x2102,
1070
+ 0x2107, 0x2107,
1071
+ 0x210A, 0x2113,
1072
+ 0x2115, 0x2115,
1073
+ 0x2119, 0x211D,
1074
+ 0x2124, 0x2124,
1075
+ 0x2126, 0x2126,
1076
+ 0x2128, 0x2128,
1077
+ 0x212A, 0x212D,
1078
+ 0x212F, 0x2139,
1079
+ 0x213C, 0x213F,
1080
+ 0x2145, 0x2149,
1081
+ 0x214E, 0x214E,
1082
+ 0x2160, 0x2188,
1083
+ 0x24B6, 0x24E9,
1084
+ 0x2C00, 0x2CE4,
1085
+ 0x2CEB, 0x2CEE,
1086
+ 0x2CF2, 0x2CF3,
1087
+ 0x2D00, 0x2D25,
1088
+ 0x2D27, 0x2D27,
1089
+ 0x2D2D, 0x2D2D,
1090
+ 0x2D30, 0x2D67,
1091
+ 0x2D6F, 0x2D6F,
1092
+ 0x2D80, 0x2D96,
1093
+ 0x2DA0, 0x2DA6,
1094
+ 0x2DA8, 0x2DAE,
1095
+ 0x2DB0, 0x2DB6,
1096
+ 0x2DB8, 0x2DBE,
1097
+ 0x2DC0, 0x2DC6,
1098
+ 0x2DC8, 0x2DCE,
1099
+ 0x2DD0, 0x2DD6,
1100
+ 0x2DD8, 0x2DDE,
1101
+ 0x2DE0, 0x2DFF,
1102
+ 0x2E2F, 0x2E2F,
1103
+ 0x3005, 0x3007,
1104
+ 0x3021, 0x3029,
1105
+ 0x3031, 0x3035,
1106
+ 0x3038, 0x303C,
1107
+ 0x3041, 0x3096,
1108
+ 0x309D, 0x309F,
1109
+ 0x30A1, 0x30FA,
1110
+ 0x30FC, 0x30FF,
1111
+ 0x3105, 0x312F,
1112
+ 0x3131, 0x318E,
1113
+ 0x31A0, 0x31BF,
1114
+ 0x31F0, 0x31FF,
1115
+ 0x3400, 0x4DBF,
1116
+ 0x4E00, 0xA48C,
1117
+ 0xA4D0, 0xA4FD,
1118
+ 0xA500, 0xA60C,
1119
+ 0xA610, 0xA62B,
1120
+ 0xA640, 0xA66E,
1121
+ 0xA674, 0xA67B,
1122
+ 0xA67F, 0xA6EF,
1123
+ 0xA717, 0xA71F,
1124
+ 0xA722, 0xA788,
1125
+ 0xA78B, 0xA7CA,
1126
+ 0xA7D0, 0xA7D1,
1127
+ 0xA7D3, 0xA7D3,
1128
+ 0xA7D5, 0xA7D9,
1129
+ 0xA7F2, 0xA805,
1130
+ 0xA807, 0xA827,
1131
+ 0xA840, 0xA873,
1132
+ 0xA880, 0xA8C3,
1133
+ 0xA8C5, 0xA8C5,
1134
+ 0xA8D0, 0xA8D9,
1135
+ 0xA8F2, 0xA8F7,
1136
+ 0xA8FB, 0xA8FB,
1137
+ 0xA8FD, 0xA92A,
1138
+ 0xA930, 0xA952,
1139
+ 0xA960, 0xA97C,
1140
+ 0xA980, 0xA9B2,
1141
+ 0xA9B4, 0xA9BF,
1142
+ 0xA9CF, 0xA9D9,
1143
+ 0xA9E0, 0xA9FE,
1144
+ 0xAA00, 0xAA36,
1145
+ 0xAA40, 0xAA4D,
1146
+ 0xAA50, 0xAA59,
1147
+ 0xAA60, 0xAA76,
1148
+ 0xAA7A, 0xAABE,
1149
+ 0xAAC0, 0xAAC0,
1150
+ 0xAAC2, 0xAAC2,
1151
+ 0xAADB, 0xAADD,
1152
+ 0xAAE0, 0xAAEF,
1153
+ 0xAAF2, 0xAAF5,
1154
+ 0xAB01, 0xAB06,
1155
+ 0xAB09, 0xAB0E,
1156
+ 0xAB11, 0xAB16,
1157
+ 0xAB20, 0xAB26,
1158
+ 0xAB28, 0xAB2E,
1159
+ 0xAB30, 0xAB5A,
1160
+ 0xAB5C, 0xAB69,
1161
+ 0xAB70, 0xABEA,
1162
+ 0xABF0, 0xABF9,
1163
+ 0xAC00, 0xD7A3,
1164
+ 0xD7B0, 0xD7C6,
1165
+ 0xD7CB, 0xD7FB,
1166
+ 0xF900, 0xFA6D,
1167
+ 0xFA70, 0xFAD9,
1168
+ 0xFB00, 0xFB06,
1169
+ 0xFB13, 0xFB17,
1170
+ 0xFB1D, 0xFB28,
1171
+ 0xFB2A, 0xFB36,
1172
+ 0xFB38, 0xFB3C,
1173
+ 0xFB3E, 0xFB3E,
1174
+ 0xFB40, 0xFB41,
1175
+ 0xFB43, 0xFB44,
1176
+ 0xFB46, 0xFBB1,
1177
+ 0xFBD3, 0xFD3D,
1178
+ 0xFD50, 0xFD8F,
1179
+ 0xFD92, 0xFDC7,
1180
+ 0xFDF0, 0xFDFB,
1181
+ 0xFE70, 0xFE74,
1182
+ 0xFE76, 0xFEFC,
1183
+ 0xFF10, 0xFF19,
1184
+ 0xFF21, 0xFF3A,
1185
+ 0xFF41, 0xFF5A,
1186
+ 0xFF66, 0xFFBE,
1187
+ 0xFFC2, 0xFFC7,
1188
+ 0xFFCA, 0xFFCF,
1189
+ 0xFFD2, 0xFFD7,
1190
+ 0xFFDA, 0xFFDC,
1191
+ 0x10000, 0x1000B,
1192
+ 0x1000D, 0x10026,
1193
+ 0x10028, 0x1003A,
1194
+ 0x1003C, 0x1003D,
1195
+ 0x1003F, 0x1004D,
1196
+ 0x10050, 0x1005D,
1197
+ 0x10080, 0x100FA,
1198
+ 0x10140, 0x10174,
1199
+ 0x10280, 0x1029C,
1200
+ 0x102A0, 0x102D0,
1201
+ 0x10300, 0x1031F,
1202
+ 0x1032D, 0x1034A,
1203
+ 0x10350, 0x1037A,
1204
+ 0x10380, 0x1039D,
1205
+ 0x103A0, 0x103C3,
1206
+ 0x103C8, 0x103CF,
1207
+ 0x103D1, 0x103D5,
1208
+ 0x10400, 0x1049D,
1209
+ 0x104A0, 0x104A9,
1210
+ 0x104B0, 0x104D3,
1211
+ 0x104D8, 0x104FB,
1212
+ 0x10500, 0x10527,
1213
+ 0x10530, 0x10563,
1214
+ 0x10570, 0x1057A,
1215
+ 0x1057C, 0x1058A,
1216
+ 0x1058C, 0x10592,
1217
+ 0x10594, 0x10595,
1218
+ 0x10597, 0x105A1,
1219
+ 0x105A3, 0x105B1,
1220
+ 0x105B3, 0x105B9,
1221
+ 0x105BB, 0x105BC,
1222
+ 0x10600, 0x10736,
1223
+ 0x10740, 0x10755,
1224
+ 0x10760, 0x10767,
1225
+ 0x10780, 0x10785,
1226
+ 0x10787, 0x107B0,
1227
+ 0x107B2, 0x107BA,
1228
+ 0x10800, 0x10805,
1229
+ 0x10808, 0x10808,
1230
+ 0x1080A, 0x10835,
1231
+ 0x10837, 0x10838,
1232
+ 0x1083C, 0x1083C,
1233
+ 0x1083F, 0x10855,
1234
+ 0x10860, 0x10876,
1235
+ 0x10880, 0x1089E,
1236
+ 0x108E0, 0x108F2,
1237
+ 0x108F4, 0x108F5,
1238
+ 0x10900, 0x10915,
1239
+ 0x10920, 0x10939,
1240
+ 0x10980, 0x109B7,
1241
+ 0x109BE, 0x109BF,
1242
+ 0x10A00, 0x10A03,
1243
+ 0x10A05, 0x10A06,
1244
+ 0x10A0C, 0x10A13,
1245
+ 0x10A15, 0x10A17,
1246
+ 0x10A19, 0x10A35,
1247
+ 0x10A60, 0x10A7C,
1248
+ 0x10A80, 0x10A9C,
1249
+ 0x10AC0, 0x10AC7,
1250
+ 0x10AC9, 0x10AE4,
1251
+ 0x10B00, 0x10B35,
1252
+ 0x10B40, 0x10B55,
1253
+ 0x10B60, 0x10B72,
1254
+ 0x10B80, 0x10B91,
1255
+ 0x10C00, 0x10C48,
1256
+ 0x10C80, 0x10CB2,
1257
+ 0x10CC0, 0x10CF2,
1258
+ 0x10D00, 0x10D27,
1259
+ 0x10D30, 0x10D39,
1260
+ 0x10E80, 0x10EA9,
1261
+ 0x10EAB, 0x10EAC,
1262
+ 0x10EB0, 0x10EB1,
1263
+ 0x10F00, 0x10F1C,
1264
+ 0x10F27, 0x10F27,
1265
+ 0x10F30, 0x10F45,
1266
+ 0x10F70, 0x10F81,
1267
+ 0x10FB0, 0x10FC4,
1268
+ 0x10FE0, 0x10FF6,
1269
+ 0x11000, 0x11045,
1270
+ 0x11066, 0x1106F,
1271
+ 0x11071, 0x11075,
1272
+ 0x11080, 0x110B8,
1273
+ 0x110C2, 0x110C2,
1274
+ 0x110D0, 0x110E8,
1275
+ 0x110F0, 0x110F9,
1276
+ 0x11100, 0x11132,
1277
+ 0x11136, 0x1113F,
1278
+ 0x11144, 0x11147,
1279
+ 0x11150, 0x11172,
1280
+ 0x11176, 0x11176,
1281
+ 0x11180, 0x111BF,
1282
+ 0x111C1, 0x111C4,
1283
+ 0x111CE, 0x111DA,
1284
+ 0x111DC, 0x111DC,
1285
+ 0x11200, 0x11211,
1286
+ 0x11213, 0x11234,
1287
+ 0x11237, 0x11237,
1288
+ 0x1123E, 0x11241,
1289
+ 0x11280, 0x11286,
1290
+ 0x11288, 0x11288,
1291
+ 0x1128A, 0x1128D,
1292
+ 0x1128F, 0x1129D,
1293
+ 0x1129F, 0x112A8,
1294
+ 0x112B0, 0x112E8,
1295
+ 0x112F0, 0x112F9,
1296
+ 0x11300, 0x11303,
1297
+ 0x11305, 0x1130C,
1298
+ 0x1130F, 0x11310,
1299
+ 0x11313, 0x11328,
1300
+ 0x1132A, 0x11330,
1301
+ 0x11332, 0x11333,
1302
+ 0x11335, 0x11339,
1303
+ 0x1133D, 0x11344,
1304
+ 0x11347, 0x11348,
1305
+ 0x1134B, 0x1134C,
1306
+ 0x11350, 0x11350,
1307
+ 0x11357, 0x11357,
1308
+ 0x1135D, 0x11363,
1309
+ 0x11400, 0x11441,
1310
+ 0x11443, 0x11445,
1311
+ 0x11447, 0x1144A,
1312
+ 0x11450, 0x11459,
1313
+ 0x1145F, 0x11461,
1314
+ 0x11480, 0x114C1,
1315
+ 0x114C4, 0x114C5,
1316
+ 0x114C7, 0x114C7,
1317
+ 0x114D0, 0x114D9,
1318
+ 0x11580, 0x115B5,
1319
+ 0x115B8, 0x115BE,
1320
+ 0x115D8, 0x115DD,
1321
+ 0x11600, 0x1163E,
1322
+ 0x11640, 0x11640,
1323
+ 0x11644, 0x11644,
1324
+ 0x11650, 0x11659,
1325
+ 0x11680, 0x116B5,
1326
+ 0x116B8, 0x116B8,
1327
+ 0x116C0, 0x116C9,
1328
+ 0x11700, 0x1171A,
1329
+ 0x1171D, 0x1172A,
1330
+ 0x11730, 0x11739,
1331
+ 0x11740, 0x11746,
1332
+ 0x11800, 0x11838,
1333
+ 0x118A0, 0x118E9,
1334
+ 0x118FF, 0x11906,
1335
+ 0x11909, 0x11909,
1336
+ 0x1190C, 0x11913,
1337
+ 0x11915, 0x11916,
1338
+ 0x11918, 0x11935,
1339
+ 0x11937, 0x11938,
1340
+ 0x1193B, 0x1193C,
1341
+ 0x1193F, 0x11942,
1342
+ 0x11950, 0x11959,
1343
+ 0x119A0, 0x119A7,
1344
+ 0x119AA, 0x119D7,
1345
+ 0x119DA, 0x119DF,
1346
+ 0x119E1, 0x119E1,
1347
+ 0x119E3, 0x119E4,
1348
+ 0x11A00, 0x11A32,
1349
+ 0x11A35, 0x11A3E,
1350
+ 0x11A50, 0x11A97,
1351
+ 0x11A9D, 0x11A9D,
1352
+ 0x11AB0, 0x11AF8,
1353
+ 0x11C00, 0x11C08,
1354
+ 0x11C0A, 0x11C36,
1355
+ 0x11C38, 0x11C3E,
1356
+ 0x11C40, 0x11C40,
1357
+ 0x11C50, 0x11C59,
1358
+ 0x11C72, 0x11C8F,
1359
+ 0x11C92, 0x11CA7,
1360
+ 0x11CA9, 0x11CB6,
1361
+ 0x11D00, 0x11D06,
1362
+ 0x11D08, 0x11D09,
1363
+ 0x11D0B, 0x11D36,
1364
+ 0x11D3A, 0x11D3A,
1365
+ 0x11D3C, 0x11D3D,
1366
+ 0x11D3F, 0x11D41,
1367
+ 0x11D43, 0x11D43,
1368
+ 0x11D46, 0x11D47,
1369
+ 0x11D50, 0x11D59,
1370
+ 0x11D60, 0x11D65,
1371
+ 0x11D67, 0x11D68,
1372
+ 0x11D6A, 0x11D8E,
1373
+ 0x11D90, 0x11D91,
1374
+ 0x11D93, 0x11D96,
1375
+ 0x11D98, 0x11D98,
1376
+ 0x11DA0, 0x11DA9,
1377
+ 0x11EE0, 0x11EF6,
1378
+ 0x11F00, 0x11F10,
1379
+ 0x11F12, 0x11F3A,
1380
+ 0x11F3E, 0x11F40,
1381
+ 0x11F50, 0x11F59,
1382
+ 0x11FB0, 0x11FB0,
1383
+ 0x12000, 0x12399,
1384
+ 0x12400, 0x1246E,
1385
+ 0x12480, 0x12543,
1386
+ 0x12F90, 0x12FF0,
1387
+ 0x13000, 0x1342F,
1388
+ 0x13441, 0x13446,
1389
+ 0x14400, 0x14646,
1390
+ 0x16800, 0x16A38,
1391
+ 0x16A40, 0x16A5E,
1392
+ 0x16A60, 0x16A69,
1393
+ 0x16A70, 0x16ABE,
1394
+ 0x16AC0, 0x16AC9,
1395
+ 0x16AD0, 0x16AED,
1396
+ 0x16B00, 0x16B2F,
1397
+ 0x16B40, 0x16B43,
1398
+ 0x16B50, 0x16B59,
1399
+ 0x16B63, 0x16B77,
1400
+ 0x16B7D, 0x16B8F,
1401
+ 0x16E40, 0x16E7F,
1402
+ 0x16F00, 0x16F4A,
1403
+ 0x16F4F, 0x16F87,
1404
+ 0x16F8F, 0x16F9F,
1405
+ 0x16FE0, 0x16FE1,
1406
+ 0x16FE3, 0x16FE3,
1407
+ 0x16FF0, 0x16FF1,
1408
+ 0x17000, 0x187F7,
1409
+ 0x18800, 0x18CD5,
1410
+ 0x18D00, 0x18D08,
1411
+ 0x1AFF0, 0x1AFF3,
1412
+ 0x1AFF5, 0x1AFFB,
1413
+ 0x1AFFD, 0x1AFFE,
1414
+ 0x1B000, 0x1B122,
1415
+ 0x1B132, 0x1B132,
1416
+ 0x1B150, 0x1B152,
1417
+ 0x1B155, 0x1B155,
1418
+ 0x1B164, 0x1B167,
1419
+ 0x1B170, 0x1B2FB,
1420
+ 0x1BC00, 0x1BC6A,
1421
+ 0x1BC70, 0x1BC7C,
1422
+ 0x1BC80, 0x1BC88,
1423
+ 0x1BC90, 0x1BC99,
1424
+ 0x1BC9E, 0x1BC9E,
1425
+ 0x1D400, 0x1D454,
1426
+ 0x1D456, 0x1D49C,
1427
+ 0x1D49E, 0x1D49F,
1428
+ 0x1D4A2, 0x1D4A2,
1429
+ 0x1D4A5, 0x1D4A6,
1430
+ 0x1D4A9, 0x1D4AC,
1431
+ 0x1D4AE, 0x1D4B9,
1432
+ 0x1D4BB, 0x1D4BB,
1433
+ 0x1D4BD, 0x1D4C3,
1434
+ 0x1D4C5, 0x1D505,
1435
+ 0x1D507, 0x1D50A,
1436
+ 0x1D50D, 0x1D514,
1437
+ 0x1D516, 0x1D51C,
1438
+ 0x1D51E, 0x1D539,
1439
+ 0x1D53B, 0x1D53E,
1440
+ 0x1D540, 0x1D544,
1441
+ 0x1D546, 0x1D546,
1442
+ 0x1D54A, 0x1D550,
1443
+ 0x1D552, 0x1D6A5,
1444
+ 0x1D6A8, 0x1D6C0,
1445
+ 0x1D6C2, 0x1D6DA,
1446
+ 0x1D6DC, 0x1D6FA,
1447
+ 0x1D6FC, 0x1D714,
1448
+ 0x1D716, 0x1D734,
1449
+ 0x1D736, 0x1D74E,
1450
+ 0x1D750, 0x1D76E,
1451
+ 0x1D770, 0x1D788,
1452
+ 0x1D78A, 0x1D7A8,
1453
+ 0x1D7AA, 0x1D7C2,
1454
+ 0x1D7C4, 0x1D7CB,
1455
+ 0x1D7CE, 0x1D7FF,
1456
+ 0x1DF00, 0x1DF1E,
1457
+ 0x1DF25, 0x1DF2A,
1458
+ 0x1E000, 0x1E006,
1459
+ 0x1E008, 0x1E018,
1460
+ 0x1E01B, 0x1E021,
1461
+ 0x1E023, 0x1E024,
1462
+ 0x1E026, 0x1E02A,
1463
+ 0x1E030, 0x1E06D,
1464
+ 0x1E08F, 0x1E08F,
1465
+ 0x1E100, 0x1E12C,
1466
+ 0x1E137, 0x1E13D,
1467
+ 0x1E140, 0x1E149,
1468
+ 0x1E14E, 0x1E14E,
1469
+ 0x1E290, 0x1E2AD,
1470
+ 0x1E2C0, 0x1E2EB,
1471
+ 0x1E2F0, 0x1E2F9,
1472
+ 0x1E4D0, 0x1E4EB,
1473
+ 0x1E4F0, 0x1E4F9,
1474
+ 0x1E7E0, 0x1E7E6,
1475
+ 0x1E7E8, 0x1E7EB,
1476
+ 0x1E7ED, 0x1E7EE,
1477
+ 0x1E7F0, 0x1E7FE,
1478
+ 0x1E800, 0x1E8C4,
1479
+ 0x1E900, 0x1E943,
1480
+ 0x1E947, 0x1E947,
1481
+ 0x1E94B, 0x1E94B,
1482
+ 0x1E950, 0x1E959,
1483
+ 0x1EE00, 0x1EE03,
1484
+ 0x1EE05, 0x1EE1F,
1485
+ 0x1EE21, 0x1EE22,
1486
+ 0x1EE24, 0x1EE24,
1487
+ 0x1EE27, 0x1EE27,
1488
+ 0x1EE29, 0x1EE32,
1489
+ 0x1EE34, 0x1EE37,
1490
+ 0x1EE39, 0x1EE39,
1491
+ 0x1EE3B, 0x1EE3B,
1492
+ 0x1EE42, 0x1EE42,
1493
+ 0x1EE47, 0x1EE47,
1494
+ 0x1EE49, 0x1EE49,
1495
+ 0x1EE4B, 0x1EE4B,
1496
+ 0x1EE4D, 0x1EE4F,
1497
+ 0x1EE51, 0x1EE52,
1498
+ 0x1EE54, 0x1EE54,
1499
+ 0x1EE57, 0x1EE57,
1500
+ 0x1EE59, 0x1EE59,
1501
+ 0x1EE5B, 0x1EE5B,
1502
+ 0x1EE5D, 0x1EE5D,
1503
+ 0x1EE5F, 0x1EE5F,
1504
+ 0x1EE61, 0x1EE62,
1505
+ 0x1EE64, 0x1EE64,
1506
+ 0x1EE67, 0x1EE6A,
1507
+ 0x1EE6C, 0x1EE72,
1508
+ 0x1EE74, 0x1EE77,
1509
+ 0x1EE79, 0x1EE7C,
1510
+ 0x1EE7E, 0x1EE7E,
1511
+ 0x1EE80, 0x1EE89,
1512
+ 0x1EE8B, 0x1EE9B,
1513
+ 0x1EEA1, 0x1EEA3,
1514
+ 0x1EEA5, 0x1EEA9,
1515
+ 0x1EEAB, 0x1EEBB,
1516
+ 0x1F130, 0x1F149,
1517
+ 0x1F150, 0x1F169,
1518
+ 0x1F170, 0x1F189,
1519
+ 0x1FBF0, 0x1FBF9,
1520
+ 0x20000, 0x2A6DF,
1521
+ 0x2A700, 0x2B739,
1522
+ 0x2B740, 0x2B81D,
1523
+ 0x2B820, 0x2CEA1,
1524
+ 0x2CEB0, 0x2EBE0,
1525
+ 0x2F800, 0x2FA1D,
1526
+ 0x30000, 0x3134A,
1527
+ 0x31350, 0x323AF,
1528
+ };
1529
+
1530
+ #define UNICODE_ISUPPER_CODEPOINTS_LENGTH 1296
1531
+ static const pm_unicode_codepoint_t unicode_isupper_codepoints[UNICODE_ISUPPER_CODEPOINTS_LENGTH] = {
1532
+ 0x100, 0x100,
1533
+ 0x102, 0x102,
1534
+ 0x104, 0x104,
1535
+ 0x106, 0x106,
1536
+ 0x108, 0x108,
1537
+ 0x10A, 0x10A,
1538
+ 0x10C, 0x10C,
1539
+ 0x10E, 0x10E,
1540
+ 0x110, 0x110,
1541
+ 0x112, 0x112,
1542
+ 0x114, 0x114,
1543
+ 0x116, 0x116,
1544
+ 0x118, 0x118,
1545
+ 0x11A, 0x11A,
1546
+ 0x11C, 0x11C,
1547
+ 0x11E, 0x11E,
1548
+ 0x120, 0x120,
1549
+ 0x122, 0x122,
1550
+ 0x124, 0x124,
1551
+ 0x126, 0x126,
1552
+ 0x128, 0x128,
1553
+ 0x12A, 0x12A,
1554
+ 0x12C, 0x12C,
1555
+ 0x12E, 0x12E,
1556
+ 0x130, 0x130,
1557
+ 0x132, 0x132,
1558
+ 0x134, 0x134,
1559
+ 0x136, 0x136,
1560
+ 0x139, 0x139,
1561
+ 0x13B, 0x13B,
1562
+ 0x13D, 0x13D,
1563
+ 0x13F, 0x13F,
1564
+ 0x141, 0x141,
1565
+ 0x143, 0x143,
1566
+ 0x145, 0x145,
1567
+ 0x147, 0x147,
1568
+ 0x14A, 0x14A,
1569
+ 0x14C, 0x14C,
1570
+ 0x14E, 0x14E,
1571
+ 0x150, 0x150,
1572
+ 0x152, 0x152,
1573
+ 0x154, 0x154,
1574
+ 0x156, 0x156,
1575
+ 0x158, 0x158,
1576
+ 0x15A, 0x15A,
1577
+ 0x15C, 0x15C,
1578
+ 0x15E, 0x15E,
1579
+ 0x160, 0x160,
1580
+ 0x162, 0x162,
1581
+ 0x164, 0x164,
1582
+ 0x166, 0x166,
1583
+ 0x168, 0x168,
1584
+ 0x16A, 0x16A,
1585
+ 0x16C, 0x16C,
1586
+ 0x16E, 0x16E,
1587
+ 0x170, 0x170,
1588
+ 0x172, 0x172,
1589
+ 0x174, 0x174,
1590
+ 0x176, 0x176,
1591
+ 0x178, 0x179,
1592
+ 0x17B, 0x17B,
1593
+ 0x17D, 0x17D,
1594
+ 0x181, 0x182,
1595
+ 0x184, 0x184,
1596
+ 0x186, 0x187,
1597
+ 0x189, 0x18B,
1598
+ 0x18E, 0x191,
1599
+ 0x193, 0x194,
1600
+ 0x196, 0x198,
1601
+ 0x19C, 0x19D,
1602
+ 0x19F, 0x1A0,
1603
+ 0x1A2, 0x1A2,
1604
+ 0x1A4, 0x1A4,
1605
+ 0x1A6, 0x1A7,
1606
+ 0x1A9, 0x1A9,
1607
+ 0x1AC, 0x1AC,
1608
+ 0x1AE, 0x1AF,
1609
+ 0x1B1, 0x1B3,
1610
+ 0x1B5, 0x1B5,
1611
+ 0x1B7, 0x1B8,
1612
+ 0x1BC, 0x1BC,
1613
+ 0x1C4, 0x1C4,
1614
+ 0x1C7, 0x1C7,
1615
+ 0x1CA, 0x1CA,
1616
+ 0x1CD, 0x1CD,
1617
+ 0x1CF, 0x1CF,
1618
+ 0x1D1, 0x1D1,
1619
+ 0x1D3, 0x1D3,
1620
+ 0x1D5, 0x1D5,
1621
+ 0x1D7, 0x1D7,
1622
+ 0x1D9, 0x1D9,
1623
+ 0x1DB, 0x1DB,
1624
+ 0x1DE, 0x1DE,
1625
+ 0x1E0, 0x1E0,
1626
+ 0x1E2, 0x1E2,
1627
+ 0x1E4, 0x1E4,
1628
+ 0x1E6, 0x1E6,
1629
+ 0x1E8, 0x1E8,
1630
+ 0x1EA, 0x1EA,
1631
+ 0x1EC, 0x1EC,
1632
+ 0x1EE, 0x1EE,
1633
+ 0x1F1, 0x1F1,
1634
+ 0x1F4, 0x1F4,
1635
+ 0x1F6, 0x1F8,
1636
+ 0x1FA, 0x1FA,
1637
+ 0x1FC, 0x1FC,
1638
+ 0x1FE, 0x1FE,
1639
+ 0x200, 0x200,
1640
+ 0x202, 0x202,
1641
+ 0x204, 0x204,
1642
+ 0x206, 0x206,
1643
+ 0x208, 0x208,
1644
+ 0x20A, 0x20A,
1645
+ 0x20C, 0x20C,
1646
+ 0x20E, 0x20E,
1647
+ 0x210, 0x210,
1648
+ 0x212, 0x212,
1649
+ 0x214, 0x214,
1650
+ 0x216, 0x216,
1651
+ 0x218, 0x218,
1652
+ 0x21A, 0x21A,
1653
+ 0x21C, 0x21C,
1654
+ 0x21E, 0x21E,
1655
+ 0x220, 0x220,
1656
+ 0x222, 0x222,
1657
+ 0x224, 0x224,
1658
+ 0x226, 0x226,
1659
+ 0x228, 0x228,
1660
+ 0x22A, 0x22A,
1661
+ 0x22C, 0x22C,
1662
+ 0x22E, 0x22E,
1663
+ 0x230, 0x230,
1664
+ 0x232, 0x232,
1665
+ 0x23A, 0x23B,
1666
+ 0x23D, 0x23E,
1667
+ 0x241, 0x241,
1668
+ 0x243, 0x246,
1669
+ 0x248, 0x248,
1670
+ 0x24A, 0x24A,
1671
+ 0x24C, 0x24C,
1672
+ 0x24E, 0x24E,
1673
+ 0x370, 0x370,
1674
+ 0x372, 0x372,
1675
+ 0x376, 0x376,
1676
+ 0x37F, 0x37F,
1677
+ 0x386, 0x386,
1678
+ 0x388, 0x38A,
1679
+ 0x38C, 0x38C,
1680
+ 0x38E, 0x38F,
1681
+ 0x391, 0x3A1,
1682
+ 0x3A3, 0x3AB,
1683
+ 0x3CF, 0x3CF,
1684
+ 0x3D2, 0x3D4,
1685
+ 0x3D8, 0x3D8,
1686
+ 0x3DA, 0x3DA,
1687
+ 0x3DC, 0x3DC,
1688
+ 0x3DE, 0x3DE,
1689
+ 0x3E0, 0x3E0,
1690
+ 0x3E2, 0x3E2,
1691
+ 0x3E4, 0x3E4,
1692
+ 0x3E6, 0x3E6,
1693
+ 0x3E8, 0x3E8,
1694
+ 0x3EA, 0x3EA,
1695
+ 0x3EC, 0x3EC,
1696
+ 0x3EE, 0x3EE,
1697
+ 0x3F4, 0x3F4,
1698
+ 0x3F7, 0x3F7,
1699
+ 0x3F9, 0x3FA,
1700
+ 0x3FD, 0x42F,
1701
+ 0x460, 0x460,
1702
+ 0x462, 0x462,
1703
+ 0x464, 0x464,
1704
+ 0x466, 0x466,
1705
+ 0x468, 0x468,
1706
+ 0x46A, 0x46A,
1707
+ 0x46C, 0x46C,
1708
+ 0x46E, 0x46E,
1709
+ 0x470, 0x470,
1710
+ 0x472, 0x472,
1711
+ 0x474, 0x474,
1712
+ 0x476, 0x476,
1713
+ 0x478, 0x478,
1714
+ 0x47A, 0x47A,
1715
+ 0x47C, 0x47C,
1716
+ 0x47E, 0x47E,
1717
+ 0x480, 0x480,
1718
+ 0x48A, 0x48A,
1719
+ 0x48C, 0x48C,
1720
+ 0x48E, 0x48E,
1721
+ 0x490, 0x490,
1722
+ 0x492, 0x492,
1723
+ 0x494, 0x494,
1724
+ 0x496, 0x496,
1725
+ 0x498, 0x498,
1726
+ 0x49A, 0x49A,
1727
+ 0x49C, 0x49C,
1728
+ 0x49E, 0x49E,
1729
+ 0x4A0, 0x4A0,
1730
+ 0x4A2, 0x4A2,
1731
+ 0x4A4, 0x4A4,
1732
+ 0x4A6, 0x4A6,
1733
+ 0x4A8, 0x4A8,
1734
+ 0x4AA, 0x4AA,
1735
+ 0x4AC, 0x4AC,
1736
+ 0x4AE, 0x4AE,
1737
+ 0x4B0, 0x4B0,
1738
+ 0x4B2, 0x4B2,
1739
+ 0x4B4, 0x4B4,
1740
+ 0x4B6, 0x4B6,
1741
+ 0x4B8, 0x4B8,
1742
+ 0x4BA, 0x4BA,
1743
+ 0x4BC, 0x4BC,
1744
+ 0x4BE, 0x4BE,
1745
+ 0x4C0, 0x4C1,
1746
+ 0x4C3, 0x4C3,
1747
+ 0x4C5, 0x4C5,
1748
+ 0x4C7, 0x4C7,
1749
+ 0x4C9, 0x4C9,
1750
+ 0x4CB, 0x4CB,
1751
+ 0x4CD, 0x4CD,
1752
+ 0x4D0, 0x4D0,
1753
+ 0x4D2, 0x4D2,
1754
+ 0x4D4, 0x4D4,
1755
+ 0x4D6, 0x4D6,
1756
+ 0x4D8, 0x4D8,
1757
+ 0x4DA, 0x4DA,
1758
+ 0x4DC, 0x4DC,
1759
+ 0x4DE, 0x4DE,
1760
+ 0x4E0, 0x4E0,
1761
+ 0x4E2, 0x4E2,
1762
+ 0x4E4, 0x4E4,
1763
+ 0x4E6, 0x4E6,
1764
+ 0x4E8, 0x4E8,
1765
+ 0x4EA, 0x4EA,
1766
+ 0x4EC, 0x4EC,
1767
+ 0x4EE, 0x4EE,
1768
+ 0x4F0, 0x4F0,
1769
+ 0x4F2, 0x4F2,
1770
+ 0x4F4, 0x4F4,
1771
+ 0x4F6, 0x4F6,
1772
+ 0x4F8, 0x4F8,
1773
+ 0x4FA, 0x4FA,
1774
+ 0x4FC, 0x4FC,
1775
+ 0x4FE, 0x4FE,
1776
+ 0x500, 0x500,
1777
+ 0x502, 0x502,
1778
+ 0x504, 0x504,
1779
+ 0x506, 0x506,
1780
+ 0x508, 0x508,
1781
+ 0x50A, 0x50A,
1782
+ 0x50C, 0x50C,
1783
+ 0x50E, 0x50E,
1784
+ 0x510, 0x510,
1785
+ 0x512, 0x512,
1786
+ 0x514, 0x514,
1787
+ 0x516, 0x516,
1788
+ 0x518, 0x518,
1789
+ 0x51A, 0x51A,
1790
+ 0x51C, 0x51C,
1791
+ 0x51E, 0x51E,
1792
+ 0x520, 0x520,
1793
+ 0x522, 0x522,
1794
+ 0x524, 0x524,
1795
+ 0x526, 0x526,
1796
+ 0x528, 0x528,
1797
+ 0x52A, 0x52A,
1798
+ 0x52C, 0x52C,
1799
+ 0x52E, 0x52E,
1800
+ 0x531, 0x556,
1801
+ 0x10A0, 0x10C5,
1802
+ 0x10C7, 0x10C7,
1803
+ 0x10CD, 0x10CD,
1804
+ 0x13A0, 0x13F5,
1805
+ 0x1C90, 0x1CBA,
1806
+ 0x1CBD, 0x1CBF,
1807
+ 0x1E00, 0x1E00,
1808
+ 0x1E02, 0x1E02,
1809
+ 0x1E04, 0x1E04,
1810
+ 0x1E06, 0x1E06,
1811
+ 0x1E08, 0x1E08,
1812
+ 0x1E0A, 0x1E0A,
1813
+ 0x1E0C, 0x1E0C,
1814
+ 0x1E0E, 0x1E0E,
1815
+ 0x1E10, 0x1E10,
1816
+ 0x1E12, 0x1E12,
1817
+ 0x1E14, 0x1E14,
1818
+ 0x1E16, 0x1E16,
1819
+ 0x1E18, 0x1E18,
1820
+ 0x1E1A, 0x1E1A,
1821
+ 0x1E1C, 0x1E1C,
1822
+ 0x1E1E, 0x1E1E,
1823
+ 0x1E20, 0x1E20,
1824
+ 0x1E22, 0x1E22,
1825
+ 0x1E24, 0x1E24,
1826
+ 0x1E26, 0x1E26,
1827
+ 0x1E28, 0x1E28,
1828
+ 0x1E2A, 0x1E2A,
1829
+ 0x1E2C, 0x1E2C,
1830
+ 0x1E2E, 0x1E2E,
1831
+ 0x1E30, 0x1E30,
1832
+ 0x1E32, 0x1E32,
1833
+ 0x1E34, 0x1E34,
1834
+ 0x1E36, 0x1E36,
1835
+ 0x1E38, 0x1E38,
1836
+ 0x1E3A, 0x1E3A,
1837
+ 0x1E3C, 0x1E3C,
1838
+ 0x1E3E, 0x1E3E,
1839
+ 0x1E40, 0x1E40,
1840
+ 0x1E42, 0x1E42,
1841
+ 0x1E44, 0x1E44,
1842
+ 0x1E46, 0x1E46,
1843
+ 0x1E48, 0x1E48,
1844
+ 0x1E4A, 0x1E4A,
1845
+ 0x1E4C, 0x1E4C,
1846
+ 0x1E4E, 0x1E4E,
1847
+ 0x1E50, 0x1E50,
1848
+ 0x1E52, 0x1E52,
1849
+ 0x1E54, 0x1E54,
1850
+ 0x1E56, 0x1E56,
1851
+ 0x1E58, 0x1E58,
1852
+ 0x1E5A, 0x1E5A,
1853
+ 0x1E5C, 0x1E5C,
1854
+ 0x1E5E, 0x1E5E,
1855
+ 0x1E60, 0x1E60,
1856
+ 0x1E62, 0x1E62,
1857
+ 0x1E64, 0x1E64,
1858
+ 0x1E66, 0x1E66,
1859
+ 0x1E68, 0x1E68,
1860
+ 0x1E6A, 0x1E6A,
1861
+ 0x1E6C, 0x1E6C,
1862
+ 0x1E6E, 0x1E6E,
1863
+ 0x1E70, 0x1E70,
1864
+ 0x1E72, 0x1E72,
1865
+ 0x1E74, 0x1E74,
1866
+ 0x1E76, 0x1E76,
1867
+ 0x1E78, 0x1E78,
1868
+ 0x1E7A, 0x1E7A,
1869
+ 0x1E7C, 0x1E7C,
1870
+ 0x1E7E, 0x1E7E,
1871
+ 0x1E80, 0x1E80,
1872
+ 0x1E82, 0x1E82,
1873
+ 0x1E84, 0x1E84,
1874
+ 0x1E86, 0x1E86,
1875
+ 0x1E88, 0x1E88,
1876
+ 0x1E8A, 0x1E8A,
1877
+ 0x1E8C, 0x1E8C,
1878
+ 0x1E8E, 0x1E8E,
1879
+ 0x1E90, 0x1E90,
1880
+ 0x1E92, 0x1E92,
1881
+ 0x1E94, 0x1E94,
1882
+ 0x1E9E, 0x1E9E,
1883
+ 0x1EA0, 0x1EA0,
1884
+ 0x1EA2, 0x1EA2,
1885
+ 0x1EA4, 0x1EA4,
1886
+ 0x1EA6, 0x1EA6,
1887
+ 0x1EA8, 0x1EA8,
1888
+ 0x1EAA, 0x1EAA,
1889
+ 0x1EAC, 0x1EAC,
1890
+ 0x1EAE, 0x1EAE,
1891
+ 0x1EB0, 0x1EB0,
1892
+ 0x1EB2, 0x1EB2,
1893
+ 0x1EB4, 0x1EB4,
1894
+ 0x1EB6, 0x1EB6,
1895
+ 0x1EB8, 0x1EB8,
1896
+ 0x1EBA, 0x1EBA,
1897
+ 0x1EBC, 0x1EBC,
1898
+ 0x1EBE, 0x1EBE,
1899
+ 0x1EC0, 0x1EC0,
1900
+ 0x1EC2, 0x1EC2,
1901
+ 0x1EC4, 0x1EC4,
1902
+ 0x1EC6, 0x1EC6,
1903
+ 0x1EC8, 0x1EC8,
1904
+ 0x1ECA, 0x1ECA,
1905
+ 0x1ECC, 0x1ECC,
1906
+ 0x1ECE, 0x1ECE,
1907
+ 0x1ED0, 0x1ED0,
1908
+ 0x1ED2, 0x1ED2,
1909
+ 0x1ED4, 0x1ED4,
1910
+ 0x1ED6, 0x1ED6,
1911
+ 0x1ED8, 0x1ED8,
1912
+ 0x1EDA, 0x1EDA,
1913
+ 0x1EDC, 0x1EDC,
1914
+ 0x1EDE, 0x1EDE,
1915
+ 0x1EE0, 0x1EE0,
1916
+ 0x1EE2, 0x1EE2,
1917
+ 0x1EE4, 0x1EE4,
1918
+ 0x1EE6, 0x1EE6,
1919
+ 0x1EE8, 0x1EE8,
1920
+ 0x1EEA, 0x1EEA,
1921
+ 0x1EEC, 0x1EEC,
1922
+ 0x1EEE, 0x1EEE,
1923
+ 0x1EF0, 0x1EF0,
1924
+ 0x1EF2, 0x1EF2,
1925
+ 0x1EF4, 0x1EF4,
1926
+ 0x1EF6, 0x1EF6,
1927
+ 0x1EF8, 0x1EF8,
1928
+ 0x1EFA, 0x1EFA,
1929
+ 0x1EFC, 0x1EFC,
1930
+ 0x1EFE, 0x1EFE,
1931
+ 0x1F08, 0x1F0F,
1932
+ 0x1F18, 0x1F1D,
1933
+ 0x1F28, 0x1F2F,
1934
+ 0x1F38, 0x1F3F,
1935
+ 0x1F48, 0x1F4D,
1936
+ 0x1F59, 0x1F59,
1937
+ 0x1F5B, 0x1F5B,
1938
+ 0x1F5D, 0x1F5D,
1939
+ 0x1F5F, 0x1F5F,
1940
+ 0x1F68, 0x1F6F,
1941
+ 0x1FB8, 0x1FBB,
1942
+ 0x1FC8, 0x1FCB,
1943
+ 0x1FD8, 0x1FDB,
1944
+ 0x1FE8, 0x1FEC,
1945
+ 0x1FF8, 0x1FFB,
1946
+ 0x2102, 0x2102,
1947
+ 0x2107, 0x2107,
1948
+ 0x210B, 0x210D,
1949
+ 0x2110, 0x2112,
1950
+ 0x2115, 0x2115,
1951
+ 0x2119, 0x211D,
1952
+ 0x2124, 0x2124,
1953
+ 0x2126, 0x2126,
1954
+ 0x2128, 0x2128,
1955
+ 0x212A, 0x212D,
1956
+ 0x2130, 0x2133,
1957
+ 0x213E, 0x213F,
1958
+ 0x2145, 0x2145,
1959
+ 0x2160, 0x216F,
1960
+ 0x2183, 0x2183,
1961
+ 0x24B6, 0x24CF,
1962
+ 0x2C00, 0x2C2F,
1963
+ 0x2C60, 0x2C60,
1964
+ 0x2C62, 0x2C64,
1965
+ 0x2C67, 0x2C67,
1966
+ 0x2C69, 0x2C69,
1967
+ 0x2C6B, 0x2C6B,
1968
+ 0x2C6D, 0x2C70,
1969
+ 0x2C72, 0x2C72,
1970
+ 0x2C75, 0x2C75,
1971
+ 0x2C7E, 0x2C80,
1972
+ 0x2C82, 0x2C82,
1973
+ 0x2C84, 0x2C84,
1974
+ 0x2C86, 0x2C86,
1975
+ 0x2C88, 0x2C88,
1976
+ 0x2C8A, 0x2C8A,
1977
+ 0x2C8C, 0x2C8C,
1978
+ 0x2C8E, 0x2C8E,
1979
+ 0x2C90, 0x2C90,
1980
+ 0x2C92, 0x2C92,
1981
+ 0x2C94, 0x2C94,
1982
+ 0x2C96, 0x2C96,
1983
+ 0x2C98, 0x2C98,
1984
+ 0x2C9A, 0x2C9A,
1985
+ 0x2C9C, 0x2C9C,
1986
+ 0x2C9E, 0x2C9E,
1987
+ 0x2CA0, 0x2CA0,
1988
+ 0x2CA2, 0x2CA2,
1989
+ 0x2CA4, 0x2CA4,
1990
+ 0x2CA6, 0x2CA6,
1991
+ 0x2CA8, 0x2CA8,
1992
+ 0x2CAA, 0x2CAA,
1993
+ 0x2CAC, 0x2CAC,
1994
+ 0x2CAE, 0x2CAE,
1995
+ 0x2CB0, 0x2CB0,
1996
+ 0x2CB2, 0x2CB2,
1997
+ 0x2CB4, 0x2CB4,
1998
+ 0x2CB6, 0x2CB6,
1999
+ 0x2CB8, 0x2CB8,
2000
+ 0x2CBA, 0x2CBA,
2001
+ 0x2CBC, 0x2CBC,
2002
+ 0x2CBE, 0x2CBE,
2003
+ 0x2CC0, 0x2CC0,
2004
+ 0x2CC2, 0x2CC2,
2005
+ 0x2CC4, 0x2CC4,
2006
+ 0x2CC6, 0x2CC6,
2007
+ 0x2CC8, 0x2CC8,
2008
+ 0x2CCA, 0x2CCA,
2009
+ 0x2CCC, 0x2CCC,
2010
+ 0x2CCE, 0x2CCE,
2011
+ 0x2CD0, 0x2CD0,
2012
+ 0x2CD2, 0x2CD2,
2013
+ 0x2CD4, 0x2CD4,
2014
+ 0x2CD6, 0x2CD6,
2015
+ 0x2CD8, 0x2CD8,
2016
+ 0x2CDA, 0x2CDA,
2017
+ 0x2CDC, 0x2CDC,
2018
+ 0x2CDE, 0x2CDE,
2019
+ 0x2CE0, 0x2CE0,
2020
+ 0x2CE2, 0x2CE2,
2021
+ 0x2CEB, 0x2CEB,
2022
+ 0x2CED, 0x2CED,
2023
+ 0x2CF2, 0x2CF2,
2024
+ 0xA640, 0xA640,
2025
+ 0xA642, 0xA642,
2026
+ 0xA644, 0xA644,
2027
+ 0xA646, 0xA646,
2028
+ 0xA648, 0xA648,
2029
+ 0xA64A, 0xA64A,
2030
+ 0xA64C, 0xA64C,
2031
+ 0xA64E, 0xA64E,
2032
+ 0xA650, 0xA650,
2033
+ 0xA652, 0xA652,
2034
+ 0xA654, 0xA654,
2035
+ 0xA656, 0xA656,
2036
+ 0xA658, 0xA658,
2037
+ 0xA65A, 0xA65A,
2038
+ 0xA65C, 0xA65C,
2039
+ 0xA65E, 0xA65E,
2040
+ 0xA660, 0xA660,
2041
+ 0xA662, 0xA662,
2042
+ 0xA664, 0xA664,
2043
+ 0xA666, 0xA666,
2044
+ 0xA668, 0xA668,
2045
+ 0xA66A, 0xA66A,
2046
+ 0xA66C, 0xA66C,
2047
+ 0xA680, 0xA680,
2048
+ 0xA682, 0xA682,
2049
+ 0xA684, 0xA684,
2050
+ 0xA686, 0xA686,
2051
+ 0xA688, 0xA688,
2052
+ 0xA68A, 0xA68A,
2053
+ 0xA68C, 0xA68C,
2054
+ 0xA68E, 0xA68E,
2055
+ 0xA690, 0xA690,
2056
+ 0xA692, 0xA692,
2057
+ 0xA694, 0xA694,
2058
+ 0xA696, 0xA696,
2059
+ 0xA698, 0xA698,
2060
+ 0xA69A, 0xA69A,
2061
+ 0xA722, 0xA722,
2062
+ 0xA724, 0xA724,
2063
+ 0xA726, 0xA726,
2064
+ 0xA728, 0xA728,
2065
+ 0xA72A, 0xA72A,
2066
+ 0xA72C, 0xA72C,
2067
+ 0xA72E, 0xA72E,
2068
+ 0xA732, 0xA732,
2069
+ 0xA734, 0xA734,
2070
+ 0xA736, 0xA736,
2071
+ 0xA738, 0xA738,
2072
+ 0xA73A, 0xA73A,
2073
+ 0xA73C, 0xA73C,
2074
+ 0xA73E, 0xA73E,
2075
+ 0xA740, 0xA740,
2076
+ 0xA742, 0xA742,
2077
+ 0xA744, 0xA744,
2078
+ 0xA746, 0xA746,
2079
+ 0xA748, 0xA748,
2080
+ 0xA74A, 0xA74A,
2081
+ 0xA74C, 0xA74C,
2082
+ 0xA74E, 0xA74E,
2083
+ 0xA750, 0xA750,
2084
+ 0xA752, 0xA752,
2085
+ 0xA754, 0xA754,
2086
+ 0xA756, 0xA756,
2087
+ 0xA758, 0xA758,
2088
+ 0xA75A, 0xA75A,
2089
+ 0xA75C, 0xA75C,
2090
+ 0xA75E, 0xA75E,
2091
+ 0xA760, 0xA760,
2092
+ 0xA762, 0xA762,
2093
+ 0xA764, 0xA764,
2094
+ 0xA766, 0xA766,
2095
+ 0xA768, 0xA768,
2096
+ 0xA76A, 0xA76A,
2097
+ 0xA76C, 0xA76C,
2098
+ 0xA76E, 0xA76E,
2099
+ 0xA779, 0xA779,
2100
+ 0xA77B, 0xA77B,
2101
+ 0xA77D, 0xA77E,
2102
+ 0xA780, 0xA780,
2103
+ 0xA782, 0xA782,
2104
+ 0xA784, 0xA784,
2105
+ 0xA786, 0xA786,
2106
+ 0xA78B, 0xA78B,
2107
+ 0xA78D, 0xA78D,
2108
+ 0xA790, 0xA790,
2109
+ 0xA792, 0xA792,
2110
+ 0xA796, 0xA796,
2111
+ 0xA798, 0xA798,
2112
+ 0xA79A, 0xA79A,
2113
+ 0xA79C, 0xA79C,
2114
+ 0xA79E, 0xA79E,
2115
+ 0xA7A0, 0xA7A0,
2116
+ 0xA7A2, 0xA7A2,
2117
+ 0xA7A4, 0xA7A4,
2118
+ 0xA7A6, 0xA7A6,
2119
+ 0xA7A8, 0xA7A8,
2120
+ 0xA7AA, 0xA7AE,
2121
+ 0xA7B0, 0xA7B4,
2122
+ 0xA7B6, 0xA7B6,
2123
+ 0xA7B8, 0xA7B8,
2124
+ 0xA7BA, 0xA7BA,
2125
+ 0xA7BC, 0xA7BC,
2126
+ 0xA7BE, 0xA7BE,
2127
+ 0xA7C0, 0xA7C0,
2128
+ 0xA7C2, 0xA7C2,
2129
+ 0xA7C4, 0xA7C7,
2130
+ 0xA7C9, 0xA7C9,
2131
+ 0xA7D0, 0xA7D0,
2132
+ 0xA7D6, 0xA7D6,
2133
+ 0xA7D8, 0xA7D8,
2134
+ 0xA7F5, 0xA7F5,
2135
+ 0xFF21, 0xFF3A,
2136
+ 0x10400, 0x10427,
2137
+ 0x104B0, 0x104D3,
2138
+ 0x10570, 0x1057A,
2139
+ 0x1057C, 0x1058A,
2140
+ 0x1058C, 0x10592,
2141
+ 0x10594, 0x10595,
2142
+ 0x10C80, 0x10CB2,
2143
+ 0x118A0, 0x118BF,
2144
+ 0x16E40, 0x16E5F,
2145
+ 0x1D400, 0x1D419,
2146
+ 0x1D434, 0x1D44D,
2147
+ 0x1D468, 0x1D481,
2148
+ 0x1D49C, 0x1D49C,
2149
+ 0x1D49E, 0x1D49F,
2150
+ 0x1D4A2, 0x1D4A2,
2151
+ 0x1D4A5, 0x1D4A6,
2152
+ 0x1D4A9, 0x1D4AC,
2153
+ 0x1D4AE, 0x1D4B5,
2154
+ 0x1D4D0, 0x1D4E9,
2155
+ 0x1D504, 0x1D505,
2156
+ 0x1D507, 0x1D50A,
2157
+ 0x1D50D, 0x1D514,
2158
+ 0x1D516, 0x1D51C,
2159
+ 0x1D538, 0x1D539,
2160
+ 0x1D53B, 0x1D53E,
2161
+ 0x1D540, 0x1D544,
2162
+ 0x1D546, 0x1D546,
2163
+ 0x1D54A, 0x1D550,
2164
+ 0x1D56C, 0x1D585,
2165
+ 0x1D5A0, 0x1D5B9,
2166
+ 0x1D5D4, 0x1D5ED,
2167
+ 0x1D608, 0x1D621,
2168
+ 0x1D63C, 0x1D655,
2169
+ 0x1D670, 0x1D689,
2170
+ 0x1D6A8, 0x1D6C0,
2171
+ 0x1D6E2, 0x1D6FA,
2172
+ 0x1D71C, 0x1D734,
2173
+ 0x1D756, 0x1D76E,
2174
+ 0x1D790, 0x1D7A8,
2175
+ 0x1D7CA, 0x1D7CA,
2176
+ 0x1E900, 0x1E921,
2177
+ 0x1F130, 0x1F149,
2178
+ 0x1F150, 0x1F169,
2179
+ 0x1F170, 0x1F189,
2180
+ };
2181
+
2182
+ static bool
2183
+ pm_unicode_codepoint_match(pm_unicode_codepoint_t codepoint, const pm_unicode_codepoint_t *codepoints, size_t size) {
2184
+ size_t start = 0;
2185
+ size_t end = size;
2186
+
2187
+ while (start < end) {
2188
+ size_t middle = start + (end - start) / 2;
2189
+ if ((middle % 2) != 0) middle--;
2190
+
2191
+ if (codepoint >= codepoints[middle] && codepoint <= codepoints[middle + 1]) {
2192
+ return true;
2193
+ }
2194
+
2195
+ if (codepoint < codepoints[middle]) {
2196
+ end = middle;
2197
+ } else {
2198
+ start = middle + 2;
2199
+ }
2200
+ }
2201
+
2202
+ return false;
2203
+ }
2204
+
2205
+ static const uint8_t pm_utf_8_dfa[] = {
2206
+ 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, // 00..1f
2207
+ 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, // 20..3f
2208
+ 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, // 40..5f
2209
+ 0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0, // 60..7f
2210
+ 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9,9, // 80..9f
2211
+ 7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7,7, // a0..bf
2212
+ 8,8,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2,2, // c0..df
2213
+ 0xa,0x3,0x3,0x3,0x3,0x3,0x3,0x3,0x3,0x3,0x3,0x3,0x3,0x4,0x3,0x3, // e0..ef
2214
+ 0xb,0x6,0x6,0x6,0x5,0x8,0x8,0x8,0x8,0x8,0x8,0x8,0x8,0x8,0x8,0x8, // f0..ff
2215
+ 0x0,0x1,0x2,0x3,0x5,0x8,0x7,0x1,0x1,0x1,0x4,0x6,0x1,0x1,0x1,0x1, // s0..s0
2216
+ 1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,1,0,1,1,1,1,1,0,1,0,1,1,1,1,1,1, // s1..s2
2217
+ 1,2,1,1,1,1,1,2,1,2,1,1,1,1,1,1,1,1,1,1,1,1,1,2,1,1,1,1,1,1,1,1, // s3..s4
2218
+ 1,2,1,1,1,1,1,1,1,2,1,1,1,1,1,1,1,1,1,1,1,1,1,3,1,3,1,1,1,1,1,1, // s5..s6
2219
+ 1,3,1,1,1,1,1,3,1,3,1,1,1,1,1,1,1,3,1,1,1,1,1,1,1,1,1,1,1,1,1,1, // s7..s8
2220
+ };
2221
+
2222
+ static pm_unicode_codepoint_t
2223
+ pm_utf_8_codepoint(const uint8_t *b, ptrdiff_t n, size_t *width) {
2224
+ assert(n >= 1);
2225
+ size_t maximum = (size_t) n;
2226
+
2227
+ uint32_t codepoint;
2228
+ uint32_t state = 0;
2229
+
2230
+ for (size_t index = 0; index < 4 && index < maximum; index++) {
2231
+ uint32_t byte = b[index];
2232
+ uint32_t type = pm_utf_8_dfa[byte];
2233
+
2234
+ codepoint = (state != 0) ?
2235
+ (byte & 0x3fu) | (codepoint << 6) :
2236
+ (0xffu >> type) & (byte);
2237
+
2238
+ state = pm_utf_8_dfa[256 + (state * 16) + type];
2239
+ if (!state) {
2240
+ *width = index + 1;
2241
+ return (pm_unicode_codepoint_t) codepoint;
2242
+ }
2243
+ }
2244
+
2245
+ *width = 0;
2246
+ return 0;
2247
+ }
2248
+
2249
+ static size_t
2250
+ pm_encoding_utf_8_char_width(const uint8_t *b, ptrdiff_t n) {
2251
+ size_t width;
2252
+ pm_utf_8_codepoint(b, n, &width);
2253
+ return width;
2254
+ }
2255
+
2256
+ size_t
2257
+ pm_encoding_utf_8_alpha_char(const uint8_t *b, ptrdiff_t n) {
2258
+ if (*b < 0x80) {
2259
+ return (pm_encoding_unicode_table[*b] & PRISM_ENCODING_ALPHABETIC_BIT) ? 1 : 0;
2260
+ }
2261
+
2262
+ size_t width;
2263
+ pm_unicode_codepoint_t codepoint = pm_utf_8_codepoint(b, n, &width);
2264
+
2265
+ if (codepoint <= 0xFF) {
2266
+ return (pm_encoding_unicode_table[(uint8_t) codepoint] & PRISM_ENCODING_ALPHABETIC_BIT) ? width : 0;
2267
+ } else {
2268
+ return pm_unicode_codepoint_match(codepoint, unicode_alpha_codepoints, UNICODE_ALPHA_CODEPOINTS_LENGTH) ? width : 0;
2269
+ }
2270
+ }
2271
+
2272
+ size_t
2273
+ pm_encoding_utf_8_alnum_char(const uint8_t *b, ptrdiff_t n) {
2274
+ if (*b < 0x80) {
2275
+ return (pm_encoding_unicode_table[*b] & (PRISM_ENCODING_ALPHANUMERIC_BIT)) ? 1 : 0;
2276
+ }
2277
+
2278
+ size_t width;
2279
+ pm_unicode_codepoint_t codepoint = pm_utf_8_codepoint(b, n, &width);
2280
+
2281
+ if (codepoint <= 0xFF) {
2282
+ return (pm_encoding_unicode_table[(uint8_t) codepoint] & (PRISM_ENCODING_ALPHANUMERIC_BIT)) ? width : 0;
2283
+ } else {
2284
+ return pm_unicode_codepoint_match(codepoint, unicode_alnum_codepoints, UNICODE_ALNUM_CODEPOINTS_LENGTH) ? width : 0;
2285
+ }
2286
+ }
2287
+
2288
+ static bool
2289
+ pm_encoding_utf_8_isupper_char(const uint8_t *b, ptrdiff_t n) {
2290
+ if (*b < 0x80) {
2291
+ return (pm_encoding_unicode_table[*b] & PRISM_ENCODING_UPPERCASE_BIT) ? true : false;
2292
+ }
2293
+
2294
+ size_t width;
2295
+ pm_unicode_codepoint_t codepoint = pm_utf_8_codepoint(b, n, &width);
2296
+
2297
+ if (codepoint <= 0xFF) {
2298
+ return (pm_encoding_unicode_table[(uint8_t) codepoint] & PRISM_ENCODING_UPPERCASE_BIT) ? true : false;
2299
+ } else {
2300
+ return pm_unicode_codepoint_match(codepoint, unicode_isupper_codepoints, UNICODE_ISUPPER_CODEPOINTS_LENGTH) ? true : false;
2301
+ }
2302
+ }
2303
+
2304
+ #undef UNICODE_ALPHA_CODEPOINTS_LENGTH
2305
+ #undef UNICODE_ALNUM_CODEPOINTS_LENGTH
2306
+ #undef UNICODE_ISUPPER_CODEPOINTS_LENGTH
2307
+
2308
+ pm_encoding_t pm_encoding_utf_8 = {
2309
+ .name = "utf-8",
2310
+ .char_width = pm_encoding_utf_8_char_width,
2311
+ .alnum_char = pm_encoding_utf_8_alnum_char,
2312
+ .alpha_char = pm_encoding_utf_8_alpha_char,
2313
+ .isupper_char = pm_encoding_utf_8_isupper_char,
2314
+ .multibyte = true
2315
+ };
2316
+
2317
+ pm_encoding_t pm_encoding_utf8_mac = {
2318
+ .name = "utf8-mac",
2319
+ .char_width = pm_encoding_utf_8_char_width,
2320
+ .alnum_char = pm_encoding_utf_8_alnum_char,
2321
+ .alpha_char = pm_encoding_utf_8_alpha_char,
2322
+ .isupper_char = pm_encoding_utf_8_isupper_char,
2323
+ .multibyte = true
2324
+ };