regex_syntax/unicode_tables/
word_break.rs

1// DO NOT EDIT THIS FILE. IT WAS AUTOMATICALLY GENERATED BY:
2//
3//  ucd-generate word-break /tmp/ucd/12.1.0/ --chars
4//
5// ucd-generate is available on crates.io.
6
7pub const BY_NAME: &'static [(&'static str, &'static [(char, char)])] = &[
8    ("ALetter", ALETTER),
9    ("CR", CR),
10    ("Double_Quote", DOUBLE_QUOTE),
11    ("Extend", EXTEND),
12    ("ExtendNumLet", EXTENDNUMLET),
13    ("Format", FORMAT),
14    ("Hebrew_Letter", HEBREW_LETTER),
15    ("Katakana", KATAKANA),
16    ("LF", LF),
17    ("MidLetter", MIDLETTER),
18    ("MidNum", MIDNUM),
19    ("MidNumLet", MIDNUMLET),
20    ("Newline", NEWLINE),
21    ("Numeric", NUMERIC),
22    ("Regional_Indicator", REGIONAL_INDICATOR),
23    ("Single_Quote", SINGLE_QUOTE),
24    ("WSegSpace", WSEGSPACE),
25    ("ZWJ", ZWJ),
26];
27
28pub const ALETTER: &'static [(char, char)] = &[
29    ('A', 'Z'),
30    ('a', 'z'),
31    ('ª', 'ª'),
32    ('µ', 'µ'),
33    ('º', 'º'),
34    ('À', 'Ö'),
35    ('Ø', 'ö'),
36    ('ø', '˗'),
37    ('˞', 'ˤ'),
38    ('ˬ', '˿'),
39    ('Ͱ', 'ʹ'),
40    ('Ͷ', 'ͷ'),
41    ('ͺ', 'ͽ'),
42    ('Ϳ', 'Ϳ'),
43    ('Ά', 'Ά'),
44    ('Έ', 'Ί'),
45    ('Ό', 'Ό'),
46    ('Ύ', 'Ρ'),
47    ('Σ', 'ϵ'),
48    ('Ϸ', 'ҁ'),
49    ('Ҋ', 'ԯ'),
50    ('Ա', 'Ֆ'),
51    ('ՙ', 'ՙ'),
52    ('՛', '՜'),
53    ('՞', '՞'),
54    ('ՠ', 'ֈ'),
55    ('׳', '׳'),
56    ('ؠ', 'ي'),
57    ('ٮ', 'ٯ'),
58    ('ٱ', 'ۓ'),
59    ('ە', 'ە'),
60    ('ۥ', 'ۦ'),
61    ('ۮ', 'ۯ'),
62    ('ۺ', 'ۼ'),
63    ('ۿ', 'ۿ'),
64    ('ܐ', 'ܐ'),
65    ('ܒ', 'ܯ'),
66    ('ݍ', 'ޥ'),
67    ('ޱ', 'ޱ'),
68    ('ߊ', 'ߪ'),
69    ('ߴ', 'ߵ'),
70    ('ߺ', 'ߺ'),
71    ('ࠀ', 'ࠕ'),
72    ('ࠚ', 'ࠚ'),
73    ('ࠤ', 'ࠤ'),
74    ('ࠨ', 'ࠨ'),
75    ('ࡀ', 'ࡘ'),
76    ('ࡠ', 'ࡪ'),
77    ('ࢠ', 'ࢴ'),
78    ('ࢶ', 'ࢽ'),
79    ('ऄ', 'ह'),
80    ('ऽ', 'ऽ'),
81    ('ॐ', 'ॐ'),
82    ('क़', 'ॡ'),
83    ('ॱ', 'ঀ'),
84    ('অ', 'ঌ'),
85    ('এ', 'ঐ'),
86    ('ও', 'ন'),
87    ('প', 'র'),
88    ('ল', 'ল'),
89    ('শ', 'হ'),
90    ('ঽ', 'ঽ'),
91    ('ৎ', 'ৎ'),
92    ('ড়', 'ঢ়'),
93    ('য়', 'ৡ'),
94    ('ৰ', 'ৱ'),
95    ('ৼ', 'ৼ'),
96    ('ਅ', 'ਊ'),
97    ('ਏ', 'ਐ'),
98    ('ਓ', 'ਨ'),
99    ('ਪ', 'ਰ'),
100    ('ਲ', 'ਲ਼'),
101    ('ਵ', 'ਸ਼'),
102    ('ਸ', 'ਹ'),
103    ('ਖ਼', 'ੜ'),
104    ('ਫ਼', 'ਫ਼'),
105    ('ੲ', 'ੴ'),
106    ('અ', 'ઍ'),
107    ('એ', 'ઑ'),
108    ('ઓ', 'ન'),
109    ('પ', 'ર'),
110    ('લ', 'ળ'),
111    ('વ', 'હ'),
112    ('ઽ', 'ઽ'),
113    ('ૐ', 'ૐ'),
114    ('ૠ', 'ૡ'),
115    ('ૹ', 'ૹ'),
116    ('ଅ', 'ଌ'),
117    ('ଏ', 'ଐ'),
118    ('ଓ', 'ନ'),
119    ('ପ', 'ର'),
120    ('ଲ', 'ଳ'),
121    ('ଵ', 'ହ'),
122    ('ଽ', 'ଽ'),
123    ('ଡ଼', 'ଢ଼'),
124    ('ୟ', 'ୡ'),
125    ('ୱ', 'ୱ'),
126    ('ஃ', 'ஃ'),
127    ('அ', 'ஊ'),
128    ('எ', 'ஐ'),
129    ('ஒ', 'க'),
130    ('ங', 'ச'),
131    ('ஜ', 'ஜ'),
132    ('ஞ', 'ட'),
133    ('ண', 'த'),
134    ('ந', 'ப'),
135    ('ம', 'ஹ'),
136    ('ௐ', 'ௐ'),
137    ('అ', 'ఌ'),
138    ('ఎ', 'ఐ'),
139    ('ఒ', 'న'),
140    ('ప', 'హ'),
141    ('ఽ', 'ఽ'),
142    ('ౘ', 'ౚ'),
143    ('ౠ', 'ౡ'),
144    ('ಀ', 'ಀ'),
145    ('ಅ', 'ಌ'),
146    ('ಎ', 'ಐ'),
147    ('ಒ', 'ನ'),
148    ('ಪ', 'ಳ'),
149    ('ವ', 'ಹ'),
150    ('ಽ', 'ಽ'),
151    ('ೞ', 'ೞ'),
152    ('ೠ', 'ೡ'),
153    ('ೱ', 'ೲ'),
154    ('അ', 'ഌ'),
155    ('എ', 'ഐ'),
156    ('ഒ', 'ഺ'),
157    ('ഽ', 'ഽ'),
158    ('ൎ', 'ൎ'),
159    ('ൔ', 'ൖ'),
160    ('ൟ', 'ൡ'),
161    ('ൺ', 'ൿ'),
162    ('අ', 'ඖ'),
163    ('ක', 'න'),
164    ('ඳ', 'ර'),
165    ('ල', 'ල'),
166    ('ව', 'ෆ'),
167    ('ༀ', 'ༀ'),
168    ('ཀ', 'ཇ'),
169    ('ཉ', 'ཬ'),
170    ('ྈ', 'ྌ'),
171    ('Ⴀ', 'Ⴥ'),
172    ('Ⴧ', 'Ⴧ'),
173    ('Ⴭ', 'Ⴭ'),
174    ('ა', 'ჺ'),
175    ('ჼ', 'ቈ'),
176    ('ቊ', 'ቍ'),
177    ('ቐ', 'ቖ'),
178    ('ቘ', 'ቘ'),
179    ('ቚ', 'ቝ'),
180    ('በ', 'ኈ'),
181    ('ኊ', 'ኍ'),
182    ('ነ', 'ኰ'),
183    ('ኲ', 'ኵ'),
184    ('ኸ', 'ኾ'),
185    ('ዀ', 'ዀ'),
186    ('ዂ', 'ዅ'),
187    ('ወ', 'ዖ'),
188    ('ዘ', 'ጐ'),
189    ('ጒ', 'ጕ'),
190    ('ጘ', 'ፚ'),
191    ('ᎀ', 'ᎏ'),
192    ('Ꭰ', 'Ᏽ'),
193    ('ᏸ', 'ᏽ'),
194    ('ᐁ', 'ᙬ'),
195    ('ᙯ', 'ᙿ'),
196    ('ᚁ', 'ᚚ'),
197    ('ᚠ', 'ᛪ'),
198    ('ᛮ', 'ᛸ'),
199    ('ᜀ', 'ᜌ'),
200    ('ᜎ', 'ᜑ'),
201    ('ᜠ', 'ᜱ'),
202    ('ᝀ', 'ᝑ'),
203    ('ᝠ', 'ᝬ'),
204    ('ᝮ', 'ᝰ'),
205    ('ᠠ', 'ᡸ'),
206    ('ᢀ', 'ᢄ'),
207    ('ᢇ', 'ᢨ'),
208    ('ᢪ', 'ᢪ'),
209    ('ᢰ', 'ᣵ'),
210    ('ᤀ', 'ᤞ'),
211    ('ᨀ', 'ᨖ'),
212    ('ᬅ', 'ᬳ'),
213    ('ᭅ', 'ᭋ'),
214    ('ᮃ', 'ᮠ'),
215    ('ᮮ', 'ᮯ'),
216    ('ᮺ', 'ᯥ'),
217    ('ᰀ', 'ᰣ'),
218    ('ᱍ', 'ᱏ'),
219    ('ᱚ', 'ᱽ'),
220    ('ᲀ', 'ᲈ'),
221    ('Ა', 'Ჺ'),
222    ('Ჽ', 'Ჿ'),
223    ('ᳩ', 'ᳬ'),
224    ('ᳮ', 'ᳳ'),
225    ('ᳵ', 'ᳶ'),
226    ('\u{1cfa}', '\u{1cfa}'),
227    ('ᴀ', 'ᶿ'),
228    ('Ḁ', 'ἕ'),
229    ('Ἐ', 'Ἕ'),
230    ('ἠ', 'ὅ'),
231    ('Ὀ', 'Ὅ'),
232    ('ὐ', 'ὗ'),
233    ('Ὑ', 'Ὑ'),
234    ('Ὓ', 'Ὓ'),
235    ('Ὕ', 'Ὕ'),
236    ('Ὗ', 'ώ'),
237    ('ᾀ', 'ᾴ'),
238    ('ᾶ', 'ᾼ'),
239    ('ι', 'ι'),
240    ('ῂ', 'ῄ'),
241    ('ῆ', 'ῌ'),
242    ('ῐ', 'ΐ'),
243    ('ῖ', 'Ί'),
244    ('ῠ', 'Ῥ'),
245    ('ῲ', 'ῴ'),
246    ('ῶ', 'ῼ'),
247    ('ⁱ', 'ⁱ'),
248    ('ⁿ', 'ⁿ'),
249    ('ₐ', 'ₜ'),
250    ('ℂ', 'ℂ'),
251    ('ℇ', 'ℇ'),
252    ('ℊ', 'ℓ'),
253    ('ℕ', 'ℕ'),
254    ('ℙ', 'ℝ'),
255    ('ℤ', 'ℤ'),
256    ('Ω', 'Ω'),
257    ('ℨ', 'ℨ'),
258    ('K', 'ℭ'),
259    ('ℯ', 'ℹ'),
260    ('ℼ', 'ℿ'),
261    ('ⅅ', 'ⅉ'),
262    ('ⅎ', 'ⅎ'),
263    ('Ⅰ', 'ↈ'),
264    ('Ⓐ', 'ⓩ'),
265    ('Ⰰ', 'Ⱞ'),
266    ('ⰰ', 'ⱞ'),
267    ('Ⱡ', 'ⳤ'),
268    ('Ⳬ', 'ⳮ'),
269    ('Ⳳ', 'ⳳ'),
270    ('ⴀ', 'ⴥ'),
271    ('ⴧ', 'ⴧ'),
272    ('ⴭ', 'ⴭ'),
273    ('ⴰ', 'ⵧ'),
274    ('ⵯ', 'ⵯ'),
275    ('ⶀ', 'ⶖ'),
276    ('ⶠ', 'ⶦ'),
277    ('ⶨ', 'ⶮ'),
278    ('ⶰ', 'ⶶ'),
279    ('ⶸ', 'ⶾ'),
280    ('ⷀ', 'ⷆ'),
281    ('ⷈ', 'ⷎ'),
282    ('ⷐ', 'ⷖ'),
283    ('ⷘ', 'ⷞ'),
284    ('ⸯ', 'ⸯ'),
285    ('々', '々'),
286    ('〻', '〼'),
287    ('ㄅ', 'ㄯ'),
288    ('ㄱ', 'ㆎ'),
289    ('ㆠ', 'ㆺ'),
290    ('ꀀ', 'ꒌ'),
291    ('ꓐ', 'ꓽ'),
292    ('ꔀ', 'ꘌ'),
293    ('ꘐ', 'ꘟ'),
294    ('ꘪ', 'ꘫ'),
295    ('Ꙁ', 'ꙮ'),
296    ('ꙿ', 'ꚝ'),
297    ('ꚠ', 'ꛯ'),
298    ('ꜗ', '\u{a7bf}'),
299    ('\u{a7c2}', '\u{a7c6}'),
300    ('ꟷ', 'ꠁ'),
301    ('ꠃ', 'ꠅ'),
302    ('ꠇ', 'ꠊ'),
303    ('ꠌ', 'ꠢ'),
304    ('ꡀ', 'ꡳ'),
305    ('ꢂ', 'ꢳ'),
306    ('ꣲ', 'ꣷ'),
307    ('ꣻ', 'ꣻ'),
308    ('ꣽ', 'ꣾ'),
309    ('ꤊ', 'ꤥ'),
310    ('ꤰ', 'ꥆ'),
311    ('ꥠ', 'ꥼ'),
312    ('ꦄ', 'ꦲ'),
313    ('ꧏ', 'ꧏ'),
314    ('ꨀ', 'ꨨ'),
315    ('ꩀ', 'ꩂ'),
316    ('ꩄ', 'ꩋ'),
317    ('ꫠ', 'ꫪ'),
318    ('ꫲ', 'ꫴ'),
319    ('ꬁ', 'ꬆ'),
320    ('ꬉ', 'ꬎ'),
321    ('ꬑ', 'ꬖ'),
322    ('ꬠ', 'ꬦ'),
323    ('ꬨ', 'ꬮ'),
324    ('ꬰ', '\u{ab67}'),
325    ('ꭰ', 'ꯢ'),
326    ('가', '힣'),
327    ('ힰ', 'ퟆ'),
328    ('ퟋ', 'ퟻ'),
329    ('ff', 'st'),
330    ('ﬓ', 'ﬗ'),
331    ('ﭐ', 'ﮱ'),
332    ('ﯓ', 'ﴽ'),
333    ('ﵐ', 'ﶏ'),
334    ('ﶒ', 'ﷇ'),
335    ('ﷰ', 'ﷻ'),
336    ('ﹰ', 'ﹴ'),
337    ('ﹶ', 'ﻼ'),
338    ('A', 'Z'),
339    ('a', 'z'),
340    ('ᅠ', 'ᄒ'),
341    ('ᅡ', 'ᅦ'),
342    ('ᅧ', 'ᅬ'),
343    ('ᅭ', 'ᅲ'),
344    ('ᅳ', 'ᅵ'),
345    ('𐀀', '𐀋'),
346    ('𐀍', '𐀦'),
347    ('𐀨', '𐀺'),
348    ('𐀼', '𐀽'),
349    ('𐀿', '𐁍'),
350    ('𐁐', '𐁝'),
351    ('𐂀', '𐃺'),
352    ('𐅀', '𐅴'),
353    ('𐊀', '𐊜'),
354    ('𐊠', '𐋐'),
355    ('𐌀', '𐌟'),
356    ('𐌭', '𐍊'),
357    ('𐍐', '𐍵'),
358    ('𐎀', '𐎝'),
359    ('𐎠', '𐏃'),
360    ('𐏈', '𐏏'),
361    ('𐏑', '𐏕'),
362    ('𐐀', '𐒝'),
363    ('𐒰', '𐓓'),
364    ('𐓘', '𐓻'),
365    ('𐔀', '𐔧'),
366    ('𐔰', '𐕣'),
367    ('𐘀', '𐜶'),
368    ('𐝀', '𐝕'),
369    ('𐝠', '𐝧'),
370    ('𐠀', '𐠅'),
371    ('𐠈', '𐠈'),
372    ('𐠊', '𐠵'),
373    ('𐠷', '𐠸'),
374    ('𐠼', '𐠼'),
375    ('𐠿', '𐡕'),
376    ('𐡠', '𐡶'),
377    ('𐢀', '𐢞'),
378    ('𐣠', '𐣲'),
379    ('𐣴', '𐣵'),
380    ('𐤀', '𐤕'),
381    ('𐤠', '𐤹'),
382    ('𐦀', '𐦷'),
383    ('𐦾', '𐦿'),
384    ('𐨀', '𐨀'),
385    ('𐨐', '𐨓'),
386    ('𐨕', '𐨗'),
387    ('𐨙', '𐨵'),
388    ('𐩠', '𐩼'),
389    ('𐪀', '𐪜'),
390    ('𐫀', '𐫇'),
391    ('𐫉', '𐫤'),
392    ('𐬀', '𐬵'),
393    ('𐭀', '𐭕'),
394    ('𐭠', '𐭲'),
395    ('𐮀', '𐮑'),
396    ('𐰀', '𐱈'),
397    ('𐲀', '𐲲'),
398    ('𐳀', '𐳲'),
399    ('𐴀', '𐴣'),
400    ('𐼀', '𐼜'),
401    ('𐼧', '𐼧'),
402    ('𐼰', '𐽅'),
403    ('\u{10fe0}', '\u{10ff6}'),
404    ('𑀃', '𑀷'),
405    ('𑂃', '𑂯'),
406    ('𑃐', '𑃨'),
407    ('𑄃', '𑄦'),
408    ('𑅄', '𑅄'),
409    ('𑅐', '𑅲'),
410    ('𑅶', '𑅶'),
411    ('𑆃', '𑆲'),
412    ('𑇁', '𑇄'),
413    ('𑇚', '𑇚'),
414    ('𑇜', '𑇜'),
415    ('𑈀', '𑈑'),
416    ('𑈓', '𑈫'),
417    ('𑊀', '𑊆'),
418    ('𑊈', '𑊈'),
419    ('𑊊', '𑊍'),
420    ('𑊏', '𑊝'),
421    ('𑊟', '𑊨'),
422    ('𑊰', '𑋞'),
423    ('𑌅', '𑌌'),
424    ('𑌏', '𑌐'),
425    ('𑌓', '𑌨'),
426    ('𑌪', '𑌰'),
427    ('𑌲', '𑌳'),
428    ('𑌵', '𑌹'),
429    ('𑌽', '𑌽'),
430    ('𑍐', '𑍐'),
431    ('𑍝', '𑍡'),
432    ('𑐀', '𑐴'),
433    ('𑑇', '𑑊'),
434    ('\u{1145f}', '\u{1145f}'),
435    ('𑒀', '𑒯'),
436    ('𑓄', '𑓅'),
437    ('𑓇', '𑓇'),
438    ('𑖀', '𑖮'),
439    ('𑗘', '𑗛'),
440    ('𑘀', '𑘯'),
441    ('𑙄', '𑙄'),
442    ('𑚀', '𑚪'),
443    ('\u{116b8}', '\u{116b8}'),
444    ('𑠀', '𑠫'),
445    ('𑢠', '𑣟'),
446    ('𑣿', '𑣿'),
447    ('\u{119a0}', '\u{119a7}'),
448    ('\u{119aa}', '\u{119d0}'),
449    ('\u{119e1}', '\u{119e1}'),
450    ('\u{119e3}', '\u{119e3}'),
451    ('𑨀', '𑨀'),
452    ('𑨋', '𑨲'),
453    ('𑨺', '𑨺'),
454    ('𑩐', '𑩐'),
455    ('𑩜', '𑪉'),
456    ('𑪝', '𑪝'),
457    ('𑫀', '𑫸'),
458    ('𑰀', '𑰈'),
459    ('𑰊', '𑰮'),
460    ('𑱀', '𑱀'),
461    ('𑱲', '𑲏'),
462    ('𑴀', '𑴆'),
463    ('𑴈', '𑴉'),
464    ('𑴋', '𑴰'),
465    ('𑵆', '𑵆'),
466    ('𑵠', '𑵥'),
467    ('𑵧', '𑵨'),
468    ('𑵪', '𑶉'),
469    ('𑶘', '𑶘'),
470    ('𑻠', '𑻲'),
471    ('𒀀', '𒎙'),
472    ('𒐀', '𒑮'),
473    ('𒒀', '𒕃'),
474    ('𓀀', '𓐮'),
475    ('𔐀', '𔙆'),
476    ('𖠀', '𖨸'),
477    ('𖩀', '𖩞'),
478    ('𖫐', '𖫭'),
479    ('𖬀', '𖬯'),
480    ('𖭀', '𖭃'),
481    ('𖭣', '𖭷'),
482    ('𖭽', '𖮏'),
483    ('𖹀', '𖹿'),
484    ('𖼀', '\u{16f4a}'),
485    ('𖽐', '𖽐'),
486    ('𖾓', '𖾟'),
487    ('𖿠', '𖿡'),
488    ('\u{16fe3}', '\u{16fe3}'),
489    ('𛰀', '𛱪'),
490    ('𛱰', '𛱼'),
491    ('𛲀', '𛲈'),
492    ('𛲐', '𛲙'),
493    ('𝐀', '𝑔'),
494    ('𝑖', '𝒜'),
495    ('𝒞', '𝒟'),
496    ('𝒢', '𝒢'),
497    ('𝒥', '𝒦'),
498    ('𝒩', '𝒬'),
499    ('𝒮', '𝒹'),
500    ('𝒻', '𝒻'),
501    ('𝒽', '𝓃'),
502    ('𝓅', '𝔅'),
503    ('𝔇', '𝔊'),
504    ('𝔍', '𝔔'),
505    ('𝔖', '𝔜'),
506    ('𝔞', '𝔹'),
507    ('𝔻', '𝔾'),
508    ('𝕀', '𝕄'),
509    ('𝕆', '𝕆'),
510    ('𝕊', '𝕐'),
511    ('𝕒', '𝚥'),
512    ('𝚨', '𝛀'),
513    ('𝛂', '𝛚'),
514    ('𝛜', '𝛺'),
515    ('𝛼', '𝜔'),
516    ('𝜖', '𝜴'),
517    ('𝜶', '𝝎'),
518    ('𝝐', '𝝮'),
519    ('𝝰', '𝞈'),
520    ('𝞊', '𝞨'),
521    ('𝞪', '𝟂'),
522    ('𝟄', '𝟋'),
523    ('\u{1e100}', '\u{1e12c}'),
524    ('\u{1e137}', '\u{1e13d}'),
525    ('\u{1e14e}', '\u{1e14e}'),
526    ('\u{1e2c0}', '\u{1e2eb}'),
527    ('𞠀', '𞣄'),
528    ('𞤀', '𞥃'),
529    ('\u{1e94b}', '\u{1e94b}'),
530    ('𞸀', '𞸃'),
531    ('𞸅', '𞸟'),
532    ('𞸡', '𞸢'),
533    ('𞸤', '𞸤'),
534    ('𞸧', '𞸧'),
535    ('𞸩', '𞸲'),
536    ('𞸴', '𞸷'),
537    ('𞸹', '𞸹'),
538    ('𞸻', '𞸻'),
539    ('𞹂', '𞹂'),
540    ('𞹇', '𞹇'),
541    ('𞹉', '𞹉'),
542    ('𞹋', '𞹋'),
543    ('𞹍', '𞹏'),
544    ('𞹑', '𞹒'),
545    ('𞹔', '𞹔'),
546    ('𞹗', '𞹗'),
547    ('𞹙', '𞹙'),
548    ('𞹛', '𞹛'),
549    ('𞹝', '𞹝'),
550    ('𞹟', '𞹟'),
551    ('𞹡', '𞹢'),
552    ('𞹤', '𞹤'),
553    ('𞹧', '𞹪'),
554    ('𞹬', '𞹲'),
555    ('𞹴', '𞹷'),
556    ('𞹹', '𞹼'),
557    ('𞹾', '𞹾'),
558    ('𞺀', '𞺉'),
559    ('𞺋', '𞺛'),
560    ('𞺡', '𞺣'),
561    ('𞺥', '𞺩'),
562    ('𞺫', '𞺻'),
563    ('🄰', '🅉'),
564    ('🅐', '🅩'),
565    ('🅰', '🆉'),
566];
567
568pub const CR: &'static [(char, char)] = &[('\r', '\r')];
569
570pub const DOUBLE_QUOTE: &'static [(char, char)] = &[('\"', '\"')];
571
572pub const EXTEND: &'static [(char, char)] = &[
573    ('\u{300}', '\u{36f}'),
574    ('\u{483}', '\u{489}'),
575    ('\u{591}', '\u{5bd}'),
576    ('\u{5bf}', '\u{5bf}'),
577    ('\u{5c1}', '\u{5c2}'),
578    ('\u{5c4}', '\u{5c5}'),
579    ('\u{5c7}', '\u{5c7}'),
580    ('\u{610}', '\u{61a}'),
581    ('\u{64b}', '\u{65f}'),
582    ('\u{670}', '\u{670}'),
583    ('\u{6d6}', '\u{6dc}'),
584    ('\u{6df}', '\u{6e4}'),
585    ('\u{6e7}', '\u{6e8}'),
586    ('\u{6ea}', '\u{6ed}'),
587    ('\u{711}', '\u{711}'),
588    ('\u{730}', '\u{74a}'),
589    ('\u{7a6}', '\u{7b0}'),
590    ('\u{7eb}', '\u{7f3}'),
591    ('\u{7fd}', '\u{7fd}'),
592    ('\u{816}', '\u{819}'),
593    ('\u{81b}', '\u{823}'),
594    ('\u{825}', '\u{827}'),
595    ('\u{829}', '\u{82d}'),
596    ('\u{859}', '\u{85b}'),
597    ('\u{8d3}', '\u{8e1}'),
598    ('\u{8e3}', 'ः'),
599    ('\u{93a}', '\u{93c}'),
600    ('ा', 'ॏ'),
601    ('\u{951}', '\u{957}'),
602    ('\u{962}', '\u{963}'),
603    ('\u{981}', 'ঃ'),
604    ('\u{9bc}', '\u{9bc}'),
605    ('\u{9be}', '\u{9c4}'),
606    ('ে', 'ৈ'),
607    ('ো', '\u{9cd}'),
608    ('\u{9d7}', '\u{9d7}'),
609    ('\u{9e2}', '\u{9e3}'),
610    ('\u{9fe}', '\u{9fe}'),
611    ('\u{a01}', 'ਃ'),
612    ('\u{a3c}', '\u{a3c}'),
613    ('ਾ', '\u{a42}'),
614    ('\u{a47}', '\u{a48}'),
615    ('\u{a4b}', '\u{a4d}'),
616    ('\u{a51}', '\u{a51}'),
617    ('\u{a70}', '\u{a71}'),
618    ('\u{a75}', '\u{a75}'),
619    ('\u{a81}', 'ઃ'),
620    ('\u{abc}', '\u{abc}'),
621    ('ા', '\u{ac5}'),
622    ('\u{ac7}', 'ૉ'),
623    ('ો', '\u{acd}'),
624    ('\u{ae2}', '\u{ae3}'),
625    ('\u{afa}', '\u{aff}'),
626    ('\u{b01}', 'ଃ'),
627    ('\u{b3c}', '\u{b3c}'),
628    ('\u{b3e}', '\u{b44}'),
629    ('େ', 'ୈ'),
630    ('ୋ', '\u{b4d}'),
631    ('\u{b56}', '\u{b57}'),
632    ('\u{b62}', '\u{b63}'),
633    ('\u{b82}', '\u{b82}'),
634    ('\u{bbe}', 'ூ'),
635    ('ெ', 'ை'),
636    ('ொ', '\u{bcd}'),
637    ('\u{bd7}', '\u{bd7}'),
638    ('\u{c00}', '\u{c04}'),
639    ('\u{c3e}', 'ౄ'),
640    ('\u{c46}', '\u{c48}'),
641    ('\u{c4a}', '\u{c4d}'),
642    ('\u{c55}', '\u{c56}'),
643    ('\u{c62}', '\u{c63}'),
644    ('\u{c81}', 'ಃ'),
645    ('\u{cbc}', '\u{cbc}'),
646    ('ಾ', 'ೄ'),
647    ('\u{cc6}', 'ೈ'),
648    ('ೊ', '\u{ccd}'),
649    ('\u{cd5}', '\u{cd6}'),
650    ('\u{ce2}', '\u{ce3}'),
651    ('\u{d00}', 'ഃ'),
652    ('\u{d3b}', '\u{d3c}'),
653    ('\u{d3e}', '\u{d44}'),
654    ('െ', 'ൈ'),
655    ('ൊ', '\u{d4d}'),
656    ('\u{d57}', '\u{d57}'),
657    ('\u{d62}', '\u{d63}'),
658    ('ං', 'ඃ'),
659    ('\u{dca}', '\u{dca}'),
660    ('\u{dcf}', '\u{dd4}'),
661    ('\u{dd6}', '\u{dd6}'),
662    ('ෘ', '\u{ddf}'),
663    ('ෲ', 'ෳ'),
664    ('\u{e31}', '\u{e31}'),
665    ('\u{e34}', '\u{e3a}'),
666    ('\u{e47}', '\u{e4e}'),
667    ('\u{eb1}', '\u{eb1}'),
668    ('\u{eb4}', '\u{ebc}'),
669    ('\u{ec8}', '\u{ecd}'),
670    ('\u{f18}', '\u{f19}'),
671    ('\u{f35}', '\u{f35}'),
672    ('\u{f37}', '\u{f37}'),
673    ('\u{f39}', '\u{f39}'),
674    ('༾', '༿'),
675    ('\u{f71}', '\u{f84}'),
676    ('\u{f86}', '\u{f87}'),
677    ('\u{f8d}', '\u{f97}'),
678    ('\u{f99}', '\u{fbc}'),
679    ('\u{fc6}', '\u{fc6}'),
680    ('ါ', '\u{103e}'),
681    ('ၖ', '\u{1059}'),
682    ('\u{105e}', '\u{1060}'),
683    ('ၢ', 'ၤ'),
684    ('ၧ', 'ၭ'),
685    ('\u{1071}', '\u{1074}'),
686    ('\u{1082}', '\u{108d}'),
687    ('ႏ', 'ႏ'),
688    ('ႚ', '\u{109d}'),
689    ('\u{135d}', '\u{135f}'),
690    ('\u{1712}', '\u{1714}'),
691    ('\u{1732}', '\u{1734}'),
692    ('\u{1752}', '\u{1753}'),
693    ('\u{1772}', '\u{1773}'),
694    ('\u{17b4}', '\u{17d3}'),
695    ('\u{17dd}', '\u{17dd}'),
696    ('\u{180b}', '\u{180d}'),
697    ('\u{1885}', '\u{1886}'),
698    ('\u{18a9}', '\u{18a9}'),
699    ('\u{1920}', 'ᤫ'),
700    ('ᤰ', '\u{193b}'),
701    ('\u{1a17}', '\u{1a1b}'),
702    ('ᩕ', '\u{1a5e}'),
703    ('\u{1a60}', '\u{1a7c}'),
704    ('\u{1a7f}', '\u{1a7f}'),
705    ('\u{1ab0}', '\u{1abe}'),
706    ('\u{1b00}', 'ᬄ'),
707    ('\u{1b34}', '᭄'),
708    ('\u{1b6b}', '\u{1b73}'),
709    ('\u{1b80}', 'ᮂ'),
710    ('ᮡ', '\u{1bad}'),
711    ('\u{1be6}', '᯳'),
712    ('ᰤ', '\u{1c37}'),
713    ('\u{1cd0}', '\u{1cd2}'),
714    ('\u{1cd4}', '\u{1ce8}'),
715    ('\u{1ced}', '\u{1ced}'),
716    ('\u{1cf4}', '\u{1cf4}'),
717    ('᳷', '\u{1cf9}'),
718    ('\u{1dc0}', '\u{1df9}'),
719    ('\u{1dfb}', '\u{1dff}'),
720    ('\u{200c}', '\u{200c}'),
721    ('\u{20d0}', '\u{20f0}'),
722    ('\u{2cef}', '\u{2cf1}'),
723    ('\u{2d7f}', '\u{2d7f}'),
724    ('\u{2de0}', '\u{2dff}'),
725    ('\u{302a}', '\u{302f}'),
726    ('\u{3099}', '\u{309a}'),
727    ('\u{a66f}', '\u{a672}'),
728    ('\u{a674}', '\u{a67d}'),
729    ('\u{a69e}', '\u{a69f}'),
730    ('\u{a6f0}', '\u{a6f1}'),
731    ('\u{a802}', '\u{a802}'),
732    ('\u{a806}', '\u{a806}'),
733    ('\u{a80b}', '\u{a80b}'),
734    ('ꠣ', 'ꠧ'),
735    ('ꢀ', 'ꢁ'),
736    ('ꢴ', '\u{a8c5}'),
737    ('\u{a8e0}', '\u{a8f1}'),
738    ('\u{a8ff}', '\u{a8ff}'),
739    ('\u{a926}', '\u{a92d}'),
740    ('\u{a947}', '꥓'),
741    ('\u{a980}', 'ꦃ'),
742    ('\u{a9b3}', '꧀'),
743    ('\u{a9e5}', '\u{a9e5}'),
744    ('\u{aa29}', '\u{aa36}'),
745    ('\u{aa43}', '\u{aa43}'),
746    ('\u{aa4c}', 'ꩍ'),
747    ('ꩻ', 'ꩽ'),
748    ('\u{aab0}', '\u{aab0}'),
749    ('\u{aab2}', '\u{aab4}'),
750    ('\u{aab7}', '\u{aab8}'),
751    ('\u{aabe}', '\u{aabf}'),
752    ('\u{aac1}', '\u{aac1}'),
753    ('ꫫ', 'ꫯ'),
754    ('ꫵ', '\u{aaf6}'),
755    ('ꯣ', 'ꯪ'),
756    ('꯬', '\u{abed}'),
757    ('\u{fb1e}', '\u{fb1e}'),
758    ('\u{fe00}', '\u{fe0f}'),
759    ('\u{fe20}', '\u{fe2f}'),
760    ('\u{ff9e}', '\u{ff9f}'),
761    ('\u{101fd}', '\u{101fd}'),
762    ('\u{102e0}', '\u{102e0}'),
763    ('\u{10376}', '\u{1037a}'),
764    ('\u{10a01}', '\u{10a03}'),
765    ('\u{10a05}', '\u{10a06}'),
766    ('\u{10a0c}', '\u{10a0f}'),
767    ('\u{10a38}', '\u{10a3a}'),
768    ('\u{10a3f}', '\u{10a3f}'),
769    ('\u{10ae5}', '\u{10ae6}'),
770    ('\u{10d24}', '\u{10d27}'),
771    ('\u{10f46}', '\u{10f50}'),
772    ('𑀀', '𑀂'),
773    ('\u{11038}', '\u{11046}'),
774    ('\u{1107f}', '𑂂'),
775    ('𑂰', '\u{110ba}'),
776    ('\u{11100}', '\u{11102}'),
777    ('\u{11127}', '\u{11134}'),
778    ('𑅅', '𑅆'),
779    ('\u{11173}', '\u{11173}'),
780    ('\u{11180}', '𑆂'),
781    ('𑆳', '𑇀'),
782    ('\u{111c9}', '\u{111cc}'),
783    ('𑈬', '\u{11237}'),
784    ('\u{1123e}', '\u{1123e}'),
785    ('\u{112df}', '\u{112ea}'),
786    ('\u{11300}', '𑌃'),
787    ('\u{1133b}', '\u{1133c}'),
788    ('\u{1133e}', '𑍄'),
789    ('𑍇', '𑍈'),
790    ('𑍋', '𑍍'),
791    ('\u{11357}', '\u{11357}'),
792    ('𑍢', '𑍣'),
793    ('\u{11366}', '\u{1136c}'),
794    ('\u{11370}', '\u{11374}'),
795    ('𑐵', '\u{11446}'),
796    ('\u{1145e}', '\u{1145e}'),
797    ('\u{114b0}', '\u{114c3}'),
798    ('\u{115af}', '\u{115b5}'),
799    ('𑖸', '\u{115c0}'),
800    ('\u{115dc}', '\u{115dd}'),
801    ('𑘰', '\u{11640}'),
802    ('\u{116ab}', '\u{116b7}'),
803    ('\u{1171d}', '\u{1172b}'),
804    ('𑠬', '\u{1183a}'),
805    ('\u{119d1}', '\u{119d7}'),
806    ('\u{119da}', '\u{119e0}'),
807    ('\u{119e4}', '\u{119e4}'),
808    ('\u{11a01}', '\u{11a0a}'),
809    ('\u{11a33}', '𑨹'),
810    ('\u{11a3b}', '\u{11a3e}'),
811    ('\u{11a47}', '\u{11a47}'),
812    ('\u{11a51}', '\u{11a5b}'),
813    ('\u{11a8a}', '\u{11a99}'),
814    ('𑰯', '\u{11c36}'),
815    ('\u{11c38}', '\u{11c3f}'),
816    ('\u{11c92}', '\u{11ca7}'),
817    ('𑲩', '\u{11cb6}'),
818    ('\u{11d31}', '\u{11d36}'),
819    ('\u{11d3a}', '\u{11d3a}'),
820    ('\u{11d3c}', '\u{11d3d}'),
821    ('\u{11d3f}', '\u{11d45}'),
822    ('\u{11d47}', '\u{11d47}'),
823    ('𑶊', '𑶎'),
824    ('\u{11d90}', '\u{11d91}'),
825    ('𑶓', '\u{11d97}'),
826    ('\u{11ef3}', '𑻶'),
827    ('\u{16af0}', '\u{16af4}'),
828    ('\u{16b30}', '\u{16b36}'),
829    ('\u{16f4f}', '\u{16f4f}'),
830    ('𖽑', '\u{16f87}'),
831    ('\u{16f8f}', '\u{16f92}'),
832    ('\u{1bc9d}', '\u{1bc9e}'),
833    ('\u{1d165}', '\u{1d169}'),
834    ('𝅭', '\u{1d172}'),
835    ('\u{1d17b}', '\u{1d182}'),
836    ('\u{1d185}', '\u{1d18b}'),
837    ('\u{1d1aa}', '\u{1d1ad}'),
838    ('\u{1d242}', '\u{1d244}'),
839    ('\u{1da00}', '\u{1da36}'),
840    ('\u{1da3b}', '\u{1da6c}'),
841    ('\u{1da75}', '\u{1da75}'),
842    ('\u{1da84}', '\u{1da84}'),
843    ('\u{1da9b}', '\u{1da9f}'),
844    ('\u{1daa1}', '\u{1daaf}'),
845    ('\u{1e000}', '\u{1e006}'),
846    ('\u{1e008}', '\u{1e018}'),
847    ('\u{1e01b}', '\u{1e021}'),
848    ('\u{1e023}', '\u{1e024}'),
849    ('\u{1e026}', '\u{1e02a}'),
850    ('\u{1e130}', '\u{1e136}'),
851    ('\u{1e2ec}', '\u{1e2ef}'),
852    ('\u{1e8d0}', '\u{1e8d6}'),
853    ('\u{1e944}', '\u{1e94a}'),
854    ('🏻', '🏿'),
855    ('\u{e0020}', '\u{e007f}'),
856    ('\u{e0100}', '\u{e01ef}'),
857];
858
859pub const EXTENDNUMLET: &'static [(char, char)] = &[
860    ('_', '_'),
861    ('\u{202f}', '\u{202f}'),
862    ('‿', '⁀'),
863    ('⁔', '⁔'),
864    ('︳', '︴'),
865    ('﹍', '﹏'),
866    ('_', '_'),
867];
868
869pub const FORMAT: &'static [(char, char)] = &[
870    ('\u{ad}', '\u{ad}'),
871    ('\u{600}', '\u{605}'),
872    ('\u{61c}', '\u{61c}'),
873    ('\u{6dd}', '\u{6dd}'),
874    ('\u{70f}', '\u{70f}'),
875    ('\u{8e2}', '\u{8e2}'),
876    ('\u{180e}', '\u{180e}'),
877    ('\u{200e}', '\u{200f}'),
878    ('\u{202a}', '\u{202e}'),
879    ('\u{2060}', '\u{2064}'),
880    ('\u{2066}', '\u{206f}'),
881    ('\u{feff}', '\u{feff}'),
882    ('\u{fff9}', '\u{fffb}'),
883    ('\u{110bd}', '\u{110bd}'),
884    ('\u{110cd}', '\u{110cd}'),
885    ('\u{13430}', '\u{13438}'),
886    ('\u{1bca0}', '\u{1bca3}'),
887    ('\u{1d173}', '\u{1d17a}'),
888    ('\u{e0001}', '\u{e0001}'),
889];
890
891pub const HEBREW_LETTER: &'static [(char, char)] = &[
892    ('א', 'ת'),
893    ('ׯ', 'ײ'),
894    ('יִ', 'יִ'),
895    ('ײַ', 'ﬨ'),
896    ('שׁ', 'זּ'),
897    ('טּ', 'לּ'),
898    ('מּ', 'מּ'),
899    ('נּ', 'סּ'),
900    ('ףּ', 'פּ'),
901    ('צּ', 'ﭏ'),
902];
903
904pub const KATAKANA: &'static [(char, char)] = &[
905    ('〱', '〵'),
906    ('゛', '゜'),
907    ('゠', 'ヺ'),
908    ('ー', 'ヿ'),
909    ('ㇰ', 'ㇿ'),
910    ('㋐', '㋾'),
911    ('㌀', '㍗'),
912    ('ヲ', 'ン'),
913    ('𛀀', '𛀀'),
914    ('\u{1b164}', '\u{1b167}'),
915];
916
917pub const LF: &'static [(char, char)] = &[('\n', '\n')];
918
919pub const MIDLETTER: &'static [(char, char)] = &[
920    (':', ':'),
921    ('·', '·'),
922    ('·', '·'),
923    ('״', '״'),
924    ('‧', '‧'),
925    ('︓', '︓'),
926    ('﹕', '﹕'),
927    (':', ':'),
928];
929
930pub const MIDNUM: &'static [(char, char)] = &[
931    (',', ','),
932    (';', ';'),
933    (';', ';'),
934    ('։', '։'),
935    ('،', '؍'),
936    ('٬', '٬'),
937    ('߸', '߸'),
938    ('⁄', '⁄'),
939    ('︐', '︐'),
940    ('︔', '︔'),
941    ('﹐', '﹐'),
942    ('﹔', '﹔'),
943    (',', ','),
944    (';', ';'),
945];
946
947pub const MIDNUMLET: &'static [(char, char)] = &[
948    ('.', '.'),
949    ('‘', '’'),
950    ('․', '․'),
951    ('﹒', '﹒'),
952    (''', '''),
953    ('.', '.'),
954];
955
956pub const NEWLINE: &'static [(char, char)] =
957    &[('\u{b}', '\u{c}'), ('\u{85}', '\u{85}'), ('\u{2028}', '\u{2029}')];
958
959pub const NUMERIC: &'static [(char, char)] = &[
960    ('0', '9'),
961    ('٠', '٩'),
962    ('٫', '٫'),
963    ('۰', '۹'),
964    ('߀', '߉'),
965    ('०', '९'),
966    ('০', '৯'),
967    ('੦', '੯'),
968    ('૦', '૯'),
969    ('୦', '୯'),
970    ('௦', '௯'),
971    ('౦', '౯'),
972    ('೦', '೯'),
973    ('൦', '൯'),
974    ('෦', '෯'),
975    ('๐', '๙'),
976    ('໐', '໙'),
977    ('༠', '༩'),
978    ('၀', '၉'),
979    ('႐', '႙'),
980    ('០', '៩'),
981    ('᠐', '᠙'),
982    ('᥆', '᥏'),
983    ('᧐', '᧙'),
984    ('᪀', '᪉'),
985    ('᪐', '᪙'),
986    ('᭐', '᭙'),
987    ('᮰', '᮹'),
988    ('᱀', '᱉'),
989    ('᱐', '᱙'),
990    ('꘠', '꘩'),
991    ('꣐', '꣙'),
992    ('꤀', '꤉'),
993    ('꧐', '꧙'),
994    ('꧰', '꧹'),
995    ('꩐', '꩙'),
996    ('꯰', '꯹'),
997    ('0', '9'),
998    ('𐒠', '𐒩'),
999    ('𐴰', '𐴹'),
1000    ('𑁦', '𑁯'),
1001    ('𑃰', '𑃹'),
1002    ('𑄶', '𑄿'),
1003    ('𑇐', '𑇙'),
1004    ('𑋰', '𑋹'),
1005    ('𑑐', '𑑙'),
1006    ('𑓐', '𑓙'),
1007    ('𑙐', '𑙙'),
1008    ('𑛀', '𑛉'),
1009    ('𑜰', '𑜹'),
1010    ('𑣠', '𑣩'),
1011    ('𑱐', '𑱙'),
1012    ('𑵐', '𑵙'),
1013    ('𑶠', '𑶩'),
1014    ('𖩠', '𖩩'),
1015    ('𖭐', '𖭙'),
1016    ('𝟎', '𝟿'),
1017    ('\u{1e140}', '\u{1e149}'),
1018    ('\u{1e2f0}', '\u{1e2f9}'),
1019    ('𞥐', '𞥙'),
1020];
1021
1022pub const REGIONAL_INDICATOR: &'static [(char, char)] = &[('🇦', '🇿')];
1023
1024pub const SINGLE_QUOTE: &'static [(char, char)] = &[('\'', '\'')];
1025
1026pub const WSEGSPACE: &'static [(char, char)] = &[
1027    (' ', ' '),
1028    ('\u{1680}', '\u{1680}'),
1029    ('\u{2000}', '\u{2006}'),
1030    ('\u{2008}', '\u{200a}'),
1031    ('\u{205f}', '\u{205f}'),
1032    ('\u{3000}', '\u{3000}'),
1033];
1034
1035pub const ZWJ: &'static [(char, char)] = &[('\u{200d}', '\u{200d}')];