xref: /openbsd/gnu/usr.bin/perl/t/re/anyof.t (revision 73471bf0)
1#!./perl
2
3use strict;
4use warnings;
5use utf8;
6
7# This tests that the ANYOF nodes generated by bracketed character classes are
8# as expected.  The representation of these is not guaranteed, and this test
9# may need to be updated if it changes.  But it is here to make sure that no
10# unexpected changes occur.  These could come from faulty generation of the
11# node, or faulty display of them (or both).  Because these causes come from
12# very different parts of the regex compiler, it is unlikely that a commit
13# would change both of them, so this test will adequately serve to test both.
14
15BEGIN {
16    chdir 't' if -d 't';
17    require './test.pl';
18    set_up_inc('../lib','.','../ext/re');
19    require Config; import Config;
20    skip_all('no re module') unless defined &DynaLoader::boot_DynaLoader;
21}
22
23# An array is used instead of a hash, so that the tests are carried out in the
24# order given by this file.  Even-numbered indices are the regexes to compile.
25# The next higher element is the expected compilation result.
26#
27# It is painful to port some of these to EBCDIC, as not only do the code point
28# numbers change (for those < 256), but the order changes, as the compiled
29# version is sorted by native code point order.  On EBCDIC, \r comes before
30# \n, and 'k' before "K', for example.  So, the tests where there are
31# differences are skipped on EBCDIC.  They are all at the beginning of the
32# array, and a special marker entry is used to delmit the boundary between
33# skipped and not skipped.
34#
35# NOTE:  If the pattern contains (?8) it will be upgraded to UTF-8 after
36#        stripping that
37
38use Unicode::UCD;
39my $highest_cp = $Unicode::UCD::MAX_CP;
40my $highest_cp_string = sprintf "%X", $highest_cp;
41$highest_cp_string = "$highest_cp_string";
42
43my $infinity = $highest_cp_string;
44$infinity =~ s/^7/F/;  # Make infinity larger than the largest legal one, and
45                       # at the time of this writing, we really internally
46                       # allow UV_MAX to be infinity.
47
48sub  get_compiled ($) {
49    # Convert platform-independent values to what is suitable for the
50    # platform
51
52    my $pattern = shift;
53
54    $pattern =~ s/{INFTY}/\\x{$infinity}/g;
55    $pattern =~ s/{HIGHEST_CP}/\\x{$highest_cp_string}/g;
56    my $use_utf8 = ($pattern =~ s/\Q(?8)//);
57
58    $pattern = "my \$a = '$pattern';";
59    $pattern .= "utf8::upgrade(\$a);" if $use_utf8;
60    $pattern .= "qr/\$a/";
61    my $actual_pattern = "use re qw(Debug COMPILE); $pattern";
62
63    my $result = fresh_perl($actual_pattern);
64    if ($? != 0) {  # Re-run so as to display STDERR.
65        fail($pattern, "Until this is fixed, the planned number of tests will be wrong");
66        fresh_perl($actual_pattern, { stderr => 0, verbose => 1 });
67        return;
68    }
69
70    # The Debug output will come back as a bunch of lines.  We are
71    # interested only in the line after /Final program/
72    my @lines = split /\n/, $result;
73    while (defined ($_ = shift @lines)) {
74        last if /Final program/;
75    }
76
77    $_ = shift @lines;
78
79    s/ \s* \( \d+ \) \s* //x;   # Get rid of the node branch
80    s/ ^ \s* \d+ : \s* //x;     # ... And the node number
81
82    # Use platform-independent values
83    s/$infinity/INFTY/ig;
84    s/$highest_cp_string/HIGHEST_CP/ig;
85
86    return $_;
87}
88
89# Note: EXACTish lowercases the hex; ANYOF uppercases, without braces
90
91my @tests = (
92    '[\xe0\xc0]' => 'EXACTFU <\\x{e0}>',
93    '[\xe1\xc1]' => 'EXACTFU <\\x{e1}>',
94    '[\xe2\xc2]' => 'EXACTFU <\\x{e2}>',
95    '[\xe3\xc3]' => 'EXACTFU <\\x{e3}>',
96    '[\xe4\xc4]' => 'EXACTFU <\\x{e4}>',
97    '[\xc5\xe5]' => 'ANYOF[\\xC5\\xE5]',
98    '[\xe6\xc6]' => 'EXACTFU <\\x{e6}>',
99    '[\xe7\xc7]' => 'EXACTFU <\\x{e7}>',
100    '[\xe8\xc8]' => 'EXACTFU <\\x{e8}>',
101    '[\xe9\xc9]' => 'EXACTFU <\\x{e9}>',
102    '[\xea\xca]' => 'EXACTFU <\\x{ea}>',
103    '[\xeb\xcb]' => 'EXACTFU <\\x{eb}>',
104    '[\xec\xcc]' => 'EXACTFU <\\x{ec}>',
105    '[\xee\xce]' => 'EXACTFU <\\x{ee}>',
106    '[\xef\xcf]' => 'EXACTFU <\\x{ef}>',
107    '[\xf0\xd0]' => 'EXACTFU <\\x{f0}>',
108    '[\xf1\xd1]' => 'EXACTFU <\\x{f1}>',
109    '[\xf2\xd2]' => 'EXACTFU <\\x{f2}>',
110    '[\xf3\xd3]' => 'EXACTFU <\\x{f3}>',
111    '[\xf4\xd4]' => 'EXACTFU <\\x{f4}>',
112    '[\xf5\xd5]' => 'EXACTFU <\\x{f5}>',
113    '[\xf6\xd6]' => 'EXACTFU <\\x{f6}>',
114    '[\xf8\xd8]' => 'EXACTFU <\\x{f8}>',
115    '[\xf9\xd9]' => 'EXACTFU <\\x{f9}>',
116    '[\xfa\xda]' => 'EXACTFU <\\x{fa}>',
117    '[\xfb\xdb]' => 'EXACTFU <\\x{fb}>',
118    '[\xfc\xdc]' => 'EXACTFU <\\x{fc}>',
119    '[\xfd\xdd]' => 'EXACTFU <\\x{fd}>',
120    '[\xfe\xde]' => 'EXACTFU <\\x{fe}>',
121
122    '[[{]' => 'ANYOFM[\[\{]',
123    '[^\S ]' => 'ANYOFD[\t\n\x0B\f\r{utf8}\x85\xA0][1680 2000-200A 2028-2029 202F 205F 3000]',
124    '[^\n\r]' => 'ANYOF[^\n\r][0100-INFTY]',
125    '[^\/\|,\$\%%\@\ \%"\<\>\:\#\&\*\{\}\[\]\(\)]' => 'ANYOF[^ "#$%&()*,/:<>@\[\]\{|\}][0100-INFTY]',
126    '[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
127    '[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
128    '[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
129    '(?u)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
130    '(?u)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
131    '(?a)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
132    '(?a)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
133    '(?a)[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
134    '[[:cntrl:]]' => 'POSIXD[:cntrl:]',
135    '[^[:^print:][:^ascii:]]' => 'POSIXA[:print:]',
136    '[[:blank:]]' => 'POSIXD[:blank:]',
137    '[ [:blank:]]' => 'POSIXD[:blank:]',
138    '[_[:blank:]]' => 'ANYOFD[\t _{utf8}\xA0][1680 2000-200A 202F 205F 3000]',
139    '[_[:^blank:]]' => 'NPOSIXD[:blank:]',
140    '[\xA0[:^blank:]]' => 'ANYOF[^\t ][0100-167F 1681-1FFF 200B-202E 2030-205E 2060-2FFF 3001-INFTY]',
141    '(?d:[_[:^blank:]])' => 'NPOSIXD[:blank:]',
142    '[\x{07}-\x{0B}]' => 'ANYOFR[\a\b\t\n\x0B]',
143    '(?l)[\x{2029}]' => 'EXACTL <\x{2029}>',
144    '(?l)(?[\x{2029}])' => 'ANYOFL{utf8-locale-reqd}[2029]', # regex sets requires utf8 locale for /l
145    '(?il)[\x{212A}]' => 'EXACTFL <\\x{212a}>',
146    '(?il)(?[\x{212A}])' => 'ANYOFL{utf8-locale-reqd}[Kk][212A]',
147
148    '(?i)b[s]\xe0' => 'ANYOFM[Bb]',    # The s goes into a 2nd node
149
150    '[aA]' => 'ANYOFM[Aa]',
151    '[bB]' => 'ANYOFM[Bb]',
152    '[kK]' => 'ANYOFM[Kk]',
153
154    'ebcdic_ok_below_this_marker',
155
156    '(?i:[^:])' => 'NANYOFM[:]',
157
158    '[^\n]' => 'REG_ANY',
159
160    '[[:alpha:]]' => 'POSIXD[:alpha:]',
161    '[[:^alpha:]]' => 'NPOSIXD[:alpha:]',
162    '[[:^alpha:]\x{2C2}]' => 'NPOSIXU[:alpha:]',
163    '(?l)[[:alpha:]]' => 'POSIXL[:alpha:]',
164    '(?l)[[:^alpha:]]' => 'NPOSIXL[:alpha:]',
165    '(?l)[[:^alpha:]\x{2C2}]' => 'NPOSIXL[:alpha:]',
166    '(?u)[[:alpha:]]' => 'POSIXU[:alpha:]',
167    '(?u)[[:^alpha:]]' => 'NPOSIXU[:alpha:]',
168    '(?a)[[:alpha:]]' => 'POSIXA[:alpha:]',
169    '(?a)[[:^alpha:]]' => 'NPOSIXA[:alpha:]',
170    '(?a)[[:^alpha:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
171    '[[:alpha:][:^alpha:]]' => 'SANY',
172    '[^[:alpha:][:^alpha:]]' => 'OPFAIL',
173    '(?l)[[:alpha:][:^alpha:]]' => 'SANY',
174    '(?l)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
175    '(?u)[[:alpha:][:^alpha:]]' => 'SANY',
176    '(?u)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
177    '(?a)[[:alpha:][:^alpha:]]' => 'SANY',
178    '(?a)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
179    '[[:alnum:]]' => 'POSIXD[:alnum:]',
180    '[[:^alnum:]]' => 'NPOSIXD[:alnum:]',
181    '[[:^alnum:]\x{2C2}]' => 'NPOSIXU[:alnum:]',
182    '(?l)[[:alnum:]]' => 'POSIXL[:alnum:]',
183    '(?l)[[:^alnum:]]' => 'NPOSIXL[:alnum:]',
184    '(?l)[[:^alnum:]\x{2C2}]' => 'NPOSIXL[:alnum:]',
185    '(?u)[[:alnum:]]' => 'POSIXU[:alnum:]',
186    '(?u)[[:^alnum:]]' => 'NPOSIXU[:alnum:]',
187    '(?a)[[:alnum:]]' => 'POSIXA[:alnum:]',
188    '(?a)[[:^alnum:]]' => 'NPOSIXA[:alnum:]',
189    '(?a)[[:^alnum:]\x{2C2}]' => 'NPOSIXA[:alnum:]',
190    '[[:alnum:][:^alnum:]]' => 'SANY',
191    '[^[:alnum:][:^alnum:]]' => 'OPFAIL',
192    '(?l)[[:alnum:][:^alnum:]]' => 'SANY',
193    '(?l)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
194    '(?u)[[:alnum:][:^alnum:]]' => 'SANY',
195    '(?u)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
196    '(?a)[[:alnum:][:^alnum:]]' => 'SANY',
197    '(?a)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
198    '(?l)[[:ascii:]]' => 'POSIXL[:ascii:]',
199    '(?l)[[:^ascii:]]' => 'NPOSIXL[:ascii:]',
200    '(?l)[[:^ascii:]\x{2C2}]' => 'NPOSIXL[:ascii:]',
201    '[[:ascii:][:^ascii:]]' => 'SANY',
202    '[^[:ascii:][:^ascii:]]' => 'OPFAIL',
203    '(?l)[[:ascii:][:^ascii:]]' => 'SANY',
204    '(?l)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
205    '(?u)[[:ascii:][:^ascii:]]' => 'SANY',
206    '(?u)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
207    '(?a)[[:ascii:][:^ascii:]]' => 'SANY',
208    '(?a)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
209    '[[:^blank:]]' => 'NPOSIXD[:blank:]',
210    '[[:^blank:]\x{2C2}]' => 'NPOSIXU[:blank:]',
211    '(?l)[[:blank:]]' => 'POSIXL[:blank:]',
212    '(?l)[[:^blank:]]' => 'NPOSIXL[:blank:]',
213    '(?l)[[:^blank:]\x{2C2}]' => 'NPOSIXL[:blank:]',
214    '(?u)[[:blank:]]' => 'POSIXU[:blank:]',
215    '(?u)[[:^blank:]]' => 'NPOSIXU[:blank:]',
216    '(?a)[[:blank:]]' => 'POSIXA[:blank:]',
217    '(?a)[[:^blank:]]' => 'NPOSIXA[:blank:]',
218    '(?a)[[:^blank:]\x{2C2}]' => 'NPOSIXA[:blank:]',
219    '[[:blank:]]' => 'POSIXD[:blank:]',
220    '[[:blank:][:^blank:]]' => 'SANY',
221    '[^[:blank:][:^blank:]]' => 'OPFAIL',
222    '(?l)[[:blank:][:^blank:]]' => 'SANY',
223    '(?l)[^[:blank:][:^blank:]]' => 'OPFAIL',
224    '(?u)[[:blank:][:^blank:]]' => 'SANY',
225    '(?u)[^[:blank:][:^blank:]]' => 'OPFAIL',
226    '(?a)[[:blank:][:^blank:]]' => 'SANY',
227    '(?a)[^[:blank:][:^blank:]]' => 'OPFAIL',
228    '[[:^cntrl:]]' => 'NPOSIXD[:cntrl:]',
229    '[[:^cntrl:]\x{2C2}]' => 'NPOSIXU[:cntrl:]',
230    '(?l)[[:cntrl:]]' => 'POSIXL[:cntrl:]',
231    '(?l)[[:^cntrl:]]' => 'NPOSIXL[:cntrl:]',
232    '(?l)[[:^cntrl:]\x{2C2}]' => 'NPOSIXL[:cntrl:]',
233    '(?u)[[:cntrl:]]' => 'POSIXU[:cntrl:]',
234    '(?u)[[:^cntrl:]]' => 'NPOSIXU[:cntrl:]',
235    '(?a)[[:cntrl:]]' => 'POSIXA[:cntrl:]',
236    '(?a)[[:^cntrl:]]' => 'NPOSIXA[:cntrl:]',
237    '(?a)[[:^cntrl:]\x{2C2}]' => 'NPOSIXA[:cntrl:]',
238    '[[:cntrl:][:^cntrl:]]' => 'SANY',
239    '[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
240    '(?l)[[:cntrl:][:^cntrl:]]' => 'SANY',
241    '(?l)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
242    '(?u)[[:cntrl:][:^cntrl:]]' => 'SANY',
243    '(?u)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
244    '(?a)[[:cntrl:][:^cntrl:]]' => 'SANY',
245    '(?a)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
246    '[[:digit:]]' => 'POSIXU[\d]',
247    '[[:^digit:]]' => 'NPOSIXU[\d]',
248    '[[:^digit:]\x{2C2}]' => 'NPOSIXU[\d]',
249    '(?l)[[:digit:]]' => 'POSIXL[\d]',
250    '(?l)[[:^digit:]]' => 'NPOSIXL[\d]',
251    '(?l)[[:^digit:]\x{2C2}]' => 'NPOSIXL[\d]',
252    '(?u)[[:digit:]]' => 'POSIXU[\d]',
253    '(?u)[[:^digit:]]' => 'NPOSIXU[\d]',
254    '(?a)[[:digit:]]' => 'POSIXA[\d]',
255    '(?a)[[:^digit:]]' => 'NPOSIXA[\d]',
256    '(?a)[[:^digit:]\x{2C2}]' => 'NPOSIXA[\d]',
257    '[[:digit:][:^digit:]]' => 'SANY',
258    '[^[:digit:][:^digit:]]' => 'OPFAIL',
259    '(?l)[[:digit:][:^digit:]]' => 'SANY',
260    '(?l)[^[:digit:][:^digit:]]' => 'OPFAIL',
261    '(?u)[[:digit:][:^digit:]]' => 'SANY',
262    '(?u)[^[:digit:][:^digit:]]' => 'OPFAIL',
263    '(?a)[[:digit:][:^digit:]]' => 'SANY',
264    '(?a)[^[:digit:][:^digit:]]' => 'OPFAIL',
265    '[[:graph:]]' => 'POSIXD[:graph:]',
266    '[[:^graph:]]' => 'NPOSIXD[:graph:]',
267    '[[:^graph:]\x{FFFF}]' => 'NPOSIXU[:graph:]',
268    '(?l)[[:graph:]]' => 'POSIXL[:graph:]',
269    '(?l)[[:^graph:]]' => 'NPOSIXL[:graph:]',
270    '(?l)[[:^graph:]\x{FFFF}]' => 'NPOSIXL[:graph:]',
271    '(?u)[[:graph:]]' => 'POSIXU[:graph:]',
272    '(?u)[[:^graph:]]' => 'NPOSIXU[:graph:]',
273    '(?a)[[:graph:]]' => 'POSIXA[:graph:]',
274    '(?a)[[:^graph:]]' => 'NPOSIXA[:graph:]',
275    '(?a)[[:^graph:]\x{FFFF}]' => 'NPOSIXA[:graph:]',
276    '[[:graph:][:^graph:]]' => 'SANY',
277    '[^[:graph:][:^graph:]]' => 'OPFAIL',
278    '(?l)[[:graph:][:^graph:]]' => 'SANY',
279    '(?l)[^[:graph:][:^graph:]]' => 'OPFAIL',
280    '(?u)[[:graph:][:^graph:]]' => 'SANY',
281    '(?u)[^[:graph:][:^graph:]]' => 'OPFAIL',
282    '(?a)[[:graph:][:^graph:]]' => 'SANY',
283    '(?a)[^[:graph:][:^graph:]]' => 'OPFAIL',
284    '[[:lower:]]' => 'POSIXD[:lower:]',
285    '[[:^lower:]]' => 'NPOSIXD[:lower:]',
286    '[[:^lower:]\x{2C2}]' => 'NPOSIXU[:lower:]',
287    '(?l)[[:lower:]]' => 'POSIXL[:lower:]',
288    '(?l)[[:^lower:]]' => 'NPOSIXL[:lower:]',
289    '(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:lower:]',
290    '(?u)[[:lower:]]' => 'POSIXU[:lower:]',
291    '(?u)[[:^lower:]]' => 'NPOSIXU[:lower:]',
292    '(?a)[[:lower:]]' => 'POSIXA[:lower:]',
293    '(?a)[[:^lower:]]' => 'NPOSIXA[:lower:]',
294    '(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:lower:]',
295    '[[:lower:][:^lower:]]' => 'SANY',
296    '[^[:lower:][:^lower:]]' => 'OPFAIL',
297    '(?l)[[:lower:][:^lower:]]' => 'SANY',
298    '(?l)[^[:lower:][:^lower:]]' => 'OPFAIL',
299    '(?u)[[:lower:][:^lower:]]' => 'SANY',
300    '(?u)[^[:lower:][:^lower:]]' => 'OPFAIL',
301    '(?a)[[:lower:][:^lower:]]' => 'SANY',
302    '(?a)[^[:lower:][:^lower:]]' => 'OPFAIL',
303    '[[:print:]]' => 'POSIXD[:print:]',
304    '[[:^print:]]' => 'NPOSIXD[:print:]',
305    '[[:^print:]\x{FFFF}]' => 'NPOSIXU[:print:]',
306    '(?l)[[:print:]]' => 'POSIXL[:print:]',
307    '(?l)[[:^print:]]' => 'NPOSIXL[:print:]',
308    '(?l)[[:^print:]\x{FFFF}]' => 'NPOSIXL[:print:]',
309    '(?u)[[:print:]]' => 'POSIXU[:print:]',
310    '(?u)[[:^print:]]' => 'NPOSIXU[:print:]',
311    '(?a)[[:print:]]' => 'POSIXA[:print:]',
312    '(?a)[[:^print:]]' => 'NPOSIXA[:print:]',
313    '(?a)[[:^print:]\x{FFFF}]' => 'NPOSIXA[:print:]',
314    '[[:print:][:^print:]]' => 'SANY',
315    '[^[:print:][:^print:]]' => 'OPFAIL',
316    '(?l)[[:print:][:^print:]]' => 'SANY',
317    '(?l)[^[:print:][:^print:]]' => 'OPFAIL',
318    '(?u)[[:print:][:^print:]]' => 'SANY',
319    '(?u)[^[:print:][:^print:]]' => 'OPFAIL',
320    '(?a)[[:print:][:^print:]]' => 'SANY',
321    '(?a)[^[:print:][:^print:]]' => 'OPFAIL',
322    '[[:punct:]]' => 'POSIXD[:punct:]',
323    '[[:^punct:]]' => 'NPOSIXD[:punct:]',
324    '[[:^punct:]\x{2C2}]' => 'NPOSIXU[:punct:]',
325    '(?l)[[:punct:]]' => 'POSIXL[:punct:]',
326    '(?l)[[:^punct:]]' => 'NPOSIXL[:punct:]',
327    '(?l)[[:^punct:]\x{2C2}]' => 'NPOSIXL[:punct:]',
328    '(?u)[[:punct:]]' => 'POSIXU[:punct:]',
329    '(?u)[[:^punct:]]' => 'NPOSIXU[:punct:]',
330    '(?a)[[:punct:]]' => 'POSIXA[:punct:]',
331    '(?a)[[:^punct:]]' => 'NPOSIXA[:punct:]',
332    '(?a)[[:^punct:]\x{2C2}]' => 'NPOSIXA[:punct:]',
333    '[[:punct:][:^punct:]]' => 'SANY',
334    '[^[:punct:][:^punct:]]' => 'OPFAIL',
335    '(?l)[[:punct:][:^punct:]]' => 'SANY',
336    '(?l)[^[:punct:][:^punct:]]' => 'OPFAIL',
337    '(?u)[[:punct:][:^punct:]]' => 'SANY',
338    '(?u)[^[:punct:][:^punct:]]' => 'OPFAIL',
339    '(?a)[[:punct:][:^punct:]]' => 'SANY',
340    '(?a)[^[:punct:][:^punct:]]' => 'OPFAIL',
341    '[[:space:]]' => 'POSIXD[\s]',
342    '[[:^space:]]' => 'NPOSIXD[\s]',
343    '[[:^space:]\x{2C2}]' => 'NPOSIXU[\s]',
344    '(?l)[[:space:]]' => 'POSIXL[\s]',
345    '(?l)[[:^space:]]' => 'NPOSIXL[\s]',
346    '(?l)[[:^space:]\x{2C2}]' => 'NPOSIXL[\s]',
347    '(?u)[[:space:]]' => 'POSIXU[\s]',
348    '(?u)[[:^space:]]' => 'NPOSIXU[\s]',
349    '(?a)[[:space:]]' => 'POSIXA[\s]',
350    '(?a)[[:^space:]]' => 'NPOSIXA[\s]',
351    '(?a)[[:^space:]\x{2C2}]' => 'NPOSIXA[\s]',
352    '[[:space:][:^space:]]' => 'SANY',
353    '[^[:space:][:^space:]]' => 'OPFAIL',
354    '(?l)[[:space:][:^space:]]' => 'SANY',
355    '(?l)[^[:space:][:^space:]]' => 'OPFAIL',
356    '(?u)[[:space:][:^space:]]' => 'SANY',
357    '(?u)[^[:space:][:^space:]]' => 'OPFAIL',
358    '(?a)[[:space:][:^space:]]' => 'SANY',
359    '(?a)[^[:space:][:^space:]]' => 'OPFAIL',
360    '[[:upper:]]' => 'POSIXD[:upper:]',
361    '[[:^upper:]]' => 'NPOSIXD[:upper:]',
362    '[[:^upper:]\x{2C2}]' => 'NPOSIXU[:upper:]',
363    '(?l)[[:upper:]]' => 'POSIXL[:upper:]',
364    '(?l)[[:^upper:]]' => 'NPOSIXL[:upper:]',
365    '(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:upper:]',
366    '(?u)[[:upper:]]' => 'POSIXU[:upper:]',
367    '(?u)[[:^upper:]]' => 'NPOSIXU[:upper:]',
368    '(?a)[[:upper:]]' => 'POSIXA[:upper:]',
369    '(?a)[[:^upper:]]' => 'NPOSIXA[:upper:]',
370    '(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:upper:]',
371    '[[:upper:][:^upper:]]' => 'SANY',
372    '[^[:upper:][:^upper:]]' => 'OPFAIL',
373    '(?l)[[:upper:][:^upper:]]' => 'SANY',
374    '(?l)[^[:upper:][:^upper:]]' => 'OPFAIL',
375    '(?u)[[:upper:][:^upper:]]' => 'SANY',
376    '(?u)[^[:upper:][:^upper:]]' => 'OPFAIL',
377    '(?a)[[:upper:][:^upper:]]' => 'SANY',
378    '(?a)[^[:upper:][:^upper:]]' => 'OPFAIL',
379    '[\v]' => 'POSIXU[\v]',
380    '[^\v]' => 'NPOSIXU[\v]',
381    '[\V\x{2C2}]' => 'NPOSIXU[\v]',
382    '(?l)[\v]' => 'POSIXU[\v]',
383    '(?l)[^\v]' => 'NPOSIXU[\v]',
384    '(?l)[\V\x{2C2}]' => 'NPOSIXU[\v]',
385    '(?u)[\v]' => 'POSIXU[\v]',
386    '(?u)[^\v]' => 'NPOSIXU[\v]',
387    '(?a)[\v]' => 'POSIXU[\v]',
388    '(?a)[^\v]' => 'NPOSIXU[\v]',
389    '(?a)[\V\x{2C2}]' => 'NPOSIXU[\v]',
390    '[\v\V]' => 'SANY',
391    '[^\v\V]' => 'OPFAIL',
392    '(?l)[\v\V]' => 'SANY',
393    '(?l)[^\v\V]' => 'OPFAIL',
394    '(?u)[\v\V]' => 'SANY',
395    '(?u)[^\v\V]' => 'OPFAIL',
396    '(?a)[\v\V]' => 'SANY',
397    '(?a)[^\v\V]' => 'OPFAIL',
398    '[[:word:]]' => 'POSIXD[\w]',
399    '[[:^word:]]' => 'NPOSIXD[\w]',
400    '[[:^word:]\x{2C2}]' => 'NPOSIXU[\w]',
401    '(?l)[[:word:]]' => 'POSIXL[\w]',
402    '(?l)[[:^word:]]' => 'NPOSIXL[\w]',
403    '(?l)[[:^word:]\x{2C2}]' => 'NPOSIXL[\w]',
404    '(?u)[[:word:]]' => 'POSIXU[\w]',
405    '(?u)[[:^word:]]' => 'NPOSIXU[\w]',
406    '(?a)[[:word:]]' => 'POSIXA[\w]',
407    '(?a)[[:^word:]]' => 'NPOSIXA[\w]',
408    '(?a)[[:^word:]\x{2C2}]' => 'NPOSIXA[\w]',
409    '[[:word:][:^word:]]' => 'SANY',
410    '[^[:word:][:^word:]]' => 'OPFAIL',
411    '(?l)[[:word:][:^word:]]' => 'SANY',
412    '(?l)[^[:word:][:^word:]]' => 'OPFAIL',
413    '(?u)[[:word:][:^word:]]' => 'SANY',
414    '(?u)[^[:word:][:^word:]]' => 'OPFAIL',
415    '(?a)[[:word:][:^word:]]' => 'SANY',
416    '(?a)[^[:word:][:^word:]]' => 'OPFAIL',
417    '[[:xdigit:]]' => 'POSIXU[:xdigit:]',
418    '[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
419    '[[:^xdigit:]\x{2C2}]' => 'NPOSIXU[:xdigit:]',
420    '(?l)[[:xdigit:]]' => 'POSIXL[:xdigit:]',
421    '(?l)[[:^xdigit:]]' => 'NPOSIXL[:xdigit:]',
422    '(?l)[[:^xdigit:]\x{2C2}]' => 'NPOSIXL[:xdigit:]',
423    '(?u)[[:xdigit:]]' => 'POSIXU[:xdigit:]',
424    '(?u)[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
425    '(?a)[[:xdigit:]]' => 'POSIXA[:xdigit:]',
426    '(?a)[[:^xdigit:]]' => 'NPOSIXA[:xdigit:]',
427    '(?a)[[:^xdigit:]\x{2C2}]' => 'NPOSIXA[:xdigit:]',
428    '[[:xdigit:][:^xdigit:]]' => 'SANY',
429    '[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
430    '(?l)[[:xdigit:][:^xdigit:]]' => 'SANY',
431    '(?l)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
432    '(?u)[[:xdigit:][:^xdigit:]]' => 'SANY',
433    '(?u)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
434    '(?a)[[:xdigit:][:^xdigit:]]' => 'SANY',
435    '(?a)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
436    '(?i)[[:lower:]]' => 'POSIXD[:cased:]',
437    '(?i)[[:^lower:]]' => 'NPOSIXD[:cased:]',
438    '(?i)[[:^lower:]\x{2C2}]' => 'NPOSIXU[:cased:]',
439    '(?i)(?l)[[:lower:]]' => 'POSIXL[:cased:]',
440    '(?i)(?l)[[:^lower:]]' => 'NPOSIXL[:cased:]',
441    '(?i)(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:cased:]',
442    '(?i)(?u)[[:lower:]]' => 'POSIXU[:cased:]',
443    '(?i)(?u)[[:^lower:]]' => 'NPOSIXU[:cased:]',
444    '(?i)(?a)[[:lower:]]' => 'POSIXA[:alpha:]',
445    '(?i)(?a)[[:^lower:]]' => 'NPOSIXA[:alpha:]',
446    '(?i)(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
447    '(?i)[[:upper:]]' => 'POSIXD[:cased:]',
448    '(?i)[[:^upper:]]' => 'NPOSIXD[:cased:]',
449    '(?i)[[:^upper:]\x{2C2}]' => 'NPOSIXU[:cased:]',
450    '(?i)(?l)[[:upper:]]' => 'POSIXL[:cased:]',
451    '(?i)(?l)[[:^upper:]]' => 'NPOSIXL[:cased:]',
452    '(?i)(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:cased:]',
453    '(?i)(?u)[[:upper:]]' => 'POSIXU[:cased:]',
454    '(?i)(?u)[[:^upper:]]' => 'NPOSIXU[:cased:]',
455    '(?i)(?a)[[:upper:]]' => 'POSIXA[:alpha:]',
456    '(?i)(?a)[[:^upper:]]' => 'NPOSIXA[:alpha:]',
457    '(?i)(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
458    '(?i)[\d\w]' => 'POSIXD[\w]',
459    '(?i)[\D\w]' => 'SANY',
460    #'(?i)(?l)[\d\w]' => varies depending on Unicode release
461    '(?i)(?l)[\D\w]' => 'ANYOFPOSIXL{i}[\\w\\D][0100-INFTY]',
462    '(?i)(?u)[\d\w]' => 'POSIXU[\w]',
463    '(?i)(?u)[\D\w]' => 'SANY',
464    '(?i)(?a)[\d\w]' => 'POSIXA[\w]',
465    '(?i)(?a)[\D\w]' => 'SANY',
466    '(?l:[\x{212A}])' => 'EXACTL <\x{212a}>',
467    '(?l:[\s\x{212A}])' => 'ANYOFPOSIXL[\s][1680 2000-200A 2028-2029 202F 205F 212A 3000]',
468    '(?l:[^\S\x{202F}])' => 'ANYOFPOSIXL[^\\S][1680 2000-200A 2028-2029 205F 3000]',
469    '(?li:[a-z])' => (($::IS_ASCII)
470                     ? 'ANYOFL{i}[a-z{utf8 locale}\x{017F}\x{212A}]'
471                     : 'ANYOFL{i}[a-ij-rs-z{utf8 locale}\x{017F}\x{212A}]'),
472    '\p{All}' => 'SANY',
473    '\P{All}' => 'OPFAIL',
474    '[\p{Any}]' => 'ANYOF[\x00-\xFF][0100-10FFFF]',
475
476    '[\p{IsMyRuntimeProperty}]' => 'ANYOF[+main::IsMyRuntimeProperty]',
477    '[^\p{IsMyRuntimeProperty}]' => 'ANYOF[^{+main::IsMyRuntimeProperty}]',
478    '[a\p{IsMyRuntimeProperty}]' => 'ANYOF[a][+main::IsMyRuntimeProperty]',
479    '[^a\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}]',
480    '[^a\x{100}\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}0100]',
481    '[^\p{All}\p{IsMyRuntimeProperty}]' => 'OPFAIL',
482    '[\p{All}\p{IsMyRuntimeProperty}]' => 'SANY',
483
484    '[\x{00}-{HIGHEST_CP}]' => 'ANYOF[\x00-\xFF][0100-HIGHEST_CP]',
485    '[\x{00}-{INFTY}]' => 'SANY',
486    '[\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
487    '[\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
488    '[\x{102}\x{104}]' => 'ANYOFHb[0102 0104]',
489    '[\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 HIGHEST_CP]',
490    '[\x{102}-\x{104}\x{101}]' => 'ANYOFRb[0101-0104]',
491    '[\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
492    '[\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
493    '[\x{102}-\x{104}\x{102}]' => 'ANYOFRb[0102-0104]',
494    '[\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
495    '[\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
496    '[\x{102}-\x{104}\x{103}]' => 'ANYOFRb[0102-0104]',
497    '[\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
498    '[\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
499    '[\x{102}-\x{104}\x{104}]' => 'ANYOFRb[0102-0104]',
500    '[\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
501    '[\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
502    '[\x{102}-\x{104}\x{105}]' => 'ANYOFRb[0102-0105]',
503    '[\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
504    '[\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
505    '[\x{102}-\x{104}\x{106}]' => 'ANYOFHb[0102-0104 0106]',
506    '[\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
507    '[\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
508    '[\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A HIGHEST_CP]',
509    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFHb[0101-0104 0108-010A]',
510    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
511    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
512    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFHb[0101-0104 0108-010A]',
513    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFHb[0101-0104 0108-010A]',
514    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFHb[0101-0104 0108-010A]',
515    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFHb[0101-0105 0108-010A]',
516    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFHb[0101-0106 0108-010A]',
517    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFRb[0101-010A]',
518    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFRb[0101-010A]',
519    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFRb[0101-010A]',
520    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFRb[0101-010A]',
521    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFRb[0101-010B]',
522    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFHb[0102-0104 0108-010A]',
523    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
524    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
525    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFHb[0102-0104 0108-010A]',
526    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFHb[0102-0104 0108-010A]',
527    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
528    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
529    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
530    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFRb[0102-010A]',
531    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFRb[0102-010A]',
532    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFRb[0102-010A]',
533    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFRb[0102-010A]',
534    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFRb[0102-010B]',
535    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFRb[0102-010C]',
536    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFHb[0102-0104 0108-010A]',
537    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
538    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
539    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
540    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
541    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
542    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFRb[0102-010A]',
543    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFRb[0102-010A]',
544    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFRb[0102-010A]',
545    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFRb[0102-010A]',
546    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFRb[0102-010B]',
547    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFRb[0102-010C]',
548    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
549    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
550    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
551    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
552    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
553    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFRb[0102-010A]',
554    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFRb[0102-010A]',
555    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFRb[0102-010A]',
556    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFRb[0102-010A]',
557    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFRb[0102-010B]',
558    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFRb[0102-010C]',
559    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
560    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
561    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
562    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
563    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFRb[0102-010A]',
564    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFRb[0102-010A]',
565    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFRb[0102-010A]',
566    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFRb[0102-010A]',
567    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFRb[0102-010B]',
568    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFRb[0102-010C]',
569    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFHb[0102-0104 0106 0108-010A]',
570    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
571    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
572    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFHb[0102-0104 0106-010A]',
573    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFHb[0102-0104 0106-010A]',
574    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFHb[0102-0104 0106-010A]',
575    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFHb[0102-0104 0106-010A]',
576    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFHb[0102-0104 0106-010B]',
577    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFHb[0102-0104 0106-010C]',
578    '[\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFHb[0102-0104 0107-010A]',
579    '[\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFHb[0102-0104 0108-010A]',
580    '[\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFHb[0102-0104 0108-010A]',
581    '[\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFHb[0102-0104 0108-010A]',
582    '[\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFHb[0102-0104 0108-010B]',
583    '[\x{103}\x{102}]' => 'EXACTFU_REQ8 <\x{103}>',
584    '[\x{104}\x{102}]' => 'ANYOFHb[0102 0104]',
585    '[\x{104}\x{102}\x{103}]' => 'ANYOFRb[0102-0104]',
586    '[\x{106}-{INFTY}\x{104}]' => 'ANYOFH[0104 0106-INFTY]',
587    '[\x{106}-{INFTY}\x{104}-{INFTY}]' => 'ANYOFH[0104-INFTY]',
588    '[\x{106}-{INFTY}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0104-INFTY]',
589    '[\x{106}-{INFTY}\x{104}-\x{105}]' => 'ANYOFH[0104-INFTY]',
590    '[\x{106}-{INFTY}\x{104}-\x{106}]' => 'ANYOFH[0104-INFTY]',
591    '[\x{106}-{INFTY}\x{104}-\x{107}]' => 'ANYOFH[0104-INFTY]',
592    '[\x{106}-{INFTY}\x{105}]' => 'ANYOFH[0105-INFTY]',
593    '[\x{106}-{INFTY}\x{105}-{INFTY}]' => 'ANYOFH[0105-INFTY]',
594    '[\x{106}-{INFTY}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0105-INFTY]',
595    '[\x{106}-{INFTY}\x{105}-\x{106}]' => 'ANYOFH[0105-INFTY]',
596    '[\x{106}-{INFTY}\x{105}-\x{107}]' => 'ANYOFH[0105-INFTY]',
597    '[\x{106}-{INFTY}\x{106}]' => 'ANYOFH[0106-INFTY]',
598    '[\x{106}-{INFTY}\x{106}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
599    '[\x{106}-{INFTY}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
600    '[\x{106}-{INFTY}\x{106}-\x{107}]' => 'ANYOFH[0106-INFTY]',
601    '[\x{106}-{INFTY}\x{107}]' => 'ANYOFH[0106-INFTY]',
602    '[\x{106}-{INFTY}\x{107}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
603    '[\x{106}-{INFTY}\x{107}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
604    '[\x{106}-{INFTY}\x{107}-\x{107}]' => 'ANYOFH[0106-INFTY]',
605    '[\x{10C}-{INFTY}{HIGHEST_CP}]' => 'ANYOFH[010C-INFTY]',
606    '[\x{10C}-{INFTY}\x{00}-{HIGHEST_CP}]' => 'SANY',
607    '[\x{10C}-{INFTY}\x{00}-{INFTY}]' => 'SANY',
608    '[\x{10C}-{INFTY}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
609    '[\x{10C}-{INFTY}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
610    '[\x{10C}-{INFTY}\x{102}\x{104}]' => 'ANYOFH[0102 0104 010C-INFTY]',
611    '[\x{10C}-{INFTY}\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 010C-INFTY]',
612    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{100}]' => 'ANYOFH[0100 0102-0104 010C-INFTY]',
613    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}]' => 'ANYOFH[0101-0104 010C-INFTY]',
614    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
615    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
616    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}]' => 'ANYOFH[0102-0104 010C-INFTY]',
617    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
618    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
619    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
620    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
621    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
622    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}]' => 'ANYOFH[0102-0104 010C-INFTY]',
623    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
624    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
625    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}]' => 'ANYOFH[0102-0105 010C-INFTY]',
626    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
627    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
628    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}]' => 'ANYOFH[0102-0104 0106 010C-INFTY]',
629    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
630    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
631    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
632    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
633    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
634    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
635    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
636    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
637    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
638    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFH[0101-0105 0108-010A 010C-INFTY]',
639    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFH[0101-0106 0108-010A 010C-INFTY]',
640    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFH[0101-010A 010C-INFTY]',
641    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFH[0101-010A 010C-INFTY]',
642    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFH[0101-010A 010C-INFTY]',
643    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFH[0101-010A 010C-INFTY]',
644    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFH[0101-INFTY]',
645    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
646    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
647    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
648    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
649    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
650    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
651    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
652    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
653    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
654    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
655    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
656    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
657    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
658    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
659    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
660    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
661    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
662    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
663    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
664    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
665    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
666    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
667    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
668    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
669    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
670    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
671    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
672    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
673    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
674    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
675    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
676    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
677    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
678    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
679    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
680    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
681    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
682    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
683    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
684    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
685    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
686    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
687    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
688    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
689    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
690    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
691    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
692    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFH[0102-0104 0106 0108-010A 010C-INFTY]',
693    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
694    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
695    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
696    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
697    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
698    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
699    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFH[0102-0104 0106-INFTY]',
700    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFH[0102-0104 0106-INFTY]',
701    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFH[0102-0104 0107-010A 010C-INFTY]',
702    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
703    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
704    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
705    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFH[0102-0104 0108-INFTY]',
706    '[\x{10C}-{INFTY}\x{103}\x{102}]' => 'ANYOFH[0102-0103 010C-INFTY]',
707    '[\x{10C}-{INFTY}\x{104}\x{102}]' => 'ANYOFH[0102 0104 010C-INFTY]',
708    '[\x{10C}-{INFTY}\x{104}\x{102}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
709    '[{HIGHEST_CP}]' => 'EXACT_REQ8 <\x{HIGHEST_CP}>',
710
711    '(?8)(?i)[\x{410}]' => 'EXACTFU_REQ8 <\x{430}>',
712    '(?8)(?i)[\x{399}]' => 'EXACTFU_REQ8 <\x{3b9}>',
713    '(?8)(?i)[\x{345}\x{399}\x{3B9}\x{1FBE}]' => 'EXACTFU_REQ8 <\x{3b9}>',
714    '(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>',           # Doesn't participate in a fold
715    '(?8)(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>',
716    '(?i)[\x{2bc}]' => 'EXACTFU_REQ8 <\x{2bc}>', # Part of a multi-char fold, ASCII component
717    '(?i)[\x{390}]' => 'EXACTFU_REQ8 <\x{3b9}\x{308}\x{301}>', # Part of a multi-char fold, no ASCII component
718
719    '(?i)[\x{1E9E}]' => 'EXACTFU <ss>',
720    '(?iaa)[\x{1E9E}]' => 'EXACTFAA <\x{17f}\x{17f}>',
721    '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
722    '(?iaa)[\x{FB00}]' => 'EXACT_REQ8 <\x{fb00}>',
723    '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
724    '(?i)[\x{FB01}]' => 'EXACTFU <fi>',
725    '(?i)[\x{FB02}]' => 'EXACTFU <fl>',
726    '(?i)[\x{FB03}]' => 'EXACTFU <ffi>',
727    '(?i)[\x{FB04}]' => 'EXACTFU <ffl>',
728    '(?i)[\x{FB05}]' => 'EXACTFU <st>',
729    '(?i)[\x{FB06}]' => 'EXACTFU <st>',
730
731    '[a][b]' => 'EXACT <ab>',
732    '[a]\x{100}' => 'EXACT_REQ8 <a\x{100}>',
733    '(?8)[\x{100}]a' => 'EXACT_REQ8 <\x{100}a>',
734    '(?i)[b][c]' => 'EXACTFU <bc>',
735    '(?i)[b]\x{100}' => 'EXACTFU_REQ8 <b\x{101}>',
736    '(?8)(?i)[\x{100}]b' => 'EXACTFU_REQ8 <\x{101}b>',
737    '(?i)b[s]' => 'EXACTFU <bs>',
738    '(?i)b[s]c' => 'EXACTFU <bsc>',
739    '(?i)bs[s]c' => 'EXACTF <bss>',  # The c goes into a 2nd node
740    '(?iu)bs[s]c' => 'EXACTFUP <bssc>',
741    '(?i)b[s]sc' => 'EXACTF <bssc>',
742    '(?iu)b[s]sc' => 'EXACTFUP <bssc>',
743    '(?i)[b]st' => 'EXACTFU <bst>',
744    '(?i)[b]st[s]' => 'EXACTFU <bsts>',
745    '(?i)[b]st[s]st' => 'EXACTF <bstsst>',
746    '(?iu)[b]st[s]st' => 'EXACTFUP <bstsst>',
747    '(?i)[s][s]' => 'EXACTF <ss>',
748    '(?iu)[s][s]' => 'EXACTFUP <ss>',
749);
750
751my @single_chars_to_test =
752(
753    "\x00",     # Always potentially problematic
754    "\x01",     # Unnamed control
755    "\b",       # Named control
756    "\n",       # Potentially special
757    "\r",       # Potentially special
758    "\cK",      # Potentially special
759    "0",        # Digit
760    ":",        # Not in any fold
761    "A",        # ASCII capital, participates in multi-char fold
762    "a",        # ASCII small, participates in multi-char fold
763    "B",        # ASCII capital, participates only in case-pair fold
764    "b",        # ASCII small, participates only in case-pair fold
765    "K",        # ASCII capital, folded to from above Latin1
766    "k",        # ASCII small, folded to from above Latin1
767    "\c?",      # Potentially special
768    "\x80",     # Latin1 control
769    "\xB5",     # Micro sign, folds to above Latin1
770    "\xC0",     # Latin1 capital, participates only in case-pair fold
771    "\xE0",     # Latin1 small, participates only in case-pair fold
772    "\xC5",     # Latin1 capital, folded to from above Latin1
773    "\xE5",     # Latin1 small, folded to from above Latin1
774    "\xDF",     # Small sharp S. folds to 'ss'
775    "\xF7",     # Doesn't participate in any fold
776    "\xFF",     # Folded to by above Latin1
777    "\x{100}",  # First few above Latin1 characters
778    "\x{101}",
779    "\x{102}",
780    "\x{103}",
781    "\x{104}",
782    "\x{105}",
783    "\x{106}",
784    "\x{107}",
785    "\x{108}",
786    "\x{2029}",
787);
788
789my @single_tests;
790for my $char (@single_chars_to_test) {
791    my $cp = ord $char;
792    my $hex = sprintf "%02x", $cp;
793    my $oct = sprintf "%o", $cp;
794    my $cp_string;
795
796    my $cased;
797    my $folded_hex;
798
799    {
800        use feature 'unicode_strings';
801        $cased = uc $char ne $char || lc $char ne $char;
802        $folded_hex = ($cased)
803                      ? sprintf("%02x", ord lc $char)
804                      : $hex;
805        #print STDERR "$hex, $folded_hex\n";
806    }
807
808    for my $fold ("", "i") {
809        #next unless $fold;
810        for my $charset ("", "u", "l", "aa") {
811            #next if $charset eq "aa" && ! $fold;
812
813            my $modifiers = $fold . $charset;
814            $modifiers = "(?$modifiers)" if $modifiers;
815
816            for my $upgrade ("", "(?8)") {
817                push @single_tests, "$upgrade$modifiers\[\\x{$hex}\]";
818                if ($cp < 256 || $upgrade) {
819                    push @single_tests, get_compiled("$upgrade$modifiers\\x{$hex}");
820                }
821                else {
822                    use feature 'fc';
823
824                    my %list = ( sprintf("%X", $cp) => 1 );
825                    if ($fold) {
826                        for my $op (qw(fc lc uc)) {
827                            my $result = eval "$op(\"$char\")";
828                            $list{sprintf "%X", ord $result} = 1;
829                        }
830                    }
831
832                    my $mod_cp = $cp;
833                    my $op;
834
835                    if (! $fold || scalar keys %list == 1) {
836                        $op = ($charset eq 'l')
837                                ? 'EXACTL'
838                                : ($cp < 256)
839                                ? 'EXACT'
840                                : 'EXACT_REQ8';
841                    }
842                    else {
843                        $op = ($charset eq 'aa')
844                        ? 'EXACTFAA'
845                        : ($charset eq 'l')
846                            ? (($cp < 256)
847                            ? 'EXACTFL'
848                            : 'EXACTFLU8')
849                            : ($cp < 256)
850                            ? 'EXACTFU'
851                            : 'EXACTFU_REQ8';
852                        $mod_cp = ord fc $char;
853                    }
854
855                    push @single_tests, sprintf "$op <\\x{%X}>", $mod_cp;
856                }
857            }
858        }
859    }
860}
861
862unshift @tests, @single_tests;
863
864plan(scalar (@tests - 1) / 2);  # -1 because of the marker.
865
866my $skip_ebcdic = $::IS_EBCDIC;
867while (defined (my $test = shift @tests)) {
868
869    if ($test eq 'ebcdic_ok_below_this_marker') {
870        $skip_ebcdic = 0;
871        next;
872    }
873
874    my $expected = shift @tests;
875
876    SKIP: {
877        skip("test not ported to EBCDIC", 1) if $skip_ebcdic;
878
879        my $display_expected = $expected
880                                        =~ s/ HIGHEST_CP /$highest_cp_string/xgr;
881        my $test_name = "Verify compilation of $test displays as"
882                      . " $expected";
883
884        my $result = get_compiled($test);
885        if ($expected =~ / ^ ANYOF[HR] /x) {
886            like($result, qr/ ^ \Q$expected\E (?:\Q (First UTF-8 byte=\x\E
887                              [[:xdigit:]]{2} )? /x, $test_name);
888        }
889        else {
890            is($result, $expected, $test_name);
891        }
892    }
893}
894