xref: /openbsd/gnu/usr.bin/perl/t/re/anyof.t (revision 4bdff4be)
1#!./perl
2
3use strict;
4use warnings;
5use utf8;
6
7# This tests that the ANYOF nodes generated by bracketed character classes are
8# as expected.  The representation of these is not guaranteed, and this test
9# may need to be updated if it changes.  But it is here to make sure that no
10# unexpected changes occur.  These could come from faulty generation of the
11# node, or faulty display of them (or both).  Because these causes come from
12# very different parts of the regex compiler, it is unlikely that a commit
13# would change both of them, so this test will adequately serve to test both.
14
15BEGIN {
16    chdir 't' if -d 't';
17    require './test.pl';
18    set_up_inc('../lib','.','../ext/re');
19    require Config; import Config;
20    skip_all('no re module') unless defined &DynaLoader::boot_DynaLoader;
21}
22
23# An array is used instead of a hash, so that the tests are carried out in the
24# order given by this file.  Even-numbered indices are the regexes to compile.
25# The next higher element is the expected compilation result.
26#
27# It is painful to port some of these to EBCDIC, as not only do the code point
28# numbers change (for those < 256), but the order changes, as the compiled
29# version is sorted by native code point order.  On EBCDIC, \r comes before
30# \n, and 'k' before "K', for example.  So, the tests where there are
31# differences are skipped on EBCDIC.  They are all at the beginning of the
32# array, and a special marker entry is used to delmit the boundary between
33# skipped and not skipped.
34#
35# NOTE:  If the pattern contains (?8) it will be upgraded to UTF-8 after
36#        stripping that
37
38use Unicode::UCD;
39my $highest_cp = $Unicode::UCD::MAX_CP;
40my $highest_cp_string = sprintf "%X", $highest_cp;
41$highest_cp_string = "$highest_cp_string";
42
43my $infinity = $highest_cp_string;
44$infinity =~ s/^7/F/;  # Make infinity larger than the largest legal one, and
45                       # at the time of this writing, we really internally
46                       # allow UV_MAX to be infinity.
47
48sub  get_compiled ($) {
49    # Convert platform-independent values to what is suitable for the
50    # platform
51
52    my $pattern = shift;
53
54    $pattern =~ s/{INFTY}/\\x{$infinity}/g;
55    $pattern =~ s/{HIGHEST_CP}/\\x{$highest_cp_string}/g;
56    my $use_utf8 = ($pattern =~ s/\Q(?8)//);
57
58    $pattern = "my \$a = '$pattern';";
59    $pattern .= "utf8::upgrade(\$a);" if $use_utf8;
60    $pattern .= "qr/\$a/";
61    my $actual_pattern = "use re qw(Debug COMPILE); $pattern";
62
63    my $result = fresh_perl($actual_pattern);
64    if ($? != 0) {  # Re-run so as to display STDERR.
65        fail($pattern, "Until this is fixed, the planned number of tests will be wrong");
66        fresh_perl($actual_pattern, { stderr => 0, verbose => 1 });
67        return;
68    }
69
70    # The Debug output will come back as a bunch of lines.  We are
71    # interested only in the line after /Final program/
72    my @lines = split /\n/, $result;
73    while (defined ($_ = shift @lines)) {
74        last if /Final program/;
75    }
76
77    $_ = shift @lines;
78    unless (defined $_) {
79        die "Unexpected compilation result: '$result'\n"
80          . " Compiled from '$actual_pattern'";
81    }
82
83    s/ \s* \( \d+ \) \s* //x;   # Get rid of the node branch
84    s/ ^ \s* \d+ : \s* //x;     # ... And the node number
85
86    # Use platform-independent values
87    s/$infinity/INFTY/ig;
88    s/$highest_cp_string/HIGHEST_CP/ig;
89
90    return $_;
91}
92
93# Note: EXACTish lowercases the hex; ANYOF uppercases, without braces
94
95my @tests = (
96    '[\xe0\xc0]' => 'EXACTFU <\\x{e0}>',
97    '[\xe1\xc1]' => 'EXACTFU <\\x{e1}>',
98    '[\xe2\xc2]' => 'EXACTFU <\\x{e2}>',
99    '[\xe3\xc3]' => 'EXACTFU <\\x{e3}>',
100    '[\xe4\xc4]' => 'EXACTFU <\\x{e4}>',
101    '[\xc5\xe5]' => 'ANYOF[\\xC5\\xE5]',
102    '[\xe6\xc6]' => 'EXACTFU <\\x{e6}>',
103    '[\xe7\xc7]' => 'EXACTFU <\\x{e7}>',
104    '[\xe8\xc8]' => 'EXACTFU <\\x{e8}>',
105    '[\xe9\xc9]' => 'EXACTFU <\\x{e9}>',
106    '[\xea\xca]' => 'EXACTFU <\\x{ea}>',
107    '[\xeb\xcb]' => 'EXACTFU <\\x{eb}>',
108    '[\xec\xcc]' => 'EXACTFU <\\x{ec}>',
109    '[\xee\xce]' => 'EXACTFU <\\x{ee}>',
110    '[\xef\xcf]' => 'EXACTFU <\\x{ef}>',
111    '[\xf0\xd0]' => 'EXACTFU <\\x{f0}>',
112    '[\xf1\xd1]' => 'EXACTFU <\\x{f1}>',
113    '[\xf2\xd2]' => 'EXACTFU <\\x{f2}>',
114    '[\xf3\xd3]' => 'EXACTFU <\\x{f3}>',
115    '[\xf4\xd4]' => 'EXACTFU <\\x{f4}>',
116    '[\xf5\xd5]' => 'EXACTFU <\\x{f5}>',
117    '[\xf6\xd6]' => 'EXACTFU <\\x{f6}>',
118    '[\xf8\xd8]' => 'EXACTFU <\\x{f8}>',
119    '[\xf9\xd9]' => 'EXACTFU <\\x{f9}>',
120    '[\xfa\xda]' => 'EXACTFU <\\x{fa}>',
121    '[\xfb\xdb]' => 'EXACTFU <\\x{fb}>',
122    '[\xfc\xdc]' => 'EXACTFU <\\x{fc}>',
123    '[\xfd\xdd]' => 'EXACTFU <\\x{fd}>',
124    '[\xfe\xde]' => 'EXACTFU <\\x{fe}>',
125
126    '[[{]' => 'ANYOFM[\[\{]',
127    '[^\S ]' => 'ANYOFD[\t\n\x0B\f\r{utf8}\x85\xA0][1680 2000-200A 2028-2029 202F 205F 3000]',
128    '[^\n\r]' => 'ANYOF[^\n\r][0100-INFTY]',
129    '[^\/\|,\$\%%\@\ \%"\<\>\:\#\&\*\{\}\[\]\(\)]' => 'ANYOF[^ "#$%&()*,/:<>@\[\]\{|\}][0100-INFTY]',
130    '[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
131    '[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
132    '[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
133    '(?u)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
134    '(?u)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
135    '(?a)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
136    '(?a)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
137    '(?a)[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
138    '[[:cntrl:]]' => 'POSIXD[:cntrl:]',
139    '[^[:^print:][:^ascii:]]' => 'POSIXA[:print:]',
140    '[[:blank:]]' => 'POSIXD[:blank:]',
141    '[ [:blank:]]' => 'POSIXD[:blank:]',
142    '[_[:blank:]]' => 'ANYOFD[\t _{utf8}\xA0][1680 2000-200A 202F 205F 3000]',
143    '[_[:^blank:]]' => 'NPOSIXD[:blank:]',
144    '[\xA0[:^blank:]]' => 'ANYOF[^\t ][0100-167F 1681-1FFF 200B-202E 2030-205E 2060-2FFF 3001-INFTY]',
145    '(?d:[_[:^blank:]])' => 'NPOSIXD[:blank:]',
146    '[\x{07}-\x{0B}]' => 'ANYOFR[\a\b\t\n\x0B]',
147    '(?l)[\x{2029}]' => 'EXACTL <\x{2029}>',
148    '(?l)(?[\x{2029}])' => 'ANYOFL{utf8-locale-reqd}[2029]', # regex sets requires utf8 locale for /l
149    '(?il)[\x{212A}]' => 'EXACTFL <\\x{212a}>',
150    '(?il)(?[\x{212A}])' => 'ANYOFL{utf8-locale-reqd}[Kk][212A]',
151
152    '(?i)b[s]\xe0' => 'ANYOFM[Bb]',    # The s goes into a 2nd node
153
154    '[aA]' => 'ANYOFM[Aa]',
155    '[bB]' => 'ANYOFM[Bb]',
156    '[kK]' => 'ANYOFM[Kk]',
157
158    'ebcdic_ok_below_this_marker',
159
160    '(?i:[^:])' => 'NANYOFM[:]',
161
162    '[^\n]' => 'REG_ANY',
163
164    '[[:alpha:]]' => 'POSIXD[:alpha:]',
165    '[[:^alpha:]]' => 'NPOSIXD[:alpha:]',
166    '[[:^alpha:]\x{2C2}]' => 'NPOSIXU[:alpha:]',
167    '(?l)[[:alpha:]]' => 'POSIXL[:alpha:]',
168    '(?l)[[:^alpha:]]' => 'NPOSIXL[:alpha:]',
169    '(?l)[[:^alpha:]\x{2C2}]' => 'NPOSIXL[:alpha:]',
170    '(?u)[[:alpha:]]' => 'POSIXU[:alpha:]',
171    '(?u)[[:^alpha:]]' => 'NPOSIXU[:alpha:]',
172    '(?a)[[:alpha:]]' => 'POSIXA[:alpha:]',
173    '(?a)[[:^alpha:]]' => 'NPOSIXA[:alpha:]',
174    '(?a)[[:^alpha:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
175    '[[:alpha:][:^alpha:]]' => 'SANY',
176    '[^[:alpha:][:^alpha:]]' => 'OPFAIL',
177    '(?l)[[:alpha:][:^alpha:]]' => 'SANY',
178    '(?l)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
179    '(?u)[[:alpha:][:^alpha:]]' => 'SANY',
180    '(?u)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
181    '(?a)[[:alpha:][:^alpha:]]' => 'SANY',
182    '(?a)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
183    '[[:alnum:]]' => 'POSIXD[:alnum:]',
184    '[[:^alnum:]]' => 'NPOSIXD[:alnum:]',
185    '[[:^alnum:]\x{2C2}]' => 'NPOSIXU[:alnum:]',
186    '(?l)[[:alnum:]]' => 'POSIXL[:alnum:]',
187    '(?l)[[:^alnum:]]' => 'NPOSIXL[:alnum:]',
188    '(?l)[[:^alnum:]\x{2C2}]' => 'NPOSIXL[:alnum:]',
189    '(?u)[[:alnum:]]' => 'POSIXU[:alnum:]',
190    '(?u)[[:^alnum:]]' => 'NPOSIXU[:alnum:]',
191    '(?a)[[:alnum:]]' => 'POSIXA[:alnum:]',
192    '(?a)[[:^alnum:]]' => 'NPOSIXA[:alnum:]',
193    '(?a)[[:^alnum:]\x{2C2}]' => 'NPOSIXA[:alnum:]',
194    '[[:alnum:][:^alnum:]]' => 'SANY',
195    '[^[:alnum:][:^alnum:]]' => 'OPFAIL',
196    '(?l)[[:alnum:][:^alnum:]]' => 'SANY',
197    '(?l)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
198    '(?u)[[:alnum:][:^alnum:]]' => 'SANY',
199    '(?u)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
200    '(?a)[[:alnum:][:^alnum:]]' => 'SANY',
201    '(?a)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
202    '(?l)[[:ascii:]]' => 'POSIXL[:ascii:]',
203    '(?l)[[:^ascii:]]' => 'NPOSIXL[:ascii:]',
204    '(?l)[[:^ascii:]\x{2C2}]' => 'NPOSIXL[:ascii:]',
205    '[[:ascii:][:^ascii:]]' => 'SANY',
206    '[^[:ascii:][:^ascii:]]' => 'OPFAIL',
207    '(?l)[[:ascii:][:^ascii:]]' => 'SANY',
208    '(?l)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
209    '(?u)[[:ascii:][:^ascii:]]' => 'SANY',
210    '(?u)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
211    '(?a)[[:ascii:][:^ascii:]]' => 'SANY',
212    '(?a)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
213    '[[:^blank:]]' => 'NPOSIXD[:blank:]',
214    '[[:^blank:]\x{2C2}]' => 'NPOSIXU[:blank:]',
215    '(?l)[[:blank:]]' => 'POSIXL[:blank:]',
216    '(?l)[[:^blank:]]' => 'NPOSIXL[:blank:]',
217    '(?l)[[:^blank:]\x{2C2}]' => 'NPOSIXL[:blank:]',
218    '(?u)[[:blank:]]' => 'POSIXU[:blank:]',
219    '(?u)[[:^blank:]]' => 'NPOSIXU[:blank:]',
220    '(?a)[[:blank:]]' => 'POSIXA[:blank:]',
221    '(?a)[[:^blank:]]' => 'NPOSIXA[:blank:]',
222    '(?a)[[:^blank:]\x{2C2}]' => 'NPOSIXA[:blank:]',
223    '[[:blank:]]' => 'POSIXD[:blank:]',
224    '[[:blank:][:^blank:]]' => 'SANY',
225    '[^[:blank:][:^blank:]]' => 'OPFAIL',
226    '(?l)[[:blank:][:^blank:]]' => 'SANY',
227    '(?l)[^[:blank:][:^blank:]]' => 'OPFAIL',
228    '(?u)[[:blank:][:^blank:]]' => 'SANY',
229    '(?u)[^[:blank:][:^blank:]]' => 'OPFAIL',
230    '(?a)[[:blank:][:^blank:]]' => 'SANY',
231    '(?a)[^[:blank:][:^blank:]]' => 'OPFAIL',
232    '[[:^cntrl:]]' => 'NPOSIXD[:cntrl:]',
233    '[[:^cntrl:]\x{2C2}]' => 'NPOSIXU[:cntrl:]',
234    '(?l)[[:cntrl:]]' => 'POSIXL[:cntrl:]',
235    '(?l)[[:^cntrl:]]' => 'NPOSIXL[:cntrl:]',
236    '(?l)[[:^cntrl:]\x{2C2}]' => 'NPOSIXL[:cntrl:]',
237    '(?u)[[:cntrl:]]' => 'POSIXU[:cntrl:]',
238    '(?u)[[:^cntrl:]]' => 'NPOSIXU[:cntrl:]',
239    '(?a)[[:cntrl:]]' => 'POSIXA[:cntrl:]',
240    '(?a)[[:^cntrl:]]' => 'NPOSIXA[:cntrl:]',
241    '(?a)[[:^cntrl:]\x{2C2}]' => 'NPOSIXA[:cntrl:]',
242    '[[:cntrl:][:^cntrl:]]' => 'SANY',
243    '[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
244    '(?l)[[:cntrl:][:^cntrl:]]' => 'SANY',
245    '(?l)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
246    '(?u)[[:cntrl:][:^cntrl:]]' => 'SANY',
247    '(?u)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
248    '(?a)[[:cntrl:][:^cntrl:]]' => 'SANY',
249    '(?a)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
250    '[[:digit:]]' => 'POSIXU[\d]',
251    '[[:^digit:]]' => 'NPOSIXU[\d]',
252    '[[:^digit:]\x{2C2}]' => 'NPOSIXU[\d]',
253    '(?l)[[:digit:]]' => 'POSIXL[\d]',
254    '(?l)[[:^digit:]]' => 'NPOSIXL[\d]',
255    '(?l)[[:^digit:]\x{2C2}]' => 'NPOSIXL[\d]',
256    '(?u)[[:digit:]]' => 'POSIXU[\d]',
257    '(?u)[[:^digit:]]' => 'NPOSIXU[\d]',
258    '(?a)[[:digit:]]' => 'POSIXA[\d]',
259    '(?a)[[:^digit:]]' => 'NPOSIXA[\d]',
260    '(?a)[[:^digit:]\x{2C2}]' => 'NPOSIXA[\d]',
261    '[[:digit:][:^digit:]]' => 'SANY',
262    '[^[:digit:][:^digit:]]' => 'OPFAIL',
263    '(?l)[[:digit:][:^digit:]]' => 'SANY',
264    '(?l)[^[:digit:][:^digit:]]' => 'OPFAIL',
265    '(?u)[[:digit:][:^digit:]]' => 'SANY',
266    '(?u)[^[:digit:][:^digit:]]' => 'OPFAIL',
267    '(?a)[[:digit:][:^digit:]]' => 'SANY',
268    '(?a)[^[:digit:][:^digit:]]' => 'OPFAIL',
269    '[[:graph:]]' => 'POSIXD[:graph:]',
270    '[[:^graph:]]' => 'NPOSIXD[:graph:]',
271    '[[:^graph:]\x{FFFF}]' => 'NPOSIXU[:graph:]',
272    '(?l)[[:graph:]]' => 'POSIXL[:graph:]',
273    '(?l)[[:^graph:]]' => 'NPOSIXL[:graph:]',
274    '(?l)[[:^graph:]\x{FFFF}]' => 'NPOSIXL[:graph:]',
275    '(?u)[[:graph:]]' => 'POSIXU[:graph:]',
276    '(?u)[[:^graph:]]' => 'NPOSIXU[:graph:]',
277    '(?a)[[:graph:]]' => 'POSIXA[:graph:]',
278    '(?a)[[:^graph:]]' => 'NPOSIXA[:graph:]',
279    '(?a)[[:^graph:]\x{FFFF}]' => 'NPOSIXA[:graph:]',
280    '[[:graph:][:^graph:]]' => 'SANY',
281    '[^[:graph:][:^graph:]]' => 'OPFAIL',
282    '(?l)[[:graph:][:^graph:]]' => 'SANY',
283    '(?l)[^[:graph:][:^graph:]]' => 'OPFAIL',
284    '(?u)[[:graph:][:^graph:]]' => 'SANY',
285    '(?u)[^[:graph:][:^graph:]]' => 'OPFAIL',
286    '(?a)[[:graph:][:^graph:]]' => 'SANY',
287    '(?a)[^[:graph:][:^graph:]]' => 'OPFAIL',
288    '[[:lower:]]' => 'POSIXD[:lower:]',
289    '[[:^lower:]]' => 'NPOSIXD[:lower:]',
290    '[[:^lower:]\x{2C2}]' => 'NPOSIXU[:lower:]',
291    '(?l)[[:lower:]]' => 'POSIXL[:lower:]',
292    '(?l)[[:^lower:]]' => 'NPOSIXL[:lower:]',
293    '(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:lower:]',
294    '(?u)[[:lower:]]' => 'POSIXU[:lower:]',
295    '(?u)[[:^lower:]]' => 'NPOSIXU[:lower:]',
296    '(?a)[[:lower:]]' => 'POSIXA[:lower:]',
297    '(?a)[[:^lower:]]' => 'NPOSIXA[:lower:]',
298    '(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:lower:]',
299    '[[:lower:][:^lower:]]' => 'SANY',
300    '[^[:lower:][:^lower:]]' => 'OPFAIL',
301    '(?l)[[:lower:][:^lower:]]' => 'SANY',
302    '(?l)[^[:lower:][:^lower:]]' => 'OPFAIL',
303    '(?u)[[:lower:][:^lower:]]' => 'SANY',
304    '(?u)[^[:lower:][:^lower:]]' => 'OPFAIL',
305    '(?a)[[:lower:][:^lower:]]' => 'SANY',
306    '(?a)[^[:lower:][:^lower:]]' => 'OPFAIL',
307    '[[:print:]]' => 'POSIXD[:print:]',
308    '[[:^print:]]' => 'NPOSIXD[:print:]',
309    '[[:^print:]\x{FFFF}]' => 'NPOSIXU[:print:]',
310    '(?l)[[:print:]]' => 'POSIXL[:print:]',
311    '(?l)[[:^print:]]' => 'NPOSIXL[:print:]',
312    '(?l)[[:^print:]\x{FFFF}]' => 'NPOSIXL[:print:]',
313    '(?u)[[:print:]]' => 'POSIXU[:print:]',
314    '(?u)[[:^print:]]' => 'NPOSIXU[:print:]',
315    '(?a)[[:print:]]' => 'POSIXA[:print:]',
316    '(?a)[[:^print:]]' => 'NPOSIXA[:print:]',
317    '(?a)[[:^print:]\x{FFFF}]' => 'NPOSIXA[:print:]',
318    '[[:print:][:^print:]]' => 'SANY',
319    '[^[:print:][:^print:]]' => 'OPFAIL',
320    '(?l)[[:print:][:^print:]]' => 'SANY',
321    '(?l)[^[:print:][:^print:]]' => 'OPFAIL',
322    '(?u)[[:print:][:^print:]]' => 'SANY',
323    '(?u)[^[:print:][:^print:]]' => 'OPFAIL',
324    '(?a)[[:print:][:^print:]]' => 'SANY',
325    '(?a)[^[:print:][:^print:]]' => 'OPFAIL',
326    '[[:punct:]]' => 'POSIXD[:punct:]',
327    '[[:^punct:]]' => 'NPOSIXD[:punct:]',
328    '[[:^punct:]\x{2C2}]' => 'NPOSIXU[:punct:]',
329    '(?l)[[:punct:]]' => 'POSIXL[:punct:]',
330    '(?l)[[:^punct:]]' => 'NPOSIXL[:punct:]',
331    '(?l)[[:^punct:]\x{2C2}]' => 'NPOSIXL[:punct:]',
332    '(?u)[[:punct:]]' => 'POSIXU[:punct:]',
333    '(?u)[[:^punct:]]' => 'NPOSIXU[:punct:]',
334    '(?a)[[:punct:]]' => 'POSIXA[:punct:]',
335    '(?a)[[:^punct:]]' => 'NPOSIXA[:punct:]',
336    '(?a)[[:^punct:]\x{2C2}]' => 'NPOSIXA[:punct:]',
337    '[[:punct:][:^punct:]]' => 'SANY',
338    '[^[:punct:][:^punct:]]' => 'OPFAIL',
339    '(?l)[[:punct:][:^punct:]]' => 'SANY',
340    '(?l)[^[:punct:][:^punct:]]' => 'OPFAIL',
341    '(?u)[[:punct:][:^punct:]]' => 'SANY',
342    '(?u)[^[:punct:][:^punct:]]' => 'OPFAIL',
343    '(?a)[[:punct:][:^punct:]]' => 'SANY',
344    '(?a)[^[:punct:][:^punct:]]' => 'OPFAIL',
345    '[[:space:]]' => 'POSIXD[\s]',
346    '[[:^space:]]' => 'NPOSIXD[\s]',
347    '[[:^space:]\x{2C2}]' => 'NPOSIXU[\s]',
348    '(?l)[[:space:]]' => 'POSIXL[\s]',
349    '(?l)[[:^space:]]' => 'NPOSIXL[\s]',
350    '(?l)[[:^space:]\x{2C2}]' => 'NPOSIXL[\s]',
351    '(?u)[[:space:]]' => 'POSIXU[\s]',
352    '(?u)[[:^space:]]' => 'NPOSIXU[\s]',
353    '(?a)[[:space:]]' => 'POSIXA[\s]',
354    '(?a)[[:^space:]]' => 'NPOSIXA[\s]',
355    '(?a)[[:^space:]\x{2C2}]' => 'NPOSIXA[\s]',
356    '[[:space:][:^space:]]' => 'SANY',
357    '[^[:space:][:^space:]]' => 'OPFAIL',
358    '(?l)[[:space:][:^space:]]' => 'SANY',
359    '(?l)[^[:space:][:^space:]]' => 'OPFAIL',
360    '(?u)[[:space:][:^space:]]' => 'SANY',
361    '(?u)[^[:space:][:^space:]]' => 'OPFAIL',
362    '(?a)[[:space:][:^space:]]' => 'SANY',
363    '(?a)[^[:space:][:^space:]]' => 'OPFAIL',
364    '[[:upper:]]' => 'POSIXD[:upper:]',
365    '[[:^upper:]]' => 'NPOSIXD[:upper:]',
366    '[[:^upper:]\x{2C2}]' => 'NPOSIXU[:upper:]',
367    '(?l)[[:upper:]]' => 'POSIXL[:upper:]',
368    '(?l)[[:^upper:]]' => 'NPOSIXL[:upper:]',
369    '(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:upper:]',
370    '(?u)[[:upper:]]' => 'POSIXU[:upper:]',
371    '(?u)[[:^upper:]]' => 'NPOSIXU[:upper:]',
372    '(?a)[[:upper:]]' => 'POSIXA[:upper:]',
373    '(?a)[[:^upper:]]' => 'NPOSIXA[:upper:]',
374    '(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:upper:]',
375    '[[:upper:][:^upper:]]' => 'SANY',
376    '[^[:upper:][:^upper:]]' => 'OPFAIL',
377    '(?l)[[:upper:][:^upper:]]' => 'SANY',
378    '(?l)[^[:upper:][:^upper:]]' => 'OPFAIL',
379    '(?u)[[:upper:][:^upper:]]' => 'SANY',
380    '(?u)[^[:upper:][:^upper:]]' => 'OPFAIL',
381    '(?a)[[:upper:][:^upper:]]' => 'SANY',
382    '(?a)[^[:upper:][:^upper:]]' => 'OPFAIL',
383    '[\v]' => 'POSIXU[\v]',
384    '[^\v]' => 'NPOSIXU[\v]',
385    '[\V\x{2C2}]' => 'NPOSIXU[\v]',
386    '(?l)[\v]' => 'POSIXU[\v]',
387    '(?l)[^\v]' => 'NPOSIXU[\v]',
388    '(?l)[\V\x{2C2}]' => 'NPOSIXU[\v]',
389    '(?u)[\v]' => 'POSIXU[\v]',
390    '(?u)[^\v]' => 'NPOSIXU[\v]',
391    '(?a)[\v]' => 'POSIXU[\v]',
392    '(?a)[^\v]' => 'NPOSIXU[\v]',
393    '(?a)[\V\x{2C2}]' => 'NPOSIXU[\v]',
394    '[\v\V]' => 'SANY',
395    '[^\v\V]' => 'OPFAIL',
396    '(?l)[\v\V]' => 'SANY',
397    '(?l)[^\v\V]' => 'OPFAIL',
398    '(?u)[\v\V]' => 'SANY',
399    '(?u)[^\v\V]' => 'OPFAIL',
400    '(?a)[\v\V]' => 'SANY',
401    '(?a)[^\v\V]' => 'OPFAIL',
402    '[[:word:]]' => 'POSIXD[\w]',
403    '[[:^word:]]' => 'NPOSIXD[\w]',
404    '[[:^word:]\x{2C2}]' => 'NPOSIXU[\w]',
405    '(?l)[[:word:]]' => 'POSIXL[\w]',
406    '(?l)[[:^word:]]' => 'NPOSIXL[\w]',
407    '(?l)[[:^word:]\x{2C2}]' => 'NPOSIXL[\w]',
408    '(?u)[[:word:]]' => 'POSIXU[\w]',
409    '(?u)[[:^word:]]' => 'NPOSIXU[\w]',
410    '(?a)[[:word:]]' => 'POSIXA[\w]',
411    '(?a)[[:^word:]]' => 'NPOSIXA[\w]',
412    '(?a)[[:^word:]\x{2C2}]' => 'NPOSIXA[\w]',
413    '[[:word:][:^word:]]' => 'SANY',
414    '[^[:word:][:^word:]]' => 'OPFAIL',
415    '(?l)[[:word:][:^word:]]' => 'SANY',
416    '(?l)[^[:word:][:^word:]]' => 'OPFAIL',
417    '(?u)[[:word:][:^word:]]' => 'SANY',
418    '(?u)[^[:word:][:^word:]]' => 'OPFAIL',
419    '(?a)[[:word:][:^word:]]' => 'SANY',
420    '(?a)[^[:word:][:^word:]]' => 'OPFAIL',
421    '[[:xdigit:]]' => 'POSIXU[:xdigit:]',
422    '[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
423    '[[:^xdigit:]\x{2C2}]' => 'NPOSIXU[:xdigit:]',
424    '(?l)[[:xdigit:]]' => 'POSIXL[:xdigit:]',
425    '(?l)[[:^xdigit:]]' => 'NPOSIXL[:xdigit:]',
426    '(?l)[[:^xdigit:]\x{2C2}]' => 'NPOSIXL[:xdigit:]',
427    '(?u)[[:xdigit:]]' => 'POSIXU[:xdigit:]',
428    '(?u)[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
429    '(?a)[[:xdigit:]]' => 'POSIXA[:xdigit:]',
430    '(?a)[[:^xdigit:]]' => 'NPOSIXA[:xdigit:]',
431    '(?a)[[:^xdigit:]\x{2C2}]' => 'NPOSIXA[:xdigit:]',
432    '[[:xdigit:][:^xdigit:]]' => 'SANY',
433    '[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
434    '(?l)[[:xdigit:][:^xdigit:]]' => 'SANY',
435    '(?l)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
436    '(?u)[[:xdigit:][:^xdigit:]]' => 'SANY',
437    '(?u)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
438    '(?a)[[:xdigit:][:^xdigit:]]' => 'SANY',
439    '(?a)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
440    '(?i)[[:lower:]]' => 'POSIXD[:cased:]',
441    '(?i)[[:^lower:]]' => 'NPOSIXD[:cased:]',
442    '(?i)[[:^lower:]\x{2C2}]' => 'NPOSIXU[:cased:]',
443    '(?i)(?l)[[:lower:]]' => 'POSIXL[:cased:]',
444    '(?i)(?l)[[:^lower:]]' => 'NPOSIXL[:cased:]',
445    '(?i)(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:cased:]',
446    '(?i)(?u)[[:lower:]]' => 'POSIXU[:cased:]',
447    '(?i)(?u)[[:^lower:]]' => 'NPOSIXU[:cased:]',
448    '(?i)(?a)[[:lower:]]' => 'POSIXA[:alpha:]',
449    '(?i)(?a)[[:^lower:]]' => 'NPOSIXA[:alpha:]',
450    '(?i)(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
451    '(?i)[[:upper:]]' => 'POSIXD[:cased:]',
452    '(?i)[[:^upper:]]' => 'NPOSIXD[:cased:]',
453    '(?i)[[:^upper:]\x{2C2}]' => 'NPOSIXU[:cased:]',
454    '(?i)(?l)[[:upper:]]' => 'POSIXL[:cased:]',
455    '(?i)(?l)[[:^upper:]]' => 'NPOSIXL[:cased:]',
456    '(?i)(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:cased:]',
457    '(?i)(?u)[[:upper:]]' => 'POSIXU[:cased:]',
458    '(?i)(?u)[[:^upper:]]' => 'NPOSIXU[:cased:]',
459    '(?i)(?a)[[:upper:]]' => 'POSIXA[:alpha:]',
460    '(?i)(?a)[[:^upper:]]' => 'NPOSIXA[:alpha:]',
461    '(?i)(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
462    '(?i)[\d\w]' => 'POSIXD[\w]',
463    '(?i)[\D\w]' => 'SANY',
464    #'(?i)(?l)[\d\w]' => varies depending on Unicode release
465    '(?i)(?l)[\D\w]' => 'ANYOFPOSIXL{i}[\\w\\D][0100-INFTY]',
466    '(?i)(?u)[\d\w]' => 'POSIXU[\w]',
467    '(?i)(?u)[\D\w]' => 'SANY',
468    '(?i)(?a)[\d\w]' => 'POSIXA[\w]',
469    '(?i)(?a)[\D\w]' => 'SANY',
470    '(?l:[\x{212A}])' => 'EXACTL <\x{212a}>',
471    '(?l:[\s\x{212A}])' => 'ANYOFPOSIXL[\s][1680 2000-200A 2028-2029 202F 205F 212A 3000]',
472    '(?l:[^\S\x{202F}])' => 'ANYOFPOSIXL[^\\S][1680 2000-200A 2028-2029 205F 3000]',
473    '(?li:[a-z])' => (($::IS_ASCII)
474                     ? 'ANYOFL{i}[a-z{utf8 locale}\x{017F}\x{212A}]'
475                     : 'ANYOFL{i}[a-ij-rs-z{utf8 locale}\x{017F}\x{212A}]'),
476    '\p{All}' => 'SANY',
477    '\P{All}' => 'OPFAIL',
478    '[\p{Any}]' => 'ANYOF[\x00-\xFF][0100-10FFFF]',
479
480    '[\p{IsMyRuntimeProperty}]' => 'ANYOF[+main::IsMyRuntimeProperty]',
481    '[^\p{IsMyRuntimeProperty}]' => 'ANYOF[^{+main::IsMyRuntimeProperty}]',
482    '[a\p{IsMyRuntimeProperty}]' => 'ANYOF[a][+main::IsMyRuntimeProperty]',
483    '[^a\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}]',
484    '[^a\x{100}\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}0100]',
485    '[^\p{All}\p{IsMyRuntimeProperty}]' => 'OPFAIL',
486    '[\p{All}\p{IsMyRuntimeProperty}]' => 'SANY',
487
488    '[\x{00}-{HIGHEST_CP}]' => 'ANYOF[\x00-\xFF][0100-HIGHEST_CP]',
489    '[\x{00}-{INFTY}]' => 'SANY',
490    '[\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
491    '[\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
492    '[\x{102}\x{104}]' => 'ANYOFHb[0102 0104]',
493    '[\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 HIGHEST_CP]',
494    '[\x{102}-\x{104}\x{101}]' => 'ANYOFRb[0101-0104]',
495    '[\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
496    '[\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
497    '[\x{102}-\x{104}\x{102}]' => 'ANYOFRb[0102-0104]',
498    '[\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
499    '[\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
500    '[\x{102}-\x{104}\x{103}]' => 'ANYOFRb[0102-0104]',
501    '[\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
502    '[\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
503    '[\x{102}-\x{104}\x{104}]' => 'ANYOFRb[0102-0104]',
504    '[\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
505    '[\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
506    '[\x{102}-\x{104}\x{105}]' => 'ANYOFRb[0102-0105]',
507    '[\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
508    '[\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
509    '[\x{102}-\x{104}\x{106}]' => 'ANYOFHb[0102-0104 0106]',
510    '[\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
511    '[\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
512    '[\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A HIGHEST_CP]',
513    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFHb[0101-0104 0108-010A]',
514    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
515    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
516    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFHb[0101-0104 0108-010A]',
517    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFHb[0101-0104 0108-010A]',
518    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFHb[0101-0104 0108-010A]',
519    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFHb[0101-0105 0108-010A]',
520    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFHb[0101-0106 0108-010A]',
521    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFRb[0101-010A]',
522    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFRb[0101-010A]',
523    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFRb[0101-010A]',
524    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFRb[0101-010A]',
525    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFRb[0101-010B]',
526    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFHb[0102-0104 0108-010A]',
527    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
528    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
529    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFHb[0102-0104 0108-010A]',
530    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFHb[0102-0104 0108-010A]',
531    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
532    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
533    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
534    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFRb[0102-010A]',
535    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFRb[0102-010A]',
536    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFRb[0102-010A]',
537    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFRb[0102-010A]',
538    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFRb[0102-010B]',
539    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFRb[0102-010C]',
540    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFHb[0102-0104 0108-010A]',
541    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
542    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
543    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
544    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
545    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
546    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFRb[0102-010A]',
547    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFRb[0102-010A]',
548    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFRb[0102-010A]',
549    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFRb[0102-010A]',
550    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFRb[0102-010B]',
551    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFRb[0102-010C]',
552    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
553    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
554    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
555    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
556    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
557    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFRb[0102-010A]',
558    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFRb[0102-010A]',
559    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFRb[0102-010A]',
560    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFRb[0102-010A]',
561    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFRb[0102-010B]',
562    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFRb[0102-010C]',
563    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
564    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
565    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
566    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
567    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFRb[0102-010A]',
568    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFRb[0102-010A]',
569    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFRb[0102-010A]',
570    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFRb[0102-010A]',
571    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFRb[0102-010B]',
572    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFRb[0102-010C]',
573    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFHb[0102-0104 0106 0108-010A]',
574    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
575    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
576    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFHb[0102-0104 0106-010A]',
577    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFHb[0102-0104 0106-010A]',
578    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFHb[0102-0104 0106-010A]',
579    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFHb[0102-0104 0106-010A]',
580    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFHb[0102-0104 0106-010B]',
581    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFHb[0102-0104 0106-010C]',
582    '[\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFHb[0102-0104 0107-010A]',
583    '[\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFHb[0102-0104 0108-010A]',
584    '[\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFHb[0102-0104 0108-010A]',
585    '[\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFHb[0102-0104 0108-010A]',
586    '[\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFHb[0102-0104 0108-010B]',
587    '[\x{103}\x{102}]' => 'EXACTFU_REQ8 <\x{103}>',
588    '[\x{104}\x{102}]' => 'ANYOFHb[0102 0104]',
589    '[\x{104}\x{102}\x{103}]' => 'ANYOFRb[0102-0104]',
590    '[\x{106}-{INFTY}\x{104}]' => 'ANYOFH[0104 0106-INFTY]',
591    '[\x{106}-{INFTY}\x{104}-{INFTY}]' => 'ANYOFH[0104-INFTY]',
592    '[\x{106}-{INFTY}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0104-INFTY]',
593    '[\x{106}-{INFTY}\x{104}-\x{105}]' => 'ANYOFH[0104-INFTY]',
594    '[\x{106}-{INFTY}\x{104}-\x{106}]' => 'ANYOFH[0104-INFTY]',
595    '[\x{106}-{INFTY}\x{104}-\x{107}]' => 'ANYOFH[0104-INFTY]',
596    '[\x{106}-{INFTY}\x{105}]' => 'ANYOFH[0105-INFTY]',
597    '[\x{106}-{INFTY}\x{105}-{INFTY}]' => 'ANYOFH[0105-INFTY]',
598    '[\x{106}-{INFTY}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0105-INFTY]',
599    '[\x{106}-{INFTY}\x{105}-\x{106}]' => 'ANYOFH[0105-INFTY]',
600    '[\x{106}-{INFTY}\x{105}-\x{107}]' => 'ANYOFH[0105-INFTY]',
601    '[\x{106}-{INFTY}\x{106}]' => 'ANYOFH[0106-INFTY]',
602    '[\x{106}-{INFTY}\x{106}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
603    '[\x{106}-{INFTY}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
604    '[\x{106}-{INFTY}\x{106}-\x{107}]' => 'ANYOFH[0106-INFTY]',
605    '[\x{106}-{INFTY}\x{107}]' => 'ANYOFH[0106-INFTY]',
606    '[\x{106}-{INFTY}\x{107}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
607    '[\x{106}-{INFTY}\x{107}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
608    '[\x{106}-{INFTY}\x{107}-\x{107}]' => 'ANYOFH[0106-INFTY]',
609    '[\x{10C}-{INFTY}{HIGHEST_CP}]' => 'ANYOFH[010C-INFTY]',
610    '[\x{10C}-{INFTY}\x{00}-{HIGHEST_CP}]' => 'SANY',
611    '[\x{10C}-{INFTY}\x{00}-{INFTY}]' => 'SANY',
612    '[\x{10C}-{INFTY}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
613    '[\x{10C}-{INFTY}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
614    '[\x{10C}-{INFTY}\x{102}\x{104}]' => 'ANYOFH[0102 0104 010C-INFTY]',
615    '[\x{10C}-{INFTY}\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 010C-INFTY]',
616    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{100}]' => 'ANYOFH[0100 0102-0104 010C-INFTY]',
617    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}]' => 'ANYOFH[0101-0104 010C-INFTY]',
618    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
619    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
620    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}]' => 'ANYOFH[0102-0104 010C-INFTY]',
621    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
622    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
623    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
624    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
625    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
626    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}]' => 'ANYOFH[0102-0104 010C-INFTY]',
627    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
628    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
629    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}]' => 'ANYOFH[0102-0105 010C-INFTY]',
630    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
631    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
632    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}]' => 'ANYOFH[0102-0104 0106 010C-INFTY]',
633    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
634    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
635    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
636    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
637    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
638    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
639    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
640    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
641    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
642    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFH[0101-0105 0108-010A 010C-INFTY]',
643    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFH[0101-0106 0108-010A 010C-INFTY]',
644    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFH[0101-010A 010C-INFTY]',
645    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFH[0101-010A 010C-INFTY]',
646    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFH[0101-010A 010C-INFTY]',
647    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFH[0101-010A 010C-INFTY]',
648    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFH[0101-INFTY]',
649    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
650    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
651    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
652    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
653    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
654    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
655    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
656    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
657    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
658    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
659    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
660    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
661    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
662    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
663    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
664    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
665    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
666    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
667    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
668    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
669    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
670    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
671    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
672    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
673    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
674    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
675    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
676    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
677    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
678    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
679    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
680    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
681    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
682    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
683    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
684    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
685    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
686    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
687    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
688    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
689    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
690    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
691    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
692    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
693    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
694    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
695    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
696    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFH[0102-0104 0106 0108-010A 010C-INFTY]',
697    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
698    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
699    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
700    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
701    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
702    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
703    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFH[0102-0104 0106-INFTY]',
704    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFH[0102-0104 0106-INFTY]',
705    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFH[0102-0104 0107-010A 010C-INFTY]',
706    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
707    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
708    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
709    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFH[0102-0104 0108-INFTY]',
710    '[\x{10C}-{INFTY}\x{103}\x{102}]' => 'ANYOFH[0102-0103 010C-INFTY]',
711    '[\x{10C}-{INFTY}\x{104}\x{102}]' => 'ANYOFH[0102 0104 010C-INFTY]',
712    '[\x{10C}-{INFTY}\x{104}\x{102}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
713    '[{HIGHEST_CP}]' => 'EXACT_REQ8 <\x{HIGHEST_CP}>',
714
715    '(?8)(?i)[\x{410}]' => 'EXACTFU_REQ8 <\x{430}>',
716    '(?8)(?i)[\x{399}]' => 'EXACTFU_REQ8 <\x{3b9}>',
717    '(?8)(?i)[\x{345}\x{399}\x{3B9}\x{1FBE}]' => 'EXACTFU_REQ8 <\x{3b9}>',
718    '(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>',           # Doesn't participate in a fold
719    '(?8)(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>',
720    '(?i)[\x{2bc}]' => 'EXACTFU_REQ8 <\x{2bc}>', # Part of a multi-char fold, ASCII component
721    '(?i)[\x{390}]' => 'EXACTFU_REQ8 <\x{3b9}\x{308}\x{301}>', # Part of a multi-char fold, no ASCII component
722
723    '(?i)[\x{1E9E}]' => 'EXACTFU <ss>',
724    '(?iaa)[\x{1E9E}]' => 'EXACTFAA <\x{17f}\x{17f}>',
725    '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
726    '(?iaa)[\x{FB00}]' => 'EXACT_REQ8 <\x{fb00}>',
727    '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
728    '(?i)[\x{FB01}]' => 'EXACTFU <fi>',
729    '(?i)[\x{FB02}]' => 'EXACTFU <fl>',
730    '(?i)[\x{FB03}]' => 'EXACTFU <ffi>',
731    '(?i)[\x{FB04}]' => 'EXACTFU <ffl>',
732    '(?i)[\x{FB05}]' => 'EXACTFU <st>',
733    '(?i)[\x{FB06}]' => 'EXACTFU <st>',
734
735    '[a][b]' => 'EXACT <ab>',
736    '[a]\x{100}' => 'EXACT_REQ8 <a\x{100}>',
737    '(?8)[\x{100}]a' => 'EXACT_REQ8 <\x{100}a>',
738    '(?i)[b][c]' => 'EXACTFU <bc>',
739    '(?i)[b]\x{100}' => 'EXACTFU_REQ8 <b\x{101}>',
740    '(?8)(?i)[\x{100}]b' => 'EXACTFU_REQ8 <\x{101}b>',
741    '(?i)b[s]' => 'EXACTFU <bs>',
742    '(?i)b[s]c' => 'EXACTFU <bsc>',
743    '(?i)bs[s]c' => 'EXACTF <bss>',  # The c goes into a 2nd node
744    '(?iu)bs[s]c' => 'EXACTFUP <bssc>',
745    '(?i)b[s]sc' => 'EXACTF <bssc>',
746    '(?iu)b[s]sc' => 'EXACTFUP <bssc>',
747    '(?i)[b]st' => 'EXACTFU <bst>',
748    '(?i)[b]st[s]' => 'EXACTFU <bsts>',
749    '(?i)[b]st[s]st' => 'EXACTF <bstsst>',
750    '(?iu)[b]st[s]st' => 'EXACTFUP <bstsst>',
751    '(?i)[s][s]' => 'EXACTF <ss>',
752    '(?iu)[s][s]' => 'EXACTFUP <ss>',
753);
754
755my @single_chars_to_test =
756(
757    "\x00",     # Always potentially problematic
758    "\x01",     # Unnamed control
759    "\b",       # Named control
760    "\n",       # Potentially special
761    "\r",       # Potentially special
762    "\cK",      # Potentially special
763    "0",        # Digit
764    ":",        # Not in any fold
765    "A",        # ASCII capital, participates in multi-char fold
766    "a",        # ASCII small, participates in multi-char fold
767    "B",        # ASCII capital, participates only in case-pair fold
768    "b",        # ASCII small, participates only in case-pair fold
769    "K",        # ASCII capital, folded to from above Latin1
770    "k",        # ASCII small, folded to from above Latin1
771    "\c?",      # Potentially special
772    "\x80",     # Latin1 control
773    "\xB5",     # Micro sign, folds to above Latin1
774    "\xC0",     # Latin1 capital, participates only in case-pair fold
775    "\xE0",     # Latin1 small, participates only in case-pair fold
776    "\xC5",     # Latin1 capital, folded to from above Latin1
777    "\xE5",     # Latin1 small, folded to from above Latin1
778    "\xDF",     # Small sharp S. folds to 'ss'
779    "\xF7",     # Doesn't participate in any fold
780    "\xFF",     # Folded to by above Latin1
781    "\x{100}",  # First few above Latin1 characters
782    "\x{101}",
783    "\x{102}",
784    "\x{103}",
785    "\x{104}",
786    "\x{105}",
787    "\x{106}",
788    "\x{107}",
789    "\x{108}",
790    "\x{2029}",
791);
792
793my @single_tests;
794for my $char (@single_chars_to_test) {
795    my $cp = ord $char;
796    my $hex = sprintf "%02x", $cp;
797    my $oct = sprintf "%o", $cp;
798    my $cp_string;
799
800    my $cased;
801    my $folded_hex;
802
803    {
804        use feature 'unicode_strings';
805        $cased = uc $char ne $char || lc $char ne $char;
806        $folded_hex = ($cased)
807                      ? sprintf("%02x", ord lc $char)
808                      : $hex;
809        #print STDERR "$hex, $folded_hex\n";
810    }
811
812    for my $fold ("", "i") {
813        #next unless $fold;
814        for my $charset ("", "u", "l", "aa") {
815            #next if $charset eq "aa" && ! $fold;
816
817            my $modifiers = $fold . $charset;
818            $modifiers = "(?$modifiers)" if $modifiers;
819
820            for my $upgrade ("", "(?8)") {
821                push @single_tests, "$upgrade$modifiers\[\\x{$hex}\]";
822                if ($cp < 256 || $upgrade) {
823                    push @single_tests, get_compiled("$upgrade$modifiers\\x{$hex}");
824                }
825                else {
826                    use feature 'fc';
827
828                    my %list = ( sprintf("%X", $cp) => 1 );
829                    if ($fold) {
830                        for my $op (qw(fc lc uc)) {
831                            my $result = eval "$op(\"$char\")";
832                            $list{sprintf "%X", ord $result} = 1;
833                        }
834                    }
835
836                    my $mod_cp = $cp;
837                    my $op;
838
839                    if (! $fold || scalar keys %list == 1) {
840                        $op = ($charset eq 'l')
841                                ? 'EXACTL'
842                                : ($cp < 256)
843                                ? 'EXACT'
844                                : 'EXACT_REQ8';
845                    }
846                    else {
847                        $op = ($charset eq 'aa')
848                        ? 'EXACTFAA'
849                        : ($charset eq 'l')
850                            ? (($cp < 256)
851                            ? 'EXACTFL'
852                            : 'EXACTFLU8')
853                            : ($cp < 256)
854                            ? 'EXACTFU'
855                            : 'EXACTFU_REQ8';
856                        $mod_cp = ord fc $char;
857                    }
858
859                    push @single_tests, sprintf "$op <\\x{%X}>", $mod_cp;
860                }
861            }
862        }
863    }
864}
865
866unshift @tests, @single_tests;
867
868plan(scalar (@tests - 1) / 2);  # -1 because of the marker.
869
870my $skip_ebcdic = $::IS_EBCDIC;
871while (defined (my $test = shift @tests)) {
872
873    if ($test eq 'ebcdic_ok_below_this_marker') {
874        $skip_ebcdic = 0;
875        next;
876    }
877
878    my $expected = shift @tests;
879
880    SKIP: {
881        skip("test not ported to EBCDIC", 1) if $skip_ebcdic;
882
883        my $display_expected = $expected
884                                        =~ s/ HIGHEST_CP /$highest_cp_string/xgr;
885        my $test_name = "Verify compilation of $test displays as"
886                      . " $expected";
887
888        my $result = get_compiled($test);
889        if ($expected =~ / ^ ANYOF[HR] /x) {
890            like($result, qr/ ^ \Q$expected\E (?:\Q (First UTF-8 byte=\x\E
891                              [[:xdigit:]]{2} )? /x, $test_name);
892        }
893        else {
894            is($result, $expected, $test_name);
895        }
896    }
897}
898