xref: /openbsd-src/gnu/usr.bin/perl/t/re/anyof.t (revision 5486feefcc8cb79b19e014ab332cc5dfd05b3b33)
1#!./perl
2
3use strict;
4use warnings;
5use utf8;
6
7# This tests that the ANYOF nodes generated by bracketed character classes are
8# as expected.  The representation of these is not guaranteed, and this test
9# may need to be updated if it changes.  But it is here to make sure that no
10# unexpected changes occur.  These could come from faulty generation of the
11# node, or faulty display of them (or both).  Because these causes come from
12# very different parts of the regex compiler, it is unlikely that a commit
13# would change both of them, so this test will adequately serve to test both.
14
15BEGIN {
16    chdir 't' if -d 't';
17    require './test.pl';
18    set_up_inc('../lib','.','../ext/re');
19    require Config; Config->import;
20    skip_all('no re module') unless defined &DynaLoader::boot_DynaLoader;
21}
22
23# An array is used instead of a hash, so that the tests are carried out in the
24# order given by this file.  Even-numbered indices are the regexes to compile.
25# The next higher element is the expected compilation result.
26#
27# It is painful to port some of these to EBCDIC, as not only do the code point
28# numbers change (for those < 256), but the order changes, as the compiled
29# version is sorted by native code point order.  On EBCDIC, \r comes before
30# \n, and 'k' before "K', for example.  So, the tests where there are
31# differences are skipped on EBCDIC.  They are all at the beginning of the
32# array, and a special marker entry is used to delmit the boundary between
33# skipped and not skipped.
34#
35# NOTE:  If the pattern contains (?8) it will be upgraded to UTF-8 after
36#        stripping that
37
38use Unicode::UCD;
39my $highest_cp = $Unicode::UCD::MAX_CP;
40my $highest_cp_string = sprintf "%X", $highest_cp;
41$highest_cp_string = "$highest_cp_string";
42
43my $infinity = $highest_cp_string;
44$infinity =~ s/^7/F/;  # Make infinity larger than the largest legal one, and
45                       # at the time of this writing, we really internally
46                       # allow UV_MAX to be infinity.
47
48sub  get_compiled ($) {
49    # Convert platform-independent values to what is suitable for the
50    # platform
51
52    my $pattern = shift;
53
54    $pattern =~ s/{INFTY}/\\x{$infinity}/g;
55    $pattern =~ s/{HIGHEST_CP}/\\x{$highest_cp_string}/g;
56    my $use_utf8 = ($pattern =~ s/\Q(?8)//);
57
58    $pattern = "my \$a = '$pattern';";
59    $pattern .= "utf8::upgrade(\$a);" if $use_utf8;
60    $pattern .= "qr/\$a/";
61    my $actual_pattern = "use re qw(Debug COMPILE); $pattern";
62
63    my $result = fresh_perl($actual_pattern);
64    if ($? != 0) {  # Re-run so as to display STDERR.
65        fail($pattern, "Until this is fixed, the planned number of tests will be wrong");
66        fresh_perl($actual_pattern, { stderr => 0, verbose => 1 });
67        return;
68    }
69
70    # The Debug output will come back as a bunch of lines.  We are
71    # interested only in the line after /Final program/
72    my @lines = split /\n/, $result;
73    while (defined ($_ = shift @lines)) {
74        last if /Final program/;
75    }
76
77    $_ = shift @lines;
78    unless (defined $_) {
79        die "Unexpected compilation result: '$result'\n"
80          . " Compiled from '$actual_pattern'";
81    }
82
83    s/ \s* \( \d+ \) \s* //x;   # Get rid of the node branch
84    s/ ^ \s* \d+ : \s* //x;     # ... And the node number
85
86    # Use platform-independent values
87    s/$infinity/INFTY/ig;
88    s/$highest_cp_string/HIGHEST_CP/ig;
89
90    return $_;
91}
92
93# Note: EXACTish lowercases the hex; ANYOF uppercases, without braces
94
95my @tests = (
96    '[\xe0\xc0]' => 'EXACTFU <\\x{e0}>',
97    '[\xe1\xc1]' => 'EXACTFU <\\x{e1}>',
98    '[\xe2\xc2]' => 'EXACTFU <\\x{e2}>',
99    '[\xe3\xc3]' => 'EXACTFU <\\x{e3}>',
100    '[\xe4\xc4]' => 'EXACTFU <\\x{e4}>',
101    '[\xc5\xe5]' => 'ANYOF[\\xC5\\xE5]',
102    '[\xe6\xc6]' => 'EXACTFU <\\x{e6}>',
103    '[\xe7\xc7]' => 'EXACTFU <\\x{e7}>',
104    '[\xe8\xc8]' => 'EXACTFU <\\x{e8}>',
105    '[\xe9\xc9]' => 'EXACTFU <\\x{e9}>',
106    '[\xea\xca]' => 'EXACTFU <\\x{ea}>',
107    '[\xeb\xcb]' => 'EXACTFU <\\x{eb}>',
108    '[\xec\xcc]' => 'EXACTFU <\\x{ec}>',
109    '[\xee\xce]' => 'EXACTFU <\\x{ee}>',
110    '[\xef\xcf]' => 'EXACTFU <\\x{ef}>',
111    '[\xf0\xd0]' => 'EXACTFU <\\x{f0}>',
112    '[\xf1\xd1]' => 'EXACTFU <\\x{f1}>',
113    '[\xf2\xd2]' => 'EXACTFU <\\x{f2}>',
114    '[\xf3\xd3]' => 'EXACTFU <\\x{f3}>',
115    '[\xf4\xd4]' => 'EXACTFU <\\x{f4}>',
116    '[\xf5\xd5]' => 'EXACTFU <\\x{f5}>',
117    '[\xf6\xd6]' => 'EXACTFU <\\x{f6}>',
118    '[\xf8\xd8]' => 'EXACTFU <\\x{f8}>',
119    '[\xf9\xd9]' => 'EXACTFU <\\x{f9}>',
120    '[\xfa\xda]' => 'EXACTFU <\\x{fa}>',
121    '[\xfb\xdb]' => 'EXACTFU <\\x{fb}>',
122    '[\xfc\xdc]' => 'EXACTFU <\\x{fc}>',
123    '[\xfd\xdd]' => 'EXACTFU <\\x{fd}>',
124    '[\xfe\xde]' => 'EXACTFU <\\x{fe}>',
125
126    '[[{]' => 'ANYOFM[\[\{]',
127    '[^\S ]' => 'ANYOFD[\t\n\x0B\f\r{utf8}\x85\xA0][1680 2000-200A 2028-2029 202F 205F 3000]',
128    '[^\n\r]' => 'ANYOF[^\n\r][0100-INFTY]',
129    '[^\/\|,\$\%%\@\ \%"\<\>\:\#\&\*\{\}\[\]\(\)]' => 'ANYOF[^ "#$%&()*,/:<>@\[\]\{|\}][0100-INFTY]',
130    '[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
131    '[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
132    '[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
133    '(?u)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
134    '(?u)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
135    '(?a)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
136    '(?a)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
137    '(?a)[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
138    '[[:cntrl:]]' => 'POSIXD[:cntrl:]',
139    '[^[:^print:][:^ascii:]]' => 'POSIXA[:print:]',
140    '[^[:^print:][:^ascii:]b]' => 'ANYOF[^\x00-\x1Fb\x7F-\xFF][0100-INFTY]',
141    '[^[:^print:][:^ascii:]b\p{Is_unresolved}]' => 'ANYOF[^\x00-\x1Fb\x7F-\xFF{+main::Is_unresolved}0100-INFTY]',
142    '[[:blank:]]' => 'POSIXD[:blank:]',
143    '[ [:blank:]]' => 'POSIXD[:blank:]',
144    '[_[:blank:]]' => 'ANYOFD[\t _{utf8}\xA0][1680 2000-200A 202F 205F 3000]',
145    '[_[:^blank:]]' => 'NPOSIXD[:blank:]',
146    '[\xA0[:^blank:]]' => 'ANYOF[^\t ][0100-167F 1681-1FFF 200B-202E 2030-205E 2060-2FFF 3001-INFTY]',
147    '(?d:[_[:^blank:]])' => 'NPOSIXD[:blank:]',
148    '[\x{07}-\x{0B}]' => 'ANYOFR[\a\b\t\n\x0B]',
149    '(?l)[\x{2029}]' => 'EXACTL <\x{2029}>',
150    '(?l)(?[\x{2029}])' => 'ANYOFL{utf8-locale-reqd}[2029]', # regex sets requires utf8 locale for /l
151    '(?il)[\x{212A}]' => 'EXACTFL <\\x{212a}>',
152    '(?il)(?[\x{212A}])' => 'ANYOFL{utf8-locale-reqd}[Kk][212A]',
153
154    '(?i)b[s]\xe0' => 'ANYOFM[Bb]',    # The s goes into a 2nd node
155
156    '[aA]' => 'ANYOFM[Aa]',
157    '[bB]' => 'ANYOFM[Bb]',
158    '[kK]' => 'ANYOFM[Kk]',
159
160    'ebcdic_ok_below_this_marker',
161
162    '(?i:[^:])' => 'NANYOFM[:]',
163
164    '[^\n]' => 'REG_ANY',
165
166    '[[:alpha:]]' => 'POSIXD[:alpha:]',
167    '[[:^alpha:]]' => 'NPOSIXD[:alpha:]',
168    '[[:^alpha:]\x{2C2}]' => 'NPOSIXU[:alpha:]',
169    '(?l)[[:alpha:]]' => 'POSIXL[:alpha:]',
170    '(?l)[[:^alpha:]]' => 'NPOSIXL[:alpha:]',
171    '(?l)[[:^alpha:]\x{2C2}]' => 'NPOSIXL[:alpha:]',
172    '(?u)[[:alpha:]]' => 'POSIXU[:alpha:]',
173    '(?u)[[:^alpha:]]' => 'NPOSIXU[:alpha:]',
174    '(?a)[[:alpha:]]' => 'POSIXA[:alpha:]',
175    '(?a)[[:^alpha:]]' => 'NPOSIXA[:alpha:]',
176    '(?a)[[:^alpha:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
177    '[[:alpha:][:^alpha:]]' => 'SANY',
178    '[^[:alpha:][:^alpha:]]' => 'OPFAIL',
179    '(?l)[[:alpha:][:^alpha:]]' => 'SANY',
180    '(?l)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
181    '(?u)[[:alpha:][:^alpha:]]' => 'SANY',
182    '(?u)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
183    '(?a)[[:alpha:][:^alpha:]]' => 'SANY',
184    '(?a)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
185    '[[:alnum:]]' => 'POSIXD[:alnum:]',
186    '[[:^alnum:]]' => 'NPOSIXD[:alnum:]',
187    '[[:^alnum:]\x{2C2}]' => 'NPOSIXU[:alnum:]',
188    '(?l)[[:alnum:]]' => 'POSIXL[:alnum:]',
189    '(?l)[[:^alnum:]]' => 'NPOSIXL[:alnum:]',
190    '(?l)[[:^alnum:]\x{2C2}]' => 'NPOSIXL[:alnum:]',
191    '(?u)[[:alnum:]]' => 'POSIXU[:alnum:]',
192    '(?u)[[:^alnum:]]' => 'NPOSIXU[:alnum:]',
193    '(?a)[[:alnum:]]' => 'POSIXA[:alnum:]',
194    '(?a)[[:^alnum:]]' => 'NPOSIXA[:alnum:]',
195    '(?a)[[:^alnum:]\x{2C2}]' => 'NPOSIXA[:alnum:]',
196    '[[:alnum:][:^alnum:]]' => 'SANY',
197    '[^[:alnum:][:^alnum:]]' => 'OPFAIL',
198    '(?l)[[:alnum:][:^alnum:]]' => 'SANY',
199    '(?l)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
200    '(?u)[[:alnum:][:^alnum:]]' => 'SANY',
201    '(?u)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
202    '(?a)[[:alnum:][:^alnum:]]' => 'SANY',
203    '(?a)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
204    '(?l)[[:ascii:]]' => 'POSIXL[:ascii:]',
205    '(?l)[[:^ascii:]]' => 'NPOSIXL[:ascii:]',
206    '(?l)[[:^ascii:]\x{2C2}]' => 'NPOSIXL[:ascii:]',
207    '[[:ascii:][:^ascii:]]' => 'SANY',
208    '[^[:ascii:][:^ascii:]]' => 'OPFAIL',
209    '(?l)[[:ascii:][:^ascii:]]' => 'SANY',
210    '(?l)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
211    '(?u)[[:ascii:][:^ascii:]]' => 'SANY',
212    '(?u)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
213    '(?a)[[:ascii:][:^ascii:]]' => 'SANY',
214    '(?a)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
215    '[[:^blank:]]' => 'NPOSIXD[:blank:]',
216    '[[:^blank:]\x{2C2}]' => 'NPOSIXU[:blank:]',
217    '(?l)[[:blank:]]' => 'POSIXL[:blank:]',
218    '(?l)[[:^blank:]]' => 'NPOSIXL[:blank:]',
219    '(?l)[[:^blank:]\x{2C2}]' => 'NPOSIXL[:blank:]',
220    '(?u)[[:blank:]]' => 'POSIXU[:blank:]',
221    '(?u)[[:^blank:]]' => 'NPOSIXU[:blank:]',
222    '(?a)[[:blank:]]' => 'POSIXA[:blank:]',
223    '(?a)[[:^blank:]]' => 'NPOSIXA[:blank:]',
224    '(?a)[[:^blank:]\x{2C2}]' => 'NPOSIXA[:blank:]',
225    '[[:blank:]]' => 'POSIXD[:blank:]',
226    '[[:blank:][:^blank:]]' => 'SANY',
227    '[^[:blank:][:^blank:]]' => 'OPFAIL',
228    '(?l)[[:blank:][:^blank:]]' => 'SANY',
229    '(?l)[^[:blank:][:^blank:]]' => 'OPFAIL',
230    '(?u)[[:blank:][:^blank:]]' => 'SANY',
231    '(?u)[^[:blank:][:^blank:]]' => 'OPFAIL',
232    '(?a)[[:blank:][:^blank:]]' => 'SANY',
233    '(?a)[^[:blank:][:^blank:]]' => 'OPFAIL',
234    '[[:^cntrl:]]' => 'NPOSIXD[:cntrl:]',
235    '[[:^cntrl:]\x{2C2}]' => 'NPOSIXU[:cntrl:]',
236    '(?l)[[:cntrl:]]' => 'POSIXL[:cntrl:]',
237    '(?l)[[:^cntrl:]]' => 'NPOSIXL[:cntrl:]',
238    '(?l)[[:^cntrl:]\x{2C2}]' => 'NPOSIXL[:cntrl:]',
239    '(?u)[[:cntrl:]]' => 'POSIXU[:cntrl:]',
240    '(?u)[[:^cntrl:]]' => 'NPOSIXU[:cntrl:]',
241    '(?a)[[:cntrl:]]' => 'POSIXA[:cntrl:]',
242    '(?a)[[:^cntrl:]]' => 'NPOSIXA[:cntrl:]',
243    '(?a)[[:^cntrl:]\x{2C2}]' => 'NPOSIXA[:cntrl:]',
244    '[[:cntrl:][:^cntrl:]]' => 'SANY',
245    '[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
246    '(?l)[[:cntrl:][:^cntrl:]]' => 'SANY',
247    '(?l)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
248    '(?u)[[:cntrl:][:^cntrl:]]' => 'SANY',
249    '(?u)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
250    '(?a)[[:cntrl:][:^cntrl:]]' => 'SANY',
251    '(?a)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
252    '[[:digit:]]' => 'POSIXU[\d]',
253    '[[:^digit:]]' => 'NPOSIXU[\d]',
254    '[[:^digit:]\x{2C2}]' => 'NPOSIXU[\d]',
255    '(?l)[[:digit:]]' => 'POSIXL[\d]',
256    '(?l)[[:^digit:]]' => 'NPOSIXL[\d]',
257    '(?l)[[:^digit:]\x{2C2}]' => 'NPOSIXL[\d]',
258    '(?u)[[:digit:]]' => 'POSIXU[\d]',
259    '(?u)[[:^digit:]]' => 'NPOSIXU[\d]',
260    '(?a)[[:digit:]]' => 'POSIXA[\d]',
261    '(?a)[[:^digit:]]' => 'NPOSIXA[\d]',
262    '(?a)[[:^digit:]\x{2C2}]' => 'NPOSIXA[\d]',
263    '[[:digit:][:^digit:]]' => 'SANY',
264    '[^[:digit:][:^digit:]]' => 'OPFAIL',
265    '(?l)[[:digit:][:^digit:]]' => 'SANY',
266    '(?l)[^[:digit:][:^digit:]]' => 'OPFAIL',
267    '(?u)[[:digit:][:^digit:]]' => 'SANY',
268    '(?u)[^[:digit:][:^digit:]]' => 'OPFAIL',
269    '(?a)[[:digit:][:^digit:]]' => 'SANY',
270    '(?a)[^[:digit:][:^digit:]]' => 'OPFAIL',
271    '[[:graph:]]' => 'POSIXD[:graph:]',
272    '[[:^graph:]]' => 'NPOSIXD[:graph:]',
273    '[[:^graph:]\x{FFFF}]' => 'NPOSIXU[:graph:]',
274    '(?l)[[:graph:]]' => 'POSIXL[:graph:]',
275    '(?l)[[:^graph:]]' => 'NPOSIXL[:graph:]',
276    '(?l)[[:^graph:]\x{FFFF}]' => 'NPOSIXL[:graph:]',
277    '(?u)[[:graph:]]' => 'POSIXU[:graph:]',
278    '(?u)[[:^graph:]]' => 'NPOSIXU[:graph:]',
279    '(?a)[[:graph:]]' => 'POSIXA[:graph:]',
280    '(?a)[[:^graph:]]' => 'NPOSIXA[:graph:]',
281    '(?a)[[:^graph:]\x{FFFF}]' => 'NPOSIXA[:graph:]',
282    '[[:graph:][:^graph:]]' => 'SANY',
283    '[^[:graph:][:^graph:]]' => 'OPFAIL',
284    '(?l)[[:graph:][:^graph:]]' => 'SANY',
285    '(?l)[^[:graph:][:^graph:]]' => 'OPFAIL',
286    '(?u)[[:graph:][:^graph:]]' => 'SANY',
287    '(?u)[^[:graph:][:^graph:]]' => 'OPFAIL',
288    '(?a)[[:graph:][:^graph:]]' => 'SANY',
289    '(?a)[^[:graph:][:^graph:]]' => 'OPFAIL',
290    '[[:lower:]]' => 'POSIXD[:lower:]',
291    '[[:^lower:]]' => 'NPOSIXD[:lower:]',
292    '[[:^lower:]\x{2C2}]' => 'NPOSIXU[:lower:]',
293    '(?l)[[:lower:]]' => 'POSIXL[:lower:]',
294    '(?l)[[:^lower:]]' => 'NPOSIXL[:lower:]',
295    '(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:lower:]',
296    '(?u)[[:lower:]]' => 'POSIXU[:lower:]',
297    '(?u)[[:^lower:]]' => 'NPOSIXU[:lower:]',
298    '(?a)[[:lower:]]' => 'POSIXA[:lower:]',
299    '(?a)[[:^lower:]]' => 'NPOSIXA[:lower:]',
300    '(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:lower:]',
301    '[[:lower:][:^lower:]]' => 'SANY',
302    '[^[:lower:][:^lower:]]' => 'OPFAIL',
303    '(?l)[[:lower:][:^lower:]]' => 'SANY',
304    '(?l)[^[:lower:][:^lower:]]' => 'OPFAIL',
305    '(?u)[[:lower:][:^lower:]]' => 'SANY',
306    '(?u)[^[:lower:][:^lower:]]' => 'OPFAIL',
307    '(?a)[[:lower:][:^lower:]]' => 'SANY',
308    '(?a)[^[:lower:][:^lower:]]' => 'OPFAIL',
309    '[[:print:]]' => 'POSIXD[:print:]',
310    '[[:^print:]]' => 'NPOSIXD[:print:]',
311    '[[:^print:]\x{FFFF}]' => 'NPOSIXU[:print:]',
312    '(?l)[[:print:]]' => 'POSIXL[:print:]',
313    '(?l)[[:^print:]]' => 'NPOSIXL[:print:]',
314    '(?l)[[:^print:]\x{FFFF}]' => 'NPOSIXL[:print:]',
315    '(?u)[[:print:]]' => 'POSIXU[:print:]',
316    '(?u)[[:^print:]]' => 'NPOSIXU[:print:]',
317    '(?a)[[:print:]]' => 'POSIXA[:print:]',
318    '(?a)[[:^print:]]' => 'NPOSIXA[:print:]',
319    '(?a)[[:^print:]\x{FFFF}]' => 'NPOSIXA[:print:]',
320    '[[:print:][:^print:]]' => 'SANY',
321    '[^[:print:][:^print:]]' => 'OPFAIL',
322    '(?l)[[:print:][:^print:]]' => 'SANY',
323    '(?l)[^[:print:][:^print:]]' => 'OPFAIL',
324    '(?u)[[:print:][:^print:]]' => 'SANY',
325    '(?u)[^[:print:][:^print:]]' => 'OPFAIL',
326    '(?a)[[:print:][:^print:]]' => 'SANY',
327    '(?a)[^[:print:][:^print:]]' => 'OPFAIL',
328    '[[:punct:]]' => 'POSIXD[:punct:]',
329    '[[:^punct:]]' => 'NPOSIXD[:punct:]',
330    '[[:^punct:]\x{2C2}]' => 'NPOSIXU[:punct:]',
331    '(?l)[[:punct:]]' => 'POSIXL[:punct:]',
332    '(?l)[[:^punct:]]' => 'NPOSIXL[:punct:]',
333    '(?l)[[:^punct:]\x{2C2}]' => 'NPOSIXL[:punct:]',
334    '(?u)[[:punct:]]' => 'POSIXU[:punct:]',
335    '(?u)[[:^punct:]]' => 'NPOSIXU[:punct:]',
336    '(?a)[[:punct:]]' => 'POSIXA[:punct:]',
337    '(?a)[[:^punct:]]' => 'NPOSIXA[:punct:]',
338    '(?a)[[:^punct:]\x{2C2}]' => 'NPOSIXA[:punct:]',
339    '[[:punct:][:^punct:]]' => 'SANY',
340    '[^[:punct:][:^punct:]]' => 'OPFAIL',
341    '(?l)[[:punct:][:^punct:]]' => 'SANY',
342    '(?l)[^[:punct:][:^punct:]]' => 'OPFAIL',
343    '(?u)[[:punct:][:^punct:]]' => 'SANY',
344    '(?u)[^[:punct:][:^punct:]]' => 'OPFAIL',
345    '(?a)[[:punct:][:^punct:]]' => 'SANY',
346    '(?a)[^[:punct:][:^punct:]]' => 'OPFAIL',
347    '[[:space:]]' => 'POSIXD[\s]',
348    '[[:^space:]]' => 'NPOSIXD[\s]',
349    '[[:^space:]\x{2C2}]' => 'NPOSIXU[\s]',
350    '(?l)[[:space:]]' => 'POSIXL[\s]',
351    '(?l)[[:^space:]]' => 'NPOSIXL[\s]',
352    '(?l)[[:^space:]\x{2C2}]' => 'NPOSIXL[\s]',
353    '(?u)[[:space:]]' => 'POSIXU[\s]',
354    '(?u)[[:^space:]]' => 'NPOSIXU[\s]',
355    '(?a)[[:space:]]' => 'POSIXA[\s]',
356    '(?a)[[:^space:]]' => 'NPOSIXA[\s]',
357    '(?a)[[:^space:]\x{2C2}]' => 'NPOSIXA[\s]',
358    '[[:space:][:^space:]]' => 'SANY',
359    '[^[:space:][:^space:]]' => 'OPFAIL',
360    '(?l)[[:space:][:^space:]]' => 'SANY',
361    '(?l)[^[:space:][:^space:]]' => 'OPFAIL',
362    '(?u)[[:space:][:^space:]]' => 'SANY',
363    '(?u)[^[:space:][:^space:]]' => 'OPFAIL',
364    '(?a)[[:space:][:^space:]]' => 'SANY',
365    '(?a)[^[:space:][:^space:]]' => 'OPFAIL',
366    '[[:upper:]]' => 'POSIXD[:upper:]',
367    '[[:^upper:]]' => 'NPOSIXD[:upper:]',
368    '[[:^upper:]\x{2C2}]' => 'NPOSIXU[:upper:]',
369    '(?l)[[:upper:]]' => 'POSIXL[:upper:]',
370    '(?l)[[:^upper:]]' => 'NPOSIXL[:upper:]',
371    '(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:upper:]',
372    '(?u)[[:upper:]]' => 'POSIXU[:upper:]',
373    '(?u)[[:^upper:]]' => 'NPOSIXU[:upper:]',
374    '(?a)[[:upper:]]' => 'POSIXA[:upper:]',
375    '(?a)[[:^upper:]]' => 'NPOSIXA[:upper:]',
376    '(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:upper:]',
377    '[[:upper:][:^upper:]]' => 'SANY',
378    '[^[:upper:][:^upper:]]' => 'OPFAIL',
379    '(?l)[[:upper:][:^upper:]]' => 'SANY',
380    '(?l)[^[:upper:][:^upper:]]' => 'OPFAIL',
381    '(?u)[[:upper:][:^upper:]]' => 'SANY',
382    '(?u)[^[:upper:][:^upper:]]' => 'OPFAIL',
383    '(?a)[[:upper:][:^upper:]]' => 'SANY',
384    '(?a)[^[:upper:][:^upper:]]' => 'OPFAIL',
385    '[\v]' => 'POSIXU[\v]',
386    '[^\v]' => 'NPOSIXU[\v]',
387    '[\V\x{2C2}]' => 'NPOSIXU[\v]',
388    '(?l)[\v]' => 'POSIXU[\v]',
389    '(?l)[^\v]' => 'NPOSIXU[\v]',
390    '(?l)[\V\x{2C2}]' => 'NPOSIXU[\v]',
391    '(?u)[\v]' => 'POSIXU[\v]',
392    '(?u)[^\v]' => 'NPOSIXU[\v]',
393    '(?a)[\v]' => 'POSIXU[\v]',
394    '(?a)[^\v]' => 'NPOSIXU[\v]',
395    '(?a)[\V\x{2C2}]' => 'NPOSIXU[\v]',
396    '[\v\V]' => 'SANY',
397    '[^\v\V]' => 'OPFAIL',
398    '(?l)[\v\V]' => 'SANY',
399    '(?l)[^\v\V]' => 'OPFAIL',
400    '(?u)[\v\V]' => 'SANY',
401    '(?u)[^\v\V]' => 'OPFAIL',
402    '(?a)[\v\V]' => 'SANY',
403    '(?a)[^\v\V]' => 'OPFAIL',
404    '[[:word:]]' => 'POSIXD[\w]',
405    '[[:^word:]]' => 'NPOSIXD[\w]',
406    '[[:^word:]\x{2C2}]' => 'NPOSIXU[\w]',
407    '(?l)[[:word:]]' => 'POSIXL[\w]',
408    '(?l)[[:^word:]]' => 'NPOSIXL[\w]',
409    '(?l)[[:^word:]\x{2C2}]' => 'NPOSIXL[\w]',
410    '(?u)[[:word:]]' => 'POSIXU[\w]',
411    '(?u)[[:^word:]]' => 'NPOSIXU[\w]',
412    '(?a)[[:word:]]' => 'POSIXA[\w]',
413    '(?a)[[:^word:]]' => 'NPOSIXA[\w]',
414    '(?a)[[:^word:]\x{2C2}]' => 'NPOSIXA[\w]',
415    '[[:word:][:^word:]]' => 'SANY',
416    '[^[:word:][:^word:]]' => 'OPFAIL',
417    '(?l)[[:word:][:^word:]]' => 'SANY',
418    '(?l)[^[:word:][:^word:]]' => 'OPFAIL',
419    '(?u)[[:word:][:^word:]]' => 'SANY',
420    '(?u)[^[:word:][:^word:]]' => 'OPFAIL',
421    '(?a)[[:word:][:^word:]]' => 'SANY',
422    '(?a)[^[:word:][:^word:]]' => 'OPFAIL',
423    '[[:xdigit:]]' => 'POSIXU[:xdigit:]',
424    '[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
425    '[[:^xdigit:]\x{2C2}]' => 'NPOSIXU[:xdigit:]',
426    '(?l)[[:xdigit:]]' => 'POSIXL[:xdigit:]',
427    '(?l)[[:^xdigit:]]' => 'NPOSIXL[:xdigit:]',
428    '(?l)[[:^xdigit:]\x{2C2}]' => 'NPOSIXL[:xdigit:]',
429    '(?u)[[:xdigit:]]' => 'POSIXU[:xdigit:]',
430    '(?u)[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
431    '(?a)[[:xdigit:]]' => 'POSIXA[:xdigit:]',
432    '(?a)[[:^xdigit:]]' => 'NPOSIXA[:xdigit:]',
433    '(?a)[[:^xdigit:]\x{2C2}]' => 'NPOSIXA[:xdigit:]',
434    '[[:xdigit:][:^xdigit:]]' => 'SANY',
435    '[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
436    '(?l)[[:xdigit:][:^xdigit:]]' => 'SANY',
437    '(?l)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
438    '(?u)[[:xdigit:][:^xdigit:]]' => 'SANY',
439    '(?u)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
440    '(?a)[[:xdigit:][:^xdigit:]]' => 'SANY',
441    '(?a)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
442    '(?i)[[:lower:]]' => 'POSIXD[:cased:]',
443    '(?i)[[:^lower:]]' => 'NPOSIXD[:cased:]',
444    '(?i)[[:^lower:]\x{2C2}]' => 'NPOSIXU[:cased:]',
445    '(?i)(?l)[[:lower:]]' => 'POSIXL[:cased:]',
446    '(?i)(?l)[[:^lower:]]' => 'NPOSIXL[:cased:]',
447    '(?i)(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:cased:]',
448    '(?i)(?u)[[:lower:]]' => 'POSIXU[:cased:]',
449    '(?i)(?u)[[:^lower:]]' => 'NPOSIXU[:cased:]',
450    '(?i)(?a)[[:lower:]]' => 'POSIXA[:alpha:]',
451    '(?i)(?a)[[:^lower:]]' => 'NPOSIXA[:alpha:]',
452    '(?i)(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
453    '(?i)[[:upper:]]' => 'POSIXD[:cased:]',
454    '(?i)[[:^upper:]]' => 'NPOSIXD[:cased:]',
455    '(?i)[[:^upper:]\x{2C2}]' => 'NPOSIXU[:cased:]',
456    '(?i)(?l)[[:upper:]]' => 'POSIXL[:cased:]',
457    '(?i)(?l)[[:^upper:]]' => 'NPOSIXL[:cased:]',
458    '(?i)(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:cased:]',
459    '(?i)(?u)[[:upper:]]' => 'POSIXU[:cased:]',
460    '(?i)(?u)[[:^upper:]]' => 'NPOSIXU[:cased:]',
461    '(?i)(?a)[[:upper:]]' => 'POSIXA[:alpha:]',
462    '(?i)(?a)[[:^upper:]]' => 'NPOSIXA[:alpha:]',
463    '(?i)(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
464    '(?i)[\d\w]' => 'POSIXD[\w]',
465    '(?i)[\D\w]' => 'SANY',
466    #'(?i)(?l)[\d\w]' => varies depending on Unicode release
467    '(?i)(?l)[\D\w]' => 'ANYOFPOSIXL{i}[\\w\\D][0100-INFTY]',
468    '(?i)(?u)[\d\w]' => 'POSIXU[\w]',
469    '(?i)(?u)[\D\w]' => 'SANY',
470    '(?i)(?a)[\d\w]' => 'POSIXA[\w]',
471    '(?i)(?a)[\D\w]' => 'SANY',
472    '(?l:[\x{212A}])' => 'EXACTL <\x{212a}>',
473    '(?l:[\s\x{212A}])' => 'ANYOFPOSIXL[\s][1680 2000-200A 2028-2029 202F 205F 212A 3000]',
474    '(?l:[^\S\x{202F}])' => 'ANYOFPOSIXL[^\\S][1680 2000-200A 2028-2029 205F 3000]',
475    '(?li:[a-z])' => (($::IS_ASCII)
476                     ? 'ANYOFL{i}[a-z{utf8 locale}\x{017F}\x{212A}]'
477                     : 'ANYOFL{i}[a-ij-rs-z{utf8 locale}\x{017F}\x{212A}]'),
478    '\p{All}' => 'SANY',
479    '\P{All}' => 'OPFAIL',
480    '[\p{Any}]' => 'ANYOF[\x00-\xFF][0100-10FFFF]',
481
482    '[\p{IsMyRuntimeProperty}]' => 'ANYOF[+main::IsMyRuntimeProperty]',
483    '[^\p{IsMyRuntimeProperty}]' => 'ANYOF[^{+main::IsMyRuntimeProperty}]',
484    '[a\p{IsMyRuntimeProperty}]' => 'ANYOF[a][+main::IsMyRuntimeProperty]',
485    '[^a\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}]',
486    '[^a\x{100}\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}0100]',
487    '[^\p{All}\p{IsMyRuntimeProperty}]' => 'OPFAIL',
488    '[\p{All}\p{IsMyRuntimeProperty}]' => 'SANY',
489
490    '[\x{00}-{HIGHEST_CP}]' => 'ANYOF[\x00-\xFF][0100-HIGHEST_CP]',
491    '[\x{00}-{INFTY}]' => 'SANY',
492    '[\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
493    '[\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
494    '[\x{102}\x{104}]' => 'ANYOFHbbm[0102 0104]',
495    '[\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 HIGHEST_CP]',
496    '[\x{102}-\x{104}\x{101}]' => 'ANYOFRb[0101-0104]',
497    '[\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
498    '[\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
499    '[\x{102}-\x{104}\x{102}]' => 'ANYOFRb[0102-0104]',
500    '[\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
501    '[\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
502    '[\x{102}-\x{104}\x{103}]' => 'ANYOFRb[0102-0104]',
503    '[\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
504    '[\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
505    '[\x{102}-\x{104}\x{104}]' => 'ANYOFRb[0102-0104]',
506    '[\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
507    '[\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
508    '[\x{102}-\x{104}\x{105}]' => 'ANYOFRb[0102-0105]',
509    '[\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
510    '[\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
511    '[\x{102}-\x{104}\x{106}]' => 'ANYOFHbbm[0102-0104 0106]',
512    '[\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
513    '[\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
514    '[\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A HIGHEST_CP]',
515    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFHbbm[0101-0104 0108-010A]',
516    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
517    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
518    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFHbbm[0101-0104 0108-010A]',
519    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFHbbm[0101-0104 0108-010A]',
520    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFHbbm[0101-0104 0108-010A]',
521    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFHbbm[0101-0105 0108-010A]',
522    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFHbbm[0101-0106 0108-010A]',
523    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFRb[0101-010A]',
524    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFRb[0101-010A]',
525    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFRb[0101-010A]',
526    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFRb[0101-010A]',
527    '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFRb[0101-010B]',
528    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
529    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
530    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
531    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
532    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
533    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
534    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFHbbm[0102-0105 0108-010A]',
535    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFHbbm[0102-0106 0108-010A]',
536    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFRb[0102-010A]',
537    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFRb[0102-010A]',
538    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFRb[0102-010A]',
539    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFRb[0102-010A]',
540    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFRb[0102-010B]',
541    '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFRb[0102-010C]',
542    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
543    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
544    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
545    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
546    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFHbbm[0102-0105 0108-010A]',
547    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFHbbm[0102-0106 0108-010A]',
548    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFRb[0102-010A]',
549    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFRb[0102-010A]',
550    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFRb[0102-010A]',
551    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFRb[0102-010A]',
552    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFRb[0102-010B]',
553    '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFRb[0102-010C]',
554    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
555    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
556    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
557    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFHbbm[0102-0105 0108-010A]',
558    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFHbbm[0102-0106 0108-010A]',
559    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFRb[0102-010A]',
560    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFRb[0102-010A]',
561    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFRb[0102-010A]',
562    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFRb[0102-010A]',
563    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFRb[0102-010B]',
564    '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFRb[0102-010C]',
565    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFHbbm[0102-0105 0108-010A]',
566    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
567    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
568    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFHbbm[0102-0106 0108-010A]',
569    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFRb[0102-010A]',
570    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFRb[0102-010A]',
571    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFRb[0102-010A]',
572    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFRb[0102-010A]',
573    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFRb[0102-010B]',
574    '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFRb[0102-010C]',
575    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFHbbm[0102-0104 0106 0108-010A]',
576    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
577    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
578    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFHbbm[0102-0104 0106-010A]',
579    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFHbbm[0102-0104 0106-010A]',
580    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFHbbm[0102-0104 0106-010A]',
581    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFHbbm[0102-0104 0106-010A]',
582    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFHbbm[0102-0104 0106-010B]',
583    '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFHbbm[0102-0104 0106-010C]',
584    '[\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFHbbm[0102-0104 0107-010A]',
585    '[\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
586    '[\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
587    '[\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFHbbm[0102-0104 0108-010A]',
588    '[\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFHbbm[0102-0104 0108-010B]',
589    '[\x{103}\x{102}]' => 'EXACTFU_REQ8 <\x{103}>',
590    '[\x{104}\x{102}]' => 'ANYOFHbbm[0102 0104]',
591    '[\x{104}\x{102}\x{103}]' => 'ANYOFRb[0102-0104]',
592    '[\x{106}-{INFTY}\x{104}]' => 'ANYOFH[0104 0106-INFTY]',
593    '[\x{106}-{INFTY}\x{104}-{INFTY}]' => 'ANYOFH[0104-INFTY]',
594    '[\x{106}-{INFTY}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0104-INFTY]',
595    '[\x{106}-{INFTY}\x{104}-\x{105}]' => 'ANYOFH[0104-INFTY]',
596    '[\x{106}-{INFTY}\x{104}-\x{106}]' => 'ANYOFH[0104-INFTY]',
597    '[\x{106}-{INFTY}\x{104}-\x{107}]' => 'ANYOFH[0104-INFTY]',
598    '[\x{106}-{INFTY}\x{105}]' => 'ANYOFH[0105-INFTY]',
599    '[\x{106}-{INFTY}\x{105}-{INFTY}]' => 'ANYOFH[0105-INFTY]',
600    '[\x{106}-{INFTY}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0105-INFTY]',
601    '[\x{106}-{INFTY}\x{105}-\x{106}]' => 'ANYOFH[0105-INFTY]',
602    '[\x{106}-{INFTY}\x{105}-\x{107}]' => 'ANYOFH[0105-INFTY]',
603    '[\x{106}-{INFTY}\x{106}]' => 'ANYOFH[0106-INFTY]',
604    '[\x{106}-{INFTY}\x{106}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
605    '[\x{106}-{INFTY}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
606    '[\x{106}-{INFTY}\x{106}-\x{107}]' => 'ANYOFH[0106-INFTY]',
607    '[\x{106}-{INFTY}\x{107}]' => 'ANYOFH[0106-INFTY]',
608    '[\x{106}-{INFTY}\x{107}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
609    '[\x{106}-{INFTY}\x{107}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
610    '[\x{106}-{INFTY}\x{107}-\x{107}]' => 'ANYOFH[0106-INFTY]',
611    '[\x{10C}-{INFTY}{HIGHEST_CP}]' => 'ANYOFH[010C-INFTY]',
612    '[\x{10C}-{INFTY}\x{00}-{HIGHEST_CP}]' => 'SANY',
613    '[\x{10C}-{INFTY}\x{00}-{INFTY}]' => 'SANY',
614    '[\x{10C}-{INFTY}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
615    '[\x{10C}-{INFTY}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
616    '[\x{10C}-{INFTY}\x{102}\x{104}]' => 'ANYOFH[0102 0104 010C-INFTY]',
617    '[\x{10C}-{INFTY}\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 010C-INFTY]',
618    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{100}]' => 'ANYOFH[0100 0102-0104 010C-INFTY]',
619    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}]' => 'ANYOFH[0101-0104 010C-INFTY]',
620    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
621    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
622    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}]' => 'ANYOFH[0102-0104 010C-INFTY]',
623    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
624    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
625    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
626    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
627    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
628    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}]' => 'ANYOFH[0102-0104 010C-INFTY]',
629    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
630    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
631    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}]' => 'ANYOFH[0102-0105 010C-INFTY]',
632    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
633    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
634    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}]' => 'ANYOFH[0102-0104 0106 010C-INFTY]',
635    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
636    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
637    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
638    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
639    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
640    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
641    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
642    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
643    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
644    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFH[0101-0105 0108-010A 010C-INFTY]',
645    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFH[0101-0106 0108-010A 010C-INFTY]',
646    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFH[0101-010A 010C-INFTY]',
647    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFH[0101-010A 010C-INFTY]',
648    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFH[0101-010A 010C-INFTY]',
649    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFH[0101-010A 010C-INFTY]',
650    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFH[0101-INFTY]',
651    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
652    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
653    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
654    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
655    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
656    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
657    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
658    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
659    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
660    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
661    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
662    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
663    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
664    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
665    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
666    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
667    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
668    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
669    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
670    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
671    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
672    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
673    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
674    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
675    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
676    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
677    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
678    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
679    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
680    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
681    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
682    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
683    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
684    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
685    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
686    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
687    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
688    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
689    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
690    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
691    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
692    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
693    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
694    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
695    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
696    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
697    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
698    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFH[0102-0104 0106 0108-010A 010C-INFTY]',
699    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
700    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
701    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
702    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
703    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
704    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
705    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFH[0102-0104 0106-INFTY]',
706    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFH[0102-0104 0106-INFTY]',
707    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFH[0102-0104 0107-010A 010C-INFTY]',
708    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
709    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
710    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
711    '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFH[0102-0104 0108-INFTY]',
712    '[\x{10C}-{INFTY}\x{103}\x{102}]' => 'ANYOFH[0102-0103 010C-INFTY]',
713    '[\x{10C}-{INFTY}\x{104}\x{102}]' => 'ANYOFH[0102 0104 010C-INFTY]',
714    '[\x{10C}-{INFTY}\x{104}\x{102}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
715    '[{HIGHEST_CP}]' => 'EXACT_REQ8 <\x{HIGHEST_CP}>',
716
717    '(?8)(?i)[\x{410}]' => 'EXACTFU_REQ8 <\x{430}>',
718    '(?8)(?i)[\x{399}]' => 'EXACTFU_REQ8 <\x{3b9}>',
719    '(?8)(?i)[\x{345}\x{399}\x{3B9}\x{1FBE}]' => 'EXACTFU_REQ8 <\x{3b9}>',
720    '(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>',           # Doesn't participate in a fold
721    '(?8)(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>',
722    '(?i)[\x{2bc}]' => 'EXACTFU_REQ8 <\x{2bc}>', # Part of a multi-char fold, ASCII component
723    '(?i)[\x{390}]' => 'EXACTFU_REQ8 <\x{3b9}\x{308}\x{301}>', # Part of a multi-char fold, no ASCII component
724
725    '(?i)[\x{1E9E}]' => 'EXACTFU <ss>',
726    '(?iaa)[\x{1E9E}]' => 'EXACTFAA <\x{17f}\x{17f}>',
727    '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
728    '(?iaa)[\x{FB00}]' => 'EXACT_REQ8 <\x{fb00}>',
729    '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
730    '(?i)[\x{FB01}]' => 'EXACTFU <fi>',
731    '(?i)[\x{FB02}]' => 'EXACTFU <fl>',
732    '(?i)[\x{FB03}]' => 'EXACTFU <ffi>',
733    '(?i)[\x{FB04}]' => 'EXACTFU <ffl>',
734    '(?i)[\x{FB05}]' => 'EXACTFU <st>',
735    '(?i)[\x{FB06}]' => 'EXACTFU <st>',
736
737    '[a][b]' => 'EXACT <ab>',
738    '[a]\x{100}' => 'EXACT_REQ8 <a\x{100}>',
739    '(?8)[\x{100}]a' => 'EXACT_REQ8 <\x{100}a>',
740    '(?i)[b][c]' => 'EXACTFU <bc>',
741    '(?i)[b]\x{100}' => 'EXACTFU_REQ8 <b\x{101}>',
742    '(?8)(?i)[\x{100}]b' => 'EXACTFU_REQ8 <\x{101}b>',
743    '(?i)b[s]' => 'EXACTFU <bs>',
744    '(?i)b[s]c' => 'EXACTFU <bsc>',
745    '(?i)bs[s]c' => 'EXACTF <bss>',  # The c goes into a 2nd node
746    '(?iu)bs[s]c' => 'EXACTFUP <bssc>',
747    '(?i)b[s]sc' => 'EXACTF <bssc>',
748    '(?iu)b[s]sc' => 'EXACTFUP <bssc>',
749    '(?i)[b]st' => 'EXACTFU <bst>',
750    '(?i)[b]st[s]' => 'EXACTFU <bsts>',
751    '(?i)[b]st[s]st' => 'EXACTF <bstsst>',
752    '(?iu)[b]st[s]st' => 'EXACTFUP <bstsst>',
753    '(?i)[s][s]' => 'EXACTF <ss>',
754    '(?iu)[s][s]' => 'EXACTFUP <ss>',
755);
756
757my @single_chars_to_test =
758(
759    "\x00",     # Always potentially problematic
760    "\x01",     # Unnamed control
761    "\b",       # Named control
762    "\n",       # Potentially special
763    "\r",       # Potentially special
764    "\cK",      # Potentially special
765    "0",        # Digit
766    ":",        # Not in any fold
767    "A",        # ASCII capital, participates in multi-char fold
768    "a",        # ASCII small, participates in multi-char fold
769    "B",        # ASCII capital, participates only in case-pair fold
770    "b",        # ASCII small, participates only in case-pair fold
771    "K",        # ASCII capital, folded to from above Latin1
772    "k",        # ASCII small, folded to from above Latin1
773    "\c?",      # Potentially special
774    "\x80",     # Latin1 control
775    "\xB5",     # Micro sign, folds to above Latin1
776    "\xC0",     # Latin1 capital, participates only in case-pair fold
777    "\xE0",     # Latin1 small, participates only in case-pair fold
778    "\xC5",     # Latin1 capital, folded to from above Latin1
779    "\xE5",     # Latin1 small, folded to from above Latin1
780    "\xDF",     # Small sharp S. folds to 'ss'
781    "\xF7",     # Doesn't participate in any fold
782    "\xFF",     # Folded to by above Latin1
783    "\x{100}",  # First few above Latin1 characters
784    "\x{101}",
785    "\x{102}",
786    "\x{103}",
787    "\x{104}",
788    "\x{105}",
789    "\x{106}",
790    "\x{107}",
791    "\x{108}",
792    "\x{2029}",
793);
794
795my @single_tests;
796for my $char (@single_chars_to_test) {
797    my $cp = ord $char;
798    my $hex = sprintf "%02x", $cp;
799    my $oct = sprintf "%o", $cp;
800    my $cp_string;
801
802    my $cased;
803    my $folded_hex;
804
805    {
806        use feature 'unicode_strings';
807        $cased = uc $char ne $char || lc $char ne $char;
808        $folded_hex = ($cased)
809                      ? sprintf("%02x", ord lc $char)
810                      : $hex;
811        #print STDERR "$hex, $folded_hex\n";
812    }
813
814    for my $fold ("", "i") {
815        #next unless $fold;
816        for my $charset ("", "u", "l", "aa") {
817            #next if $charset eq "aa" && ! $fold;
818
819            my $modifiers = $fold . $charset;
820            $modifiers = "(?$modifiers)" if $modifiers;
821
822            for my $upgrade ("", "(?8)") {
823                push @single_tests, "$upgrade$modifiers\[\\x{$hex}\]";
824                if ($cp < 256 || $upgrade) {
825                    push @single_tests, get_compiled("$upgrade$modifiers\\x{$hex}");
826                }
827                else {
828                    use feature 'fc';
829
830                    my %list = ( sprintf("%X", $cp) => 1 );
831                    if ($fold) {
832                        for my $op (qw(fc lc uc)) {
833                            my $result = eval "$op(\"$char\")";
834                            $list{sprintf "%X", ord $result} = 1;
835                        }
836                    }
837
838                    my $mod_cp = $cp;
839                    my $op;
840
841                    if (! $fold || scalar keys %list == 1) {
842                        $op = ($charset eq 'l')
843                                ? 'EXACTL'
844                                : ($cp < 256)
845                                ? 'EXACT'
846                                : 'EXACT_REQ8';
847                    }
848                    else {
849                        $op = ($charset eq 'aa')
850                        ? 'EXACTFAA'
851                        : ($charset eq 'l')
852                            ? (($cp < 256)
853                            ? 'EXACTFL'
854                            : 'EXACTFLU8')
855                            : ($cp < 256)
856                            ? 'EXACTFU'
857                            : 'EXACTFU_REQ8';
858                        $mod_cp = ord fc $char;
859                    }
860
861                    push @single_tests, sprintf "$op <\\x{%X}>", $mod_cp;
862                }
863            }
864        }
865    }
866}
867
868unshift @tests, @single_tests;
869
870plan(scalar (@tests - 1) / 2);  # -1 because of the marker.
871
872my $skip_ebcdic = $::IS_EBCDIC;
873while (defined (my $test = shift @tests)) {
874
875    if ($test eq 'ebcdic_ok_below_this_marker') {
876        $skip_ebcdic = 0;
877        next;
878    }
879
880    my $expected = shift @tests;
881
882    SKIP: {
883        skip("test not ported to EBCDIC", 1) if $skip_ebcdic;
884
885        my $display_expected = $expected
886                                        =~ s/ HIGHEST_CP /$highest_cp_string/xgr;
887        my $test_name = "Verify compilation of $test displays as"
888                      . " $expected";
889
890        my $result = get_compiled($test);
891        if ($expected =~ / ^ ANYOF[HR] /x) {
892            like($result, qr/ ^ \Q$expected\E (?:\Q (First UTF-8 byte=\x\E
893                              [[:xdigit:]]{2} )? /x, $test_name);
894        }
895        else {
896            is($result, $expected, $test_name);
897        }
898    }
899}
900