7 # This tests that the ANYOF nodes generated by bracketed character classes are
8 # as expected. The representation of these is not guaranteed, and this test
9 # may need to be updated if it changes. But it is here to make sure that no
10 # unexpected changes occur. These could come from faulty generation of the
11 # node, or faulty display of them (or both). Because these causes come from
12 # very different parts of the regex compiler, it is unlikely that a commit
13 # would change both of them, so this test will adequately serve to test both.
18 set_up_inc('../lib','.','../ext/re');
19 require Config; import Config;
20 skip_all('no re module') unless defined &DynaLoader::boot_DynaLoader;
23 # An array is used instead of a hash, so that the tests are carried out in the
24 # order given by this file. Even-numbered indices are the regexes to compile.
25 # The next higher element is the expected compilation result.
27 # It is painful to port some of these to EBCDIC, as not only do the code point
28 # numbers change (for those < 256), but the order changes, as the compiled
29 # version is sorted by native code point order. On EBCDIC, \r comes before
30 # \n, and 'k' before "K', for example. So, the tests where there are
31 # differences are skipped on EBCDIC. They are all at the beginning of the
32 # array, and a special marker entry is used to delmit the boundary between
33 # skipped and not skipped.
35 # NOTE: If the pattern contains (?8) it will be upgraded to UTF-8 after
39 my $highest_cp = $Unicode::UCD::MAX_CP;
40 my $highest_cp_string = sprintf "%X", $highest_cp;
41 $highest_cp_string = "$highest_cp_string";
43 my $infinity = $highest_cp_string;
44 $infinity =~ s/^7/F/; # Make infinity larger than the largest legal one, and
45 # at the time of this writing, we really internally
46 # allow UV_MAX to be infinity.
48 sub get_compiled ($) {
49 # Convert platform-independent values to what is suitable for the
54 $pattern =~ s/{INFTY}/\\x{$infinity}/g;
55 $pattern =~ s/{HIGHEST_CP}/\\x{$highest_cp_string}/g;
56 my $use_utf8 = ($pattern =~ s/\Q(?8)//);
58 $pattern = "my \$a = '$pattern';";
59 $pattern .= "utf8::upgrade(\$a);" if $use_utf8;
60 $pattern .= "qr/\$a/";
61 my $actual_pattern = "use re qw(Debug COMPILE); $pattern";
63 my $result = fresh_perl($actual_pattern);
64 if ($? != 0) { # Re-run so as to display STDERR.
65 fail($pattern, "Until this is fixed, the planned number of tests will be wrong");
66 fresh_perl($actual_pattern, { stderr => 0, verbose => 1 });
70 # The Debug output will come back as a bunch of lines. We are
71 # interested only in the line after /Final program/
72 my @lines = split /\n/, $result;
73 while (defined ($_ = shift @lines)) {
74 last if /Final program/;
79 die "Unexpected compilation result: '$result'\n"
80 . " Compiled from '$actual_pattern'";
83 s/ \s* \( \d+ \) \s* //x; # Get rid of the node branch
84 s/ ^ \s* \d+ : \s* //x; # ... And the node number
86 # Use platform-independent values
88 s/$highest_cp_string/HIGHEST_CP/ig;
93 # Note: EXACTish lowercases the hex; ANYOF uppercases, without braces
96 '[\xe0\xc0]' => 'EXACTFU <\\x{e0}>',
97 '[\xe1\xc1]' => 'EXACTFU <\\x{e1}>',
98 '[\xe2\xc2]' => 'EXACTFU <\\x{e2}>',
99 '[\xe3\xc3]' => 'EXACTFU <\\x{e3}>',
100 '[\xe4\xc4]' => 'EXACTFU <\\x{e4}>',
101 '[\xc5\xe5]' => 'ANYOF[\\xC5\\xE5]',
102 '[\xe6\xc6]' => 'EXACTFU <\\x{e6}>',
103 '[\xe7\xc7]' => 'EXACTFU <\\x{e7}>',
104 '[\xe8\xc8]' => 'EXACTFU <\\x{e8}>',
105 '[\xe9\xc9]' => 'EXACTFU <\\x{e9}>',
106 '[\xea\xca]' => 'EXACTFU <\\x{ea}>',
107 '[\xeb\xcb]' => 'EXACTFU <\\x{eb}>',
108 '[\xec\xcc]' => 'EXACTFU <\\x{ec}>',
109 '[\xee\xce]' => 'EXACTFU <\\x{ee}>',
110 '[\xef\xcf]' => 'EXACTFU <\\x{ef}>',
111 '[\xf0\xd0]' => 'EXACTFU <\\x{f0}>',
112 '[\xf1\xd1]' => 'EXACTFU <\\x{f1}>',
113 '[\xf2\xd2]' => 'EXACTFU <\\x{f2}>',
114 '[\xf3\xd3]' => 'EXACTFU <\\x{f3}>',
115 '[\xf4\xd4]' => 'EXACTFU <\\x{f4}>',
116 '[\xf5\xd5]' => 'EXACTFU <\\x{f5}>',
117 '[\xf6\xd6]' => 'EXACTFU <\\x{f6}>',
118 '[\xf8\xd8]' => 'EXACTFU <\\x{f8}>',
119 '[\xf9\xd9]' => 'EXACTFU <\\x{f9}>',
120 '[\xfa\xda]' => 'EXACTFU <\\x{fa}>',
121 '[\xfb\xdb]' => 'EXACTFU <\\x{fb}>',
122 '[\xfc\xdc]' => 'EXACTFU <\\x{fc}>',
123 '[\xfd\xdd]' => 'EXACTFU <\\x{fd}>',
124 '[\xfe\xde]' => 'EXACTFU <\\x{fe}>',
126 '[[{]' => 'ANYOFM[\[\{]',
127 '[^\S ]' => 'ANYOFD[\t\n\x0B\f\r{utf8}\x85\xA0][1680 2000-200A 2028-2029 202F 205F 3000]',
128 '[^\n\r]' => 'ANYOF[^\n\r][0100-INFTY]',
129 '[^\/\|,\$\%%\@\ \%"\<\>\:\#\&\*\{\}\[\]\(\)]' => 'ANYOF[^ "#$%&()*,/:<>@\[\]\{|\}][0100-INFTY]',
130 '[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
131 '[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
132 '[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
133 '(?u)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
134 '(?u)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
135 '(?a)[[:ascii:]]' => 'ANYOFM[\x00-\x7F]',
136 '(?a)[[:^ascii:]]' => 'NANYOFM[\x00-\x7F]',
137 '(?a)[[:^ascii:]\x{2C2}]' => 'NANYOFM[\x00-\x7F]',
138 '[[:cntrl:]]' => 'POSIXD[:cntrl:]',
139 '[^[:^print:][:^ascii:]]' => 'POSIXA[:print:]',
140 '[[:blank:]]' => 'POSIXD[:blank:]',
141 '[ [:blank:]]' => 'POSIXD[:blank:]',
142 '[_[:blank:]]' => 'ANYOFD[\t _{utf8}\xA0][1680 2000-200A 202F 205F 3000]',
143 '[_[:^blank:]]' => 'NPOSIXD[:blank:]',
144 '[\xA0[:^blank:]]' => 'ANYOF[^\t ][0100-167F 1681-1FFF 200B-202E 2030-205E 2060-2FFF 3001-INFTY]',
145 '(?d:[_[:^blank:]])' => 'NPOSIXD[:blank:]',
146 '[\x{07}-\x{0B}]' => 'ANYOFR[\a\b\t\n\x0B]',
147 '(?l)[\x{2029}]' => 'EXACTL <\x{2029}>',
148 '(?l)(?[\x{2029}])' => 'ANYOFL{utf8-locale-reqd}[2029]', # regex sets requires utf8 locale for /l
149 '(?il)[\x{212A}]' => 'EXACTFL <\\x{212a}>',
150 '(?il)(?[\x{212A}])' => 'ANYOFL{utf8-locale-reqd}[Kk][212A]',
152 '(?i)b[s]\xe0' => 'ANYOFM[Bb]', # The s goes into a 2nd node
154 '[aA]' => 'ANYOFM[Aa]',
155 '[bB]' => 'ANYOFM[Bb]',
156 '[kK]' => 'ANYOFM[Kk]',
158 'ebcdic_ok_below_this_marker',
160 '(?i:[^:])' => 'NANYOFM[:]',
162 '[^\n]' => 'REG_ANY',
164 '[[:alpha:]]' => 'POSIXD[:alpha:]',
165 '[[:^alpha:]]' => 'NPOSIXD[:alpha:]',
166 '[[:^alpha:]\x{2C2}]' => 'NPOSIXU[:alpha:]',
167 '(?l)[[:alpha:]]' => 'POSIXL[:alpha:]',
168 '(?l)[[:^alpha:]]' => 'NPOSIXL[:alpha:]',
169 '(?l)[[:^alpha:]\x{2C2}]' => 'NPOSIXL[:alpha:]',
170 '(?u)[[:alpha:]]' => 'POSIXU[:alpha:]',
171 '(?u)[[:^alpha:]]' => 'NPOSIXU[:alpha:]',
172 '(?a)[[:alpha:]]' => 'POSIXA[:alpha:]',
173 '(?a)[[:^alpha:]]' => 'NPOSIXA[:alpha:]',
174 '(?a)[[:^alpha:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
175 '[[:alpha:][:^alpha:]]' => 'SANY',
176 '[^[:alpha:][:^alpha:]]' => 'OPFAIL',
177 '(?l)[[:alpha:][:^alpha:]]' => 'SANY',
178 '(?l)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
179 '(?u)[[:alpha:][:^alpha:]]' => 'SANY',
180 '(?u)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
181 '(?a)[[:alpha:][:^alpha:]]' => 'SANY',
182 '(?a)[^[:alpha:][:^alpha:]]' => 'OPFAIL',
183 '[[:alnum:]]' => 'POSIXD[:alnum:]',
184 '[[:^alnum:]]' => 'NPOSIXD[:alnum:]',
185 '[[:^alnum:]\x{2C2}]' => 'NPOSIXU[:alnum:]',
186 '(?l)[[:alnum:]]' => 'POSIXL[:alnum:]',
187 '(?l)[[:^alnum:]]' => 'NPOSIXL[:alnum:]',
188 '(?l)[[:^alnum:]\x{2C2}]' => 'NPOSIXL[:alnum:]',
189 '(?u)[[:alnum:]]' => 'POSIXU[:alnum:]',
190 '(?u)[[:^alnum:]]' => 'NPOSIXU[:alnum:]',
191 '(?a)[[:alnum:]]' => 'POSIXA[:alnum:]',
192 '(?a)[[:^alnum:]]' => 'NPOSIXA[:alnum:]',
193 '(?a)[[:^alnum:]\x{2C2}]' => 'NPOSIXA[:alnum:]',
194 '[[:alnum:][:^alnum:]]' => 'SANY',
195 '[^[:alnum:][:^alnum:]]' => 'OPFAIL',
196 '(?l)[[:alnum:][:^alnum:]]' => 'SANY',
197 '(?l)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
198 '(?u)[[:alnum:][:^alnum:]]' => 'SANY',
199 '(?u)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
200 '(?a)[[:alnum:][:^alnum:]]' => 'SANY',
201 '(?a)[^[:alnum:][:^alnum:]]' => 'OPFAIL',
202 '(?l)[[:ascii:]]' => 'POSIXL[:ascii:]',
203 '(?l)[[:^ascii:]]' => 'NPOSIXL[:ascii:]',
204 '(?l)[[:^ascii:]\x{2C2}]' => 'NPOSIXL[:ascii:]',
205 '[[:ascii:][:^ascii:]]' => 'SANY',
206 '[^[:ascii:][:^ascii:]]' => 'OPFAIL',
207 '(?l)[[:ascii:][:^ascii:]]' => 'SANY',
208 '(?l)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
209 '(?u)[[:ascii:][:^ascii:]]' => 'SANY',
210 '(?u)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
211 '(?a)[[:ascii:][:^ascii:]]' => 'SANY',
212 '(?a)[^[:ascii:][:^ascii:]]' => 'OPFAIL',
213 '[[:^blank:]]' => 'NPOSIXD[:blank:]',
214 '[[:^blank:]\x{2C2}]' => 'NPOSIXU[:blank:]',
215 '(?l)[[:blank:]]' => 'POSIXL[:blank:]',
216 '(?l)[[:^blank:]]' => 'NPOSIXL[:blank:]',
217 '(?l)[[:^blank:]\x{2C2}]' => 'NPOSIXL[:blank:]',
218 '(?u)[[:blank:]]' => 'POSIXU[:blank:]',
219 '(?u)[[:^blank:]]' => 'NPOSIXU[:blank:]',
220 '(?a)[[:blank:]]' => 'POSIXA[:blank:]',
221 '(?a)[[:^blank:]]' => 'NPOSIXA[:blank:]',
222 '(?a)[[:^blank:]\x{2C2}]' => 'NPOSIXA[:blank:]',
223 '[[:blank:]]' => 'POSIXD[:blank:]',
224 '[[:blank:][:^blank:]]' => 'SANY',
225 '[^[:blank:][:^blank:]]' => 'OPFAIL',
226 '(?l)[[:blank:][:^blank:]]' => 'SANY',
227 '(?l)[^[:blank:][:^blank:]]' => 'OPFAIL',
228 '(?u)[[:blank:][:^blank:]]' => 'SANY',
229 '(?u)[^[:blank:][:^blank:]]' => 'OPFAIL',
230 '(?a)[[:blank:][:^blank:]]' => 'SANY',
231 '(?a)[^[:blank:][:^blank:]]' => 'OPFAIL',
232 '[[:^cntrl:]]' => 'NPOSIXD[:cntrl:]',
233 '[[:^cntrl:]\x{2C2}]' => 'NPOSIXU[:cntrl:]',
234 '(?l)[[:cntrl:]]' => 'POSIXL[:cntrl:]',
235 '(?l)[[:^cntrl:]]' => 'NPOSIXL[:cntrl:]',
236 '(?l)[[:^cntrl:]\x{2C2}]' => 'NPOSIXL[:cntrl:]',
237 '(?u)[[:cntrl:]]' => 'POSIXU[:cntrl:]',
238 '(?u)[[:^cntrl:]]' => 'NPOSIXU[:cntrl:]',
239 '(?a)[[:cntrl:]]' => 'POSIXA[:cntrl:]',
240 '(?a)[[:^cntrl:]]' => 'NPOSIXA[:cntrl:]',
241 '(?a)[[:^cntrl:]\x{2C2}]' => 'NPOSIXA[:cntrl:]',
242 '[[:cntrl:][:^cntrl:]]' => 'SANY',
243 '[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
244 '(?l)[[:cntrl:][:^cntrl:]]' => 'SANY',
245 '(?l)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
246 '(?u)[[:cntrl:][:^cntrl:]]' => 'SANY',
247 '(?u)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
248 '(?a)[[:cntrl:][:^cntrl:]]' => 'SANY',
249 '(?a)[^[:cntrl:][:^cntrl:]]' => 'OPFAIL',
250 '[[:digit:]]' => 'POSIXU[\d]',
251 '[[:^digit:]]' => 'NPOSIXU[\d]',
252 '[[:^digit:]\x{2C2}]' => 'NPOSIXU[\d]',
253 '(?l)[[:digit:]]' => 'POSIXL[\d]',
254 '(?l)[[:^digit:]]' => 'NPOSIXL[\d]',
255 '(?l)[[:^digit:]\x{2C2}]' => 'NPOSIXL[\d]',
256 '(?u)[[:digit:]]' => 'POSIXU[\d]',
257 '(?u)[[:^digit:]]' => 'NPOSIXU[\d]',
258 '(?a)[[:digit:]]' => 'POSIXA[\d]',
259 '(?a)[[:^digit:]]' => 'NPOSIXA[\d]',
260 '(?a)[[:^digit:]\x{2C2}]' => 'NPOSIXA[\d]',
261 '[[:digit:][:^digit:]]' => 'SANY',
262 '[^[:digit:][:^digit:]]' => 'OPFAIL',
263 '(?l)[[:digit:][:^digit:]]' => 'SANY',
264 '(?l)[^[:digit:][:^digit:]]' => 'OPFAIL',
265 '(?u)[[:digit:][:^digit:]]' => 'SANY',
266 '(?u)[^[:digit:][:^digit:]]' => 'OPFAIL',
267 '(?a)[[:digit:][:^digit:]]' => 'SANY',
268 '(?a)[^[:digit:][:^digit:]]' => 'OPFAIL',
269 '[[:graph:]]' => 'POSIXD[:graph:]',
270 '[[:^graph:]]' => 'NPOSIXD[:graph:]',
271 '[[:^graph:]\x{FFFF}]' => 'NPOSIXU[:graph:]',
272 '(?l)[[:graph:]]' => 'POSIXL[:graph:]',
273 '(?l)[[:^graph:]]' => 'NPOSIXL[:graph:]',
274 '(?l)[[:^graph:]\x{FFFF}]' => 'NPOSIXL[:graph:]',
275 '(?u)[[:graph:]]' => 'POSIXU[:graph:]',
276 '(?u)[[:^graph:]]' => 'NPOSIXU[:graph:]',
277 '(?a)[[:graph:]]' => 'POSIXA[:graph:]',
278 '(?a)[[:^graph:]]' => 'NPOSIXA[:graph:]',
279 '(?a)[[:^graph:]\x{FFFF}]' => 'NPOSIXA[:graph:]',
280 '[[:graph:][:^graph:]]' => 'SANY',
281 '[^[:graph:][:^graph:]]' => 'OPFAIL',
282 '(?l)[[:graph:][:^graph:]]' => 'SANY',
283 '(?l)[^[:graph:][:^graph:]]' => 'OPFAIL',
284 '(?u)[[:graph:][:^graph:]]' => 'SANY',
285 '(?u)[^[:graph:][:^graph:]]' => 'OPFAIL',
286 '(?a)[[:graph:][:^graph:]]' => 'SANY',
287 '(?a)[^[:graph:][:^graph:]]' => 'OPFAIL',
288 '[[:lower:]]' => 'POSIXD[:lower:]',
289 '[[:^lower:]]' => 'NPOSIXD[:lower:]',
290 '[[:^lower:]\x{2C2}]' => 'NPOSIXU[:lower:]',
291 '(?l)[[:lower:]]' => 'POSIXL[:lower:]',
292 '(?l)[[:^lower:]]' => 'NPOSIXL[:lower:]',
293 '(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:lower:]',
294 '(?u)[[:lower:]]' => 'POSIXU[:lower:]',
295 '(?u)[[:^lower:]]' => 'NPOSIXU[:lower:]',
296 '(?a)[[:lower:]]' => 'POSIXA[:lower:]',
297 '(?a)[[:^lower:]]' => 'NPOSIXA[:lower:]',
298 '(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:lower:]',
299 '[[:lower:][:^lower:]]' => 'SANY',
300 '[^[:lower:][:^lower:]]' => 'OPFAIL',
301 '(?l)[[:lower:][:^lower:]]' => 'SANY',
302 '(?l)[^[:lower:][:^lower:]]' => 'OPFAIL',
303 '(?u)[[:lower:][:^lower:]]' => 'SANY',
304 '(?u)[^[:lower:][:^lower:]]' => 'OPFAIL',
305 '(?a)[[:lower:][:^lower:]]' => 'SANY',
306 '(?a)[^[:lower:][:^lower:]]' => 'OPFAIL',
307 '[[:print:]]' => 'POSIXD[:print:]',
308 '[[:^print:]]' => 'NPOSIXD[:print:]',
309 '[[:^print:]\x{FFFF}]' => 'NPOSIXU[:print:]',
310 '(?l)[[:print:]]' => 'POSIXL[:print:]',
311 '(?l)[[:^print:]]' => 'NPOSIXL[:print:]',
312 '(?l)[[:^print:]\x{FFFF}]' => 'NPOSIXL[:print:]',
313 '(?u)[[:print:]]' => 'POSIXU[:print:]',
314 '(?u)[[:^print:]]' => 'NPOSIXU[:print:]',
315 '(?a)[[:print:]]' => 'POSIXA[:print:]',
316 '(?a)[[:^print:]]' => 'NPOSIXA[:print:]',
317 '(?a)[[:^print:]\x{FFFF}]' => 'NPOSIXA[:print:]',
318 '[[:print:][:^print:]]' => 'SANY',
319 '[^[:print:][:^print:]]' => 'OPFAIL',
320 '(?l)[[:print:][:^print:]]' => 'SANY',
321 '(?l)[^[:print:][:^print:]]' => 'OPFAIL',
322 '(?u)[[:print:][:^print:]]' => 'SANY',
323 '(?u)[^[:print:][:^print:]]' => 'OPFAIL',
324 '(?a)[[:print:][:^print:]]' => 'SANY',
325 '(?a)[^[:print:][:^print:]]' => 'OPFAIL',
326 '[[:punct:]]' => 'POSIXD[:punct:]',
327 '[[:^punct:]]' => 'NPOSIXD[:punct:]',
328 '[[:^punct:]\x{2C2}]' => 'NPOSIXU[:punct:]',
329 '(?l)[[:punct:]]' => 'POSIXL[:punct:]',
330 '(?l)[[:^punct:]]' => 'NPOSIXL[:punct:]',
331 '(?l)[[:^punct:]\x{2C2}]' => 'NPOSIXL[:punct:]',
332 '(?u)[[:punct:]]' => 'POSIXU[:punct:]',
333 '(?u)[[:^punct:]]' => 'NPOSIXU[:punct:]',
334 '(?a)[[:punct:]]' => 'POSIXA[:punct:]',
335 '(?a)[[:^punct:]]' => 'NPOSIXA[:punct:]',
336 '(?a)[[:^punct:]\x{2C2}]' => 'NPOSIXA[:punct:]',
337 '[[:punct:][:^punct:]]' => 'SANY',
338 '[^[:punct:][:^punct:]]' => 'OPFAIL',
339 '(?l)[[:punct:][:^punct:]]' => 'SANY',
340 '(?l)[^[:punct:][:^punct:]]' => 'OPFAIL',
341 '(?u)[[:punct:][:^punct:]]' => 'SANY',
342 '(?u)[^[:punct:][:^punct:]]' => 'OPFAIL',
343 '(?a)[[:punct:][:^punct:]]' => 'SANY',
344 '(?a)[^[:punct:][:^punct:]]' => 'OPFAIL',
345 '[[:space:]]' => 'POSIXD[\s]',
346 '[[:^space:]]' => 'NPOSIXD[\s]',
347 '[[:^space:]\x{2C2}]' => 'NPOSIXU[\s]',
348 '(?l)[[:space:]]' => 'POSIXL[\s]',
349 '(?l)[[:^space:]]' => 'NPOSIXL[\s]',
350 '(?l)[[:^space:]\x{2C2}]' => 'NPOSIXL[\s]',
351 '(?u)[[:space:]]' => 'POSIXU[\s]',
352 '(?u)[[:^space:]]' => 'NPOSIXU[\s]',
353 '(?a)[[:space:]]' => 'POSIXA[\s]',
354 '(?a)[[:^space:]]' => 'NPOSIXA[\s]',
355 '(?a)[[:^space:]\x{2C2}]' => 'NPOSIXA[\s]',
356 '[[:space:][:^space:]]' => 'SANY',
357 '[^[:space:][:^space:]]' => 'OPFAIL',
358 '(?l)[[:space:][:^space:]]' => 'SANY',
359 '(?l)[^[:space:][:^space:]]' => 'OPFAIL',
360 '(?u)[[:space:][:^space:]]' => 'SANY',
361 '(?u)[^[:space:][:^space:]]' => 'OPFAIL',
362 '(?a)[[:space:][:^space:]]' => 'SANY',
363 '(?a)[^[:space:][:^space:]]' => 'OPFAIL',
364 '[[:upper:]]' => 'POSIXD[:upper:]',
365 '[[:^upper:]]' => 'NPOSIXD[:upper:]',
366 '[[:^upper:]\x{2C2}]' => 'NPOSIXU[:upper:]',
367 '(?l)[[:upper:]]' => 'POSIXL[:upper:]',
368 '(?l)[[:^upper:]]' => 'NPOSIXL[:upper:]',
369 '(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:upper:]',
370 '(?u)[[:upper:]]' => 'POSIXU[:upper:]',
371 '(?u)[[:^upper:]]' => 'NPOSIXU[:upper:]',
372 '(?a)[[:upper:]]' => 'POSIXA[:upper:]',
373 '(?a)[[:^upper:]]' => 'NPOSIXA[:upper:]',
374 '(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:upper:]',
375 '[[:upper:][:^upper:]]' => 'SANY',
376 '[^[:upper:][:^upper:]]' => 'OPFAIL',
377 '(?l)[[:upper:][:^upper:]]' => 'SANY',
378 '(?l)[^[:upper:][:^upper:]]' => 'OPFAIL',
379 '(?u)[[:upper:][:^upper:]]' => 'SANY',
380 '(?u)[^[:upper:][:^upper:]]' => 'OPFAIL',
381 '(?a)[[:upper:][:^upper:]]' => 'SANY',
382 '(?a)[^[:upper:][:^upper:]]' => 'OPFAIL',
383 '[\v]' => 'POSIXU[\v]',
384 '[^\v]' => 'NPOSIXU[\v]',
385 '[\V\x{2C2}]' => 'NPOSIXU[\v]',
386 '(?l)[\v]' => 'POSIXU[\v]',
387 '(?l)[^\v]' => 'NPOSIXU[\v]',
388 '(?l)[\V\x{2C2}]' => 'NPOSIXU[\v]',
389 '(?u)[\v]' => 'POSIXU[\v]',
390 '(?u)[^\v]' => 'NPOSIXU[\v]',
391 '(?a)[\v]' => 'POSIXU[\v]',
392 '(?a)[^\v]' => 'NPOSIXU[\v]',
393 '(?a)[\V\x{2C2}]' => 'NPOSIXU[\v]',
395 '[^\v\V]' => 'OPFAIL',
396 '(?l)[\v\V]' => 'SANY',
397 '(?l)[^\v\V]' => 'OPFAIL',
398 '(?u)[\v\V]' => 'SANY',
399 '(?u)[^\v\V]' => 'OPFAIL',
400 '(?a)[\v\V]' => 'SANY',
401 '(?a)[^\v\V]' => 'OPFAIL',
402 '[[:word:]]' => 'POSIXD[\w]',
403 '[[:^word:]]' => 'NPOSIXD[\w]',
404 '[[:^word:]\x{2C2}]' => 'NPOSIXU[\w]',
405 '(?l)[[:word:]]' => 'POSIXL[\w]',
406 '(?l)[[:^word:]]' => 'NPOSIXL[\w]',
407 '(?l)[[:^word:]\x{2C2}]' => 'NPOSIXL[\w]',
408 '(?u)[[:word:]]' => 'POSIXU[\w]',
409 '(?u)[[:^word:]]' => 'NPOSIXU[\w]',
410 '(?a)[[:word:]]' => 'POSIXA[\w]',
411 '(?a)[[:^word:]]' => 'NPOSIXA[\w]',
412 '(?a)[[:^word:]\x{2C2}]' => 'NPOSIXA[\w]',
413 '[[:word:][:^word:]]' => 'SANY',
414 '[^[:word:][:^word:]]' => 'OPFAIL',
415 '(?l)[[:word:][:^word:]]' => 'SANY',
416 '(?l)[^[:word:][:^word:]]' => 'OPFAIL',
417 '(?u)[[:word:][:^word:]]' => 'SANY',
418 '(?u)[^[:word:][:^word:]]' => 'OPFAIL',
419 '(?a)[[:word:][:^word:]]' => 'SANY',
420 '(?a)[^[:word:][:^word:]]' => 'OPFAIL',
421 '[[:xdigit:]]' => 'POSIXU[:xdigit:]',
422 '[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
423 '[[:^xdigit:]\x{2C2}]' => 'NPOSIXU[:xdigit:]',
424 '(?l)[[:xdigit:]]' => 'POSIXL[:xdigit:]',
425 '(?l)[[:^xdigit:]]' => 'NPOSIXL[:xdigit:]',
426 '(?l)[[:^xdigit:]\x{2C2}]' => 'NPOSIXL[:xdigit:]',
427 '(?u)[[:xdigit:]]' => 'POSIXU[:xdigit:]',
428 '(?u)[[:^xdigit:]]' => 'NPOSIXU[:xdigit:]',
429 '(?a)[[:xdigit:]]' => 'POSIXA[:xdigit:]',
430 '(?a)[[:^xdigit:]]' => 'NPOSIXA[:xdigit:]',
431 '(?a)[[:^xdigit:]\x{2C2}]' => 'NPOSIXA[:xdigit:]',
432 '[[:xdigit:][:^xdigit:]]' => 'SANY',
433 '[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
434 '(?l)[[:xdigit:][:^xdigit:]]' => 'SANY',
435 '(?l)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
436 '(?u)[[:xdigit:][:^xdigit:]]' => 'SANY',
437 '(?u)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
438 '(?a)[[:xdigit:][:^xdigit:]]' => 'SANY',
439 '(?a)[^[:xdigit:][:^xdigit:]]' => 'OPFAIL',
440 '(?i)[[:lower:]]' => 'POSIXD[:cased:]',
441 '(?i)[[:^lower:]]' => 'NPOSIXD[:cased:]',
442 '(?i)[[:^lower:]\x{2C2}]' => 'NPOSIXU[:cased:]',
443 '(?i)(?l)[[:lower:]]' => 'POSIXL[:cased:]',
444 '(?i)(?l)[[:^lower:]]' => 'NPOSIXL[:cased:]',
445 '(?i)(?l)[[:^lower:]\x{2C2}]' => 'NPOSIXL[:cased:]',
446 '(?i)(?u)[[:lower:]]' => 'POSIXU[:cased:]',
447 '(?i)(?u)[[:^lower:]]' => 'NPOSIXU[:cased:]',
448 '(?i)(?a)[[:lower:]]' => 'POSIXA[:alpha:]',
449 '(?i)(?a)[[:^lower:]]' => 'NPOSIXA[:alpha:]',
450 '(?i)(?a)[[:^lower:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
451 '(?i)[[:upper:]]' => 'POSIXD[:cased:]',
452 '(?i)[[:^upper:]]' => 'NPOSIXD[:cased:]',
453 '(?i)[[:^upper:]\x{2C2}]' => 'NPOSIXU[:cased:]',
454 '(?i)(?l)[[:upper:]]' => 'POSIXL[:cased:]',
455 '(?i)(?l)[[:^upper:]]' => 'NPOSIXL[:cased:]',
456 '(?i)(?l)[[:^upper:]\x{2C2}]' => 'NPOSIXL[:cased:]',
457 '(?i)(?u)[[:upper:]]' => 'POSIXU[:cased:]',
458 '(?i)(?u)[[:^upper:]]' => 'NPOSIXU[:cased:]',
459 '(?i)(?a)[[:upper:]]' => 'POSIXA[:alpha:]',
460 '(?i)(?a)[[:^upper:]]' => 'NPOSIXA[:alpha:]',
461 '(?i)(?a)[[:^upper:]\x{2C2}]' => 'NPOSIXA[:alpha:]',
462 '(?i)[\d\w]' => 'POSIXD[\w]',
463 '(?i)[\D\w]' => 'SANY',
464 #'(?i)(?l)[\d\w]' => varies depending on Unicode release
465 '(?i)(?l)[\D\w]' => 'ANYOFPOSIXL{i}[\\w\\D][0100-INFTY]',
466 '(?i)(?u)[\d\w]' => 'POSIXU[\w]',
467 '(?i)(?u)[\D\w]' => 'SANY',
468 '(?i)(?a)[\d\w]' => 'POSIXA[\w]',
469 '(?i)(?a)[\D\w]' => 'SANY',
470 '(?l:[\x{212A}])' => 'EXACTL <\x{212a}>',
471 '(?l:[\s\x{212A}])' => 'ANYOFPOSIXL[\s][1680 2000-200A 2028-2029 202F 205F 212A 3000]',
472 '(?l:[^\S\x{202F}])' => 'ANYOFPOSIXL[^\\S][1680 2000-200A 2028-2029 205F 3000]',
473 '(?li:[a-z])' => (($::IS_ASCII)
474 ? 'ANYOFL{i}[a-z{utf8 locale}\x{017F}\x{212A}]'
475 : 'ANYOFL{i}[a-ij-rs-z{utf8 locale}\x{017F}\x{212A}]'),
477 '\P{All}' => 'OPFAIL',
478 '[\p{Any}]' => 'ANYOF[\x00-\xFF][0100-10FFFF]',
480 '[\p{IsMyRuntimeProperty}]' => 'ANYOF[+main::IsMyRuntimeProperty]',
481 '[^\p{IsMyRuntimeProperty}]' => 'ANYOF[^{+main::IsMyRuntimeProperty}]',
482 '[a\p{IsMyRuntimeProperty}]' => 'ANYOF[a][+main::IsMyRuntimeProperty]',
483 '[^a\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}]',
484 '[^a\x{100}\p{IsMyRuntimeProperty}]' => 'ANYOF[^a{+main::IsMyRuntimeProperty}0100]',
485 '[^\p{All}\p{IsMyRuntimeProperty}]' => 'OPFAIL',
486 '[\p{All}\p{IsMyRuntimeProperty}]' => 'SANY',
488 '[\x{00}-{HIGHEST_CP}]' => 'ANYOF[\x00-\xFF][0100-HIGHEST_CP]',
489 '[\x{00}-{INFTY}]' => 'SANY',
490 '[\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
491 '[\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
492 '[\x{102}\x{104}]' => 'ANYOFHb[0102 0104]',
493 '[\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 HIGHEST_CP]',
494 '[\x{102}-\x{104}\x{101}]' => 'ANYOFRb[0101-0104]',
495 '[\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
496 '[\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
497 '[\x{102}-\x{104}\x{102}]' => 'ANYOFRb[0102-0104]',
498 '[\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
499 '[\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
500 '[\x{102}-\x{104}\x{103}]' => 'ANYOFRb[0102-0104]',
501 '[\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
502 '[\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
503 '[\x{102}-\x{104}\x{104}]' => 'ANYOFRb[0102-0104]',
504 '[\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
505 '[\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
506 '[\x{102}-\x{104}\x{105}]' => 'ANYOFRb[0102-0105]',
507 '[\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
508 '[\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
509 '[\x{102}-\x{104}\x{106}]' => 'ANYOFHb[0102-0104 0106]',
510 '[\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
511 '[\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
512 '[\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A HIGHEST_CP]',
513 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFHb[0101-0104 0108-010A]',
514 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
515 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-HIGHEST_CP]',
516 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFHb[0101-0104 0108-010A]',
517 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFHb[0101-0104 0108-010A]',
518 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFHb[0101-0104 0108-010A]',
519 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFHb[0101-0105 0108-010A]',
520 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFHb[0101-0106 0108-010A]',
521 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFRb[0101-010A]',
522 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFRb[0101-010A]',
523 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFRb[0101-010A]',
524 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFRb[0101-010A]',
525 '[\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFRb[0101-010B]',
526 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFHb[0102-0104 0108-010A]',
527 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
528 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
529 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFHb[0102-0104 0108-010A]',
530 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFHb[0102-0104 0108-010A]',
531 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
532 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
533 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
534 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFRb[0102-010A]',
535 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFRb[0102-010A]',
536 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFRb[0102-010A]',
537 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFRb[0102-010A]',
538 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFRb[0102-010B]',
539 '[\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFRb[0102-010C]',
540 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFHb[0102-0104 0108-010A]',
541 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
542 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
543 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
544 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
545 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
546 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFRb[0102-010A]',
547 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFRb[0102-010A]',
548 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFRb[0102-010A]',
549 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFRb[0102-010A]',
550 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFRb[0102-010B]',
551 '[\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFRb[0102-010C]',
552 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFHb[0102-0104 0108-010A]',
553 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
554 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
555 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
556 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
557 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFRb[0102-010A]',
558 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFRb[0102-010A]',
559 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFRb[0102-010A]',
560 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFRb[0102-010A]',
561 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFRb[0102-010B]',
562 '[\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFRb[0102-010C]',
563 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFHb[0102-0105 0108-010A]',
564 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
565 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-HIGHEST_CP]',
566 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFHb[0102-0106 0108-010A]',
567 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFRb[0102-010A]',
568 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFRb[0102-010A]',
569 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFRb[0102-010A]',
570 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFRb[0102-010A]',
571 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFRb[0102-010B]',
572 '[\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFRb[0102-010C]',
573 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFHb[0102-0104 0106 0108-010A]',
574 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
575 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-HIGHEST_CP]',
576 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFHb[0102-0104 0106-010A]',
577 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFHb[0102-0104 0106-010A]',
578 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFHb[0102-0104 0106-010A]',
579 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFHb[0102-0104 0106-010A]',
580 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFHb[0102-0104 0106-010B]',
581 '[\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFHb[0102-0104 0106-010C]',
582 '[\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFHb[0102-0104 0107-010A]',
583 '[\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFHb[0102-0104 0108-010A]',
584 '[\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFHb[0102-0104 0108-010A]',
585 '[\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFHb[0102-0104 0108-010A]',
586 '[\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFHb[0102-0104 0108-010B]',
587 '[\x{103}\x{102}]' => 'EXACTFU_REQ8 <\x{103}>',
588 '[\x{104}\x{102}]' => 'ANYOFHb[0102 0104]',
589 '[\x{104}\x{102}\x{103}]' => 'ANYOFRb[0102-0104]',
590 '[\x{106}-{INFTY}\x{104}]' => 'ANYOFH[0104 0106-INFTY]',
591 '[\x{106}-{INFTY}\x{104}-{INFTY}]' => 'ANYOFH[0104-INFTY]',
592 '[\x{106}-{INFTY}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0104-INFTY]',
593 '[\x{106}-{INFTY}\x{104}-\x{105}]' => 'ANYOFH[0104-INFTY]',
594 '[\x{106}-{INFTY}\x{104}-\x{106}]' => 'ANYOFH[0104-INFTY]',
595 '[\x{106}-{INFTY}\x{104}-\x{107}]' => 'ANYOFH[0104-INFTY]',
596 '[\x{106}-{INFTY}\x{105}]' => 'ANYOFH[0105-INFTY]',
597 '[\x{106}-{INFTY}\x{105}-{INFTY}]' => 'ANYOFH[0105-INFTY]',
598 '[\x{106}-{INFTY}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0105-INFTY]',
599 '[\x{106}-{INFTY}\x{105}-\x{106}]' => 'ANYOFH[0105-INFTY]',
600 '[\x{106}-{INFTY}\x{105}-\x{107}]' => 'ANYOFH[0105-INFTY]',
601 '[\x{106}-{INFTY}\x{106}]' => 'ANYOFH[0106-INFTY]',
602 '[\x{106}-{INFTY}\x{106}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
603 '[\x{106}-{INFTY}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
604 '[\x{106}-{INFTY}\x{106}-\x{107}]' => 'ANYOFH[0106-INFTY]',
605 '[\x{106}-{INFTY}\x{107}]' => 'ANYOFH[0106-INFTY]',
606 '[\x{106}-{INFTY}\x{107}-{INFTY}]' => 'ANYOFH[0106-INFTY]',
607 '[\x{106}-{INFTY}\x{107}-{HIGHEST_CP}]' => 'ANYOFH[0106-INFTY]',
608 '[\x{106}-{INFTY}\x{107}-\x{107}]' => 'ANYOFH[0106-INFTY]',
609 '[\x{10C}-{INFTY}{HIGHEST_CP}]' => 'ANYOFH[010C-INFTY]',
610 '[\x{10C}-{INFTY}\x{00}-{HIGHEST_CP}]' => 'SANY',
611 '[\x{10C}-{INFTY}\x{00}-{INFTY}]' => 'SANY',
612 '[\x{10C}-{INFTY}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
613 '[\x{10C}-{INFTY}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
614 '[\x{10C}-{INFTY}\x{102}\x{104}]' => 'ANYOFH[0102 0104 010C-INFTY]',
615 '[\x{10C}-{INFTY}\x{102}-\x{104}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 010C-INFTY]',
616 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{100}]' => 'ANYOFH[0100 0102-0104 010C-INFTY]',
617 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}]' => 'ANYOFH[0101-0104 010C-INFTY]',
618 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
619 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
620 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}]' => 'ANYOFH[0102-0104 010C-INFTY]',
621 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
622 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
623 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
624 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
625 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
626 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}]' => 'ANYOFH[0102-0104 010C-INFTY]',
627 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
628 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
629 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}]' => 'ANYOFH[0102-0105 010C-INFTY]',
630 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
631 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
632 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}]' => 'ANYOFH[0102-0104 0106 010C-INFTY]',
633 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
634 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
635 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
636 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
637 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{INFTY}]' => 'ANYOFH[0101-INFTY]',
638 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-{HIGHEST_CP}]' => 'ANYOFH[0101-INFTY]',
639 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{102}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
640 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{103}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
641 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{104}]' => 'ANYOFH[0101-0104 0108-010A 010C-INFTY]',
642 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{105}]' => 'ANYOFH[0101-0105 0108-010A 010C-INFTY]',
643 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{106}]' => 'ANYOFH[0101-0106 0108-010A 010C-INFTY]',
644 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{107}]' => 'ANYOFH[0101-010A 010C-INFTY]',
645 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{108}]' => 'ANYOFH[0101-010A 010C-INFTY]',
646 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{109}]' => 'ANYOFH[0101-010A 010C-INFTY]',
647 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10A}]' => 'ANYOFH[0101-010A 010C-INFTY]',
648 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{101}-\x{10B}]' => 'ANYOFH[0101-INFTY]',
649 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
650 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
651 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
652 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{102}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
653 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
654 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
655 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
656 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
657 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
658 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
659 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
660 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
661 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
662 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{102}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
663 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
664 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
665 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
666 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
667 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
668 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
669 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
670 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
671 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
672 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
673 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
674 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{103}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
675 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
676 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
677 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
678 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
679 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
680 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
681 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
682 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
683 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
684 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
685 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{104}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
686 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}]' => 'ANYOFH[0102-0105 0108-010A 010C-INFTY]',
687 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{INFTY}]' => 'ANYOFH[0102-INFTY]',
688 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-{HIGHEST_CP}]' => 'ANYOFH[0102-INFTY]',
689 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{106}]' => 'ANYOFH[0102-0106 0108-010A 010C-INFTY]',
690 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{107}]' => 'ANYOFH[0102-010A 010C-INFTY]',
691 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{108}]' => 'ANYOFH[0102-010A 010C-INFTY]',
692 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{109}]' => 'ANYOFH[0102-010A 010C-INFTY]',
693 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10A}]' => 'ANYOFH[0102-010A 010C-INFTY]',
694 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10B}]' => 'ANYOFH[0102-INFTY]',
695 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{105}-\x{10C}]' => 'ANYOFH[0102-INFTY]',
696 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}]' => 'ANYOFH[0102-0104 0106 0108-010A 010C-INFTY]',
697 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{INFTY}]' => 'ANYOFH[0102-0104 0106-INFTY]',
698 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-{HIGHEST_CP}]' => 'ANYOFH[0102-0104 0106-INFTY]',
699 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{107}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
700 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{108}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
701 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{109}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
702 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10A}]' => 'ANYOFH[0102-0104 0106-010A 010C-INFTY]',
703 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10B}]' => 'ANYOFH[0102-0104 0106-INFTY]',
704 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{106}-\x{10C}]' => 'ANYOFH[0102-0104 0106-INFTY]',
705 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{107}]' => 'ANYOFH[0102-0104 0107-010A 010C-INFTY]',
706 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{108}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
707 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{109}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
708 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10A}]' => 'ANYOFH[0102-0104 0108-010A 010C-INFTY]',
709 '[\x{10C}-{INFTY}\x{102}-\x{104}\x{108}-\x{10A}\x{10B}]' => 'ANYOFH[0102-0104 0108-INFTY]',
710 '[\x{10C}-{INFTY}\x{103}\x{102}]' => 'ANYOFH[0102-0103 010C-INFTY]',
711 '[\x{10C}-{INFTY}\x{104}\x{102}]' => 'ANYOFH[0102 0104 010C-INFTY]',
712 '[\x{10C}-{INFTY}\x{104}\x{102}\x{103}]' => 'ANYOFH[0102-0104 010C-INFTY]',
713 '[{HIGHEST_CP}]' => 'EXACT_REQ8 <\x{HIGHEST_CP}>',
715 '(?8)(?i)[\x{410}]' => 'EXACTFU_REQ8 <\x{430}>',
716 '(?8)(?i)[\x{399}]' => 'EXACTFU_REQ8 <\x{3b9}>',
717 '(?8)(?i)[\x{345}\x{399}\x{3B9}\x{1FBE}]' => 'EXACTFU_REQ8 <\x{3b9}>',
718 '(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>', # Doesn't participate in a fold
719 '(?8)(?i)[\x{2b9}]' => 'EXACT_REQ8 <\x{2b9}>',
720 '(?i)[\x{2bc}]' => 'EXACTFU_REQ8 <\x{2bc}>', # Part of a multi-char fold, ASCII component
721 '(?i)[\x{390}]' => 'EXACTFU_REQ8 <\x{3b9}\x{308}\x{301}>', # Part of a multi-char fold, no ASCII component
723 '(?i)[\x{1E9E}]' => 'EXACTFU <ss>',
724 '(?iaa)[\x{1E9E}]' => 'EXACTFAA <\x{17f}\x{17f}>',
725 '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
726 '(?iaa)[\x{FB00}]' => 'EXACT_REQ8 <\x{fb00}>',
727 '(?i)[\x{FB00}]' => 'EXACTFU <ff>',
728 '(?i)[\x{FB01}]' => 'EXACTFU <fi>',
729 '(?i)[\x{FB02}]' => 'EXACTFU <fl>',
730 '(?i)[\x{FB03}]' => 'EXACTFU <ffi>',
731 '(?i)[\x{FB04}]' => 'EXACTFU <ffl>',
732 '(?i)[\x{FB05}]' => 'EXACTFU <st>',
733 '(?i)[\x{FB06}]' => 'EXACTFU <st>',
735 '[a][b]' => 'EXACT <ab>',
736 '[a]\x{100}' => 'EXACT_REQ8 <a\x{100}>',
737 '(?8)[\x{100}]a' => 'EXACT_REQ8 <\x{100}a>',
738 '(?i)[b][c]' => 'EXACTFU <bc>',
739 '(?i)[b]\x{100}' => 'EXACTFU_REQ8 <b\x{101}>',
740 '(?8)(?i)[\x{100}]b' => 'EXACTFU_REQ8 <\x{101}b>',
741 '(?i)b[s]' => 'EXACTFU <bs>',
742 '(?i)b[s]c' => 'EXACTFU <bsc>',
743 '(?i)bs[s]c' => 'EXACTF <bss>', # The c goes into a 2nd node
744 '(?iu)bs[s]c' => 'EXACTFUP <bssc>',
745 '(?i)b[s]sc' => 'EXACTF <bssc>',
746 '(?iu)b[s]sc' => 'EXACTFUP <bssc>',
747 '(?i)[b]st' => 'EXACTFU <bst>',
748 '(?i)[b]st[s]' => 'EXACTFU <bsts>',
749 '(?i)[b]st[s]st' => 'EXACTF <bstsst>',
750 '(?iu)[b]st[s]st' => 'EXACTFUP <bstsst>',
751 '(?i)[s][s]' => 'EXACTF <ss>',
752 '(?iu)[s][s]' => 'EXACTFUP <ss>',
755 my @single_chars_to_test =
757 "\x00", # Always potentially problematic
758 "\x01", # Unnamed control
759 "\b", # Named control
760 "\n", # Potentially special
761 "\r", # Potentially special
762 "\cK", # Potentially special
764 ":", # Not in any fold
765 "A", # ASCII capital, participates in multi-char fold
766 "a", # ASCII small, participates in multi-char fold
767 "B", # ASCII capital, participates only in case-pair fold
768 "b", # ASCII small, participates only in case-pair fold
769 "K", # ASCII capital, folded to from above Latin1
770 "k", # ASCII small, folded to from above Latin1
771 "\c?", # Potentially special
772 "\x80", # Latin1 control
773 "\xB5", # Micro sign, folds to above Latin1
774 "\xC0", # Latin1 capital, participates only in case-pair fold
775 "\xE0", # Latin1 small, participates only in case-pair fold
776 "\xC5", # Latin1 capital, folded to from above Latin1
777 "\xE5", # Latin1 small, folded to from above Latin1
778 "\xDF", # Small sharp S. folds to 'ss'
779 "\xF7", # Doesn't participate in any fold
780 "\xFF", # Folded to by above Latin1
781 "\x{100}", # First few above Latin1 characters
794 for my $char (@single_chars_to_test) {
796 my $hex = sprintf "%02x", $cp;
797 my $oct = sprintf "%o", $cp;
804 use feature 'unicode_strings';
805 $cased = uc $char ne $char || lc $char ne $char;
806 $folded_hex = ($cased)
807 ? sprintf("%02x", ord lc $char)
809 #print STDERR "$hex, $folded_hex\n";
812 for my $fold ("", "i") {
814 for my $charset ("", "u", "l", "aa") {
815 #next if $charset eq "aa" && ! $fold;
817 my $modifiers = $fold . $charset;
818 $modifiers = "(?$modifiers)" if $modifiers;
820 for my $upgrade ("", "(?8)") {
821 push @single_tests, "$upgrade$modifiers\[\\x{$hex}\]";
822 if ($cp < 256 || $upgrade) {
823 push @single_tests, get_compiled("$upgrade$modifiers\\x{$hex}");
828 my %list = ( sprintf("%X", $cp) => 1 );
830 for my $op (qw(fc lc uc)) {
831 my $result = eval "$op(\"$char\")";
832 $list{sprintf "%X", ord $result} = 1;
839 if (! $fold || scalar keys %list == 1) {
840 $op = ($charset eq 'l')
847 $op = ($charset eq 'aa')
856 $mod_cp = ord fc $char;
859 push @single_tests, sprintf "$op <\\x{%X}>", $mod_cp;
866 unshift @tests, @single_tests;
868 plan(scalar (@tests - 1) / 2); # -1 because of the marker.
870 my $skip_ebcdic = $::IS_EBCDIC;
871 while (defined (my $test = shift @tests)) {
873 if ($test eq 'ebcdic_ok_below_this_marker') {
878 my $expected = shift @tests;
881 skip("test not ported to EBCDIC", 1) if $skip_ebcdic;
883 my $display_expected = $expected
884 =~ s/ HIGHEST_CP /$highest_cp_string/xgr;
885 my $test_name = "Verify compilation of $test displays as"
888 my $result = get_compiled($test);
889 if ($expected =~ / ^ ANYOF[HR] /x) {
890 like($result, qr/ ^ \Q$expected\E (?:\Q (First UTF-8 byte=\x\E
891 [[:xdigit:]]{2} )? /x, $test_name);
894 is($result, $expected, $test_name);