perl5.git.perl.org Git - perl5.git/blame_incremental

... / ...

Commit	Line	Data
	1	#!./perl
	2	#
	3	# This is a home for regular expression tests that don't fit into
	4	# the format supported by op/regexp.t. If you want to add a test
	5	# that does fit that format, add it to op/re_tests, not here.
	6
	7	$\| = 1;
	8
	9	# Test counter output is generated by a BEGIN block at bottom of file
	10
	11	BEGIN {
	12	chdir 't' if -d 't';
	13	@INC = '../lib';
	14	}
	15	our $Message = "Noname test";
	16
	17	eval 'use Config'; # Defaults assumed if this fails
	18
	19	$x = "abc\ndef\n";
	20
	21	if ($x =~ /^abc/) {print "ok 1\n";} else {print "not ok 1\n";}
	22	if ($x !~ /^def/) {print "ok 2\n";} else {print "not ok 2\n";}
	23
	24	# used to be a test for $*
	25	if ($x =~ /^def/m) {print "ok 3\n";} else {print "not ok 3\n";}
	26
	27	$_ = '123';
	28	if (/^([0-9][0-9]*)/) {print "ok 4\n";} else {print "not ok 4\n";}
	29
	30	if ($x =~ /^xxx/) {print "not ok 5\n";} else {print "ok 5\n";}
	31	if ($x !~ /^abc/) {print "not ok 6\n";} else {print "ok 6\n";}
	32
	33	if ($x =~ /def/) {print "ok 7\n";} else {print "not ok 7\n";}
	34	if ($x !~ /def/) {print "not ok 8\n";} else {print "ok 8\n";}
	35
	36	if ($x !~ /.def/) {print "ok 9\n";} else {print "not ok 9\n";}
	37	if ($x =~ /.def/) {print "not ok 10\n";} else {print "ok 10\n";}
	38
	39	if ($x =~ /\ndef/) {print "ok 11\n";} else {print "not ok 11\n";}
	40	if ($x !~ /\ndef/) {print "not ok 12\n";} else {print "ok 12\n";}
	41
	42	$_ = 'aaabbbccc';
	43	if (/(ab)(c*)/ && $1 eq 'aaabbb' && $2 eq 'ccc') {
	44	print "ok 13\n";
	45	} else {
	46	print "not ok 13\n";
	47	}
	48	if (/(a+b+c+)/ && $1 eq 'aaabbbccc') {
	49	print "ok 14\n";
	50	} else {
	51	print "not ok 14\n";
	52	}
	53
	54	if (/a+b?c+/) {print "not ok 15\n";} else {print "ok 15\n";}
	55
	56	$_ = 'aaabccc';
	57	if (/a+b?c+/) {print "ok 16\n";} else {print "not ok 16\n";}
	58	if (/ab+c/) {print "ok 17\n";} else {print "not ok 17\n";}
	59
	60	$_ = 'aaaccc';
	61	if (/ab?c/) {print "ok 18\n";} else {print "not ok 18\n";}
	62	if (/ab+c/) {print "not ok 19\n";} else {print "ok 19\n";}
	63
	64	$_ = 'abcdef';
	65	if (/bcd\|xyz/) {print "ok 20\n";} else {print "not ok 20\n";}
	66	if (/xyz\|bcd/) {print "ok 21\n";} else {print "not ok 21\n";}
	67
	68	if (m\|bc/*d\|) {print "ok 22\n";} else {print "not ok 22\n";}
	69
	70	if (/^$_$/) {print "ok 23\n";} else {print "not ok 23\n";}
	71
	72	# used to be a test for $*
	73	if ("ab\ncd\n" =~ /^cd/m) {print "ok 24\n";} else {print "not ok 24\n";}
	74
	75	$XXX{123} = 123;
	76	$XXX{234} = 234;
	77	$XXX{345} = 345;
	78
	79	@XXX = ('ok 25','not ok 25', 'ok 26','not ok 26','not ok 27');
	80	while ($_ = shift(@XXX)) {
	81	?(.*)? && (print $1,"\n");
	82	/not/ && reset;
	83	if (/not ok 26/) {
	84	if ($^O eq 'VMS') {
	85	$_ = shift(@XXX);
	86	}
	87	else {
	88	reset 'X';
	89	}
	90	}
	91	}
	92
	93	if ($^O ne 'VMS') {
	94	while (($key,$val) = each(%XXX)) {
	95	print "not ok 27\n";
	96	exit;
	97	}
	98	}
	99
	100	print "ok 27\n";
	101
	102	'cde' =~ /[^ab]*/;
	103	'xyz' =~ //;
	104	if ($& eq 'xyz') {print "ok 28\n";} else {print "not ok 28\n";}
	105
	106	$foo = '[^ab]*';
	107	'cde' =~ /$foo/;
	108	'xyz' =~ //;
	109	if ($& eq 'xyz') {print "ok 29\n";} else {print "not ok 29\n";}
	110
	111	$foo = '[^ab]*';
	112	'cde' =~ /$foo/;
	113	'xyz' =~ /$null/;
	114	if ($& eq 'xyz') {print "ok 30\n";} else {print "not ok 30\n";}
	115
	116	$_ = 'abcdefghi';
	117	/def/; # optimized up to cmd
	118	if ("$`:$&:$'" eq 'abc:def:ghi') {print "ok 31\n";} else {print "not ok 31\n";}
	119
	120	/cde/ + 0; # optimized only to spat
	121	if ("$`:$&:$'" eq 'ab:cde:fghi') {print "ok 32\n";} else {print "not ok 32\n";}
	122
	123	/[d][e][f]/; # not optimized
	124	if ("$`:$&:$'" eq 'abc:def:ghi') {print "ok 33\n";} else {print "not ok 33\n";}
	125
	126	$_ = 'now is the {time for all} good men to come to.';
	127	/ {([^}]*)}/;
	128	if ($1 eq 'time for all') {print "ok 34\n";} else {print "not ok 34 $1\n";}
	129
	130	$_ = 'xxx {3,4} yyy zzz';
	131	print /( {3,4})/ ? "ok 35\n" : "not ok 35\n";
	132	print $1 eq ' ' ? "ok 36\n" : "not ok 36\n";
	133	print /( {4,})/ ? "not ok 37\n" : "ok 37\n";
	134	print /( {2,3}.)/ ? "ok 38\n" : "not ok 38\n";
	135	print $1 eq ' y' ? "ok 39\n" : "not ok 39\n";
	136	print /(y{2,3}.)/ ? "ok 40\n" : "not ok 40\n";
	137	print $1 eq 'yyy ' ? "ok 41\n" : "not ok 41\n";
	138	print /x {3,4}/ ? "not ok 42\n" : "ok 42\n";
	139	print /^xxx {3,4}/ ? "not ok 43\n" : "ok 43\n";
	140
	141	$_ = "now is the time for all good men to come to.";
	142	@words = /(\w+)/g;
	143	print join(':',@words) eq "now:is:the:time:for:all:good:men:to:come:to"
	144	? "ok 44\n"
	145	: "not ok 44\n";
	146
	147	@words = ();
	148	while (/\w+/g) {
	149	push(@words, $&);
	150	}
	151	print join(':',@words) eq "now:is:the:time:for:all:good:men:to:come:to"
	152	? "ok 45\n"
	153	: "not ok 45\n";
	154
	155	@words = ();
	156	pos = 0;
	157	while (/to/g) {
	158	push(@words, $&);
	159	}
	160	print join(':',@words) eq "to:to"
	161	? "ok 46\n"
	162	: "not ok 46 `@words'\n";
	163
	164	pos $_ = 0;
	165	@words = /to/g;
	166	print join(':',@words) eq "to:to"
	167	? "ok 47\n"
	168	: "not ok 47 `@words'\n";
	169
	170	$_ = "abcdefghi";
	171
	172	$pat1 = 'def';
	173	$pat2 = '^def';
	174	$pat3 = '.def.';
	175	$pat4 = 'abc';
	176	$pat5 = '^abc';
	177	$pat6 = 'abc$';
	178	$pat7 = 'ghi';
	179	$pat8 = '\w*ghi';
	180	$pat9 = 'ghi$';
	181
	182	$t1=$t2=$t3=$t4=$t5=$t6=$t7=$t8=$t9=0;
	183
	184	for $iter (1..5) {
	185	$t1++ if /$pat1/o;
	186	$t2++ if /$pat2/o;
	187	$t3++ if /$pat3/o;
	188	$t4++ if /$pat4/o;
	189	$t5++ if /$pat5/o;
	190	$t6++ if /$pat6/o;
	191	$t7++ if /$pat7/o;
	192	$t8++ if /$pat8/o;
	193	$t9++ if /$pat9/o;
	194	}
	195
	196	$x = "$t1$t2$t3$t4$t5$t6$t7$t8$t9";
	197	print $x eq '505550555' ? "ok 48\n" : "not ok 48 $x\n";
	198
	199	$xyz = 'xyz';
	200	print "abc" =~ /^abc$\|$xyz/ ? "ok 49\n" : "not ok 49\n";
	201
	202	# perl 4.009 says "unmatched ()"
	203	eval '"abc" =~ /a(bc$)\|$xyz/; $result = "$&:$1"';
	204	print $@ eq "" ? "ok 50\n" : "not ok 50\n";
	205	print $result eq "abc:bc" ? "ok 51\n" : "not ok 51\n";
	206
	207
	208	$_="abcfooabcbar";
	209	$x=/abc/g;
	210	print $` eq "" ? "ok 52\n" : "not ok 52\n" if $x;
	211	$x=/abc/g;
	212	print $` eq "abcfoo" ? "ok 53\n" : "not ok 53\n" if $x;
	213	$x=/abc/g;
	214	print $x == 0 ? "ok 54\n" : "not ok 54\n";
	215	pos = 0;
	216	$x=/ABC/gi;
	217	print $` eq "" ? "ok 55\n" : "not ok 55\n" if $x;
	218	$x=/ABC/gi;
	219	print $` eq "abcfoo" ? "ok 56\n" : "not ok 56\n" if $x;
	220	$x=/ABC/gi;
	221	print $x == 0 ? "ok 57\n" : "not ok 57\n";
	222	pos = 0;
	223	$x=/abc/g;
	224	print $' eq "fooabcbar" ? "ok 58\n" : "not ok 58\n" if $x;
	225	$x=/abc/g;
	226	print $' eq "bar" ? "ok 59\n" : "not ok 59\n" if $x;
	227	$_ .= '';
	228	@x=/abc/g;
	229	print scalar @x == 2 ? "ok 60\n" : "not ok 60\n";
	230
	231	$_ = "abdc";
	232	pos $_ = 2;
	233	/\Gc/gc;
	234	print "not " if (pos $_) != 2;
	235	print "ok 61\n";
	236	/\Gc/g;
	237	print "not " if defined pos $_;
	238	print "ok 62\n";
	239
	240	$out = 1;
	241	'abc' =~ m'a(?{ $out = 2 })b';
	242	print "not " if $out != 2;
	243	print "ok 63\n";
	244
	245	$out = 1;
	246	'abc' =~ m'a(?{ $out = 3 })c';
	247	print "not " if $out != 1;
	248	print "ok 64\n";
	249
	250	$_ = 'foobar1 bar2 foobar3 barfoobar5 foobar6';
	251	@out = /(?<!foo)bar./g;
	252	print "not " if "@out" ne 'bar2 barf';
	253	print "ok 65\n";
	254
	255	# Tests which depend on REG_INFTY
	256	$reg_infty = defined $Config{reg_infty} ? $Config{reg_infty} : 32767;
	257	$reg_infty_m = $reg_infty - 1; $reg_infty_p = $reg_infty + 1;
	258
	259	# As well as failing if the pattern matches do unexpected things, the
	260	# next three tests will fail if you should have picked up a lower-than-
	261	# default value for $reg_infty from Config.pm, but have not.
	262
	263	undef $@;
	264	print "not " if eval q(('aaa' =~ /(a{1,$reg_infty_m})/)[0] ne 'aaa') \|\| $@;
	265	print "ok 66\n";
	266
	267	undef $@;
	268	print "not " if eval q(('a' x $reg_infty_m) !~ /a{$reg_infty_m}/) \|\| $@;
	269	print "ok 67\n";
	270
	271	undef $@;
	272	print "not " if eval q(('a' x ($reg_infty_m - 1)) =~ /a{$reg_infty_m}/) \|\| $@;
	273	print "ok 68\n";
	274
	275	undef $@;
	276	eval "'aaa' =~ /a{1,$reg_infty}/";
	277	print "not " if $@ !~ m%^\QQuantifier in {,} bigger than%;
	278	print "ok 69\n";
	279
	280	eval "'aaa' =~ /a{1,$reg_infty_p}/";
	281	print "not "
	282	if $@ !~ m%^\QQuantifier in {,} bigger than%;
	283	print "ok 70\n";
	284	undef $@;
	285
	286	# Poke a couple more parse failures
	287
	288	$context = 'x' x 256;
	289	eval qq("${context}y" =~ /(?<=$context)y/);
	290	print "not " if $@ !~ m%^\QLookbehind longer than 255 not%;
	291	print "ok 71\n";
	292
	293	# removed test
	294	print "ok 72\n";
	295
	296	# Long Monsters
	297	$test = 73;
	298	for $l (125, 140, 250, 270, 300000, 30) { # Ordered to free memory
	299	$a = 'a' x $l;
	300	print "# length=$l\nnot " unless "ba$a=" =~ /a$a=/;
	301	print "ok $test\n";
	302	$test++;
	303
	304	print "not " if "b$a=" =~ /a$a=/;
	305	print "ok $test\n";
	306	$test++;
	307	}
	308
	309	# 20000 nodes, each taking 3 words per string, and 1 per branch
	310	$long_constant_len = join '\|', 12120 .. 32645;
	311	$long_var_len = join '\|', 8120 .. 28645;
	312	%ans = ( 'ax13876y25677lbc' => 1,
	313	'ax13876y25677mcb' => 0, # not b.
	314	'ax13876y35677nbc' => 0, # Num too big
	315	'ax13876y25677y21378obc' => 1,
	316	'ax13876y25677y21378zbc' => 0, # Not followed by [k-o]
	317	'ax13876y25677y21378y21378kbc' => 1,
	318	'ax13876y25677y21378y21378kcb' => 0, # Not b.
	319	'ax13876y25677y21378y21378y21378kbc' => 0, # 5 runs
	320	);
	321
	322	for ( keys %ans ) {
	323	print "# const-len `$_' not => $ans{$_}\nnot "
	324	if $ans{$_} xor /a(?=([yx]($long_constant_len)){2,4}[k-o]).*b./o;
	325	print "ok $test\n";
	326	$test++;
	327	print "# var-len `$_' not => $ans{$_}\nnot "
	328	if $ans{$_} xor /a(?=([yx]($long_var_len)){2,4}[k-o]).*b./o;
	329	print "ok $test\n";
	330	$test++;
	331	}
	332
	333	$_ = " a (bla()) and x(y b((l)u((e))) and b(l(e)e)e";
	334	$expect = "(bla()) ((l)u((e))) (l(e)e)";
	335
	336	sub matchit {
	337	m/
	338	(
	339	\(
	340	(?{ $c = 1 }) # Initialize
	341	(?:
	342	(?(?{ $c == 0 }) # PREVIOUS iteration was OK, stop the loop
	343	(?!
	344	) # Fail: will unwind one iteration back
	345	)
	346	(?:
	347	[^()]+ # Match a big chunk
	348	(?=
	349	[()]
	350	) # Do not try to match subchunks
	351	\|
	352	\(
	353	(?{ ++$c })
	354	\|
	355	\)
	356	(?{ --$c })
	357	)
	358	)+ # This may not match with different subblocks
	359	)
	360	(?(?{ $c != 0 })
	361	(?!
	362	) # Fail
	363	) # Otherwise the chunk 1 may succeed with $c>0
	364	/xg;
	365	}
	366
	367	@ans = ();
	368	push @ans, $res while $res = matchit;
	369
	370	print "# ans='@ans'\n# expect='$expect'\nnot " if "@ans" ne "1 1 1";
	371	print "ok $test\n";
	372	$test++;
	373
	374	@ans = matchit;
	375
	376	print "# ans='@ans'\n# expect='$expect'\nnot " if "@ans" ne $expect;
	377	print "ok $test\n";
	378	$test++;
	379
	380	print "not " unless "abc" =~ /^(??{"a"})b/;
	381	print "ok $test\n";
	382	$test++;
	383
	384	my $matched;
	385	$matched = qr/$(?:(?>[^()]+)\|(??{$matched}))*$/;
	386
	387	@ans = @ans1 = ();
	388	push(@ans, $res), push(@ans1, $&) while $res = m/$matched/g;
	389
	390	print "# ans='@ans'\n# expect='$expect'\nnot " if "@ans" ne "1 1 1";
	391	print "ok $test\n";
	392	$test++;
	393
	394	print "# ans1='@ans1'\n# expect='$expect'\nnot " if "@ans1" ne $expect;
	395	print "ok $test\n";
	396	$test++;
	397
	398	@ans = m/$matched/g;
	399
	400	print "# ans='@ans'\n# expect='$expect'\nnot " if "@ans" ne $expect;
	401	print "ok $test\n";
	402	$test++;
	403
	404	@ans = ('a/b' =~ m%(./)?(.)%); # Stack may be bad
	405	print "not " if "@ans" ne 'a/ b';
	406	print "ok $test\n";
	407	$test++;
	408
	409	$code = '{$blah = 45}';
	410	$blah = 12;
	411	eval { /(?$code)/ };
	412	print "not " unless $@ and $@ =~ /not allowed at runtime/ and $blah == 12;
	413	print "ok $test\n";
	414	$test++;
	415
	416	for $code ('{$blah = 45}','=xx') {
	417	$blah = 12;
	418	$res = eval { "xx" =~ /(?$code)/o };
	419	if ($code eq '=xx') {
	420	print "#'$@','$res','$blah'\nnot " unless not $@ and $res;
	421	} else {
	422	print "#'$@','$res','$blah'\nnot " unless $@ and $@ =~ /not allowed at runtime/ and $blah == 12;
	423	}
	424	print "ok $test\n";
	425	$test++;
	426	}
	427
	428	$code = '{$blah = 45}';
	429	$blah = 12;
	430	eval "/(?$code)/";
	431	print "not " if $blah != 45;
	432	print "ok $test\n";
	433	$test++;
	434
	435	$blah = 12;
	436	/(?{$blah = 45})/;
	437	print "not " if $blah != 45;
	438	print "ok $test\n";
	439	$test++;
	440
	441	$x = 'banana';
	442	$x =~ /.a/g;
	443	print "not " unless pos($x) == 2;
	444	print "ok $test\n";
	445	$test++;
	446
	447	$x =~ /.z/gc;
	448	print "not " unless pos($x) == 2;
	449	print "ok $test\n";
	450	$test++;
	451
	452	sub f {
	453	my $p = $_[0];
	454	return $p;
	455	}
	456
	457	$x =~ /.a/g;
	458	print "not " unless f(pos($x)) == 4;
	459	print "ok $test\n";
	460	$test++;
	461
	462	$x = $^R = 67;
	463	'foot' =~ /foo(?{$x = 12; 75})[t]/;
	464	print "not " unless $^R eq '75';
	465	print "ok $test\n";
	466	$test++;
	467
	468	$x = $^R = 67;
	469	'foot' =~ /foo(?{$x = 12; 75})[xy]/;
	470	print "not " unless $^R eq '67' and $x eq '12';
	471	print "ok $test\n";
	472	$test++;
	473
	474	$x = $^R = 67;
	475	'foot' =~ /foo(?{ $^R + 12 })((?{ $x = 12; $^R + 17 })[xy])?/;
	476	print "not " unless $^R eq '79' and $x eq '12';
	477	print "ok $test\n";
	478	$test++;
	479
	480	print "not " unless qr/\b\v$/i eq '(?i-xsm:\b\v$)';
	481	print "ok $test\n";
	482	$test++;
	483
	484	print "not " unless qr/\b\v$/s eq '(?s-xim:\b\v$)';
	485	print "ok $test\n";
	486	$test++;
	487
	488	print "not " unless qr/\b\v$/m eq '(?m-xis:\b\v$)';
	489	print "ok $test\n";
	490	$test++;
	491
	492	print "not " unless qr/\b\v$/x eq '(?x-ism:\b\v$)';
	493	print "ok $test\n";
	494	$test++;
	495
	496	print "not " unless qr/\b\v$/xism eq '(?msix:\b\v$)';
	497	print "ok $test\n";
	498	$test++;
	499
	500	print "not " unless qr/\b\v$/ eq '(?-xism:\b\v$)';
	501	print "ok $test\n";
	502	$test++;
	503
	504	$_ = 'xabcx';
	505	foreach $ans ('', 'c') {
	506	/(?<=(?=a)..)((?=c)\|.)/g;
	507	print "# \$1 ='$1'\n# \$ans='$ans'\nnot " unless $1 eq $ans;
	508	print "ok $test\n";
	509	$test++;
	510	}
	511
	512	$_ = 'a';
	513	foreach $ans ('', 'a', '') {
	514	/^\|a\|$/g;
	515	print "# \$& ='$&'\n# \$ans='$ans'\nnot " unless $& eq $ans;
	516	print "ok $test\n";
	517	$test++;
	518	}
	519
	520	sub prefixify {
	521	my($v,$a,$b,$res) = @_;
	522	$v =~ s/\Q$a\E/$b/;
	523	print "not " unless $res eq $v;
	524	print "ok $test\n";
	525	$test++;
	526	}
	527	prefixify('/a/b/lib/arch', "/a/b/lib", 'X/lib', 'X/lib/arch');
	528	prefixify('/a/b/man/arch', "/a/b/man", 'X/man', 'X/man/arch');
	529
	530	$_ = 'var="foo"';
	531	/(\")/;
	532	print "not " unless $1 and /$1/;
	533	print "ok $test\n";
	534	$test++;
	535
	536	$a=qr/(?{++$b})/;
	537	$b = 7;
	538	/$a$a/;
	539	print "not " unless $b eq '9';
	540	print "ok $test\n";
	541	$test++;
	542
	543	$c="$a";
	544	/$a$a/;
	545	print "not " unless $b eq '11';
	546	print "ok $test\n";
	547	$test++;
	548
	549	{
	550	use re "eval";
	551	/$a$c$a/;
	552	print "not " unless $b eq '14';
	553	print "ok $test\n";
	554	$test++;
	555
	556	local $lex_a = 2;
	557	my $lex_a = 43;
	558	my $lex_b = 17;
	559	my $lex_c = 27;
	560	my $lex_res = ($lex_b =~ qr/$lex_b(?{ $lex_c = $lex_a++ })/);
	561	print "not " unless $lex_res eq '1';
	562	print "ok $test\n";
	563	$test++;
	564	print "not " unless $lex_a eq '44';
	565	print "ok $test\n";
	566	$test++;
	567	print "not " unless $lex_c eq '43';
	568	print "ok $test\n";
	569	$test++;
	570
	571
	572	no re "eval";
	573	$match = eval { /$a$c$a/ };
	574	print "not "
	575	unless $b eq '14' and $@ =~ /Eval-group not allowed/ and not $match;
	576	print "ok $test\n";
	577	$test++;
	578	}
	579
	580	{
	581	local $lex_a = 2;
	582	my $lex_a = 43;
	583	my $lex_b = 17;
	584	my $lex_c = 27;
	585	my $lex_res = ($lex_b =~ qr/17(?{ $lex_c = $lex_a++ })/);
	586	print "not " unless $lex_res eq '1';
	587	print "ok $test\n";
	588	$test++;
	589	print "not " unless $lex_a eq '44';
	590	print "ok $test\n";
	591	$test++;
	592	print "not " unless $lex_c eq '43';
	593	print "ok $test\n";
	594	$test++;
	595	}
	596
	597	{
	598	package aa;
	599	$c = 2;
	600	$::c = 3;
	601	'' =~ /(?{ $c = 4 })/;
	602	print "not " unless $c == 4;
	603	}
	604	print "ok $test\n";
	605	$test++;
	606	print "not " unless $c == 3;
	607	print "ok $test\n";
	608	$test++;
	609
	610	sub must_warn_pat {
	611	my $warn_pat = shift;
	612	return sub { print "not " unless $_[0] =~ /$warn_pat/ }
	613	}
	614
	615	sub must_warn {
	616	my ($warn_pat, $code) = @_;
	617	local %SIG;
	618	eval 'BEGIN { use warnings; $SIG{__WARN__} = $warn_pat };' . $code;
	619	print "ok $test\n";
	620	$test++;
	621	}
	622
	623
	624	sub make_must_warn {
	625	my $warn_pat = shift;
	626	return sub { must_warn(must_warn_pat($warn_pat)) }
	627	}
	628
	629	my $for_future = make_must_warn('reserved for future extensions');
	630
	631	&$for_future('q(a:[b]:) =~ /[x[:foo:]]/');
	632
	633	#&$for_future('q(a=[b]=) =~ /[x[=foo=]]/');
	634	print "ok $test\n"; $test++; # now a fatal croak
	635
	636	#&$for_future('q(a.[b].) =~ /[x[.foo.]]/');
	637	print "ok $test\n"; $test++; # now a fatal croak
	638
	639	# test if failure of patterns returns empty list
	640	$_ = 'aaa';
	641	@_ = /bbb/;
	642	print "not " if @_;
	643	print "ok $test\n";
	644	$test++;
	645
	646	@_ = /bbb/g;
	647	print "not " if @_;
	648	print "ok $test\n";
	649	$test++;
	650
	651	@_ = /(bbb)/;
	652	print "not " if @_;
	653	print "ok $test\n";
	654	$test++;
	655
	656	@_ = /(bbb)/g;
	657	print "not " if @_;
	658	print "ok $test\n";
	659	$test++;
	660
	661	/a(?=.$)/;
	662	print "not " if $#+ != 0 or $#- != 0;
	663	print "ok $test\n";
	664	$test++;
	665
	666	print "not " if $+[0] != 2 or $-[0] != 1;
	667	print "ok $test\n";
	668	$test++;
	669
	670	print "not "
	671	if defined $+[1] or defined $-[1] or defined $+[2] or defined $-[2];
	672	print "ok $test\n";
	673	$test++;
	674
	675	/a(a)(a)/;
	676	print "not " if $#+ != 2 or $#- != 2;
	677	print "ok $test\n";
	678	$test++;
	679
	680	print "not " if $+[0] != 3 or $-[0] != 0;
	681	print "ok $test\n";
	682	$test++;
	683
	684	print "not " if $+[1] != 2 or $-[1] != 1;
	685	print "ok $test\n";
	686	$test++;
	687
	688	print "not " if $+[2] != 3 or $-[2] != 2;
	689	print "ok $test\n";
	690	$test++;
	691
	692	print "not "
	693	if defined $+[3] or defined $-[3] or defined $+[4] or defined $-[4];
	694	print "ok $test\n";
	695	$test++;
	696
	697	/.(a)(b)?(a)/;
	698	print "not " if $#+ != 3 or $#- != 3;
	699	print "ok $test\n";
	700	$test++;
	701
	702	print "not " if $+[0] != 3 or $-[0] != 0;
	703	print "ok $test\n";
	704	$test++;
	705
	706	print "not " if $+[1] != 2 or $-[1] != 1;
	707	print "ok $test\n";
	708	$test++;
	709
	710	print "not " if $+[3] != 3 or $-[3] != 2;
	711	print "ok $test\n";
	712	$test++;
	713
	714	print "not "
	715	if defined $+[2] or defined $-[2] or defined $+[4] or defined $-[4];
	716	print "ok $test\n";
	717	$test++;
	718
	719	/.(a)/;
	720	print "not " if $#+ != 1 or $#- != 1;
	721	print "ok $test\n";
	722	$test++;
	723
	724	print "not " if $+[0] != 2 or $-[0] != 0;
	725	print "ok $test\n";
	726	$test++;
	727
	728	print "not " if $+[1] != 2 or $-[1] != 1;
	729	print "ok $test\n";
	730	$test++;
	731
	732	print "not "
	733	if defined $+[2] or defined $-[2] or defined $+[3] or defined $-[3];
	734	print "ok $test\n";
	735	$test++;
	736
	737	eval { $+[0] = 13; };
	738	print "not "
	739	if $@ !~ /^Modification of a read-only value attempted/;
	740	print "ok $test\n";
	741	$test++;
	742
	743	eval { $-[0] = 13; };
	744	print "not "
	745	if $@ !~ /^Modification of a read-only value attempted/;
	746	print "ok $test\n";
	747	$test++;
	748
	749	eval { @+ = (7, 6, 5); };
	750	print "not "
	751	if $@ !~ /^Modification of a read-only value attempted/;
	752	print "ok $test\n";
	753	$test++;
	754
	755	eval { @- = qw(foo bar); };
	756	print "not "
	757	if $@ !~ /^Modification of a read-only value attempted/;
	758	print "ok $test\n";
	759	$test++;
	760
	761	/.(a)(ba*)?/;
	762	print "#$#-..$#+\nnot " if $#+ != 2 or $#- != 1;
	763	print "ok $test\n";
	764	$test++;
	765
	766	$_ = 'aaa';
	767	pos = 1;
	768	@a = /\Ga/g;
	769	print "not " unless "@a" eq "a a";
	770	print "ok $test\n";
	771	$test++;
	772
	773	$str = 'abcde';
	774	pos $str = 2;
	775
	776	print "not " if $str =~ /^\G/;
	777	print "ok $test\n";
	778	$test++;
	779
	780	print "not " if $str =~ /^.\G/;
	781	print "ok $test\n";
	782	$test++;
	783
	784	print "not " unless $str =~ /^..\G/;
	785	print "ok $test\n";
	786	$test++;
	787
	788	print "not " if $str =~ /^...\G/;
	789	print "ok $test\n";
	790	$test++;
	791
	792	print "not " unless $str =~ /.\G./ and $& eq 'bc';
	793	print "ok $test\n";
	794	$test++;
	795
	796	print "not " unless $str =~ /\G../ and $& eq 'cd';
	797	print "ok $test\n";
	798	$test++;
	799
	800	undef $foo; undef $bar;
	801	print "#'$str','$foo','$bar'\nnot "
	802	unless $str =~ /b(?{$foo = $_; $bar = pos})c/
	803	and $foo eq 'abcde' and $bar eq 2;
	804	print "ok $test\n";
	805	$test++;
	806
	807	undef $foo; undef $bar;
	808	pos $str = undef;
	809	print "#'$str','$foo','$bar'\nnot "
	810	unless $str =~ /b(?{$foo = $_; $bar = pos})c/g
	811	and $foo eq 'abcde' and $bar eq 2 and pos $str eq 3;
	812	print "ok $test\n";
	813	$test++;
	814
	815	$_ = $str;
	816
	817	undef $foo; undef $bar;
	818	print "#'$str','$foo','$bar'\nnot "
	819	unless /b(?{$foo = $_; $bar = pos})c/
	820	and $foo eq 'abcde' and $bar eq 2;
	821	print "ok $test\n";
	822	$test++;
	823
	824	undef $foo; undef $bar;
	825	print "#'$str','$foo','$bar'\nnot "
	826	unless /b(?{$foo = $_; $bar = pos})c/g
	827	and $foo eq 'abcde' and $bar eq 2 and pos eq 3;
	828	print "ok $test\n";
	829	$test++;
	830
	831	undef $foo; undef $bar;
	832	pos = undef;
	833	1 while /b(?{$foo = $_; $bar = pos})c/g;
	834	print "#'$str','$foo','$bar'\nnot "
	835	unless $foo eq 'abcde' and $bar eq 2 and not defined pos;
	836	print "ok $test\n";
	837	$test++;
	838
	839	undef $foo; undef $bar;
	840	$_ = 'abcde\|abcde';
	841	print "#'$str','$foo','$bar','$_'\nnot "
	842	unless s/b(?{$foo = $_; $bar = pos})c/x/g and $foo eq 'abcde\|abcde'
	843	and $bar eq 8 and $_ eq 'axde\|axde';
	844	print "ok $test\n";
	845	$test++;
	846
	847	@res = ();
	848	# List context:
	849	$_ = 'abcde\|abcde';
	850	@dummy = /([ace]).(?{push @res, $1,$2})([ce])(?{push @res, $1,$2})/g;
	851	@res = map {defined $_ ? "'$_'" : 'undef'} @res;
	852	$res = "@res";
	853	print "#'@res' '$_'\nnot "
	854	unless "@res" eq "'a' undef 'a' 'c' 'e' undef 'a' undef 'a' 'c'";
	855	print "ok $test\n";
	856	$test++;
	857
	858	@res = ();
	859	@dummy = /([ace]).(?{push @res, $`,$&,$'})([ce])(?{push @res, $`,$&,$'})/g;
	860	@res = map {defined $_ ? "'$_'" : 'undef'} @res;
	861	$res = "@res";
	862	print "#'@res' '$_'\nnot "
	863	unless "@res" eq
	864	"'' 'ab' 'cde\|abcde' " .
	865	"'' 'abc' 'de\|abcde' " .
	866	"'abcd' 'e\|' 'abcde' " .
	867	"'abcde\|' 'ab' 'cde' " .
	868	"'abcde\|' 'abc' 'de'" ;
	869	print "ok $test\n";
	870	$test++;
	871
	872	#Some more \G anchor checks
	873	$foo='aabbccddeeffgg';
	874
	875	pos($foo)=1;
	876
	877	$foo=~/.\G(..)/g;
	878	iseq($1,'ab');
	879
	880	pos($foo) += 1;
	881	$foo=~/.\G(..)/g;
	882	print "not " unless($1 eq 'cc');
	883	print "ok $test\n";
	884	$test++;
	885
	886	pos($foo) += 1;
	887	$foo=~/.\G(..)/g;
	888	print "not " unless($1 eq 'de');
	889	print "ok $test\n";
	890	$test++;
	891
	892	print "not " unless $foo =~ /\Gef/g;
	893	print "ok $test\n";
	894	$test++;
	895
	896	undef pos $foo;
	897
	898	$foo=~/\G(..)/g;
	899	print "not " unless($1 eq 'aa');
	900	print "ok $test\n";
	901	$test++;
	902
	903	$foo=~/\G(..)/g;
	904	print "not " unless($1 eq 'bb');
	905	print "ok $test\n";
	906	$test++;
	907
	908	pos($foo)=5;
	909	$foo=~/\G(..)/g;
	910	print "not " unless($1 eq 'cd');
	911	print "ok $test\n";
	912	$test++;
	913
	914	$_='123x123';
	915	@res = /(\d*\|x)/g;
	916	print "not " unless('123\|\|x\|123\|' eq join '\|', @res);
	917	print "ok $test\n";
	918	$test++;
	919
	920	# see if matching against temporaries (created via pp_helem()) is safe
	921	{ foo => "ok $test\n".$^X }->{foo} =~ /^(.*)\n/g;
	922	print "$1\n";
	923	$test++;
	924
	925	# See if $i work inside (?{}) in the presense of saved substrings and
	926	# changing $_
	927	@a = qw(foo bar);
	928	@b = ();
	929	s/(\w)(?{push @b, $1})/,$1,/g for @a;
	930
	931	print "# \@b='@b', expect 'f o o b a r'\nnot " unless("@b" eq "f o o b a r");
	932	print "ok $test\n";
	933	$test++;
	934
	935	print "not " unless("@a" eq ",f,,o,,o, ,b,,a,,r,");
	936	print "ok $test\n";
	937	$test++;
	938
	939	$brackets = qr{
	940	{ (?> [^{}]+ \| (??{ $brackets }) )* }
	941	}x;
	942
	943	"{{}" =~ $brackets;
	944	print "ok $test\n"; # Did we survive?
	945	$test++;
	946
	947	"something { long { and } hairy" =~ $brackets;
	948	print "ok $test\n"; # Did we survive?
	949	$test++;
	950
	951	"something { long { and } hairy" =~ m/((??{ $brackets }))/;
	952	print "not " unless $1 eq "{ and }";
	953	print "ok $test\n";
	954	$test++;
	955
	956	$_ = "a-a\nxbb";
	957	pos=1;
	958	m/^-.*bb/mg and print "not ";
	959	print "ok $test\n";
	960	$test++;
	961
	962	$text = "aaXbXcc";
	963	pos($text)=0;
	964	$text =~ /\GXb*X/g and print 'not ';
	965	print "ok $test\n";
	966	$test++;
	967
	968	$text = "xA\n" x 500;
	969	$text =~ /^\s*A/m and print 'not ';
	970	print "ok $test\n";
	971	$test++;
	972
	973	$text = "abc dbf";
	974	@res = ($text =~ /.?(b).?\b/g);
	975	"@res" eq 'b b' or print 'not ';
	976	print "ok $test\n";
	977	$test++;
	978
	979	@a = map chr,0..255;
	980
	981	@b = grep(/\S/,@a);
	982	@c = grep(/[^\s]/,@a);
	983	print "not " if "@b" ne "@c";
	984	print "ok $test\n";
	985	$test++;
	986
	987	@b = grep(/\S/,@a);
	988	@c = grep(/[\S]/,@a);
	989	print "not " if "@b" ne "@c";
	990	print "ok $test\n";
	991	$test++;
	992
	993	@b = grep(/\s/,@a);
	994	@c = grep(/[^\S]/,@a);
	995	print "not " if "@b" ne "@c";
	996	print "ok $test\n";
	997	$test++;
	998
	999	@b = grep(/\s/,@a);
	1000	@c = grep(/[\s]/,@a);
	1001	print "not " if "@b" ne "@c";
	1002	print "ok $test\n";
	1003	$test++;
	1004
	1005	@b = grep(/\D/,@a);
	1006	@c = grep(/[^\d]/,@a);
	1007	print "not " if "@b" ne "@c";
	1008	print "ok $test\n";
	1009	$test++;
	1010
	1011	@b = grep(/\D/,@a);
	1012	@c = grep(/[\D]/,@a);
	1013	print "not " if "@b" ne "@c";
	1014	print "ok $test\n";
	1015	$test++;
	1016
	1017	@b = grep(/\d/,@a);
	1018	@c = grep(/[^\D]/,@a);
	1019	print "not " if "@b" ne "@c";
	1020	print "ok $test\n";
	1021	$test++;
	1022
	1023	@b = grep(/\d/,@a);
	1024	@c = grep(/[\d]/,@a);
	1025	print "not " if "@b" ne "@c";
	1026	print "ok $test\n";
	1027	$test++;
	1028
	1029	@b = grep(/\W/,@a);
	1030	@c = grep(/[^\w]/,@a);
	1031	print "not " if "@b" ne "@c";
	1032	print "ok $test\n";
	1033	$test++;
	1034
	1035	@b = grep(/\W/,@a);
	1036	@c = grep(/[\W]/,@a);
	1037	print "not " if "@b" ne "@c";
	1038	print "ok $test\n";
	1039	$test++;
	1040
	1041	@b = grep(/\w/,@a);
	1042	@c = grep(/[^\W]/,@a);
	1043	print "not " if "@b" ne "@c";
	1044	print "ok $test\n";
	1045	$test++;
	1046
	1047	@b = grep(/\w/,@a);
	1048	@c = grep(/[\w]/,@a);
	1049	iseq("@b","@c");
	1050
	1051	# see if backtracking optimization works correctly
	1052	"\n\n" =~ /\n $ \n/x or print "not ";
	1053	print "ok $test\n";
	1054	$test++;
	1055
	1056	"\n\n" =~ /\n* $ \n/x or print "not ";
	1057	print "ok $test\n";
	1058	$test++;
	1059
	1060	"\n\n" =~ /\n+ $ \n/x or print "not ";
	1061	print "ok $test\n";
	1062	$test++;
	1063
	1064	[] =~ /^ARRAY/ or print "# [] \nnot ";
	1065	print "ok $test\n";
	1066	$test++;
	1067
	1068	eval << 'EOE';
	1069	{
	1070	package S;
	1071	use overload '""' => sub { 'Object S' };
	1072	sub new { bless [] }
	1073	}
	1074	$a = 'S'->new;
	1075	EOE
	1076
	1077	$a and $a =~ /^Object\sS/ or print "# '$a' \nnot ";
	1078	print "ok $test\n";
	1079	$test++;
	1080
	1081	# test result of match used as match (!)
	1082	'a1b' =~ ('xyz' =~ /y/) and $` eq 'a' or print "not ";
	1083	print "ok $test\n";
	1084	$test++;
	1085
	1086	'a1b' =~ ('xyz' =~ /t/) and $` eq 'a' or print "not ";
	1087	print "ok $test\n";
	1088	$test++;
	1089
	1090	$w = 0;
	1091	{
	1092	local $SIG{__WARN__} = sub { $w = 1 };
	1093	local $^W = 1;
	1094	$w = 1 if ("1\n" x 102) =~ /^\s*\n/m;
	1095	}
	1096	print $w ? "not " : "", "ok $test\n";
	1097	$test++;
	1098
	1099	my %space = ( spc => " ",
	1100	tab => "\t",
	1101	cr => "\r",
	1102	lf => "\n",
	1103	ff => "\f",
	1104	# There's no \v but the vertical tabulator seems miraculously
	1105	# be 11 both in ASCII and EBCDIC.
	1106	vt => chr(11),
	1107	false => "space" );
	1108
	1109	my @space0 = sort grep { $space{$_} =~ /\s/ } keys %space;
	1110	my @space1 = sort grep { $space{$_} =~ /[[:space:]]/ } keys %space;
	1111	my @space2 = sort grep { $space{$_} =~ /[[:blank:]]/ } keys %space;
	1112
	1113	print "not " unless "@space0" eq "cr ff lf spc tab";
	1114	print "ok $test # @space0\n";
	1115	$test++;
	1116
	1117	print "not " unless "@space1" eq "cr ff lf spc tab vt";
	1118	print "ok $test # @space1\n";
	1119	$test++;
	1120
	1121	print "not " unless "@space2" eq "spc tab";
	1122	print "ok $test # @space2\n";
	1123	$test++;
	1124
	1125	# bugid 20001021.005 - this caused a SEGV
	1126	print "not " unless undef =~ /^([^\/])(.)$/;
	1127	print "ok $test\n";
	1128	$test++;
	1129
	1130	# bugid 20000731.001
	1131
	1132	print "not " unless "A \x{263a} B z C" =~ /A . B (??{ "z" }) C/;
	1133	print "ok $test\n";
	1134	$test++;
	1135
	1136	my $ordA = ord('A');
	1137
	1138	$_ = "a\x{100}b";
	1139	if (/(.)(\C)(\C)(.)/) {
	1140	print "ok 232\n";
	1141	if ($1 eq "a") {
	1142	print "ok 233\n";
	1143	} else {
	1144	print "not ok 233\n";
	1145	}
	1146	if ($ordA == 65) { # ASCII (or equivalent), should be UTF-8
	1147	if ($2 eq "\xC4") {
	1148	print "ok 234\n";
	1149	} else {
	1150	print "not ok 234\n";
	1151	}
	1152	if ($3 eq "\x80") {
	1153	print "ok 235\n";
	1154	} else {
	1155	print "not ok 235\n";
	1156	}
	1157	} elsif ($ordA == 193) { # EBCDIC (or equivalent), should be UTF-EBCDIC
	1158	if ($2 eq "\x8C") {
	1159	print "ok 234\n";
	1160	} else {
	1161	print "not ok 234\n";
	1162	}
	1163	if ($3 eq "\x41") {
	1164	print "ok 235\n";
	1165	} else {
	1166	print "not ok 235\n";
	1167	}
	1168	} else {
	1169	for (234..235) {
	1170	print "not ok $_ # ord('A') == $ordA\n";
	1171	}
	1172	}
	1173	if ($4 eq "b") {
	1174	print "ok 236\n";
	1175	} else {
	1176	print "not ok 236\n";
	1177	}
	1178	} else {
	1179	for (232..236) {
	1180	print "not ok $_\n";
	1181	}
	1182	}
	1183	$_ = "\x{100}";
	1184	if (/(\C)/g) {
	1185	print "ok 237\n";
	1186	# currently \C are still tagged as UTF-8
	1187	if ($ordA == 65) {
	1188	if ($1 eq "\xC4") {
	1189	print "ok 238\n";
	1190	} else {
	1191	print "not ok 238\n";
	1192	}
	1193	} elsif ($ordA == 193) {
	1194	if ($1 eq "\x8C") {
	1195	print "ok 238\n";
	1196	} else {
	1197	print "not ok 238\n";
	1198	}
	1199	} else {
	1200	print "not ok 238 # ord('A') == $ordA\n";
	1201	}
	1202	} else {
	1203	for (237..238) {
	1204	print "not ok $_\n";
	1205	}
	1206	}
	1207	if (/(\C)/g) {
	1208	print "ok 239\n";
	1209	# currently \C are still tagged as UTF-8
	1210	if ($ordA == 65) {
	1211	if ($1 eq "\x80") {
	1212	print "ok 240\n";
	1213	} else {
	1214	print "not ok 240\n";
	1215	}
	1216	} elsif ($ordA == 193) {
	1217	if ($1 eq "\x41") {
	1218	print "ok 240\n";
	1219	} else {
	1220	print "not ok 240\n";
	1221	}
	1222	} else {
	1223	print "not ok 240 # ord('A') == $ordA\n";
	1224	}
	1225	} else {
	1226	for (239..240) {
	1227	print "not ok $_\n";
	1228	}
	1229	}
	1230
	1231	{
	1232	# japhy -- added 03/03/2001
	1233	() = (my $str = "abc") =~ /(...)/;
	1234	$str = "def";
	1235	print "not " if $1 ne "abc";
	1236	print "ok 241\n";
	1237	}
	1238
	1239	# The 242 and 243 go with the 244 and 245.
	1240	# The trick is that in EBCDIC the explicit numeric range should match
	1241	# (as also in non-EBCDIC) but the explicit alphabetic range should not match.
	1242
	1243	if ("\x8e" =~ /[\x89-\x91]/) {
	1244	print "ok 242\n";
	1245	} else {
	1246	print "not ok 242\n";
	1247	}
	1248
	1249	if ("\xce" =~ /[\xc9-\xd1]/) {
	1250	print "ok 243\n";
	1251	} else {
	1252	print "not ok 243\n";
	1253	}
	1254
	1255	# In most places these tests would succeed since \x8e does not
	1256	# in most character sets match 'i' or 'j' nor would \xce match
	1257	# 'I' or 'J', but strictly speaking these tests are here for
	1258	# the good of EBCDIC, so let's test these only there.
	1259	if (ord('i') == 0x89 && ord('J') == 0xd1) { # EBCDIC
	1260	if ("\x8e" !~ /[i-j]/) {
	1261	print "ok 244\n";
	1262	} else {
	1263	print "not ok 244\n";
	1264	}
	1265	if ("\xce" !~ /[I-J]/) {
	1266	print "ok 245\n";
	1267	} else {
	1268	print "not ok 245\n";
	1269	}
	1270	} else {
	1271	for (244..245) {
	1272	print "ok $_ # Skip: only in EBCDIC\n";
	1273	}
	1274	}
	1275
	1276	print "not " unless "\x{ab}" =~ /\x{ab}/;
	1277	print "ok 246\n";
	1278
	1279	print "not " unless "\x{abcd}" =~ /\x{abcd}/;
	1280	print "ok 247\n";
	1281
	1282	{
	1283	# bug id 20001008.001
	1284
	1285	$test = 248;
	1286	my @x = ("stra\337e 138","stra\337e 138");
	1287	for (@x) {
	1288	s/(\d+)\s*([\w\-]+)/$1 . uc $2/e;
	1289	my($latin) = /^(.+)(?:\s+\d)/;
	1290	print $latin eq "stra\337e" ? "ok $test\n" : # 248,249
	1291	"#latin[$latin]\nnot ok $test\n";
	1292	$test++;
	1293	$latin =~ s/stra\337e/straße/; # \303\237 after the 2nd a
	1294	use utf8; # needed for the raw UTF-8
	1295	$latin =~ s!(s)tr(?:aß\|s+e)!$1tr.!; # \303\237 after the a
	1296	}
	1297	}
	1298
	1299	{
	1300	print "not " unless "ba\xd4c" =~ /([a\xd4]+)/ && $1 eq "a\xd4";
	1301	print "ok 250\n";
	1302
	1303	print "not " unless "ba\xd4c" =~ /([a\xd4]+)/ && $1 eq "a\x{d4}";
	1304	print "ok 251\n";
	1305
	1306	print "not " unless "ba\x{d4}c" =~ /([a\xd4]+)/ && $1 eq "a\x{d4}";
	1307	print "ok 252\n";
	1308
	1309	print "not " unless "ba\x{d4}c" =~ /([a\xd4]+)/ && $1 eq "a\xd4";
	1310	print "ok 253\n";
	1311
	1312	print "not " unless "ba\xd4c" =~ /([a\x{d4}]+)/ && $1 eq "a\xd4";
	1313	print "ok 254\n";
	1314
	1315	print "not " unless "ba\xd4c" =~ /([a\x{d4}]+)/ && $1 eq "a\x{d4}";
	1316	print "ok 255\n";
	1317
	1318	print "not " unless "ba\x{d4}c" =~ /([a\x{d4}]+)/ && $1 eq "a\x{d4}";
	1319	print "ok 256\n";
	1320
	1321	print "not " unless "ba\x{d4}c" =~ /([a\x{d4}]+)/ && $1 eq "a\xd4";
	1322	print "ok 257\n";
	1323	}
	1324
	1325	{
	1326	# the first half of 20001028.003
	1327
	1328	my $X = chr(1448);
	1329	my ($Y) = $X =~ /(.*)/;
	1330	print "not " unless $Y eq v1448 && length($Y) == 1;
	1331	print "ok 258\n";
	1332	}
	1333
	1334	{
	1335	# 20001108.001
	1336
	1337	my $X = "Szab\x{f3},Bal\x{e1}zs";
	1338	my $Y = $X;
	1339	$Y =~ s/(B)/$1/ for 0..3;
	1340	print "not " unless $Y eq $X && $X eq "Szab\x{f3},Bal\x{e1}zs";
	1341	print "ok 259\n";
	1342	}
	1343
	1344	{
	1345	# the second half of 20001028.003
	1346
	1347	my $X = '';
	1348	$X =~ s/^/chr(1488)/e;
	1349	print "not " unless length $X == 1 && ord($X) == 1488;
	1350	print "ok 260\n";
	1351	}
	1352
	1353	{
	1354	# 20000517.001
	1355
	1356	my $x = "\x{100}A";
	1357
	1358	$x =~ s/A/B/;
	1359
	1360	print "not " unless $x eq "\x{100}B" && length($x) == 2;
	1361	print "ok 261\n";
	1362	}
	1363
	1364	{
	1365	# bug id 20001230.002
	1366
	1367	print "not " unless "École" =~ /^\C\C(.)/ && $1 eq 'c';
	1368	print "ok 262\n";
	1369
	1370	print "not " unless "École" =~ /^\C\C(c)/;
	1371	print "ok 263\n";
	1372	}
	1373
	1374	SKIP: {
	1375	$test = 264; # till 575
	1376
	1377	use charnames ":full";
	1378
	1379	# This is far from complete testing, there are dozens of character
	1380	# classes in Unicode. The mixing of literals and \N{...} is
	1381	# intentional so that in non-Latin-1 places we test the native
	1382	# characters, not the Unicode code points.
	1383
	1384	my %s = (
	1385	"a" => 'Ll',
	1386	"\N{CYRILLIC SMALL LETTER A}" => 'Ll',
	1387	"A" => 'Lu',
	1388	"\N{GREEK CAPITAL LETTER ALPHA}" => 'Lu',
	1389	"\N{HIRAGANA LETTER SMALL A}" => 'Lo',
	1390	"\N{COMBINING GRAVE ACCENT}" => 'Mn',
	1391	"0" => 'Nd',
	1392	"\N{ARABIC-INDIC DIGIT ZERO}" => 'Nd',
	1393	"_" => 'N',
	1394	"!" => 'P',
	1395	" " => 'Zs',
	1396	"\0" => 'Cc',
	1397	);
	1398
	1399	for my $char (map { s/^\S+ //; $_ }
	1400	sort map { sprintf("%06x", ord($_))." $_" } keys %s) {
	1401	my $class = $s{$char};
	1402	my $code = sprintf("%06x", ord($char));
	1403	printf "#\n# 0x$code\n#\n";
	1404	print "# IsAlpha\n";
	1405	if ($class =~ /^[LM]/) {
	1406	print "not " unless $char =~ /\p{IsAlpha}/;
	1407	print "ok $test\n"; $test++;
	1408	print "not " if $char =~ /\P{IsAlpha}/;
	1409	print "ok $test\n"; $test++;
	1410	} else {
	1411	print "not " if $char =~ /\p{IsAlpha}/;
	1412	print "ok $test\n"; $test++;
	1413	print "not " unless $char =~ /\P{IsAlpha}/;
	1414	print "ok $test\n"; $test++;
	1415	}
	1416	print "# IsAlnum\n";
	1417	if ($class =~ /^[LMN]/ && $char ne "_") {
	1418	print "not " unless $char =~ /\p{IsAlnum}/;
	1419	print "ok $test\n"; $test++;
	1420	print "not " if $char =~ /\P{IsAlnum}/;
	1421	print "ok $test\n"; $test++;
	1422	} else {
	1423	print "not " if $char =~ /\p{IsAlnum}/;
	1424	print "ok $test\n"; $test++;
	1425	print "not " unless $char =~ /\P{IsAlnum}/;
	1426	print "ok $test\n"; $test++;
	1427	}
	1428	print "# IsASCII\n";
	1429	if (ord("A") == 193) {
	1430	print "ok $test # Skip: in EBCDIC\n"; $test++;
	1431	print "ok $test # Skip: in EBCDIC\n"; $test++;
	1432	} else {
	1433	if ($code le '00007f') {
	1434	print "not " unless $char =~ /\p{IsASCII}/;
	1435	print "ok $test\n"; $test++;
	1436	print "not " if $char =~ /\P{IsASCII}/;
	1437	print "ok $test\n"; $test++;
	1438	} else {
	1439	print "not " if $char =~ /\p{IsASCII}/;
	1440	print "ok $test\n"; $test++;
	1441	print "not " unless $char =~ /\P{IsASCII}/;
	1442	print "ok $test\n"; $test++;
	1443	}
	1444	}
	1445	print "# IsCntrl\n";
	1446	if ($class =~ /^C/) {
	1447	print "not " unless $char =~ /\p{IsCntrl}/;
	1448	print "ok $test\n"; $test++;
	1449	print "not " if $char =~ /\P{IsCntrl}/;
	1450	print "ok $test\n"; $test++;
	1451	} else {
	1452	print "not " if $char =~ /\p{IsCntrl}/;
	1453	print "ok $test\n"; $test++;
	1454	print "not " unless $char =~ /\P{IsCntrl}/;
	1455	print "ok $test\n"; $test++;
	1456	}
	1457	print "# IsBlank\n";
	1458	if ($class =~ /^Z[lp]/ \|\| $char eq " ") {
	1459	print "not " unless $char =~ /\p{IsBlank}/;
	1460	print "ok $test\n"; $test++;
	1461	print "not " if $char =~ /\P{IsBlank}/;
	1462	print "ok $test\n"; $test++;
	1463	} else {
	1464	print "not " if $char =~ /\p{IsBlank}/;
	1465	print "ok $test\n"; $test++;
	1466	print "not " unless $char =~ /\P{IsBlank}/;
	1467	print "ok $test\n"; $test++;
	1468	}
	1469	print "# IsDigit\n";
	1470	if ($class =~ /^Nd$/) {
	1471	print "not " unless $char =~ /\p{IsDigit}/;
	1472	print "ok $test\n"; $test++;
	1473	print "not " if $char =~ /\P{IsDigit}/;
	1474	print "ok $test\n"; $test++;
	1475	} else {
	1476	print "not " if $char =~ /\p{IsDigit}/;
	1477	print "ok $test\n"; $test++;
	1478	print "not " unless $char =~ /\P{IsDigit}/;
	1479	print "ok $test\n"; $test++;
	1480	}
	1481	print "# IsGraph\n";
	1482	if ($class =~ /^([LMNPS])\|Co/) {
	1483	print "not " unless $char =~ /\p{IsGraph}/;
	1484	print "ok $test\n"; $test++;
	1485	print "not " if $char =~ /\P{IsGraph}/;
	1486	print "ok $test\n"; $test++;
	1487	} else {
	1488	print "not " if $char =~ /\p{IsGraph}/;
	1489	print "ok $test\n"; $test++;
	1490	print "not " unless $char =~ /\P{IsGraph}/;
	1491	print "ok $test\n"; $test++;
	1492	}
	1493	print "# IsLower\n";
	1494	if ($class =~ /^Ll$/) {
	1495	print "not " unless $char =~ /\p{IsLower}/;
	1496	print "ok $test\n"; $test++;
	1497	print "not " if $char =~ /\P{IsLower}/;
	1498	print "ok $test\n"; $test++;
	1499	} else {
	1500	print "not " if $char =~ /\p{IsLower}/;
	1501	print "ok $test\n"; $test++;
	1502	print "not " unless $char =~ /\P{IsLower}/;
	1503	print "ok $test\n"; $test++;
	1504	}
	1505	print "# IsPrint\n";
	1506	if ($class =~ /^([LMNPS])\|Co\|Zs/) {
	1507	print "not " unless $char =~ /\p{IsPrint}/;
	1508	print "ok $test\n"; $test++;
	1509	print "not " if $char =~ /\P{IsPrint}/;
	1510	print "ok $test\n"; $test++;
	1511	} else {
	1512	print "not " if $char =~ /\p{IsPrint}/;
	1513	print "ok $test\n"; $test++;
	1514	print "not " unless $char =~ /\P{IsPrint}/;
	1515	print "ok $test\n"; $test++;
	1516	}
	1517	print "# IsPunct\n";
	1518	if ($class =~ /^P/ \|\| $char eq "_") {
	1519	print "not " unless $char =~ /\p{IsPunct}/;
	1520	print "ok $test\n"; $test++;
	1521	print "not " if $char =~ /\P{IsPunct}/;
	1522	print "ok $test\n"; $test++;
	1523	} else {
	1524	print "not " if $char =~ /\p{IsPunct}/;
	1525	print "ok $test\n"; $test++;
	1526	print "not " unless $char =~ /\P{IsPunct}/;
	1527	print "ok $test\n"; $test++;
	1528	}
	1529	print "# IsSpace\n";
	1530	if ($class =~ /^Z/ \|\| ($code =~ /^(0009\|000A\|000B\|000C\|000D)$/)) {
	1531	print "not " unless $char =~ /\p{IsSpace}/;
	1532	print "ok $test\n"; $test++;
	1533	print "not " if $char =~ /\P{IsSpace}/;
	1534	print "ok $test\n"; $test++;
	1535	} else {
	1536	print "not " if $char =~ /\p{IsSpace}/;
	1537	print "ok $test\n"; $test++;
	1538	print "not " unless $char =~ /\P{IsSpace}/;
	1539	print "ok $test\n"; $test++;
	1540	}
	1541	print "# IsUpper\n";
	1542	if ($class =~ /^L[ut]/) {
	1543	print "not " unless $char =~ /\p{IsUpper}/;
	1544	print "ok $test\n"; $test++;
	1545	print "not " if $char =~ /\P{IsUpper}/;
	1546	print "ok $test\n"; $test++;
	1547	} else {
	1548	print "not " if $char =~ /\p{IsUpper}/;
	1549	print "ok $test\n"; $test++;
	1550	print "not " unless $char =~ /\P{IsUpper}/;
	1551	print "ok $test\n"; $test++;
	1552	}
	1553	print "# IsWord\n";
	1554	if ($class =~ /^[LMN]/ \|\| $char eq "_") {
	1555	print "not " unless $char =~ /\p{IsWord}/;
	1556	print "ok $test\n"; $test++;
	1557	print "not " if $char =~ /\P{IsWord}/;
	1558	print "ok $test\n"; $test++;
	1559	} else {
	1560	print "not " if $char =~ /\p{IsWord}/;
	1561	print "ok $test\n"; $test++;
	1562	print "not " unless $char =~ /\P{IsWord}/;
	1563	print "ok $test\n"; $test++;
	1564	}
	1565	}
	1566	}
	1567
	1568	{
	1569	$_ = "abc\x{100}\x{200}\x{300}\x{380}\x{400}defg";
	1570
	1571	if (/(.\x{300})./) {
	1572	print "ok 576\n";
	1573
	1574	print "not " unless $` eq "abc\x{100}" && length($`) == 4;
	1575	print "ok 577\n";
	1576
	1577	print "not " unless $& eq "\x{200}\x{300}\x{380}" && length($&) == 3;
	1578	print "ok 578\n";
	1579
	1580	print "not " unless $' eq "\x{400}defg" && length($') == 5;
	1581	print "ok 579\n";
	1582
	1583	print "not " unless $1 eq "\x{200}\x{300}" && length($1) == 2;
	1584	print "ok 580\n";
	1585	} else {
	1586	for (576..580) { print "not ok $_\n" }
	1587	}
	1588	}
	1589
	1590	{
	1591	# bug id 20010306.008
	1592
	1593	$a = "a\x{1234}";
	1594	# The original bug report had 'no utf8' here but that was irrelevant.
	1595	$a =~ m/\w/; # used to core dump
	1596
	1597	print "ok 581\n";
	1598	}
	1599
	1600	{
	1601	$test = 582;
	1602
	1603	# bugid 20010410.006
	1604	for my $rx (
	1605	'/(.?)\{(.?)\}/csg',
	1606	'/(.?)\{(.?)\}/cg',
	1607	'/(.?)\{(.?)\}/sg',
	1608	'/(.?)\{(.?)\}/g',
	1609	'/(.+?)\{(.+?)\}/csg',
	1610	)
	1611	{
	1612	my($input, $i);
	1613
	1614	$i = 0;
	1615	$input = "a{b}c{d}";
	1616	eval <<EOT;
	1617	while (eval \$input =~ $rx) {
	1618	print "# \\\$1 = '\$1' \\\$2 = '\$2'\n";
	1619	++\$i;
	1620	}
	1621	EOT
	1622	print "not " unless $i == 2;
	1623	print "ok " . $test++ . "\n";
	1624	}
	1625	}
	1626
	1627	{
	1628	# from Robin Houston
	1629
	1630	my $x = "\x{10FFFD}";
	1631	$x =~ s/(.)/$1/g;
	1632	print "not " unless ord($x) == 0x10FFFD && length($x) == 1;
	1633	print "ok 587\n";
	1634	}
	1635
	1636	{
	1637	my $x = "\x7f";
	1638
	1639	print "not " if $x =~ /[\x80-\xff]/;
	1640	print "ok 588\n";
	1641
	1642	print "not " if $x =~ /[\x80-\x{100}]/;
	1643	print "ok 589\n";
	1644
	1645	print "not " if $x =~ /[\x{100}]/;
	1646	print "ok 590\n";
	1647
	1648	print "not " if $x =~ /\p{InLatin1Supplement}/;
	1649	print "ok 591\n";
	1650
	1651	print "not " unless $x =~ /\P{InLatin1Supplement}/;
	1652	print "ok 592\n";
	1653
	1654	print "not " if $x =~ /\p{InLatinExtendedA}/;
	1655	print "ok 593\n";
	1656
	1657	print "not " unless $x =~ /\P{InLatinExtendedA}/;
	1658	print "ok 594\n";
	1659	}
	1660
	1661	{
	1662	my $x = "\x80";
	1663
	1664	print "not " unless $x =~ /[\x80-\xff]/;
	1665	print "ok 595\n";
	1666
	1667	print "not " unless $x =~ /[\x80-\x{100}]/;
	1668	print "ok 596\n";
	1669
	1670	print "not " if $x =~ /[\x{100}]/;
	1671	print "ok 597\n";
	1672
	1673	print "not " unless $x =~ /\p{InLatin1Supplement}/;
	1674	print "ok 598\n";
	1675
	1676	print "not " if $x =~ /\P{InLatin1Supplement}/;
	1677	print "ok 599\n";
	1678
	1679	print "not " if $x =~ /\p{InLatinExtendedA}/;
	1680	print "ok 600\n";
	1681
	1682	print "not " unless $x =~ /\P{InLatinExtendedA}/;
	1683	print "ok 601\n";
	1684	}
	1685
	1686	{
	1687	my $x = "\xff";
	1688
	1689	print "not " unless $x =~ /[\x80-\xff]/;
	1690	print "ok 602\n";
	1691
	1692	print "not " unless $x =~ /[\x80-\x{100}]/;
	1693	print "ok 603\n";
	1694
	1695	print "not " if $x =~ /[\x{100}]/;
	1696	print "ok 604\n";
	1697
	1698	# the next two tests must be ignored on EBCDIC
	1699	print "not " unless $x =~ /\p{InLatin1Supplement}/ or ord("A") == 193;
	1700	print "ok 605\n";
	1701
	1702	print "not " if $x =~ /\P{InLatin1Supplement}/ and ord("A") != 193;
	1703	print "ok 606\n";
	1704
	1705	print "not " if $x =~ /\p{InLatinExtendedA}/;
	1706	print "ok 607\n";
	1707
	1708	print "not " unless $x =~ /\P{InLatinExtendedA}/;
	1709	print "ok 608\n";
	1710	}
	1711
	1712	{
	1713	my $x = "\x{100}";
	1714
	1715	print "not " if $x =~ /[\x80-\xff]/;
	1716	print "ok 609\n";
	1717
	1718	print "not " unless $x =~ /[\x80-\x{100}]/;
	1719	print "ok 610\n";
	1720
	1721	print "not " unless $x =~ /[\x{100}]/;
	1722	print "ok 611\n";
	1723
	1724	print "not " if $x =~ /\p{InLatin1Supplement}/;
	1725	print "ok 612\n";
	1726
	1727	print "not " unless $x =~ /\P{InLatin1Supplement}/;
	1728	print "ok 613\n";
	1729
	1730	print "not " unless $x =~ /\p{InLatinExtendedA}/;
	1731	print "ok 614\n";
	1732
	1733	print "not " if $x =~ /\P{InLatinExtendedA}/;
	1734	print "ok 615\n";
	1735	}
	1736
	1737	{
	1738	# from japhy
	1739	my $w;
	1740	use warnings;
	1741	local $SIG{__WARN__} = sub { $w .= shift };
	1742
	1743	$w = "";
	1744	eval 'qr/(?c)/';
	1745	print "not " if $w !~ /^Useless $\?c$/;
	1746	print "ok 616\n";
	1747
	1748	$w = "";
	1749	eval 'qr/(?-c)/';
	1750	print "not " if $w !~ /^Useless $\?-c$/;
	1751	print "ok 617\n";
	1752
	1753	$w = "";
	1754	eval 'qr/(?g)/';
	1755	print "not " if $w !~ /^Useless $\?g$/;
	1756	print "ok 618\n";
	1757
	1758	$w = "";
	1759	eval 'qr/(?-g)/';
	1760	print "not " if $w !~ /^Useless $\?-g$/;
	1761	print "ok 619\n";
	1762
	1763	$w = "";
	1764	eval 'qr/(?o)/';
	1765	print "not " if $w !~ /^Useless $\?o$/;
	1766	print "ok 620\n";
	1767
	1768	$w = "";
	1769	eval 'qr/(?-o)/';
	1770	print "not " if $w !~ /^Useless $\?-o$/;
	1771	print "ok 621\n";
	1772
	1773	# now test multi-error regexes
	1774
	1775	$w = "";
	1776	eval 'qr/(?g-o)/';
	1777	print "not " if $w !~ /^Useless $\?g$.*\nUseless $\?-o$/;
	1778	print "ok 622\n";
	1779
	1780	$w = "";
	1781	eval 'qr/(?g-c)/';
	1782	print "not " if $w !~ /^Useless $\?g$.*\nUseless $\?-c$/;
	1783	print "ok 623\n";
	1784
	1785	$w = "";
	1786	eval 'qr/(?o-cg)/'; # (?c) means (?g) error won't be thrown
	1787	print "not " if $w !~ /^Useless $\?o$.*\nUseless $\?-c$/;
	1788	print "ok 624\n";
	1789
	1790	$w = "";
	1791	eval 'qr/(?ogc)/';
	1792	print "not " if $w !~ /^Useless $\?o$.\nUseless $\?g$.\nUseless $\?c$/;
	1793	print "ok 625\n";
	1794	}
	1795
	1796	# More Unicode "class" tests
	1797
	1798	{
	1799	use charnames ':full';
	1800
	1801	print "not " unless "\N{LATIN CAPITAL LETTER A}" =~ /\p{InBasicLatin}/;
	1802	print "ok 626\n";
	1803
	1804	print "not " unless "\N{LATIN CAPITAL LETTER A WITH GRAVE}" =~ /\p{InLatin1Supplement}/;
	1805	print "ok 627\n";
	1806
	1807	print "not " unless "\N{LATIN CAPITAL LETTER A WITH MACRON}" =~ /\p{InLatinExtendedA}/;
	1808	print "ok 628\n";
	1809
	1810	print "not " unless "\N{LATIN SMALL LETTER B WITH STROKE}" =~ /\p{InLatinExtendedB}/;
	1811	print "ok 629\n";
	1812
	1813	print "not " unless "\N{KATAKANA LETTER SMALL A}" =~ /\p{InKatakana}/;
	1814	print "ok 630\n";
	1815	}
	1816
	1817	$_ = "foo";
	1818
	1819	eval <<"EOT"; die if $@;
	1820	/f
	1821	o\r
	1822	o
	1823	\$
	1824	/x && print "ok 631\n";
	1825	EOT
	1826
	1827	eval <<"EOT"; die if $@;
	1828	/f
	1829	o
	1830	o
	1831	\$\r
	1832	/x && print "ok 632\n";
	1833	EOT
	1834
	1835	#test /o feature
	1836	sub test_o { $_[0] =~/$_[1]/o; return $1}
	1837	if(test_o('abc','(.)..') eq 'a') {
	1838	print "ok 633\n";
	1839	} else {
	1840	print "not ok 633\n";
	1841	}
	1842	if(test_o('abc','..(.)') eq 'a') {
	1843	print "ok 634\n";
	1844	} else {
	1845	print "not ok 634\n";
	1846	}
	1847
	1848	# 635..639: ID 20010619.003 (only the space character is
	1849	# supposed to be [:print:], not the whole isprint()).
	1850
	1851	print "not " if "\n" =~ /[[:print:]]/;
	1852	print "ok 635\n";
	1853
	1854	print "not " if "\t" =~ /[[:print:]]/;
	1855	print "ok 636\n";
	1856
	1857	# Amazingly vertical tabulator is the same in ASCII and EBCDIC.
	1858	print "not " if "\014" =~ /[[:print:]]/;
	1859	print "ok 637\n";
	1860
	1861	print "not " if "\r" =~ /[[:print:]]/;
	1862	print "ok 638\n";
	1863
	1864	print "not " unless " " =~ /[[:print:]]/;
	1865	print "ok 639\n";
	1866
	1867	##
	1868	## Test basic $^N usage outside of a regex
	1869	##
	1870	$x = "abcdef";
	1871	$T="ok 640\n";if ($x =~ /cde/ and not defined $^N) {print $T} else {print "not $T"};
	1872	$T="ok 641\n";if ($x =~ /(cde)/ and $^N eq "cde") {print $T} else {print "not $T"};
	1873	$T="ok 642\n";if ($x =~ /(c)(d)(e)/ and $^N eq "e") {print $T} else {print "not $T"};
	1874	$T="ok 643\n";if ($x =~ /(c(d)e)/ and $^N eq "cde") {print $T} else {print "not $T"};
	1875	$T="ok 644\n";if ($x =~ /(foo)\|(c(d)e)/ and $^N eq "cde") {print $T} else {print "not $T"};
	1876	$T="ok 645\n";if ($x =~ /(c(d)e)\|(foo)/ and $^N eq "cde") {print $T} else {print "not $T"};
	1877	$T="ok 646\n";if ($x =~ /(c(d)e)\|(abc)/ and $^N eq "abc") {print $T} else {print "not $T"};
	1878	$T="ok 647\n";if ($x =~ /(c(d)e)\|(abc)x/ and $^N eq "cde") {print $T} else {print "not $T"};
	1879	$T="ok 648\n";if ($x =~ /(c(d)e)(abc)?/ and $^N eq "cde") {print $T} else {print "not $T"};
	1880	$T="ok 649\n";if ($x =~ /(?:c(d)e)/ and $^N eq "d" ) {print $T} else {print "not $T"};
	1881	$T="ok 650\n";if ($x =~ /(?:c(d)e)(?:f)/ and $^N eq "d" ) {print $T} else {print "not $T"};
	1882	$T="ok 651\n";if ($x =~ /(?:([abc])\|([def]))*/ and $^N eq "f" ){print $T} else {print "not $T"};
	1883	$T="ok 652\n";if ($x =~ /(?:([ace])\|([bdf]))*/ and $^N eq "f" ){print $T} else {print "not $T"};
	1884	$T="ok 653\n";if ($x =~ /(([ace])\|([bd]))*/ and $^N eq "e" ){print $T} else {print "not $T"};
	1885	{
	1886	$T="ok 654\n";if($x =~ /(([ace])\|([bdf]))*/ and $^N eq "f" ){print $T} else {print "not $T"};
	1887	}
	1888	## test to see if $^N is automatically localized -- it should now
	1889	## have the value set in test 653
	1890	$T="ok 655\n";if ($^N eq "e" ){print $T} else {print "not $T"};
	1891
	1892	##
	1893	## Now test inside (?{...})
	1894	##
	1895	$T="ok 656\n";if ($x =~ /a([abc])(?{$y=$^N})c/ and $y eq "b" ){print $T} else {print "not $T"};
	1896	$T="ok 657\n";if ($x =~ /a([abc]+)(?{$y=$^N})d/ and $y eq "bc"){print $T} else {print "not $T"};
	1897	$T="ok 658\n";if ($x =~ /a([abcdefg]+)(?{$y=$^N})d/ and $y eq "bc"){print $T} else {print "not $T"};
	1898	$T="ok 659\n";if ($x =~ /(a([abcdefg]+)(?{$y=$^N})d)(?{$z=$^N})e/ and $y eq "bc" and $z eq "abcd")
	1899	{print $T} else {print "not $T"};
	1900	$T="ok 660\n";if ($x =~ /(a([abcdefg]+)(?{$y=$^N})de)(?{$z=$^N})/ and $y eq "bc" and $z eq "abcde")
	1901	{print $T} else {print "not $T"};
	1902
	1903	# Test the Unicode script classes
	1904
	1905	print "not " unless chr(0x100) =~ /\p{IsLatin}/; # outside Latin-1
	1906	print "ok 661\n";
	1907
	1908	print "not " unless chr(0x212b) =~ /\p{IsLatin}/; # Angstrom sign, very outside
	1909	print "ok 662\n";
	1910
	1911	print "not " unless chr(0x5d0) =~ /\p{IsHebrew}/; # inside InHebrew
	1912	print "ok 663\n";
	1913
	1914	print "not " unless chr(0xfb4f) =~ /\p{IsHebrew}/; # outside InHebrew
	1915	print "ok 664\n";
	1916
	1917	# # singleton (not in a range, this test must be ignored on EBCDIC)
	1918	# print "not " unless chr(0xb5) =~ /\p{IsGreek}/ or ord("A") == 193;
	1919	# print "ok 665\n";
	1920	print "ok 665 # 0xb5 moved from Greek to Common with Unicode 4.0.1\n";
	1921
	1922	print "not " unless chr(0x37a) =~ /\p{IsGreek}/; # singleton
	1923	print "ok 666\n";
	1924
	1925	print "not " unless chr(0x386) =~ /\p{IsGreek}/; # singleton
	1926	print "ok 667\n";
	1927
	1928	print "not " unless chr(0x387) =~ /\P{IsGreek}/; # not there
	1929	print "ok 668\n";
	1930
	1931	print "not " unless chr(0x388) =~ /\p{IsGreek}/; # range
	1932	print "ok 669\n";
	1933
	1934	print "not " unless chr(0x38a) =~ /\p{IsGreek}/; # range
	1935	print "ok 670\n";
	1936
	1937	print "not " unless chr(0x38b) =~ /\P{IsGreek}/; # not there
	1938	print "ok 671\n";
	1939
	1940	print "not " unless chr(0x38c) =~ /\p{IsGreek}/; # singleton
	1941	print "ok 672\n";
	1942
	1943	if (ord("A") == 65) {
	1944	##
	1945	## Test [:cntrl:]...
	1946	##
	1947	## Should probably put in tests for all the POSIX stuff, but not sure how to
	1948	## guarantee a specific locale......
	1949	##
	1950	$AllBytes = join('', map { chr($_) } 0..255);
	1951	($x = $AllBytes) =~ s/[[:cntrl:]]//g;
	1952	if ($x ne join('', map { chr($_) } 0x20..0x7E, 0x80..0xFF)) {
	1953	print "not ";
	1954	}
	1955	print "ok 673\n";
	1956
	1957	($x = $AllBytes) =~ s/[^[:cntrl:]]//g;
	1958	if ($x ne join('', map { chr($_) } 0..0x1F, 0x7F)) { print "not " }
	1959	print "ok 674\n";
	1960	} else {
	1961	print "ok $_ # Skip: EBCDIC\n" for 673..674;
	1962	}
	1963
	1964	# With /s modifier UTF8 chars were interpreted as bytes
	1965	{
	1966	my $a = "Hello \x{263A} World";
	1967
	1968	my @a = ($a =~ /./gs);
	1969
	1970	print "not " unless $#a == 12;
	1971	print "ok 675\n";
	1972	}
	1973
	1974	@a = ("foo\nbar" =~ /./g);
	1975	print "ok 676\n" if @a == 6 && "@a" eq "f o o b a r";
	1976
	1977	@a = ("foo\nbar" =~ /./gs);
	1978	print "ok 677\n" if @a == 7 && "@a" eq "f o o \n b a r";
	1979
	1980	@a = ("foo\nbar" =~ /\C/g);
	1981	print "ok 678\n" if @a == 7 && "@a" eq "f o o \n b a r";
	1982
	1983	@a = ("foo\nbar" =~ /\C/gs);
	1984	print "ok 679\n" if @a == 7 && "@a" eq "f o o \n b a r";
	1985
	1986	@a = ("foo\n\x{100}bar" =~ /./g);
	1987	print "ok 680\n" if @a == 7 && "@a" eq "f o o \x{100} b a r";
	1988
	1989	@a = ("foo\n\x{100}bar" =~ /./gs);
	1990	print "ok 681\n" if @a == 8 && "@a" eq "f o o \n \x{100} b a r";
	1991
	1992	($a, $b) = map { chr } ord('A') == 65 ? (0xc4, 0x80) : (0x8c, 0x41);
	1993
	1994	@a = ("foo\n\x{100}bar" =~ /\C/g);
	1995	print "ok 682\n" if @a == 9 && "@a" eq "f o o \n $a $b b a r";
	1996
	1997	@a = ("foo\n\x{100}bar" =~ /\C/gs);
	1998	print "ok 683\n" if @a == 9 && "@a" eq "f o o \n $a $b b a r";
	1999
	2000	{
	2001	# [ID 20010814.004] pos() doesn't work when using =~m// in list context
	2002	$_ = "ababacadaea";
	2003	$a = join ":", /b./gc;
	2004	$b = join ":", /a./gc;
	2005	$c = pos;
	2006	print "$a $b $c" eq 'ba:ba ad:ae 10' ? "ok 684\n" : "not ok 684\t# $a $b $c\n";
	2007	}
	2008
	2009	{
	2010	# [ID 20010407.006] matching utf8 return values from functions does not work
	2011
	2012	package ID_20010407_006;
	2013
	2014	sub x {
	2015	"a\x{1234}";
	2016	}
	2017
	2018	my $x = x;
	2019	my $y;
	2020
	2021	$x =~ /(..)/; $y = $1;
	2022	print "not " unless length($y) == 2 && $y eq $x;
	2023	print "ok 685\n";
	2024
	2025	x =~ /(..)/; $y = $1;
	2026	print "not " unless length($y) == 2 && $y eq $x;
	2027	print "ok 686\n";
	2028	}
	2029
	2030
	2031	$test = 687;
	2032
	2033	# Force scalar context on the patern match
	2034	sub ok ($;$) {
	2035	my($ok, $name) = @_;
	2036
	2037	printf "%sok %d - %s\n", ($ok ? "" : "not "), $test,
	2038	($name\|\|$Message)."\tLine ".((caller)[2]);
	2039
	2040	printf "# Failed test at line %d\n", (caller)[2] unless $ok;
	2041
	2042	$test++;
	2043	return $ok;
	2044	}
	2045
	2046	{
	2047	# Check that \x## works. 5.6.1 and 5.005_03 fail some of these.
	2048	$x = "\x4e" . "E";
	2049	ok ($x =~ /^\x4EE$/, "Check only 2 bytes of hex are matched.");
	2050
	2051	$x = "\x4e" . "i";
	2052	ok ($x =~ /^\x4Ei$/, "Check that invalid hex digit stops it (2)");
	2053
	2054	$x = "\x4" . "j";
	2055	ok ($x =~ /^\x4j$/, "Check that invalid hex digit stops it (1)");
	2056
	2057	$x = "\x0" . "k";
	2058	ok ($x =~ /^\xk$/, "Check that invalid hex digit stops it (0)");
	2059
	2060	$x = "\x0" . "x";
	2061	ok ($x =~ /^\xx$/, "\\xx isn't to be treated as \\0");
	2062
	2063	$x = "\x0" . "xa";
	2064	ok ($x =~ /^\xxa$/, "\\xxa isn't to be treated as \\xa");
	2065
	2066	$x = "\x9" . "_b";
	2067	ok ($x =~ /^\x9_b$/, "\\x9_b isn't to be treated as \\x9b");
	2068
	2069	print "# and now again in [] ranges\n";
	2070
	2071	$x = "\x4e" . "E";
	2072	ok ($x =~ /^[\x4EE]{2}$/, "Check only 2 bytes of hex are matched.");
	2073
	2074	$x = "\x4e" . "i";
	2075	ok ($x =~ /^[\x4Ei]{2}$/, "Check that invalid hex digit stops it (2)");
	2076
	2077	$x = "\x4" . "j";
	2078	ok ($x =~ /^[\x4j]{2}$/, "Check that invalid hex digit stops it (1)");
	2079
	2080	$x = "\x0" . "k";
	2081	ok ($x =~ /^[\xk]{2}$/, "Check that invalid hex digit stops it (0)");
	2082
	2083	$x = "\x0" . "x";
	2084	ok ($x =~ /^[\xx]{2}$/, "\\xx isn't to be treated as \\0");
	2085
	2086	$x = "\x0" . "xa";
	2087	ok ($x =~ /^[\xxa]{3}$/, "\\xxa isn't to be treated as \\xa");
	2088
	2089	$x = "\x9" . "_b";
	2090	ok ($x =~ /^[\x9_b]{3}$/, "\\x9_b isn't to be treated as \\x9b");
	2091
	2092	}
	2093
	2094	{
	2095	# Check that \x{##} works. 5.6.1 fails quite a few of these.
	2096
	2097	$x = "\x9b";
	2098	ok ($x =~ /^\x{9_b}$/, "\\x{9_b} is to be treated as \\x9b");
	2099
	2100	$x = "\x9b" . "y";
	2101	ok ($x =~ /^\x{9_b}y$/, "\\x{9_b} is to be treated as \\x9b (again)");
	2102
	2103	$x = "\x9b" . "y";
	2104	ok ($x =~ /^\x{9b_}y$/, "\\x{9b_} is to be treated as \\x9b");
	2105
	2106	$x = "\x9b" . "y";
	2107	ok ($x =~ /^\x{9_bq}y$/, "\\x{9_bc} is to be treated as \\x9b");
	2108
	2109	$x = "\x0" . "y";
	2110	ok ($x =~ /^\x{x9b}y$/, "\\x{x9b} is to be treated as \\x0");
	2111
	2112	$x = "\x0" . "y";
	2113	ok ($x =~ /^\x{0x9b}y$/, "\\x{0x9b} is to be treated as \\x0");
	2114
	2115	$x = "\x9b" . "y";
	2116	ok ($x =~ /^\x{09b}y$/, "\\x{09b} is to be treated as \\x9b");
	2117
	2118	print "# and now again in [] ranges\n";
	2119
	2120	$x = "\x9b";
	2121	ok ($x =~ /^[\x{9_b}]$/, "\\x{9_b} is to be treated as \\x9b");
	2122
	2123	$x = "\x9b" . "y";
	2124	ok ($x =~ /^[\x{9_b}y]{2}$/, "\\x{9_b} is to be treated as \\x9b (again)");
	2125
	2126	$x = "\x9b" . "y";
	2127	ok ($x =~ /^[\x{9b_}y]{2}$/, "\\x{9b_} is to be treated as \\x9b");
	2128
	2129	$x = "\x9b" . "y";
	2130	ok ($x =~ /^[\x{9_bq}y]{2}$/, "\\x{9_bc} is to be treated as \\x9b");
	2131
	2132	$x = "\x0" . "y";
	2133	ok ($x =~ /^[\x{x9b}y]{2}$/, "\\x{x9b} is to be treated as \\x0");
	2134
	2135	$x = "\x0" . "y";
	2136	ok ($x =~ /^[\x{0x9b}y]{2}$/, "\\x{0x9b} is to be treated as \\x0");
	2137
	2138	$x = "\x9b" . "y";
	2139	ok ($x =~ /^[\x{09b}y]{2}$/, "\\x{09b} is to be treated as \\x9b");
	2140	}
	2141
	2142	{
	2143	# high bit bug -- japhy
	2144	my $x = "ab\200d";
	2145	$x =~ /.*?\200/ or print "not ";
	2146	print "ok 715\n";
	2147	}
	2148
	2149	print "# some Unicode properties\n";
	2150
	2151	{
	2152	# Dashes, underbars, case.
	2153	print "not " unless "\x80" =~ /\p{in-latin1_SUPPLEMENT}/;
	2154	print "ok 716\n";
	2155
	2156	# Complement, leading and trailing whitespace.
	2157	print "not " unless "\x80" =~ /\P{ ^ In Latin 1 Supplement }/;
	2158	print "ok 717\n";
	2159
	2160	# No ^In, dashes, case, dash, any intervening (word-break) whitespace.
	2161	# (well, newlines don't work...)
	2162	print "not " unless "\x80" =~ /\p{latin-1 supplement}/;
	2163	print "ok 718\n";
	2164	}
	2165
	2166	{
	2167	print "not " unless "a" =~ /\pL/;
	2168	print "ok 719\n";
	2169
	2170	print "not " unless "a" =~ /\p{IsLl}/;
	2171	print "ok 720\n";
	2172
	2173	print "not " if "a" =~ /\p{IsLu}/;
	2174	print "ok 721\n";
	2175
	2176	print "not " unless "a" =~ /\p{Ll}/;
	2177	print "ok 722\n";
	2178
	2179	print "not " if "a" =~ /\p{Lu}/;
	2180	print "ok 723\n";
	2181
	2182	print "not " unless "A" =~ /\pL/;
	2183	print "ok 724\n";
	2184
	2185	print "not " unless "A" =~ /\p{IsLu}/;
	2186	print "ok 725\n";
	2187
	2188	print "not " if "A" =~ /\p{IsLl}/;
	2189	print "ok 726\n";
	2190
	2191	print "not " unless "A" =~ /\p{Lu}/;
	2192	print "ok 727\n";
	2193
	2194	print "not " if "A" =~ /\p{Ll}/;
	2195	print "ok 728\n";
	2196
	2197	print "not " if "a" =~ /\PL/;
	2198	print "ok 729\n";
	2199
	2200	print "not " if "a" =~ /\P{IsLl}/;
	2201	print "ok 730\n";
	2202
	2203	print "not " unless "a" =~ /\P{IsLu}/;
	2204	print "ok 731\n";
	2205
	2206	print "not " if "a" =~ /\P{Ll}/;
	2207	print "ok 732\n";
	2208
	2209	print "not " unless "a" =~ /\P{Lu}/;
	2210	print "ok 733\n";
	2211
	2212	print "not " if "A" =~ /\PL/;
	2213	print "ok 734\n";
	2214
	2215	print "not " if "A" =~ /\P{IsLu}/;
	2216	print "ok 735\n";
	2217
	2218	print "not " unless "A" =~ /\P{IsLl}/;
	2219	print "ok 736\n";
	2220
	2221	print "not " if "A" =~ /\P{Lu}/;
	2222	print "ok 737\n";
	2223
	2224	print "not " unless "A" =~ /\P{Ll}/;
	2225	print "ok 738\n";
	2226
	2227	}
	2228
	2229	{
	2230	print "not " if "a" =~ /\p{Common}/;
	2231	print "ok 739\n";
	2232
	2233	print "not " unless "1" =~ /\p{Common}/;
	2234	print "ok 740\n";
	2235	}
	2236
	2237	{
	2238	print "not " if "a" =~ /\p{Inherited}/;
	2239	print "ok 741\n";
	2240
	2241	print "not " unless "\x{300}" =~ /\p{Inherited}/;
	2242	print "ok 742\n";
	2243	}
	2244
	2245	{
	2246	# L& and LC are the same
	2247	print "not " unless "a" =~ /\p{LC}/ and "a" =~ /\p{L&}/;
	2248	print "ok 743\n";
	2249
	2250	print "not " if "1" =~ /\p{LC}/ or "1" =~ /\p{L&}/;
	2251	print "ok 744\n";
	2252	}
	2253
	2254	{
	2255	print "not " unless "a" =~ /\p{Lowercase Letter}/;
	2256	print "ok 745\n";
	2257
	2258	print "not " if "A" =~ /\p{lowercaseletter}/;
	2259	print "ok 746\n";
	2260	}
	2261
	2262	{
	2263	print "not " unless "\x{AC00}" =~ /\p{HangulSyllables}/;
	2264	print "ok 747\n";
	2265	}
	2266
	2267	{
	2268	# Script=, Block=, Category=
	2269
	2270	print "not " unless "\x{0100}" =~ /\p{Script=Latin}/;
	2271	print "ok 748\n";
	2272
	2273	print "not " unless "\x{0100}" =~ /\p{Block=LatinExtendedA}/;
	2274	print "ok 749\n";
	2275
	2276	print "not " unless "\x{0100}" =~ /\p{Category=UppercaseLetter}/;
	2277	print "ok 750\n";
	2278	}
	2279
	2280	{
	2281	print "# the basic character classes and Unicode \n";
	2282
	2283	# 0100;LATIN CAPITAL LETTER A WITH MACRON;Lu;0;L;0041 0304;;;;N;LATIN CAPITAL LETTER A MACRON;;;0101;
	2284	print "not " unless "\x{0100}" =~ /\w/;
	2285	print "ok 751\n";
	2286
	2287	# 0660;ARABIC-INDIC DIGIT ZERO;Nd;0;AN;;0;0;0;N;;;;;
	2288	print "not " unless "\x{0660}" =~ /\d/;
	2289	print "ok 752\n";
	2290
	2291	# 1680;OGHAM SPACE MARK;Zs;0;WS;;;;;N;;;;;
	2292	print "not " unless "\x{1680}" =~ /\s/;
	2293	print "ok 753\n";
	2294	}
	2295
	2296	{
	2297	print "# folding matches and Unicode\n";
	2298
	2299	print "not " unless "a\x{100}" =~ /A/i;
	2300	print "ok 754\n";
	2301
	2302	print "not " unless "A\x{100}" =~ /a/i;
	2303	print "ok 755\n";
	2304
	2305	print "not " unless "a\x{100}" =~ /a/i;
	2306	print "ok 756\n";
	2307
	2308	print "not " unless "A\x{100}" =~ /A/i;
	2309	print "ok 757\n";
	2310
	2311	print "not " unless "\x{101}a" =~ /\x{100}/i;
	2312	print "ok 758\n";
	2313
	2314	print "not " unless "\x{100}a" =~ /\x{100}/i;
	2315	print "ok 759\n";
	2316
	2317	print "not " unless "\x{101}a" =~ /\x{101}/i;
	2318	print "ok 760\n";
	2319
	2320	print "not " unless "\x{100}a" =~ /\x{101}/i;
	2321	print "ok 761\n";
	2322
	2323	print "not " unless "a\x{100}" =~ /A\x{100}/i;
	2324	print "ok 762\n";
	2325
	2326	print "not " unless "A\x{100}" =~ /a\x{100}/i;
	2327	print "ok 763\n";
	2328
	2329	print "not " unless "a\x{100}" =~ /a\x{100}/i;
	2330	print "ok 764\n";
	2331
	2332	print "not " unless "A\x{100}" =~ /A\x{100}/i;
	2333	print "ok 765\n";
	2334
	2335	print "not " unless "a\x{100}" =~ /[A]/i;
	2336	print "ok 766\n";
	2337
	2338	print "not " unless "A\x{100}" =~ /[a]/i;
	2339	print "ok 767\n";
	2340
	2341	print "not " unless "a\x{100}" =~ /[a]/i;
	2342	print "ok 768\n";
	2343
	2344	print "not " unless "A\x{100}" =~ /[A]/i;
	2345	print "ok 769\n";
	2346
	2347	print "not " unless "\x{101}a" =~ /[\x{100}]/i;
	2348	print "ok 770\n";
	2349
	2350	print "not " unless "\x{100}a" =~ /[\x{100}]/i;
	2351	print "ok 771\n";
	2352
	2353	print "not " unless "\x{101}a" =~ /[\x{101}]/i;
	2354	print "ok 772\n";
	2355
	2356	print "not " unless "\x{100}a" =~ /[\x{101}]/i;
	2357	print "ok 773\n";
	2358
	2359	}
	2360
	2361	{
	2362	use charnames ':full';
	2363
	2364	print "# LATIN LETTER A WITH GRAVE\n";
	2365	my $lower = "\N{LATIN SMALL LETTER A WITH GRAVE}";
	2366	my $UPPER = "\N{LATIN CAPITAL LETTER A WITH GRAVE}";
	2367
	2368	print $lower =~ m/$UPPER/i ? "ok 774\n" : "not ok 774\n";
	2369	print $UPPER =~ m/$lower/i ? "ok 775\n" : "not ok 775\n";
	2370	print $lower =~ m/[$UPPER]/i ? "ok 776\n" : "not ok 776\n";
	2371	print $UPPER =~ m/[$lower]/i ? "ok 777\n" : "not ok 777\n";
	2372
	2373	print "# GREEK LETTER ALPHA WITH VRACHY\n";
	2374
	2375	$lower = "\N{GREEK CAPITAL LETTER ALPHA WITH VRACHY}";
	2376	$UPPER = "\N{GREEK SMALL LETTER ALPHA WITH VRACHY}";
	2377
	2378	print $lower =~ m/$UPPER/i ? "ok 778\n" : "not ok 778\n";
	2379	print $UPPER =~ m/$lower/i ? "ok 779\n" : "not ok 779\n";
	2380	print $lower =~ m/[$UPPER]/i ? "ok 780\n" : "not ok 780\n";
	2381	print $UPPER =~ m/[$lower]/i ? "ok 781\n" : "not ok 781\n";
	2382
	2383	print "# LATIN LETTER Y WITH DIAERESIS\n";
	2384
	2385	$lower = "\N{LATIN CAPITAL LETTER Y WITH DIAERESIS}";
	2386	$UPPER = "\N{LATIN SMALL LETTER Y WITH DIAERESIS}";
	2387	print $lower =~ m/$UPPER/i ? "ok 782\n" : "not ok 782\n";
	2388	print $UPPER =~ m/$lower/i ? "ok 783\n" : "not ok 783\n";
	2389	print $lower =~ m/[$UPPER]/i ? "ok 784\n" : "not ok 784\n";
	2390	print $UPPER =~ m/[$lower]/i ? "ok 785\n" : "not ok 785\n";
	2391	}
	2392
	2393	{
	2394	use warnings;
	2395	use charnames ':full';
	2396
	2397	print "# GREEK CAPITAL LETTER SIGMA vs COMBINING GREEK PERISPOMENI\n";
	2398
	2399	my $SIGMA = "\N{GREEK CAPITAL LETTER SIGMA}";
	2400	my $char = "\N{COMBINING GREEK PERISPOMENI}";
	2401
	2402	# Before #13843 this was failing by matching falsely.
	2403	print "_:$char:_" =~ m/_:$SIGMA:_/i ? "not ok 786\n" : "ok 786\n";
	2404	}
	2405
	2406	{
	2407	print "# \\X\n";
	2408
	2409	use charnames ':full';
	2410
	2411	print "a!" =~ /^(\X)!/ && $1 eq "a" ?
	2412	"ok 787\n" : "not ok 787 # $1\n";
	2413	print "\xDF!" =~ /^(\X)!/ && $1 eq "\xDF" ?
	2414	"ok 788\n" : "not ok 788 # $1\n";
	2415	print "\x{100}!" =~ /^(\X)!/ && $1 eq "\x{100}" ?
	2416	"ok 789\n" : "not ok 789 # $1\n";
	2417	print "\x{100}\x{300}!" =~ /^(\X)!/ && $1 eq "\x{100}\x{300}" ?
	2418	"ok 790\n" : "not ok 790 # $1\n";
	2419	print "\N{LATIN CAPITAL LETTER E}!" =~ /^(\X)!/ &&
	2420	$1 eq "\N{LATIN CAPITAL LETTER E}" ?
	2421	"ok 791\n" : "not ok 791 # $1\n";
	2422	print "\N{LATIN CAPITAL LETTER E}\N{COMBINING GRAVE ACCENT}!" =~
	2423	/^(\X)!/ &&
	2424	$1 eq "\N{LATIN CAPITAL LETTER E}\N{COMBINING GRAVE ACCENT}" ?
	2425	"ok 792\n" : "not ok 792 # $1\n";
	2426	}
	2427
	2428	{
	2429	print "#\\C and \\X\n";
	2430
	2431	print "!abc!" =~ /a\Cc/ ? "ok 793\n" : "not ok 793\n";
	2432	print "!abc!" =~ /a\Xc/ ? "ok 794\n" : "not ok 794\n";
	2433	}
	2434
	2435	{
	2436	print "# FINAL SIGMA\n";
	2437
	2438	my $SIGMA = "\x{03A3}"; # CAPITAL
	2439	my $Sigma = "\x{03C2}"; # SMALL FINAL
	2440	my $sigma = "\x{03C3}"; # SMALL
	2441
	2442	print $SIGMA =~ /$SIGMA/i ? "ok 795\n" : "not ok 795\n";
	2443	print $SIGMA =~ /$Sigma/i ? "ok 796\n" : "not ok 796\n";
	2444	print $SIGMA =~ /$sigma/i ? "ok 797\n" : "not ok 797\n";
	2445
	2446	print $Sigma =~ /$SIGMA/i ? "ok 798\n" : "not ok 798\n";
	2447	print $Sigma =~ /$Sigma/i ? "ok 799\n" : "not ok 799\n";
	2448	print $Sigma =~ /$sigma/i ? "ok 800\n" : "not ok 800\n";
	2449
	2450	print $sigma =~ /$SIGMA/i ? "ok 801\n" : "not ok 801\n";
	2451	print $sigma =~ /$Sigma/i ? "ok 802\n" : "not ok 802\n";
	2452	print $sigma =~ /$sigma/i ? "ok 803\n" : "not ok 803\n";
	2453
	2454	print $SIGMA =~ /[$SIGMA]/i ? "ok 804\n" : "not ok 804\n";
	2455	print $SIGMA =~ /[$Sigma]/i ? "ok 805\n" : "not ok 805\n";
	2456	print $SIGMA =~ /[$sigma]/i ? "ok 806\n" : "not ok 806\n";
	2457
	2458	print $Sigma =~ /[$SIGMA]/i ? "ok 807\n" : "not ok 807\n";
	2459	print $Sigma =~ /[$Sigma]/i ? "ok 808\n" : "not ok 808\n";
	2460	print $Sigma =~ /[$sigma]/i ? "ok 809\n" : "not ok 809\n";
	2461
	2462	print $sigma =~ /[$SIGMA]/i ? "ok 810\n" : "not ok 810\n";
	2463	print $sigma =~ /[$Sigma]/i ? "ok 811\n" : "not ok 811\n";
	2464	print $sigma =~ /[$sigma]/i ? "ok 812\n" : "not ok 812\n";
	2465	}
	2466
	2467	{
	2468	print "# parlez-vous?\n";
	2469
	2470	use charnames ':full';
	2471
	2472	print "fran\N{LATIN SMALL LETTER C}ais" =~
	2473	/fran.ais/ &&
	2474	$& eq "francais" ?
	2475	"ok 813\n" : "not ok 813\n";
	2476
	2477	print "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" =~
	2478	/fran.ais/ &&
	2479	$& eq "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" ?
	2480	"ok 814\n" : "not ok 814\n";
	2481
	2482	print "fran\N{LATIN SMALL LETTER C}ais" =~
	2483	/fran\Cais/ &&
	2484	$& eq "francais" ?
	2485	"ok 815\n" : "not ok 815\n";
	2486
	2487	print "franc\N{COMBINING CEDILLA}ais" =~
	2488	/franc\C\Cais/ ? # COMBINING CEDILLA is two bytes when encoded
	2489	"ok 816\n" : "not ok 816\n";
	2490
	2491	print "fran\N{LATIN SMALL LETTER C}ais" =~
	2492	/fran\Xais/ &&
	2493	$& eq "francais" ?
	2494	"ok 817\n" : "not ok 817\n";
	2495
	2496	print "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" =~
	2497	/fran\Xais/ &&
	2498	$& eq "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" ?
	2499	"ok 818\n" : "not ok 818\n";
	2500
	2501	print "franc\N{COMBINING CEDILLA}ais" =~
	2502	/fran\Xais/ &&
	2503	$& eq "franc\N{COMBINING CEDILLA}ais" ?
	2504	"ok 819\n" : "not ok 819\n";
	2505
	2506	print "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" =~
	2507	/fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais/ &&
	2508	$& eq "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" ?
	2509	"ok 820\n" : "not ok 820\n";
	2510
	2511	print "franc\N{COMBINING CEDILLA}ais" =~
	2512	/franc\N{COMBINING CEDILLA}ais/ &&
	2513	$& eq "franc\N{COMBINING CEDILLA}ais" ?
	2514	"ok 821\n" : "not ok 821\n";
	2515
	2516	print "fran\N{LATIN SMALL LETTER C}ais" =~
	2517	/fran(?:c\N{COMBINING CEDILLA}?\|\N{LATIN SMALL LETTER C WITH CEDILLA})ais/ &&
	2518	$& eq "francais" ?
	2519	"ok 822\n" : "not ok 822\n";
	2520
	2521	print "fran\N{LATIN SMALL LETTER C}ais" =~
	2522	/fran(?:c\N{COMBINING CEDILLA}?\|\N{LATIN SMALL LETTER C WITH CEDILLA})ais/ &&
	2523	$& eq "francais" ?
	2524	"ok 823\n" : "not ok 823\n";
	2525
	2526	print "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" =~
	2527	/fran(?:c\N{COMBINING CEDILLA}?\|\N{LATIN SMALL LETTER C WITH CEDILLA})ais/ &&
	2528	$& eq "fran\N{LATIN SMALL LETTER C WITH CEDILLA}ais" ?
	2529	"ok 824\n" : "not ok 824\n";
	2530
	2531	print "franc\N{COMBINING CEDILLA}ais" =~
	2532	/fran(?:c\N{COMBINING CEDILLA}?\|\N{LATIN SMALL LETTER C WITH CEDILLA})ais/ &&
	2533	$& eq "franc\N{COMBINING CEDILLA}ais" ?
	2534	"ok 825\n" : "not ok 825\n";
	2535	}
	2536
	2537	{
	2538	print "# Does lingering (and useless) UTF8 flag mess up /i matching?\n";
	2539
	2540	{
	2541	my $regex = "ABcde";
	2542	my $string = "abcDE\x{100}";
	2543	chop($string);
	2544	if ($string =~ m/$regex/i) {
	2545	print "ok 826\n";
	2546	} else {
	2547	print "not ok 826\n";
	2548	}
	2549	}
	2550
	2551	{
	2552	my $regex = "ABcde\x{100}";
	2553	my $string = "abcDE";
	2554	chop($regex);
	2555	if ($string =~ m/$regex/i) {
	2556	print "ok 827\n";
	2557	} else {
	2558	print "not ok 827\n";
	2559	}
	2560	}
	2561
	2562	{
	2563	my $regex = "ABcde\x{100}";
	2564	my $string = "abcDE\x{100}";
	2565	chop($regex);
	2566	chop($string);
	2567	if ($string =~ m/$regex/i) {
	2568	print "ok 828\n";
	2569	} else {
	2570	print "not ok 828\n";
	2571	}
	2572	}
	2573	}
	2574
	2575	{
	2576	print "# more SIGMAs\n";
	2577
	2578	my $SIGMA = "\x{03A3}"; # CAPITAL
	2579	my $Sigma = "\x{03C2}"; # SMALL FINAL
	2580	my $sigma = "\x{03C3}"; # SMALL
	2581
	2582	my $S3 = "$SIGMA$Sigma$sigma";
	2583
	2584	print ":$S3:" =~ /:(($SIGMA)+):/i && $1 eq $S3 && $2 eq $sigma ?
	2585	"ok 829\n" : "not ok 829\n";
	2586	print ":$S3:" =~ /:(($Sigma)+):/i && $1 eq $S3 && $2 eq $sigma ?
	2587	"ok 830\n" : "not ok 830\n";
	2588	print ":$S3:" =~ /:(($sigma)+):/i && $1 eq $S3 && $2 eq $sigma ?
	2589	"ok 831\n" : "not ok 831\n";
	2590
	2591	print ":$S3:" =~ /:(([$SIGMA])+):/i && $1 eq $S3 && $2 eq $sigma ?
	2592	"ok 832\n" : "not ok 832\n";
	2593	print ":$S3:" =~ /:(([$Sigma])+):/i && $1 eq $S3 && $2 eq $sigma ?
	2594	"ok 833\n" : "not ok 833\n";
	2595	print ":$S3:" =~ /:(([$sigma])+):/i && $1 eq $S3 && $2 eq $sigma ?
	2596	"ok 834\n" : "not ok 834\n";
	2597	}
	2598
	2599	{
	2600	print "# LATIN SMALL LETTER SHARP S\n";
	2601
	2602	use charnames ':full';
	2603
	2604	$test= 835;
	2605
	2606	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /\N{LATIN SMALL LETTER SHARP S}/);
	2607	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /\N{LATIN SMALL LETTER SHARP S}/i);
	2608
	2609	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /[\N{LATIN SMALL LETTER SHARP S}]/);
	2610	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /[\N{LATIN SMALL LETTER SHARP S}]/i);
	2611
	2612	ok("ss" =~ /\N{LATIN SMALL LETTER SHARP S}/i);
	2613	ok("SS" =~ /\N{LATIN SMALL LETTER SHARP S}/i);
	2614	ok("ss" =~ /[\N{LATIN SMALL LETTER SHARP S}]/i);
	2615	ok("SS" =~ /[\N{LATIN SMALL LETTER SHARP S}]/i);
	2616
	2617	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /ss/i);
	2618	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /SS/i);
	2619	}
	2620
	2621	{
	2622	print "# more whitespace: U+0085, U+2028, U+2029\n";
	2623
	2624	# U+0085 needs to be forced to be Unicode, the \x{100} does that.
	2625	if ($ordA == 193) {
	2626	print "<\x{100}\x{0085}>" =~ /<\x{100}e>/ ? "ok 845\n" : "not ok 845\n";
	2627	} else {
	2628	print "<\x{100}\x{0085}>" =~ /<\x{100}\s>/ ? "ok 845\n" : "not ok 845\n";
	2629	}
	2630	print "<\x{2028}>" =~ /<\s>/ ? "ok 846\n" : "not ok 846\n";
	2631	print "<\x{2029}>" =~ /<\s>/ ? "ok 847\n" : "not ok 847\n";
	2632	}
	2633
	2634	{
	2635	print "# . with /s should work on characters, as opposed to bytes\n";
	2636
	2637	my $s = "\x{e4}\x{100}";
	2638
	2639	# This is not expected to match: the point is that
	2640	# neither should we get "Malformed UTF-8" warnings.
	2641	print $s =~ /\G(.+?)\n/gcs ?
	2642	"not ok 848\n" : "ok 848\n";
	2643
	2644	my @c;
	2645
	2646	while ($s =~ /\G(.)/gs) {
	2647	push @c, $1;
	2648	}
	2649
	2650	print join("", @c) eq $s ? "ok 849\n" : "not ok 849\n";
	2651
	2652	my $t1 = "Q003\n\n\x{e4}\x{f6}\n\nQ004\n\n\x{e7}"; # test only chars < 256
	2653	my $r1 = "";
	2654	while ($t1 =~ / \G ( .+? ) \n\s+ ( .+? ) ( $ \| \n\s+ ) /xgcs) {
	2655	$r1 .= $1 . $2;
	2656	}
	2657
	2658	my $t2 = $t1 . "\x{100}"; # repeat with a larger char
	2659	my $r2 = "";
	2660	while ($t2 =~ / \G ( .+? ) \n\s+ ( .+? ) ( $ \| \n\s+ ) /xgcs) {
	2661	$r2 .= $1 . $2;
	2662	}
	2663	$r2 =~ s/\x{100}//;
	2664	print $r1 eq $r2 ? "ok 850\n" : "not ok 850\n";
	2665	}
	2666
	2667	{
	2668	print "# Unicode lookbehind\n";
	2669
	2670	print "A\x{100}B" =~ /(?<=A.)B/ ? "ok 851\n" : "not ok 851\n";
	2671	print "A\x{200}\x{300}B" =~ /(?<=A..)B/ ? "ok 852\n" : "not ok 852\n";
	2672	print "\x{400}AB" =~ /(?<=\x{400}.)B/ ? "ok 853\n" : "not ok 853\n";
	2673	print "\x{500\x{600}}B" =~ /(?<=\x{500}.)B/ ? "ok 854\n" : "not ok 854\n";
	2674	}
	2675
	2676	{
	2677	print "# UTF-8 hash keys and /\$/\n";
	2678	# http://www.xray.mpe.mpg.de/mailing-lists/perl5-porters/2002-01/msg01327.html
	2679
	2680	my $u = "a\x{100}";
	2681	my $v = substr($u,0,1);
	2682	my $w = substr($u,1,1);
	2683	my %u = ( $u => $u, $v => $v, $w => $w );
	2684	my $i = 855;
	2685	for (keys %u) {
	2686	my $m1 = /^\w*$/ ? 1 : 0;
	2687	my $m2 = $u{$_}=~/^\w*$/ ? 1 : 0;
	2688	print $m1 == $m2 ? "ok $i\n" : "not ok $i # $m1 $m2\n";
	2689	$i++;
	2690	}
	2691	}
	2692
	2693	{
	2694	print "# [ID 20020124.005]\n";
	2695	# Fixed by #14795.
	2696	my $i = 858;
	2697	for my $char ("a", "\x{df}", "\x{100}"){
	2698	$x = "$char b $char";
	2699	$x =~ s{($char)}{
	2700	"c" =~ /c/;
	2701	"x";
	2702	}ge;
	2703	print substr($x,0,1) eq substr($x,-1,1) ?
	2704	"ok $i\n" : "not ok $i # debug: $x\n";
	2705	$i++;
	2706	}
	2707	}
	2708
	2709	{
	2710	print "# SEGV in s/// and UTF-8\n";
	2711	$s = "s#\x{100}" x 4;
	2712	$s =~ s/[^\w]/ /g;
	2713	print $s eq "s \x{100}" x 4 ? "ok 861\n" : "not ok 861\n";
	2714	}
	2715
	2716	{
	2717	print "# UTF-8 bug (maybe alreayd known?)\n";
	2718	my $u;
	2719
	2720	$u = "foo";
	2721	$u =~ s/./\x{100}/g;
	2722	print $u eq "\x{100}\x{100}\x{100}" ? "ok 862\n" : "not ok 862\n";
	2723
	2724	$u = "foobar";
	2725	$u =~ s/[ao]/\x{100}/g;
	2726	print $u eq "f\x{100}\x{100}b\x{100}r" ? "ok 863\n" : "not ok 863\n";
	2727
	2728	$u =~ s/\x{100}/e/g;
	2729	print $u eq "feeber" ? "ok 864\n" : "not ok 864\n";
	2730	}
	2731
	2732	{
	2733	print "# UTF-8 bug with s///\n";
	2734	# check utf8/non-utf8 mixtures
	2735	# try to force all float/anchored check combinations
	2736	my $c = "\x{100}";
	2737	$test = 865;
	2738	my $subst;
	2739	for my $re (
	2740	"xx.$c", "x.$c$c", "$c.xx", "$c$c.x", "xx.(?=$c)", "(?=$c).xx",
	2741	) {
	2742	print "xxx" =~ /$re/ ? "not ok $test\n" : "ok $test\n";
	2743	++$test;
	2744	print +($subst = "xxx") =~ s/$re// ? "not ok $test\n" : "ok $test\n";
	2745	++$test;
	2746	}
	2747	for my $re ("xx.$c", "$c.xx") {
	2748	print "xxx" =~ /$re/ ? "ok $test\n" : "not ok $test\n";
	2749	++$test;
	2750	($subst = "xxx") =~ s/$re//;
	2751	print $subst eq '' ? "ok $test\n" : "not ok $test\t# $subst\n";
	2752	++$test;
	2753	}
	2754	for my $re ("xxy", "yxx") {
	2755	print "xx$c" =~ /$re/ ? "ok $test\n" : "not ok $test\n";
	2756	++$test;
	2757	($subst = "xx$c") =~ s/$re//;
	2758	print $subst eq $c ? "ok $test\n" : "not ok $test\n";
	2759	++$test;
	2760	print "xy$c" =~ /$re/ ? "not ok $test\n" : "ok $test\n";
	2761	++$test;
	2762	print +($subst = "xy$c") =~ /$re/ ? "not ok $test\n" : "ok $test\n";
	2763	++$test;
	2764	}
	2765	for my $re ("xy$cz", "x$cyz") {
	2766	print "xyz" =~ /$re/ ? "ok $test\n" : "not ok $test\n";
	2767	++$test;
	2768	($subst = "xyz") =~ s/$re//;
	2769	print $subst eq '' ? "ok $test\n" : "not ok $test\n";
	2770	++$test;
	2771	}
	2772	}
	2773
	2774	{
	2775	print "# qr/.../x\n";
	2776	$test = 893;
	2777
	2778	my $R = qr/ A B C # D E/x;
	2779
	2780	print eval {"ABCDE" =~ $R} ? "ok $test\n" : "not ok $test\n";
	2781	$test++;
	2782
	2783	print eval {"ABCDE" =~ m/$R/} ? "ok $test\n" : "not ok $test\n";
	2784	$test++;
	2785
	2786	print eval {"ABCDE" =~ m/($R)/} ? "ok $test\n" : "not ok $test\n";
	2787	$test++;
	2788	}
	2789
	2790	{
	2791	print "# illegal Unicode properties\n";
	2792	$test = 896;
	2793
	2794	print eval { "a" =~ /\pq / } ? "not ok $test\n" : "ok $test\n";
	2795	$test++;
	2796
	2797	print eval { "a" =~ /\p{qrst} / } ? "not ok $test\n" : "ok $test\n";
	2798	$test++;
	2799	}
	2800
	2801	{
	2802	print "# [ID 20020412.005] wrong pmop flags checked when empty pattern\n";
	2803	# requires reuse of last successful pattern
	2804	$test = 898;
	2805	$test =~ /\d/;
	2806	for (0 .. 1) {
	2807	my $match = ?? + 0;
	2808	if ($match != $_) {
	2809	print "ok $test\n";
	2810	} else {
	2811	printf "not ok %s\t# 'match once' %s on %s iteration\n", $test,
	2812	$match ? 'succeeded' : 'failed', $_ ? 'second' : 'first';
	2813	}
	2814	++$test;
	2815	}
	2816	$test =~ /(\d)/;
	2817	my $result = join '', $test =~ //g;
	2818	if ($result eq $test) {
	2819	print "ok $test\n";
	2820	} else {
	2821	printf "not ok %s\t# expected '%s', got '%s'\n", $test, $test, $result;
	2822	}
	2823	++$test;
	2824	}
	2825
	2826	print "# user-defined character properties\n";
	2827
	2828	sub InKana1 {
	2829	return <<'END';
	2830	3040 309F
	2831	30A0 30FF
	2832	END
	2833	}
	2834
	2835	sub InKana2 {
	2836	return <<'END';
	2837	+utf8::InHiragana
	2838	+utf8::InKatakana
	2839	END
	2840	}
	2841
	2842	sub InKana3 {
	2843	return <<'END';
	2844	+utf8::InHiragana
	2845	+utf8::InKatakana
	2846	-utf8::IsCn
	2847	END
	2848	}
	2849
	2850	sub InNotKana {
	2851	return <<'END';
	2852	!utf8::InHiragana
	2853	-utf8::InKatakana
	2854	+utf8::IsCn
	2855	END
	2856	}
	2857
	2858	$test = 901;
	2859
	2860	print "\x{3040}" =~ /\p{InKana1}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2861	print "\x{303F}" =~ /\P{InKana1}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2862
	2863	print "\x{3040}" =~ /\p{InKana2}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2864	print "\x{303F}" =~ /\P{InKana2}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2865
	2866	print "\x{3041}" =~ /\p{InKana3}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2867	print "\x{3040}" =~ /\P{InKana3}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2868
	2869	print "\x{3040}" =~ /\p{InNotKana}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2870	print "\x{3041}" =~ /\P{InNotKana}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2871
	2872	sub InConsonant { # Not EBCDIC-aware.
	2873	return <<EOF;
	2874	0061 007f
	2875	-0061
	2876	-0065
	2877	-0069
	2878	-006f
	2879	-0075
	2880	EOF
	2881	}
	2882
	2883	print "d" =~ /\p{InConsonant}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2884	print "e" =~ /\P{InConsonant}/ ? "ok $test\n" : "not ok $test\n"; $test++;
	2885
	2886	{
	2887	print "# [ID 20020630.002] utf8 regex only matches 32k\n";
	2888	$test = 911;
	2889	for ([ 'byte', "\x{ff}" ], [ 'utf8', "\x{1ff}" ]) {
	2890	my($type, $char) = @$_;
	2891	for my $len (32000, 32768, 33000) {
	2892	my $s = $char . "f" x $len;
	2893	my $r = $s =~ /$char([f]*)/gc;
	2894	print $r ? "ok $test\n" : "not ok $test\t# <$type x $len> fail\n";
	2895	++$test;
	2896	print +(!$r or pos($s) == $len + 1) ? "ok $test\n"
	2897	: "not ok $test\t# <$type x $len> pos @{[ pos($s) ]}\n";
	2898	++$test;
	2899	}
	2900	}
	2901	}
	2902
	2903	$test = 923;
	2904
	2905	$a = bless qr/foo/, 'Foo';
	2906	print(('goodfood' =~ $a ? '' : 'not '),
	2907	"ok $test\t# reblessed qr// matches\n");
	2908	++$test;
	2909
	2910	print(($a eq '(?-xism:foo)' ? '' : 'not '),
	2911	"ok $test\t# reblessed qr// stringizes\n");
	2912	++$test;
	2913
	2914	$x = "\x{3fe}";
	2915	$z=$y = "\317\276"; # $y is byte representation of $x
	2916
	2917	$a = qr/$x/;
	2918	print(($x =~ $a ? '' : 'not '), "ok $test - utf8 interpolation in qr//\n");
	2919	++$test;
	2920
	2921	print(("a$a" =~ $x ? '' : 'not '),
	2922	"ok $test - stringifed qr// preserves utf8\n");
	2923	++$test;
	2924
	2925	print(("a$x" =~ /^a$a\z/ ? '' : 'not '),
	2926	"ok $test - interpolated qr// preserves utf8\n");
	2927	++$test;
	2928
	2929	print(("a$x" =~ /^a(??{$a})\z/ ? '' : 'not '),
	2930	"ok $test - postponed interpolation of qr// preserves utf8\n");
	2931	++$test;
	2932
	2933	print((length(qr/##/x) == 12 ? '' : 'not '),
	2934	"ok $test - ## in qr// doesn't corrupt memory [perl #17776]\n");
	2935	++$test;
	2936
	2937	{ use re 'eval';
	2938
	2939	print(("$x$x" =~ /^$x(??{$x})\z/ ? '' : 'not '),
	2940	"ok $test - postponed utf8 string in utf8 re matches utf8\n");
	2941	++$test;
	2942
	2943	print(("$y$x" =~ /^$y(??{$x})\z/ ? '' : 'not '),
	2944	"ok $test - postponed utf8 string in non-utf8 re matches utf8\n");
	2945	++$test;
	2946
	2947	print(("$y$x" !~ /^$y(??{$y})\z/ ? '' : 'not '),
	2948	"ok $test - postponed non-utf8 string in non-utf8 re doesn't match utf8\n");
	2949	++$test;
	2950
	2951	print(("$x$x" !~ /^$x(??{$y})\z/ ? '' : 'not '),
	2952	"ok $test - postponed non-utf8 string in utf8 re doesn't match utf8\n");
	2953	++$test;
	2954
	2955	print(("$y$y" =~ /^$y(??{$y})\z/ ? '' : 'not '),
	2956	"ok $test - postponed non-utf8 string in non-utf8 re matches non-utf8\n");
	2957	++$test;
	2958
	2959	print(("$x$y" =~ /^$x(??{$y})\z/ ? '' : 'not '),
	2960	"ok $test - postponed non-utf8 string in utf8 re matches non-utf8\n");
	2961	++$test;
	2962	$y = $z; # reset $y after upgrade
	2963
	2964	print(("$x$y" !~ /^$x(??{$x})\z/ ? '' : 'not '),
	2965	"ok $test - postponed utf8 string in utf8 re doesn't match non-utf8\n");
	2966	++$test;
	2967	$y = $z; # reset $y after upgrade
	2968
	2969	print(("$y$y" !~ /^$y(??{$x})\z/ ? '' : 'not '),
	2970	"ok $test - postponed utf8 string in non-utf8 re doesn't match non-utf8\n");
	2971	++$test;
	2972
	2973	} # no re 'eval'
	2974
	2975	print "# more user-defined character properties\n";
	2976
	2977	sub IsSyriac1 {
	2978	return <<'END';
	2979	0712 072C
	2980	0730 074A
	2981	END
	2982	}
	2983
	2984	ok("\x{0712}" =~ /\p{IsSyriac1}/, '\x{0712}, \p{IsSyriac1}');
	2985	ok("\x{072F}" =~ /\P{IsSyriac1}/, '\x{072F}, \P{IsSyriac1}');
	2986
	2987	sub Syriac1 {
	2988	return <<'END';
	2989	0712 072C
	2990	0730 074A
	2991	END
	2992	}
	2993
	2994	ok("\x{0712}" =~ /\p{Syriac1}/, '\x{0712}, \p{Syriac1}');
	2995	ok("\x{072F}" =~ /\P{Syriac1}/, '\x{072F}, \p{Syriac1}');
	2996
	2997	print "# user-defined character properties may lack \\n at the end\n";
	2998	sub InGreekSmall { return "03B1\t03C9" }
	2999	sub InGreekCapital { return "0391\t03A9\n-03A2" }
	3000
	3001	ok("\x{03C0}" =~ /\p{InGreekSmall}/, "Small pi");
	3002	ok("\x{03C2}" =~ /\p{InGreekSmall}/, "Final sigma");
	3003	ok("\x{03A0}" =~ /\p{InGreekCapital}/, "Capital PI");
	3004	ok("\x{03A2}" =~ /\P{InGreekCapital}/, "Reserved");
	3005
	3006	sub AsciiHexAndDash {
	3007	return <<'END';
	3008	+utf8::ASCII_Hex_Digit
	3009	+utf8::Dash
	3010	END
	3011	}
	3012
	3013	ok("-" =~ /\p{Dash}/, "'-' is Dash");
	3014	ok("A" =~ /\p{ASCII_Hex_Digit}/, "'A' is ASCII_Hex_Digit");
	3015	ok("-" =~ /\p{AsciiHexAndDash}/, "'-' is AsciiHexAndDash");
	3016	ok("A" =~ /\p{AsciiHexAndDash}/, "'A' is AsciiHexAndDash");
	3017
	3018	{
	3019	print "# Change #18179\n";
	3020	# previously failed with "panic: end_shift
	3021	my $s = "\x{100}" x 5;
	3022	my $ok = $s =~ /(\x{100}{4})/;
	3023	my($ord, $len) = (ord $1, length $1);
	3024	print +($ok && $ord == 0x100 && $len == 4)
	3025	? "ok $test\n" : "not ok $test\t# [#18179] $ok/$ord/$len\n";
	3026	++$test;
	3027	}
	3028
	3029	{
	3030	print "# [perl #15763]\n";
	3031
	3032	$a = "x\x{100}";
	3033	chop $a; # but leaves the UTF-8 flag
	3034	$a .= "y"; # 1 byte before "y"
	3035
	3036	ok($a =~ /^\C/, 'match one \C on 1-byte UTF-8');
	3037	ok($a =~ /^\C{1}/, 'match \C{1}');
	3038
	3039	ok($a =~ /^\Cy/, 'match \Cy');
	3040	ok($a =~ /^\C{1}y/, 'match \C{1}y');
	3041
	3042	$a = "\x{100}y"; # 2 bytes before "y"
	3043
	3044	ok($a =~ /^\C/, 'match one \C on 2-byte UTF-8');
	3045	ok($a =~ /^\C{1}/, 'match \C{1}');
	3046	ok($a =~ /^\C\C/, 'match two \C');
	3047	ok($a =~ /^\C{2}/, 'match \C{2}');
	3048
	3049	ok($a =~ /^\C\C\C/, 'match three \C on 2-byte UTF-8 and a byte');
	3050	ok($a =~ /^\C{3}/, 'match \C{3}');
	3051
	3052	ok($a =~ /^\C\Cy/, 'match two \C');
	3053	ok($a =~ /^\C{2}y/, 'match \C{2}');
	3054
	3055	ok($a !~ /^\C\C\Cy/, q{don't match three \Cy});
	3056	ok($a !~ /^\C{2}\Cy/, q{don't match \C{3}y});
	3057
	3058	$a = "\x{1000}y"; # 3 bytes before "y"
	3059
	3060	ok($a =~ /^\C/, 'match one \C on three-byte UTF-8');
	3061	ok($a =~ /^\C{1}/, 'match \C{1}');
	3062	ok($a =~ /^\C\C/, 'match two \C');
	3063	ok($a =~ /^\C{2}/, 'match \C{2}');
	3064	ok($a =~ /^\C\C\C/, 'match three \C');
	3065	ok($a =~ /^\C{3}/, 'match \C{3}');
	3066
	3067	ok($a =~ /^\C\C\C\C/, 'match four \C on three-byte UTF-8 and a byte');
	3068	ok($a =~ /^\C{4}/, 'match \C{4}');
	3069
	3070	ok($a =~ /^\C\C\Cy/, 'match three \Cy');
	3071	ok($a =~ /^\C{3}y/, 'match \C{3}y');
	3072
	3073	ok($a !~ /^\C\C\C\C\y/, q{don't match four \Cy});
	3074	ok($a !~ /^\C{4}y/, q{don't match \C{4}y});
	3075	}
	3076
	3077	$_ = 'aaaaaaaaaa';
	3078	utf8::upgrade($_); chop $_; $\="\n";
	3079	ok(/[^\s]+/, "m/[^\s]/ utf8");
	3080	ok(/[^\d]+/, "m/[^\d]/ utf8");
	3081	ok(($a = $_, $_ =~ s/[^\s]+/./g), "s/[^\s]/ utf8");
	3082	ok(($a = $_, $a =~ s/[^\d]+/./g), "s/[^\s]/ utf8");
	3083
	3084	ok("\x{100}" =~ /\x{100}/, "[perl #15397]");
	3085	ok("\x{100}" =~ /(\x{100})/, "[perl #15397]");
	3086	ok("\x{100}" =~ /(\x{100}){1}/, "[perl #15397]");
	3087	ok("\x{100}\x{100}" =~ /(\x{100}){2}/, "[perl #15397]");
	3088	ok("\x{100}\x{100}" =~ /(\x{100})(\x{100})/, "[perl #15397]");
	3089
	3090	$x = "CD";
	3091	$x =~ /(AB)*?CD/;
	3092	ok(!defined $1, "[perl #7471]");
	3093
	3094	$x = "CD";
	3095	$x =~ /(AB)*CD/;
	3096	ok(!defined $1, "[perl #7471]");
	3097
	3098	$pattern = "^(b+?\|a){1,2}c";
	3099	ok("bac" =~ /$pattern/ && $1 eq 'a', "[perl #3547]");
	3100	ok("bbac" =~ /$pattern/ && $1 eq 'a', "[perl #3547]");
	3101	ok("bbbac" =~ /$pattern/ && $1 eq 'a', "[perl #3547]");
	3102	ok("bbbbac" =~ /$pattern/ && $1 eq 'a', "[perl #3547]");
	3103
	3104	{
	3105	# [perl #18232]
	3106	"\x{100}" =~ /(.)/;
	3107	ok( $1 eq "\x{100}", '$1 is utf-8 [perl #18232]' );
	3108	{ 'a' =~ /./; }
	3109	ok( $1 eq "\x{100}", '$1 is still utf-8' );
	3110	ok( $1 ne "\xC4\x80", '$1 is not non-utf-8' );
	3111	}
	3112
	3113	{
	3114	use utf8;
	3115	my $attr = 'Name-1' ;
	3116
	3117	my $NormalChar = qr/[\p{IsDigit}\p{IsLower}\p{IsUpper}]/;
	3118	my $NormalWord = qr/${NormalChar}+?/;
	3119	my $PredNameHyphen = qr/^${NormalWord}(\-${NormalWord})*?$/;
	3120
	3121	$attr =~ /^$/;
	3122	ok( $attr =~ $PredNameHyphen, "[perl #19767] original test" );
	3123	}
	3124
	3125	{
	3126	use utf8;
	3127	"a" =~ m/[b]/;
	3128	ok ( "0" =~ /\p{N}+\z/, "[perl #19767] variant test" );
	3129	}
	3130
	3131	{
	3132
	3133	$p = 1;
	3134	foreach (1,2,3,4) {
	3135	$p++ if /(??{ $p })/
	3136	}
	3137	ok ($p == 5, "[perl #20683] (??{ }) returns stale values");
	3138	{ package P; $a=1; sub TIESCALAR { bless[] } sub FETCH { $a++ } }
	3139	tie $p, P;
	3140	foreach (1,2,3,4) {
	3141	/(??{ $p })/
	3142	}
	3143	ok ( $p == 5, "(??{ }) returns stale values");
	3144	}
	3145
	3146	{
	3147	# Subject: Odd regexp behavior
	3148	# From: Markus Kuhn <Markus.Kuhn@cl.cam.ac.uk>
	3149	# Date: Wed, 26 Feb 2003 16:53:12 +0000
	3150	# Message-Id: <E18o4nw-0008Ly-00@wisbech.cl.cam.ac.uk>
	3151	# To: perl-unicode@perl.org
	3152
	3153	$x = "\x{2019}\nk"; $x =~ s/(\S)\n(\S)/$1 $2/sg;
	3154	ok($x eq "\x{2019} k", "Markus Kuhn 2003-02-26");
	3155
	3156	$x = "b\nk"; $x =~ s/(\S)\n(\S)/$1 $2/sg;
	3157	ok($x eq "b k", "Markus Kuhn 2003-02-26");
	3158
	3159	ok("\x{2019}" =~ /\S/, "Markus Kuhn 2003-02-26");
	3160	}
	3161
	3162	{
	3163	my $i;
	3164	ok('-1-3-5-' eq join('', split /((??{$i++}))/, '-1-3-5-'),
	3165	"[perl #21411] (??{ .. }) corrupts split's stack");
	3166	split /(?{'WOW'})/, 'abc';
	3167	ok('a\|b\|c' eq join ('\|', @_),
	3168	"[perl #21411] (?{ .. }) version of the above");
	3169	}
	3170
	3171	{
	3172	# XXX DAPM 13-Apr-06. Recursive split is still broken. It's only luck it
	3173	# hasn't been crashing. Disable this test until it is fixed properly.
	3174	# XXX also check what it returns rather than just doing ok(1,...)
	3175	# split /(?{ split "" })/, "abc";
	3176	ok(1,'cache_re & "(?{": it dumps core in 5.6.1 & 5.8.0');
	3177	}
	3178
	3179	{
	3180	ok("\x{100}\n" =~ /\x{100}\n$/, "UTF8 length cache and fbm_compile");
	3181	}
	3182
	3183	{
	3184	package Str;
	3185	use overload q/""/ => sub { ${$_[0]}; };
	3186	sub new { my ($c, $v) = @_; bless \$v, $c; }
	3187
	3188	package main;
	3189	$_ = Str->new("a\x{100}/\x{100}b");
	3190	ok(join(":", /\b(.)\x{100}/g) eq "a:/", "re_intuit_start and PL_bostr");
	3191	}
	3192
	3193	{
	3194	$_ = "code: 'x' { '...' }\n"; study;
	3195	my @x; push @x, $& while m/'[^\']*'/gx;
	3196	ok(join(":", @x) eq "'x':'...'",
	3197	"[perl #17757] Parse::RecDescent triggers infinite loop");
	3198	}
	3199
	3200	{
	3201	my $re = qq/^([^X]*)X/;
	3202	utf8::upgrade($re);
	3203	ok("\x{100}X" =~ /$re/, "S_cl_and ANYOF_UNICODE & ANYOF_INVERTED");
	3204	}
	3205
	3206	# bug #22354
	3207	sub func ($) {
	3208	ok( "a\nb" !~ /^b/, $_[0] );
	3209	ok( "a\nb" =~ /^b/m, "$_[0] - with /m" );
	3210	}
	3211	func "standalone";
	3212	$_ = "x"; s/x/func "in subst"/e;
	3213	$_ = "x"; s/x/func "in multiline subst"/em;
	3214	#$_ = "x"; /x(?{func "in regexp"})/;
	3215	#$_ = "x"; /x(?{func "in multiline regexp"})/m;
	3216
	3217	# bug RT#19049
	3218	$_="abcdef\n";
	3219	@x = m/./g;
	3220	ok("abcde" eq "$`", 'RT#19049 - global match not setting $`');
	3221
	3222	ok("123\x{100}" =~ /^.1.23\x{100}$/, 'uft8 + multiple floating substr');
	3223
	3224	# LATIN SMALL/CAPITAL LETTER A WITH MACRON
	3225	ok(" \x{101}" =~ qr/\x{100}/i,
	3226	"<20030808193656.5109.1@llama.ni-s.u-net.com>");
	3227
	3228	# LATIN SMALL/CAPITAL LETTER A WITH RING BELOW
	3229	ok(" \x{1E01}" =~ qr/\x{1E00}/i,
	3230	"<20030808193656.5109.1@llama.ni-s.u-net.com>");
	3231
	3232	# DESERET SMALL/CAPITAL LETTER LONG I
	3233	ok(" \x{10428}" =~ qr/\x{10400}/i,
	3234	"<20030808193656.5109.1@llama.ni-s.u-net.com>");
	3235
	3236	# LATIN SMALL/CAPITAL LETTER A WITH RING BELOW + 'X'
	3237	ok(" \x{1E01}x" =~ qr/\x{1E00}X/i,
	3238	"<20030808193656.5109.1@llama.ni-s.u-net.com>");
	3239
	3240	{
	3241	# [perl #23769] Unicode regex broken on simple example
	3242	# regrepeat() didn't handle UTF-8 EXACT case right.
	3243
	3244	my $s = "\x{a0}\x{a0}\x{a0}\x{100}"; chop $s;
	3245
	3246	ok($s =~ /\x{a0}/, "[perl #23769]");
	3247	ok($s =~ /\x{a0}+/, "[perl #23769]");
	3248	ok($s =~ /\x{a0}\x{a0}/, "[perl #23769]");
	3249
	3250	ok("aaa\x{100}" =~ /(a+)/, "[perl #23769] easy invariant");
	3251	ok($1 eq "aaa", "[perl #23769]");
	3252
	3253	ok("\xa0\xa0\xa0\x{100}" =~ /(\xa0+)/, "[perl #23769] regrepeat invariant");
	3254	ok($1 eq "\xa0\xa0\xa0", "[perl #23769]");
	3255
	3256	ok("ababab\x{100} " =~ /((?:ab)+)/, "[perl #23769] hard invariant");
	3257	ok($1 eq "ababab", "[perl #23769]");
	3258
	3259	ok("\xa0\xa1\xa0\xa1\xa0\xa1\x{100}" =~ /((?:\xa0\xa1)+)/, "[perl #23769] hard variant");
	3260	ok($1 eq "\xa0\xa1\xa0\xa1\xa0\xa1", "[perl #23769]");
	3261
	3262	ok("aaa\x{100} " =~ /(a+?)/, "[perl #23769] easy invariant");
	3263	ok($1 eq "a", "[perl #23769]");
	3264
	3265	ok("\xa0\xa0\xa0\x{100} " =~ /(\xa0+?)/, "[perl #23769] regrepeat variant");
	3266	ok($1 eq "\xa0", "[perl #23769]");
	3267
	3268	ok("ababab\x{100} " =~ /((?:ab)+?)/, "[perl #23769] hard invariant");
	3269	ok($1 eq "ab", "[perl #23769]");
	3270
	3271	ok("\xa0\xa1\xa0\xa1\xa0\xa1\x{100}" =~ /((?:\xa0\xa1)+?)/, "[perl #23769] hard variant");
	3272	ok($1 eq "\xa0\xa1", "[perl #23769]");
	3273
	3274	ok("\xc4\xc4\xc4" !~ /(\x{100}+)/, "[perl #23769] don't match first byte of utf8 representation");
	3275	ok("\xc4\xc4\xc4" !~ /(\x{100}+?)/, "[perl #23769] don't match first byte of utf8 representation");
	3276	}
	3277
	3278	for (120 .. 130) {
	3279	my $head = 'x' x $_;
	3280	for my $tail ('\x{0061}', '\x{1234}') {
	3281	ok(
	3282	eval qq{ "$head$tail" =~ /$head$tail/ },
	3283	'\x{...} misparsed in regexp near 127 char EXACT limit'
	3284	);
	3285	}
	3286	}
	3287
	3288	# perl #25269: panic: pp_match start/end pointers
	3289	ok("a-bc" eq eval {
	3290	my($x, $y) = "bca" =~ /^(?=.(a)).(bc)/;
	3291	"$x-$y";
	3292	}, 'captures can move backwards in string');
	3293
	3294	# perl #27940: \cA not recognized in character classes
	3295	ok("a\cAb" =~ /\cA/, '\cA in pattern');
	3296	ok("a\cAb" =~ /[\cA]/, '\cA in character class');
	3297	ok("a\cAb" =~ /[\cA-\cB]/, '\cA in character class range');
	3298	ok("abc" =~ /[^\cA-\cB]/, '\cA in negated character class range');
	3299	ok("a\cBb" =~ /[\cA-\cC]/, '\cB in character class range');
	3300	ok("a\cCbc" =~ /[^\cA-\cB]/, '\cC in negated character class range');
	3301	ok("a\cAb" =~ /(??{"\cA"})/, '\cA in ??{} pattern');
	3302	ok("ab" !~ /a\cIb/x, '\cI in pattern');
	3303
	3304	# perl #28532: optional zero-width match at end of string is ignored
	3305	ok(("abc" =~ /^abc(\z)?/) && defined($1),
	3306	'optional zero-width match at end of string');
	3307	ok(("abc" =~ /^abc(\z)??/) && !defined($1),
	3308	'optional zero-width match at end of string');
	3309
	3310
	3311
	3312	{ # TRIE related
	3313	my @got=();
	3314	"words"=~/(word\|word\|word)(?{push @got,$1})s$/;
	3315	ok(@got==1,"TRIE optimation is working") or warn "# @got";
	3316	@got=();
	3317	"words"=~/(word\|word\|word)(?{push @got,$1})s$/i;
	3318	ok(@got==1,"TRIEF optimisation is working") or warn "# @got";
	3319
	3320	my @nums=map {int rand 1000} 1..100;
	3321	my $re="(".(join "\|",@nums).")";
	3322	$re=qr/\b$re\b/;
	3323
	3324	foreach (@nums) {
	3325	ok($_=~/$re/,"Trie nums");
	3326	}
	3327	$_=join " ", @nums;
	3328	@got=();
	3329	push @got,$1 while /$re/g;
	3330
	3331	my %count;
	3332	$count{$_}++ for @got;
	3333	my $ok=1;
	3334	for (@nums) {
	3335	$ok=0 if --$count{$_}<0;
	3336	}
	3337	ok($ok,"Trie min count matches");
	3338	}
	3339
	3340
	3341	# TRIE related
	3342	# LATIN SMALL/CAPITAL LETTER A WITH MACRON
	3343	ok(("foba \x{101}foo" =~ qr/(foo\|\x{100}foo\|bar)/i) && $1 eq "\x{101}foo",
	3344	"TRIEF + LATIN SMALL/CAPITAL LETTER A WITH MACRON");
	3345
	3346	# LATIN SMALL/CAPITAL LETTER A WITH RING BELOW
	3347	ok(("foba \x{1E01}foo" =~ qr/(foo\|\x{1E00}foo\|bar)/i) && $1 eq "\x{1E01}foo",
	3348	"TRIEF + LATIN SMALL/CAPITAL LETTER A WITH RING BELOW");
	3349
	3350	# DESERET SMALL/CAPITAL LETTER LONG I
	3351	ok(("foba \x{10428}foo" =~ qr/(foo\|\x{10400}foo\|bar)/i) && $1 eq "\x{10428}foo",
	3352	"TRIEF + DESERET SMALL/CAPITAL LETTER LONG I");
	3353
	3354	# LATIN SMALL/CAPITAL LETTER A WITH RING BELOW + 'X'
	3355	ok(("foba \x{1E01}xfoo" =~ qr/(foo\|\x{1E00}Xfoo\|bar)/i) && $1 eq "\x{1E01}xfoo",
	3356	"TRIEF + LATIN SMALL/CAPITAL LETTER A WITH RING BELOW + 'X'");
	3357
	3358	{# TRIE related
	3359
	3360	use charnames ':full';
	3361
	3362	$s="\N{LATIN SMALL LETTER SHARP S}";
	3363	ok(("foba ba$s" =~ qr/(foo\|Ba$s\|bar)/i)
	3364	&& $1 eq "ba$s",
	3365	"TRIEF + LATIN SMALL LETTER SHARP S =~ ss");
	3366	ok(("foba ba$s" =~ qr/(Ba$s\|foo\|bar)/i)
	3367	&& $1 eq "ba$s",
	3368	"TRIEF + LATIN SMALL LETTER SHARP S =~ ss");
	3369	ok(("foba ba$s" =~ qr/(foo\|bar\|Ba$s)/i)
	3370	&& $1 eq "ba$s",
	3371	"TRIEF + LATIN SMALL LETTER SHARP S =~ ss");
	3372
	3373	ok(("foba ba$s" =~ qr/(foo\|Bass\|bar)/i)
	3374	&& $1 eq "ba$s",
	3375	"TRIEF + LATIN SMALL LETTER SHARP S =~ ss");
	3376
	3377	ok(("foba ba$s" =~ qr/(foo\|BaSS\|bar)/i)
	3378	&& $1 eq "ba$s",
	3379	"TRIEF + LATIN SMALL LETTER SHARP S =~ SS");
	3380
	3381	ok(("foba ba${s}pxySS$s$s" =~ qr/(b(?:a${s}t\|a${s}f\|a${s}p)[xy]+$s*)/i)
	3382	&& $1 eq "ba${s}pxySS$s$s",
	3383	"COMMON PREFIX TRIEF + LATIN SMALL LETTER SHARP S");
	3384
	3385
	3386	}
	3387
	3388
	3389
	3390	if (!$ENV{PERL_SKIP_PSYCHO_TEST}){
	3391	my @normal=qw(these are some normal words);
	3392	my $psycho=join "\|",@normal,map chr $_,255..20000;
	3393	ok(('these'=~/($psycho)/) && $1 eq 'these','Pyscho');
	3394	} else {
	3395	ok(1,'Skipped Psycho');
	3396	}
	3397
	3398	# [perl #36207] mixed utf8 / latin-1 and case folding
	3399
	3400	{
	3401	my $utf8 = "\xe9\x{100}"; chop $utf8;
	3402	my $latin1 = "\xe9";
	3403
	3404	ok($utf8 =~ /\xe9/i, "utf8/latin");
	3405	ok($utf8 =~ /$latin1/i, "utf8/latin runtime");
	3406	ok($utf8 =~ /(abc\|\xe9)/i, "utf8/latin trie");
	3407	ok($utf8 =~ /(abc\|$latin1)/i, "utf8/latin trie runtime");
	3408
	3409	ok("\xe9" =~ /$utf8/i, "# TODO latin/utf8");
	3410	ok("\xe9" =~ /(abc\|$utf8)/i, "# latin/utf8 trie");
	3411	ok($latin1 =~ /$utf8/i, "# TODO latin/utf8 runtime");
	3412	ok($latin1 =~ /(abc\|$utf8)/i, "# latin/utf8 trie runtime");
	3413	}
	3414
	3415	# [perl #37038] Global regular matches generate invalid pointers
	3416
	3417	{
	3418	my $s = "abcd";
	3419	$s =~ /(..)(..)/g;
	3420	$s = $1;
	3421	$s = $2;
	3422	ok($s eq 'cd',
	3423	"# assigning to original string should not corrupt match vars");
	3424	}
	3425
	3426	{
	3427	package wooosh;
	3428	sub gloople {
	3429	"!";
	3430	}
	3431	package main;
	3432
	3433	my $aeek = bless {}, 'wooosh';
	3434	eval {$aeek->gloople() =~ /(.)/g;};
	3435	ok($@ eq "", "//g match against return value of sub") or print "# $@\n";
	3436	}
	3437
	3438	{
	3439	sub gloople {
	3440	"!";
	3441	}
	3442	eval {gloople() =~ /(.)/g;};
	3443	ok($@ eq "", "# 26410 didn't affect sub calls for some reason")
	3444	or print "# $@\n";
	3445	}
	3446
	3447	{
	3448	package lv;
	3449	$var = "abc";
	3450	sub variable : lvalue { $var }
	3451
	3452	package main;
	3453	my $o = bless [], "lv";
	3454	my $f = "";
	3455	eval { for (1..2) { $f .= $1 if $o->variable =~ /(.)/g } };
	3456	ok($f eq "ab", "pos retained between calls # TODO") or print "# $@\n";
	3457	}
	3458
	3459	{
	3460	$var = "abc";
	3461	sub variable : lvalue { $var }
	3462
	3463	my $f = "";
	3464	eval { for (1..2) { $f .= $1 if variable() =~ /(.)/g } };
	3465	ok($f eq "ab", "pos retained between calls # TODO") or print "# $@\n";
	3466	}
	3467
	3468	# [perl #37836] Simple Regex causes SEGV when run on specific data
	3469	if ($ordA == 193) {
	3470	print "ok $test # Skip: in EBCDIC\n"; $test++;
	3471	} else {
	3472	no warnings 'utf8';
	3473	$_ = pack('U0C2', 0xa2, 0xf8); # ill-formed UTF-8
	3474	my $ret = 0;
	3475	eval { $ret = s/[\0]+//g };
	3476	ok($ret == 0, "ill-formed UTF-8 doesn't match NUL in class");
	3477	}
	3478
	3479	{ # [perl #38293] chr(65535) should be allowed in regexes
	3480	no warnings 'utf8'; # to allow non-characters
	3481	my($c, $r, $s);
	3482
	3483	$c = chr 0xffff;
	3484	$c =~ s/$c//g;
	3485	ok($c eq "", "U+FFFF, parsed as atom");
	3486
	3487	$c = chr 0xffff;
	3488	$r = "\\$c";
	3489	$c =~ s/$r//g;
	3490	ok($c eq "", "U+FFFF backslashed, parsed as atom");
	3491
	3492	$c = chr 0xffff;
	3493	$c =~ s/[$c]//g;
	3494	ok($c eq "", "U+FFFF, parsed in class");
	3495
	3496	$c = chr 0xffff;
	3497	$r = "[\\$c]";
	3498	$c =~ s/$r//g;
	3499	ok($c eq "", "U+FFFF backslashed, parsed in class");
	3500
	3501	$s = "A\x{ffff}B";
	3502	$s =~ s/\x{ffff}//i;
	3503	ok($s eq "AB", "U+FFFF, EXACTF");
	3504
	3505	$s = "\x{ffff}A";
	3506	$s =~ s/\bA//;
	3507	ok($s eq "\x{ffff}", "U+FFFF, BOUND");
	3508
	3509	$s = "\x{ffff}!";
	3510	$s =~ s/\B!//;
	3511	ok($s eq "\x{ffff}", "U+FFFF, NBOUND");
	3512	} # non-characters end
	3513
	3514	{
	3515	# https://rt.perl.org/rt3/Ticket/Display.html?id=39583
	3516
	3517	# The printing characters
	3518	my @chars = ("A".."Z");
	3519	my $delim = ",";
	3520	my $size = 32771 - 4;
	3521	my $str = '';
	3522
	3523	# create some random junk. Inefficient, but it works.
	3524	for ($i = 0 ; $i < $size ; $i++) {
	3525	$str .= $chars[int(rand(@chars))];
	3526	}
	3527
	3528	$str .= ($delim x 4);
	3529	my $res;
	3530	my $matched;
	3531	if ($str =~ s/^(.*?)${delim}{4}//s) {
	3532	$res = $1;
	3533	$matched=1;
	3534	}
	3535	ok($matched,'pattern matches');
	3536	ok(length($str)==0,"Empty string");
	3537	ok(defined($res) && length($res)==$size,"\$1 is correct size");
	3538	}
	3539
	3540	{ # related to [perl #27940]
	3541	ok("\0-A" =~ /\c@-A/, '@- should not be interpolated in a pattern');
	3542	ok("\0\0A" =~ /\c@+A/, '@+ should not be interpolated in a pattern');
	3543	ok("X\@-A" =~ /X@-A/, '@- should not be interpolated in a pattern');
	3544	ok("X\@\@A" =~ /X@+A/, '@+ should not be interpolated in a pattern');
	3545
	3546	ok("X\0A" =~ /X\c@?A/, '\c@?');
	3547	ok("X\0A" =~ /X\c@A/, '\c@');
	3548	ok("X\0A" =~ /X\c@(A)/, '\c@(');
	3549	ok("X\0A" =~ /X(\c@)A/, '\c@)');
	3550	ok("X\0A" =~ /X\c@\|ZA/, '\c@\|');
	3551
	3552	ok("X\@A" =~ /X@?A/, '@?');
	3553	ok("X\@A" =~ /X@A/, '@');
	3554	ok("X\@A" =~ /X@(A)/, '@(');
	3555	ok("X\@A" =~ /X(@)A/, '@)');
	3556	ok("X\@A" =~ /X@\|ZA/, '@\|');
	3557
	3558	local $" = ','; # non-whitespace and non-RE-specific
	3559	ok('abc' =~ /(.)(.)(.)/, 'the last successful match is bogus');
	3560	ok("A@+B" =~ /A@{+}B/, 'interpolation of @+ in /@{+}/');
	3561	ok("A@-B" =~ /A@{-}B/, 'interpolation of @- in /@{-}/');
	3562	ok("A@+B" =~ /A@{+}B/x, 'interpolation of @+ in /@{+}/x');
	3563	ok("A@-B" =~ /A@{-}B/x, 'interpolation of @- in /@{-}/x');
	3564	}
	3565
	3566	{
	3567	use lib 'lib';
	3568	use Cname;
	3569
	3570	ok('fooB'=~/\N{foo}[\N{B}\N{b}]/,"Passthrough charname");
	3571	$test=1233; my $handle=make_must_warn('Ignoring excess chars from');
	3572	$handle->('q(xxWxx) =~ /[\N{WARN}]/');
	3573	{
	3574	my $code;
	3575	my $w="";
	3576	local $SIG{__WARN__} = sub { $w.=shift };
	3577	eval($code=<<'EOFTEST') or die "$@\n$code\n";
	3578	{
	3579	use warnings;
	3580
	3581	#1234
	3582	ok("\0" !~ /[\N{EMPTY-STR}XY]/,
	3583	"Zerolength charname in charclass doesnt match \0");
	3584	1;
	3585	}
	3586	EOFTEST
	3587	ok($w=~/Ignoring zero length/,
	3588	"Got expected zero length warning");
	3589	warn $code;
	3590
	3591	}
	3592	$handle= make_must_warn('Ignoring zero length');
	3593	$handle->('qq(\\0) =~ /[\N{EMPTY-STR}XY]/');
	3594	ok('AB'=~/(\N{EVIL})/ && $1 eq 'A',"Charname caching $1");
	3595	ok('ABC'=~/(\N{EVIL})/,"Charname caching $1");
	3596	ok('xy'=~/x\N{EMPTY-STR}y/, 'Empty string charname produces NOTHING node');
	3597	ok(''=~/\N{EMPTY-STR}/, 'Empty string charname produces NOTHING node 2');
	3598
	3599	}
	3600	{
	3601	print "# MORE LATIN SMALL LETTER SHARP S\n";
	3602
	3603	use charnames ':full';
	3604
	3605	#see also test #835
	3606	ok("ss" =~ /[\N{LATIN SMALL LETTER SHARP S}x]/i,
	3607	"unoptimized named sequence in class 1");
	3608	ok("SS" =~ /[\N{LATIN SMALL LETTER SHARP S}x]/i,
	3609	"unoptimized named sequence in class 2");
	3610	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /[\N{LATIN SMALL LETTER SHARP S}x]/,
	3611	"unoptimized named sequence in class 3");
	3612	ok("\N{LATIN SMALL LETTER SHARP S}" =~ /[\N{LATIN SMALL LETTER SHARP S}x]/i,
	3613	"unoptimized named sequence in class 4");
	3614
	3615	ok('aabc' !~ /a\N{PLUS SIGN}b/,'/a\N{PLUS SIGN}b/ against aabc');
	3616	ok('a+bc' =~ /a\N{PLUS SIGN}b/,'/a\N{PLUS SIGN}b/ against a+bc');
	3617	ok('a+bc' =~ /a\N{PLUS SIGN}b/,'/a\N{PLUS SIGN}b/ against a+bc');
	3618
	3619	ok(' A B'=~/\N{SPACE}\N{U+0041}\N{SPACE}\N{U+0042}/,
	3620	'Intermixed named and unicode escapes 1');
	3621	ok("\N{SPACE}\N{U+0041}\N{SPACE}\N{U+0042}"=~
	3622	/\N{SPACE}\N{U+0041}\N{SPACE}\N{U+0042}/,
	3623	'Intermixed named and unicode escapes 2');
	3624	ok("\N{SPACE}\N{U+0041}\N{SPACE}\N{U+0042} 3"=~
	3625	/[\N{SPACE}\N{U+0041}][\N{SPACE}\N{U+0042}]/,
	3626	'Intermixed named and unicode escapes');
	3627	}
	3628	$brackets = qr{
	3629	{ (?> [^{}]+ \| (??{ $brackets }) )* }
	3630	}x;
	3631	ok("{b{c}d" !~ m/^((??{ $brackets }))/, "bracket mismatch");
	3632
	3633	SKIP:{
	3634	our @stack=();
	3635	my @expect=qw(
	3636	stuff1
	3637	stuff2
	3638	<stuff1>and<stuff2>
	3639	right
	3640	<right>
	3641	<<right>>
	3642	<<<right>>>
	3643	<<stuff1>and<stuff2>><<<<right>>>>
	3644	);
	3645
	3646	local $_='<<<stuff1>and<stuff2>><<<<right>>>>>';
	3647	ok(/^(<((?:(?>[^<>]+)\|(?1))*)>(?{push @stack, $2 }))$/,
	3648	"Recursion should match");
	3649	ok(@stack==@expect)
	3650	or skip("Won't test individual results as count isn't equal",
	3651	0+@expect);
	3652	foreach my $idx (@expect) {
	3653	ok($expect[$idx] eq $stack[$idx],
	3654	"Expecting '$expect' at stack pos #$idx");
	3655	}
	3656
	3657	}
	3658	{
	3659	my $s='123453456';
	3660	$s=~s/(?<digits>\d+)\k<digits>/$+{digits}/;
	3661	ok($s eq '123456','Named capture (angle brackets) s///');
	3662	$s='123453456';
	3663	$s=~s/(?'digits'\d+)\k'digits'/$+{digits}/;
	3664	ok($s eq '123456','Named capture (single quotes) s///');
	3665	}
	3666	sub iseq($$;$) {
	3667	my ( $got, $expect, $name)=@_;
	3668
	3669	$_=defined($_) ? "'$_'" : "undef"
	3670	for $got, $expect;
	3671
	3672	my $ok= $got eq $expect;
	3673
	3674	printf "%sok %d - %s\n", ($ok ? "" : "not "), $test,
	3675	($name\|\|$Message)."\tLine ".((caller)[2]);
	3676
	3677	printf "# Failed test at line %d\n".
	3678	"# expected: %s\n".
	3679	"# result: %s\n",
	3680	(caller)[2], $expect, $got
	3681	unless $ok;
	3682
	3683	$test++;
	3684	return $ok;
	3685	}
	3686	{
	3687	my $s='foo bar baz';
	3688	my (@k,@v,@fetch,$res);
	3689	my $count= 0;
	3690	my @names=qw($+{A} $+{B} $+{C});
	3691	if ($s=~/(?<A>foo)\s+(?<B>bar)?\s+(?<C>baz)/) {
	3692	while (my ($k,$v)=each(%+)) {
	3693	$count++;
	3694	}
	3695	@k=sort keys(%+);
	3696	@v=sort values(%+);
	3697	$res=1;
	3698	push @fetch,
	3699	[ "$+{A}", "$1" ],
	3700	[ "$+{B}", "$2" ],
	3701	[ "$+{C}", "$3" ],
	3702	;
	3703	}
	3704	foreach (0..2) {
	3705	if ($fetch[$_]) {
	3706	iseq($fetch[$_][0],$fetch[$_][1],$names[$_]);
	3707	} else {
	3708	ok(0, $names[$_]);
	3709	}
	3710	}
	3711	iseq($res,1,"$s~=/(?<A>foo)\s+(?<B>bar)?\s+(?<C>baz)/");
	3712	iseq($count,3,"Got 3 keys in %+ via each");
	3713	iseq(0+@k, 3, 'Got 3 keys in %+ via keys');
	3714	iseq("@k","A B C", "Got expected keys");
	3715	iseq("@v","bar baz foo", "Got expected values");
	3716	eval'
	3717	print for $+{this_key_doesnt_exist};
	3718	';
	3719	ok(!$@,'lvalue $+{...} should not throw an exception');
	3720	}
	3721
	3722	# stress test CURLYX/WHILEM.
	3723	#
	3724	# This test includes varying levels of nesting, and according to
	3725	# profiling done against build 28905, exercises every code line in the
	3726	# CURLYX and WHILEM blocks, except those related to LONGJMP, the
	3727	# super-linear cache and warnings. It executes about 0.5M regexes
	3728
	3729	if ($ENV{PERL_SKIP_PSYCHO_TEST}){
	3730	printf "ok %d Skip: No psycho tests\n", $test++;
	3731	} else {
	3732	my $r = qr/^
	3733	(?:
	3734	( (?:a\|z+)+ )
	3735	(?:
	3736	( (?:b\|z+){3,}? )
	3737	(
	3738	(?:
	3739	(?:
	3740	(?:c\|z+){1,1}?z
	3741	)?
	3742	(?:c\|z+){1,1}
	3743	)*
	3744	)
	3745	(?:z*){2,}
	3746	( (?:z+\|d)+ )
	3747	(?:
	3748	( (?:e\|z+)+ )
	3749	)*
	3750	( (?:f\|z+)+ )
	3751	)*
	3752	( (?:z+\|g)+ )
	3753	(?:
	3754	( (?:h\|z+)+ )
	3755	)*
	3756	( (?:i\|z+)+ )
	3757	)+
	3758	( (?:j\|z+)+ )
	3759	(?:
	3760	( (?:k\|z+)+ )
	3761	)*
	3762	( (?:l\|z+)+ )
	3763	$/x;
	3764
	3765
	3766	my $ok = 1;
	3767	my $msg = "CURLYX stress test";
	3768	OUTER:
	3769	for my $a ("x","a","aa") {
	3770	for my $b ("x","bbb","bbbb") {
	3771	my $bs = $a.$b;
	3772	for my $c ("x","c","cc") {
	3773	my $cs = $bs.$c;
	3774	for my $d ("x","d","dd") {
	3775	my $ds = $cs.$d;
	3776	for my $e ("x","e","ee") {
	3777	my $es = $ds.$e;
	3778	for my $f ("x","f","ff") {
	3779	my $fs = $es.$f;
	3780	for my $g ("x","g","gg") {
	3781	my $gs = $fs.$g;
	3782	for my $h ("x","h","hh") {
	3783	my $hs = $gs.$h;
	3784	for my $i ("x","i","ii") {
	3785	my $is = $hs.$i;
	3786	for my $j ("x","j","jj") {
	3787	my $js = $is.$j;
	3788	for my $k ("x","k","kk") {
	3789	my $ks = $js.$k;
	3790	for my $l ("x","l","ll") {
	3791	my $ls = $ks.$l;
	3792	if ($ls =~ $r) {
	3793	if ($ls =~ /x/) {
	3794	$msg .= ": unexpected match for [$ls]";
	3795	$ok = 0;
	3796	last OUTER;
	3797	}
	3798	my $cap = "$1$2$3$4$5$6$7$8$9$10$11$12";
	3799	unless ($ls eq $cap) {
	3800	$msg .= ": capture: [$ls], got [$cap]";
	3801	$ok = 0;
	3802	last OUTER;
	3803	}
	3804	}
	3805	else {
	3806	unless ($ls =~ /x/) {
	3807	$msg = ": failed for [$ls]";
	3808	$ok = 0;
	3809	last OUTER;
	3810	}
	3811	}
	3812	}
	3813	}
	3814	}
	3815	}
	3816	}
	3817	}
	3818	}
	3819	}
	3820	}
	3821	}
	3822	}
	3823	}
	3824	ok($ok, $msg);
	3825	}
	3826
	3827	# \, breaks {3,4}
	3828	ok("xaaay" !~ /xa{3\,4}y/, "\, in a pattern");
	3829	ok("xa{3,4}y" =~ /xa{3\,4}y/, "\, in a pattern");
	3830
	3831	# \c\ followed by _
	3832	ok("x\c_y" !~ /x\c\_y/, "\_ in a pattern");
	3833	ok("x\c\_y" =~ /x\c\_y/, "\_ in a pattern");
	3834
	3835	# \c\ followed by other characters
	3836	for my $c ("z", "\0", "!", chr(254), chr(256)) {
	3837	my $targ = "a\034$c";
	3838	my $reg = "a\\c\\$c";
	3839	ok(eval("qq/$targ/ =~ /$reg/"), "\\c\\ in pattern");
	3840	}
	3841
	3842	{
	3843	my $str='abc';
	3844	my $count=0;
	3845	my $mval=0;
	3846	my $pval=0;
	3847	while ($str=~/b/g) { $mval=$#-; $pval=$#+; $count++ }
	3848	iseq($mval,0,"\@- should be empty [RT#36046]");
	3849	iseq($pval,0,"\@+ should be empty [RT#36046]");
	3850	iseq($count,1,"should have matched once only [RT#36046]");
	3851	}
	3852
	3853	{ # Test the (*PRUNE) pattern
	3854	our $count = 0;
	3855	'aaab'=~/a+b?(?{$count++})(*FAIL)/;
	3856	iseq($count,9,"expect 9 for no (*PRUNE)");
	3857	$count = 0;
	3858	'aaab'=~/a+b?(PRUNE)(?{$count++})(FAIL)/;
	3859	iseq($count,3,"expect 3 with (*PRUNE)");
	3860	local $_='aaab';
	3861	$count=0;
	3862	1 while /.(PRUNE)(?{$count++})(FAIL)/g;
	3863	iseq($count,4,"/.(*PRUNE)/");
	3864	$count = 0;
	3865	'aaab'=~/a+b?(??{'(PRUNE)'})(?{$count++})(FAIL)/;
	3866	iseq($count,3,"expect 3 with (*PRUNE)");
	3867	local $_='aaab';
	3868	$count=0;
	3869	1 while /.(??{'(PRUNE)'})(?{$count++})(FAIL)/g;
	3870	iseq($count,4,"/.(*PRUNE)/");
	3871	}
	3872	{ # Test the (*SKIP) pattern
	3873	our $count = 0;
	3874	'aaab'=~/a+b?(SKIP)(?{$count++})(FAIL)/;
	3875	iseq($count,1,"expect 1 with (*SKIP)");
	3876	local $_='aaab';
	3877	$count=0;
	3878	1 while /.(SKIP)(?{$count++})(FAIL)/g;
	3879	iseq($count,4,"/.(*SKIP)/");
	3880	$_='aaabaaab';
	3881	$count=0;
	3882	our @res=();
	3883	1 while /(a+b?)(SKIP)(?{$count++; push @res,$1})(FAIL)/g;
	3884	iseq($count,2,"Expect 2 with (*SKIP)" );
	3885	iseq("@res","aaab aaab","adjacent (*SKIP) works as expected" );
	3886	}
	3887	{ # Test the (*SKIP) pattern
	3888	our $count = 0;
	3889	'aaab'=~/a+b?(MARK:foo)(SKIP)(?{$count++})(*FAIL)/;
	3890	iseq($count,1,"expect 1 with (*SKIP)");
	3891	local $_='aaab';
	3892	$count=0;
	3893	1 while /.(MARK:foo)(SKIP)(?{$count++})(*FAIL)/g;
	3894	iseq($count,4,"/.(*SKIP)/");
	3895	$_='aaabaaab';
	3896	$count=0;
	3897	our @res=();
	3898	1 while /(a+b?)(MARK:foo)(SKIP)(?{$count++; push @res,$1})(*FAIL)/g;
	3899	iseq($count,2,"Expect 2 with (*SKIP)" );
	3900	iseq("@res","aaab aaab","adjacent (*SKIP) works as expected" );
	3901	}
	3902	{ # Test the (*SKIP) pattern
	3903	our $count = 0;
	3904	'aaab'=~/a(MARK:a)b?(MARK:b)(SKIP:a)(?{$count++})(*FAIL)/;
	3905	iseq($count,3,"expect 3 with MARK:a)b?(MARK:b)(*SKIP:a)");
	3906	local $_='aaabaaab';
	3907	$count=0;
	3908	our @res=();
	3909	1 while /(a(MARK:a)b?)(MARK:x)(SKIP:a)(?{$count++; push @res,$1})(*FAIL)/g;
	3910	iseq($count,5,"Expect 5 with (MARK:a)b?)(MARK:x)(*SKIP:a)" );
	3911	iseq("@res","aaab b aaab b ","adjacent (MARK:a)b?)(MARK:x)(*SKIP:a) works as expected" );
	3912	}
	3913	{ # Test the (*COMMIT) pattern
	3914	our $count = 0;
	3915	'aaabaaab'=~/a+b?(COMMIT)(?{$count++})(FAIL)/;
	3916	iseq($count,1,"expect 1 with (*COMMIT)");
	3917	local $_='aaab';
	3918	$count=0;
	3919	1 while /.(COMMIT)(?{$count++})(FAIL)/g;
	3920	iseq($count,1,"/.(*COMMIT)/");
	3921	$_='aaabaaab';
	3922	$count=0;
	3923	our @res=();
	3924	1 while /(a+b?)(COMMIT)(?{$count++; push @res,$1})(FAIL)/g;
	3925	iseq($count,1,"Expect 1 with (*COMMIT)" );
	3926	iseq("@res","aaab","adjacent (*COMMIT) works as expected" );
	3927	}
	3928	{
	3929	# Test named commits and the $REGERROR var
	3930	our $REGERROR;
	3931	for my $name ('',':foo')
	3932	{
	3933	for my $pat ("(*PRUNE$name)",
	3934	($name? "(*MARK$name)" : "")
	3935	. "(*SKIP$name)",
	3936	"(*COMMIT$name)")
	3937	{
	3938	for my $suffix ('(*FAIL)','')
	3939	{
	3940	'aaaab'=~/a+b$pat$suffix/;
	3941	iseq(
	3942	$REGERROR,
	3943	($suffix ? ($name ? 'foo' : "1") : ""),
	3944	"Test $pat and \$REGERROR $suffix"
	3945	);
	3946	}
	3947	}
	3948	}
	3949	}
	3950	{
	3951	# Test named commits and the $REGERROR var
	3952	package Fnorble;
	3953	our $REGERROR;
	3954	for my $name ('',':foo')
	3955	{
	3956	for my $pat ("(*PRUNE$name)",
	3957	($name? "(*MARK$name)" : "")
	3958	. "(*SKIP$name)",
	3959	"(*COMMIT$name)")
	3960	{
	3961	for my $suffix ('(*FAIL)','')
	3962	{
	3963	'aaaab'=~/a+b$pat$suffix/;
	3964	::iseq(
	3965	$REGERROR,
	3966	($suffix ? ($name ? 'foo' : "1") : ""),
	3967	"Test $pat and \$REGERROR $suffix"
	3968	);
	3969	}
	3970	}
	3971	}
	3972	}
	3973	{
	3974	# Test named commits and the $REGERROR var
	3975	local $Message = "\$REGERROR";
	3976	our $REGERROR;
	3977	for $word (qw(bar baz bop)) {
	3978	$REGERROR="";
	3979	"aaaaa$word"=~/a+(?:bar(COMMIT:bar)\|baz(COMMIT:baz)\|bop(COMMIT:bop))(FAIL)/;
	3980	iseq($REGERROR,$word);
	3981	}
	3982	}
	3983	{ #Regression test for perlbug 40684
	3984	local $Message = "RT#40684 tests:";
	3985	my $s = "abc\ndef";
	3986	my $rex = qr'^abc$'m;
	3987	ok($s =~ m/$rex/);
	3988	ok($s =~ m/^abc$/m);
	3989	}
	3990	{
	3991	#Mindnumbingly simple test of (*THEN)
	3992	for ("ABC","BAX") {
	3993	ok(/A (THEN) X \| B (THEN) C/x,"Simple (*THEN) test");
	3994	}
	3995	}
	3996
	3997	{
	3998	local $Message = "Relative Recursion";
	3999	my $parens=qr/($(?:[^()]++\|(?-1))*+$)/;
	4000	local $_='foo((23)+4-3) + bar(2(3+4)-1*(2-3))';
	4001	my ($all,$one,$two)=('','','');
	4002	if (/foo $parens \s* \+ \s* bar $parens/x) {
	4003	$all=$&;
	4004	$one=$1;
	4005	$two=$2;
	4006	}
	4007	iseq($one, '((2*3)+4-3)');
	4008	iseq($two, '(2(3+4)-1(2-3))');
	4009	iseq($all, 'foo((23)+4-3) + bar(2(3+4)-1*(2-3))');
	4010	iseq($all, $_);
	4011	}
	4012	{
	4013	my $spaces=" ";
	4014	local $_=join 'bar',$spaces,$spaces;
	4015	our $count=0;
	4016	s/(?>\s+bar)(?{$count++})//g;
	4017	iseq($_,$spaces,"SUSPEND final string");
	4018	iseq($count,1,"Optimiser should have prevented more than one match");
	4019	}
	4020	{
	4021	local $Message = "RT#36909 test";
	4022	$^R = 'Nothing';
	4023	{
	4024	local $^R = "Bad";
	4025	ok('x foofoo y' =~ m{
	4026	(foo) # $^R correctly set
	4027	(?{ "last regexp code result" })
	4028	}x);
	4029	iseq($^R,'last regexp code result');
	4030	}
	4031	iseq($^R,'Nothing');
	4032	{
	4033	local $^R = "Bad";
	4034
	4035	ok('x foofoo y' =~ m{
	4036	(?:foo\|bar)+ # $^R correctly set
	4037	(?{"last regexp code result"})
	4038	}x);
	4039	iseq($^R,'last regexp code result');
	4040	}
	4041	iseq($^R,'Nothing');
	4042
	4043	{
	4044	local $^R = "Bad";
	4045	ok('x foofoo y' =~ m{
	4046	(foo\|bar)\1+ # $^R undefined
	4047	(?{"last regexp code result"})
	4048	}x);
	4049	iseq($^R,'last regexp code result');
	4050	}
	4051	iseq($^R,'Nothing');
	4052	}
	4053	{
	4054	local $Message="RT#22395";
	4055	our $count;
	4056	for my $l (10,100,1000) {
	4057	$count=0;
	4058	('a' x $l) =~ /(.*)(?{$count++})[bc]/;
	4059	iseq( $count, $l + 1, "# TODO Should be L+1 not L*(L+3)/2 (L=$l)");
	4060	}
	4061	}
	4062	{
	4063	local $Message = "RT#22614";
	4064	local $_='ab';
	4065	our @len=();
	4066	/(.){1,}(?{push @len,0+@-})(.){1,}(?{})^/;
	4067	iseq("@len","2 2 2");
	4068	}
	4069	{
	4070	local $Message = "RT#18209";
	4071	my $text = ' word1 word2 word3 word4 word5 word6 ';
	4072
	4073	my @words = ('word1', 'word3', 'word5');
	4074	my $count;
	4075	foreach my $word (@words){
	4076	$text =~ s/$word\s//gi; # Leave a space to seperate words in the resultant str.
	4077	# The following block is not working.
	4078	if($&){
	4079	$count++;
	4080	}
	4081	# End bad block
	4082	}
	4083	iseq($count,3);
	4084	iseq($text,' word2 word4 word6 ');
	4085	}
	4086	{
	4087	# RT#6893
	4088	local $_= qq(A\nB\nC\n);
	4089	my @res;
	4090	while (m#(\G\|\n)([^\n]*)\n#gsx)
	4091	{
	4092	push @res,"$2";
	4093	last if @res>3;
	4094	}
	4095	iseq("@res","A B C","RT#6893: /g pattern shouldn't infinite loop");
	4096	}
	4097
	4098	{
	4099	# From Message-ID: <877ixs6oa6.fsf@k75.linux.bogus>
	4100	my $dow_name= "nada";
	4101	my $parser = "(\$dow_name) = \$time_string =~ /(D\x{e9}\\ C\x{e9}adaoin\|D\x{e9}\\ Sathairn\|\\w+\|\x{100})/";
	4102	my $time_string = "D\x{e9} C\x{e9}adaoin";
	4103	eval $parser;
	4104	ok(!$@,"Test Eval worked");
	4105	iseq($dow_name,$time_string,"UTF8 trie common prefix extraction");
	4106	}
	4107
	4108	{
	4109	my $v;
	4110	($v='bar')=~/(\w+)/g;
	4111	$v='foo';
	4112	iseq("$1",'bar','$1 is safe after /g - may fail due to specialized config in pp_hot.c')
	4113	}
	4114	{
	4115	local $Message = "http://nntp.perl.org/group/perl.perl5.porters/118663";
	4116	my $qr_barR1 = qr/(bar)\R1/;
	4117	ok("foobarbarxyz" =~ $qr_barR1);
	4118	ok("foobarbarxyz" =~ qr/foo${qr_barR1}xyz/);
	4119	ok("foobarbarxyz" =~ qr/(foo)${qr_barR1}xyz/);
	4120	ok("foobarbarxyz" =~ qr/(foo)(bar)\R1xyz/);
	4121	ok("foobarbarxyz" =~ qr/(foo${qr_barR1})xyz/);
	4122	ok("foobarbarxyz" =~ qr/(foo(bar)\R1)xyz/);
	4123	}
	4124	{
	4125	local $Message = "RT#41010";
	4126	my @tails=('','(?(1))','(\|)','()?');
	4127	my @quants=('*','+');
	4128	my $doit=sub {
	4129	my $pats= shift;
	4130	for (@_) {
	4131	for my $pat (@$pats) {
	4132	for my $quant (@quants) {
	4133	for my $tail (@tails) {
	4134	my $re = "($pat$quant\$)$tail";
	4135	ok(/$re/ && $1 eq $_,"'$_'=~/$re/");
	4136	ok(/$re/m && $1 eq $_,"'$_'=~/$re/m");
	4137	}
	4138	}
	4139	}
	4140	}
	4141	};
	4142
	4143	my @dpats=(
	4144	'\d',
	4145	'[1234567890]',
	4146	'(1\|[23]\|4\|[56]\|[78]\|[90])',
	4147	'(?:1\|[23]\|4\|[56]\|[78]\|[90])',
	4148	'(1\|2\|3\|4\|5\|6\|7\|8\|9\|0)',
	4149	'(?:1\|2\|3\|4\|5\|6\|7\|8\|9\|0)',
	4150	);
	4151	my @spats=('[ ]',' ','( \|\t)','(?: \|\t)','[ \t]','\s');
	4152	my @sstrs=(' ');
	4153	my @dstrs=('12345');
	4154	$doit->(\@spats,@sstrs);
	4155	$doit->(\@dpats,@dstrs);
	4156	}
	4157
	4158	# Test counter is at bottom of file. Put new tests above here.
	4159	#-------------------------------------------------------------------
	4160	# Keep the following tests last -- they may crash perl
	4161	{
	4162	# RT#19049 / RT#38869
	4163	my @list = (
	4164	'ab cdef', # matches regex
	4165	( 'e' x 40000 ) .'ab c' # matches not, but 'ab c' matches part of it
	4166	);
	4167	my $y;
	4168	my $x;
	4169	foreach (@list) {
	4170	m/ab(.+)cd/i; # the ignore-case seems to be important
	4171	$y = $1; # use $1, which might not be from the last match!
	4172	$x = substr($list[0],$-[0],$+[0]-$-[0]);
	4173	}
	4174	iseq($y,' ',
	4175	'pattern in a loop, failure should not affect previous success');
	4176	iseq($x,'ab cd',
	4177	'pattern in a loop, failure should not affect previous success');
	4178	}
	4179
	4180	ok(("a" x (2*15 - 10)) =~ /^()(a\|bb)$/, "Recursive stack cracker: #24274")
	4181	or print "# Unexpected outcome: should pass or crash perl\n";
	4182
	4183	ok((q(a)x 100) =~ /^(??{'(.)'x 100})/,
	4184	"Regexp /^(??{'(.)'x 100})/ crashes older perls")
	4185	or print "# Unexpected outcome: should pass or crash perl\n";
	4186
	4187	{
	4188	local $Message = "substitution with lookahead (possible segv)";
	4189	$_="ns1ns1ns1";
	4190	s/ns(?=\d)/ns_/g;
	4191	iseq($_,"ns_1ns_1ns_1");
	4192	$_="ns1";
	4193	s/ns(?=\d)/ns_/;
	4194	iseq($_,"ns_1");
	4195	$_="123";
	4196	s/(?=\d+)\|(?<=\d)/!Bang!/g;
	4197	iseq($_,"!Bang!1!Bang!2!Bang!3!Bang!");
	4198	}
	4199
	4200	# Put new tests above the dotted line about a page above this comment
	4201	iseq(0+$::test,$::TestCount,"Got the right number of tests!");
	4202	# Don't forget to update this!
	4203	BEGIN {
	4204	$::TestCount = 1567;
	4205	print "1..$::TestCount\n";
	4206	}
	4207