embedaddon/pcre/perltest.pl - diff

Return to perltest.pl CVS log

Up to [ELWIX - Embedded LightWeight unIX -] / embedaddon / pcre

Diff for /embedaddon/pcre/perltest.pl between versions 1.1 and 1.1.1.2

version 1.1, 2012/02/21 23:05:51	version 1.1.1.2, 2012/02/21 23:50:25
Line 1	Line 1
#! /usr/bin/env perl	#! /usr/bin/env perl

# Program for testing regular expressions with perl to check that PCRE handles	# Program for testing regular expressions with perl to check that PCRE handles
# them the same. This is the version that supports /8 for UTF-8 testing. As it	# them the same. This version supports /8 for UTF-8 testing. However, it needs
# stands, it requires at least Perl 5.8 for UTF-8 support. However, it needs to	# to have "use utf8" at the start for running the UTF-8 tests, but not for
# have "use utf8" at the start for running the UTF-8 tests, but not for the	# the other tests. The only way I've found for doing this is to cat this line
# other tests. The only way I've found for doing this is to cat this line in	# in explicitly in the RunPerlTest script. I've also used this method to supply
# explicitly in the RunPerlTest script.	# "require Encode" for the UTF-8 tests, so that the main test will still run
	# where Encode is not installed.

# use locale; # With this included, \x0b matches \s!	# use locale; # With this included, \x0b matches \s!

# Function for turning a string into a string of printing chars. There are	# Function for turning a string into a string of printing chars.
# currently problems with UTF-8 strings; this fudges round them.

	#require Encode;

sub pchars {	sub pchars {
my($t) = "";	my($t) = "";

Line 21 if ($utf8)	Line 23 if ($utf8)
foreach $c (@p)	foreach $c (@p)
{	{
if ($c >= 32 && $c < 127) { $t .= chr $c; }	if ($c >= 32 && $c < 127) { $t .= chr $c; }
else { $t .= sprintf("\\x{%02x}", $c); }	else { $t .= sprintf("\\x{%02x}", $c);
	}
}	}
}	}

else	else
{	{
foreach $c (split(//, $_[0]))	foreach $c (split(//, $_[0]))
Line 192 for (;;)	Line 194 for (;;)
{	{
printf $outfile "No match";	printf $outfile "No match";
if (defined $REGERROR && $REGERROR != 1)	if (defined $REGERROR && $REGERROR != 1)
{ print $outfile (", mark = $REGERROR"); }	{ printf $outfile (", mark = %s", &pchars($REGERROR)); }
printf $outfile "\n";	printf $outfile "\n";
}	}
else	else
Line 214 for (;;)	Line 216 for (;;)
}	}
splice(@subs, 0, 18);	splice(@subs, 0, 18);
}	}

	# It seems that $REGMARK is not marked as UTF-8 even when use utf8 is
	# set and the input pattern was a UTF-8 string. We can, however, force
	# it to be so marked.

if (defined $REGMARK && $REGMARK != 1)	if (defined $REGMARK && $REGMARK != 1)
{ print $outfile ("MK: $REGMARK\n"); }	{
	$xx = $REGMARK;
	$xx = Encode::decode_utf8($xx) if $utf8;
	printf $outfile ("MK: %s\n", &pchars($xx));
	}
}	}
}	}
}	}

FreeBSD-CVSweb <freebsd-cvsweb@FreeBSD.org>

Removed from v.1.1
changed lines
	Added in v.1.1.1.2