||= [], $code);
# 005F: SPACING UNDERSCORE
$op->($Cat->{Word} ||= [], $code)
- if $cat =~ /^[LMN]/ or $code eq "005F";
+ if $cat =~ /^[LMN]/ || $code eq "005F";
$op->($Cat->{Alnum} ||= [], $code)
if $cat =~ /^[LMN]/;
$op->($Cat->{Alpha} ||= [], $code)
if $cat =~ /^Z/ ||
$code =~ /^(0009|000A|000B|000C|000D)$/;
$op->($Cat->{SpacePerl} ||= [], $code)
- if $cat =~ /^Z/ ||
+ if $cat =~ /^Z/ || $code =~ /^(?:0085|2028|2029)$/ ||
$code =~ /^(0009|000A|000C|000D)$/;
$op->($Cat->{Blank} ||= [], $code)
if $code =~ /^(0020|0009)$/ ||
$| = 1;
-print "1..840\n";
+print "1..843\n";
BEGIN {
chdir 't' if -d 't';
# print "SS" =~
# /[\N{LATIN SMALL LETTER SHARP S}]/i ? "ok 842\n" : "not ok 842\n";
}
+
+{
+ print "# more whitespace: U+0085, U+2028, U+2029\n";
+
+ # U+0085 needs to be forced to be Unicode, the \x{100} does that.
+ print "<\x{100}\x{0085}>" =~ /<\x{100}\s>/ ? "ok 841\n" : "not ok 841\n";
+ print "<\x{2028}>" =~ /<\s>/ ? "ok 842\n" : "not ok 842\n";
+ print "<\x{2029}>" =~ /<\s>/ ? "ok 843\n" : "not ok 843\n";
+}
+