'FF' => 'FORM FEED (FF)',
'CR' => 'CARRIAGE RETURN (LF)',
'NEL' => 'NEXT LINE (NEL)',
+ # More convenience. For futher convencience,
+ # it is suggested some way using using the NamesList
+ # aliases is implemented.
+ 'ZWNJ' => 'ZERO WIDTH NON-JOINER',
+ 'ZWJ' => 'ZERO WIDTH JOINER',
'BOM' => 'BYTE ORDER MARK',
);
if ($name eq "BYTE ORDER MARK") {
$fname = $name;
- $ord = 0xFFFE;
+ $ord = 0xFEFF;
} else {
## Suck in the code/name list as a big string.
## Lines look like:
##
## Now know where in the string the name starts.
- ## The code, in hex, is befor that.
+ ## The code, in hex, is before that.
##
## The code can be 4-6 characters long, so we've got to sort of
## go look for it, just after the newline that comes before $off[0].
sub viacode
{
if (@_ != 1) {
- carp "charnames::viacode() expects one numeric argument";
+ carp "charnames::viacode() expects one argument";
return ()
}
if ($code > 0x10FFFF) {
carp "Unicode characters only allocated up to 0x10FFFF (you asked for $hex)";
- return "\x{FFFD}";
+ return;
}
return $viacode{$hex} if exists $viacode{$hex};
if ($txt =~ m/^$hex\t\t(.+)/m) {
return $viacode{$hex} = $1;
- } elsif ($hex eq 'FFFE') {
- return $viacode{$hex} = "BYTE ORDER MARK";
} else {
- carp "Unknown charcode '$hex'";
- return "\x{FFFD}";
+ return;
}
}
=head1 NAME
-charnames - define character names for C<\N{named}> string literal escapes.
+charnames - define character names for C<\N{named}> string literal escapes
=head1 SYNOPSIS
Returns undef if no name is known for the code.
-This works only for the standard names, and does not yet aply
+This works only for the standard names, and does not yet apply
to custom translators.
+Notice that the name returned for of U+FEFF is "ZERO WIDTH NO-BREAK
+SPACE", not "BYTE ORDER MARK".
+
=head1 charnames::vianame(code)
Returns the code point indicated by the name.
BYTE ORDER MARK
BOM
-though that is of course not a legal character as such.
+and
+
+ ZWNJ
+ ZWJ
+
+for ZERO WIDTH NON-JOINER and ZERO WIDTH JOINER.
For backward compatibility one can use the old names for
certain C0 and C1 controls