mktables: Set caseless equivalent tables

[perl5.git] / lib / unicore / mktables
diff --git a/lib/unicore/mktables b/lib/unicore/mktables

index 73ca970..1a3f234 100644 (file)
--- a/lib/unicore/mktables
+++ b/lib/unicore/mktables
@@ -6,17 +6,35 @@
  
  # Needs 'no overloading' to run faster on miniperl.  Code commented out at the
  # subroutine objaddr can be used instead to work as far back (untested) as
-# 5.8: needs pack "U".
+# 5.8: needs pack "U".  But almost all occurrences of objaddr have been
+# removed in favor of using 'no overloading'.  You also would have to go
+# through and replace occurrences like:
+#       my $addr = do { no overloading; pack 'J', $self; }
+# with
+#       my $addr = main::objaddr $self;
+# (or reverse commit 9b01bafde4b022706c3d6f947a0963f821b2e50b
+# that instituted the change to main::objaddr, and subsequent commits that
+# changed 0+$self to pack 'J', $self.)
+
+my $start_time;
+BEGIN { # Get the time the script started running; do it at compilation to
+        # get it as close as possible
+    $start_time= time;
+}
+
+
  require 5.010_001;
  use strict;
  use warnings;
  use Carp;
+use Config;
  use File::Find;
  use File::Path;
  use File::Spec;
  use Text::Tabs;
  
  sub DEBUG () { 0 }  # Set to 0 for production; 1 for development
+my $debugging_build = $Config{"ccflags"} =~ /-DDEBUGGING/;
  
  ##########################################################################
  #
@@ -34,7 +52,7 @@ sub DEBUG () { 0 }  # Set to 0 for production; 1 for development
  #   the small actual loop to process the input files and finish up; then
  #   a __DATA__ section, for the .t tests
  #
-# This program works on all releases of Unicode through at least 5.2.  The
+# This program works on all releases of Unicode through at least 6.0.  The
  # outputs have been scrutinized most intently for release 5.1.  The others
  # have been checked for somewhat more than just sanity.  It can handle all
  # existing Unicode character properties in those releases.
@@ -146,7 +164,10 @@ my $map_directory = 'To';        # Where map files go.
  # out.  But all the ones which can be used in regular expression \p{} and \P{}
  # constructs will.  Generally a property will have either its map table or its
  # match tables written but not both.  Again, what gets written is controlled
-# by lists which can easily be changed.
+# by lists which can easily be changed.  Properties have a 'Type', like
+# binary, or string, or enum depending on how many match tables there are and
+# the content of the maps.  This 'Type' is different than a range 'Type', so
+# don't get confused by the two concepts having the same name.
  #
  # For information about the Unicode properties, see Unicode's UAX44 document:
  
@@ -167,11 +188,11 @@ my $unicode_reference_url = 'http://www.unicode.org/reports/tr44/';
  # More information on Unicode version glitches is further down in these
  # introductory comments.
  #
-# This program works on all properties as of 5.2, though the files for some
-# are suppressed from apparent lack of demand for them.  You can change which
-# are output by changing lists in this program.
+# This program works on all non-provisional properties as of 6.0, though the
+# files for some are suppressed from apparent lack of demand for them.  You
+# can change which are output by changing lists in this program.
  #
-# The old version of mktables emphasized the term "Fuzzy" to mean Unocde's
+# The old version of mktables emphasized the term "Fuzzy" to mean Unicode's
  # loose matchings rules (from Unicode TR18):
  #
  #    The recommended names for UCD properties and property values are in
@@ -302,7 +323,7 @@ my $unicode_reference_url = 'http://www.unicode.org/reports/tr44/';
  #   is nonsensical.
  #
  # There are no match tables generated for matches of the null string.  These
-# would like like qr/\p{JSN=}/ currently without modifying the regex code.
+# would look like qr/\p{JSN=}/ currently without modifying the regex code.
  # Perhaps something like them could be added if necessary.  The JSN does have
  # a real code point U+110B that maps to the null string, but it is a
  # contributory property, and therefore not output by default.  And it's easily
@@ -341,6 +362,18 @@ my $unicode_reference_url = 'http://www.unicode.org/reports/tr44/';
  # to 1, and every file whose object is in @input_file_objects and doesn't have
  # a, 'non_skip => 1,' in its constructor will be skipped.
  #
+# To compare the output tables, it may be useful to specify the -annotate
+# flag.  This causes the tables to expand so there is one entry for each
+# non-algorithmically named code point giving, currently its name, and its
+# graphic representation if printable (and you have a font that knows about
+# it).  This makes it easier to see what the particular code points are in
+# each output table.  The tables are usable, but because they don't have
+# ranges (for the most part), a Perl using them will run slower.  Non-named
+# code points are annotated with a description of their status, and contiguous
+# ones with the same description will be output as a range rather than
+# individually.  Algorithmically named characters are also output as ranges,
+# except when there are just a few contiguous ones.
+#
  # FUTURE ISSUES
  #
  # The program would break if Unicode were to change its names so that
@@ -390,7 +423,7 @@ my $unicode_reference_url = 'http://www.unicode.org/reports/tr44/';
  # Unicode_Radical_Stroke was listed in those files, so if the Unihan database
  # is present in the directory, a table will be generated for that property.
  # In 5.2, several more properties were added.  For your convenience, the two
-# arrays are initialized with all the 5.2 listed properties that are also in
+# arrays are initialized with all the 6.0 listed properties that are also in
  # earlier releases.  But these are commented out.  You can just uncomment the
  # ones you want, or use them as a template for adding entries for other
  # properties.
@@ -404,7 +437,6 @@ my $unicode_reference_url = 'http://www.unicode.org/reports/tr44/';
  # kPrimaryNumeric property have commas and an unexpected comment.  A filter
  # could be added for these; or for a particular installation, the Unihan.txt
  # file could be edited to fix them.
-# have to be
  #
  # HOW TO ADD A FILE TO BE PROCESSED
  #
@@ -446,7 +478,7 @@ my $unicode_reference_url = 'http://www.unicode.org/reports/tr44/';
  #
  # Here are some observations about some of the issues in early versions:
  #
-# The number of code points in \p{alpha} halve in 2.1.9.  It turns out that
+# The number of code points in \p{alpha} halved in 2.1.9.  It turns out that
  # the reason is that the CJK block starting at 4E00 was removed from PropList,
  # and was not put back in until 3.1.0
  #
@@ -577,6 +609,12 @@ sub uniques {
      # Encapsulated Cleverness".  p. 455 in first edition.
  
      my %seen;
+    # Arguably this breaks encapsulation, if the goal is to permit multiple
+    # distinct objects to stringify to the same value, and be interchangeable.
+    # However, for this program, no two objects stringify identically, and all
+    # lists passed to this function are either objects or strings. So this
+    # doesn't affect correctness, but it does give a couple of percent speedup.
+    no overloading;
      return grep { ! $seen{$_}++ } @_;
  }
  
@@ -600,8 +638,11 @@ my $make_list = 1;             # ? Should we write $file_list.  Set to always
                                 # special things
  my $glob_list = 0;             # ? Should we try to include unknown .txt files
                                 # in the input.
-my $output_range_counts = 1;   # ? Should we include the number of code points
-                               # in ranges in the output
+my $output_range_counts = $debugging_build;   # ? Should we include the number
+                                              # of code points in ranges in
+                                              # the output
+my $annotate = 0;              # ? Should character names be in the output
+
  # Verbosity levels; 0 is quiet
  my $NORMAL_VERBOSITY = 1;
  my $PROGRESS = 2;
@@ -657,6 +698,11 @@ while (@ARGV) {
      elsif ($arg eq '-c') {
          $output_range_counts = ! $output_range_counts
      }
+    elsif ($arg eq '-annotate') {
+        $annotate = 1;
+        $debugging_build = 1;
+        $output_range_counts = 1;
+    }
      else {
          my $with_c = 'with';
          $with_c .= 'out' if $output_range_counts;   # Complements the state
@@ -681,6 +727,10 @@ usage: $0 [-c|-p|-q|-v|-w] [-C dir] [-L filelist] [ -P pod_dir ]
    -maketest   : Make test script 'TestProp.pl' in current (or -C directory),
                  overrides -T
    -makelist   : Rewrite the file list $file_list based on current setup
+  -annotate   : Output an annotation for each character in the table files;
+                useful for debugging mktables, looking at diffs; but is slow,
+                memory intensive; resulting tables are usable but slow and
+                very large.
    -check A B  : Executes $0 only if A and B are the same
  END
      }
@@ -688,7 +738,7 @@ END
  
  # Stores the most-recently changed file.  If none have changed, can skip the
  # build
-my $youngest = -M $0;   # Do this before the chdir!
+my $most_recent = (stat $0)[9];   # Do this before the chdir!
  
  # Change directories now, because need to read 'version' early.
  if ($use_directory) {
@@ -763,11 +813,11 @@ if ($v_version gt v3.2.0) {
                                  'Canonical_Combining_Class=Attached_Below_Left'
  }
  
-# These are listed in the Property aliases file in 5.2, but Unihan is ignored
+# These are listed in the Property aliases file in 6.0, but Unihan is ignored
  # unless explicitly added.
  if ($v_version ge v5.2.0) {
      my $unihan = 'Unihan; remove from list if using Unihan';
-    foreach my $table qw (
+    foreach my $table (qw (
                             kAccountingNumeric
                             kOtherNumeric
                             kPrimaryNumeric
@@ -783,7 +833,7 @@ if ($v_version ge v5.2.0) {
                             kIRG_USource
                             kIRG_VSource
                             kRSUnicode
-                        )
+                        ))
      {
          $why_suppress_if_empty_warn_if_not{$table} = $unihan;
      }
@@ -806,10 +856,10 @@ my %why_obsolete;    # Documentation only
  
      my $other_properties = 'other properties';
      my $contributory = "Used by Unicode internally for generating $other_properties and not intended to be used stand-alone";
-    my $why_no_expand  = "Easily computed, and yet doesn't cover the common encoding forms (UTF-16/8)",
+    my $why_no_expand  = "Deprecated by Unicode: less useful than UTF-specific calculations",
  
      %why_deprecated = (
-        'Grapheme_Link' => 'Deprecated by Unicode.  Use ccc=vr (Canonical_Combining_Class=Virama) instead',
+        'Grapheme_Link' => 'Deprecated by Unicode:  Duplicates ccc=vr (Canonical_Combining_Class=Virama)',
          'Jamo_Short_Name' => $contributory,
          'Line_Break=Surrogate' => 'Deprecated by Unicode because surrogates should never appear in well-formed text, and therefore shouldn\'t be the basis for line breaking',
          'Other_Alphabetic' => $contributory,
@@ -823,7 +873,7 @@ my %why_obsolete;    # Documentation only
      );
  
      %why_suppressed = (
-        # There is a lib/unicore/Decomposition.pl (used by normalize.pm) which
+        # There is a lib/unicore/Decomposition.pl (used by Normalize.pm) which
          # contains the same information, but without the algorithmically
          # determinable Hangul syllables'.  This file is not published, so it's
          # existence is not noted in the comment.
@@ -840,10 +890,7 @@ my %why_obsolete;    # Documentation only
          'Name' => "Accessible via 'use charnames;'",
          'Name_Alias' => "Accessible via 'use charnames;'",
  
-        # These are sort of jumping the gun; deprecation is proposed for
-        # Unicode version 6.0, but they have never been exposed by Perl, and
-        # likely are soon to be deprecated, so best not to expose them.
-        FC_NFKC_Closure => 'Use NFKC_Casefold instead',
+        FC_NFKC_Closure => 'Supplanted in usage by NFKC_Casefold; otherwise not useful',
          Expands_On_NFC => $why_no_expand,
          Expands_On_NFD => $why_no_expand,
          Expands_On_NFKC => $why_no_expand,
@@ -865,9 +912,15 @@ my %why_obsolete;    # Documentation only
  
  if ($v_version ge 4.0.0) {
      $why_stabilized{'Hyphen'} = 'Use the Line_Break property instead; see www.unicode.org/reports/tr14';
+    if ($v_version ge 6.0.0) {
+        $why_deprecated{'Hyphen'} = 'Supplanted by Line_Break property values; see www.unicode.org/reports/tr14';
+    }
  }
-if ($v_version ge 5.2.0) {
+if ($v_version ge 5.2.0 && $v_version lt 6.0.0) {
      $why_obsolete{'ISO_Comment'} = 'Code points for it have been removed';
+    if ($v_version ge 6.0.0) {
+        $why_deprecated{'ISO_Comment'} = 'No longer needed for chart generation; otherwise not useful, and code points for it have been removed';
+    }
  }
  
  # Probably obsolete forever
@@ -886,7 +939,7 @@ END
  
  # If you are using the Unihan database, you need to add the properties that
  # you want to extract from it to this table.  For your convenience, the
-# properties in the 5.2 PropertyAliases.txt file are listed, commented out
+# properties in the 6.0 PropertyAliases.txt file are listed, commented out
  my @cjk_properties = split "\n", <<'END';
  #cjkAccountingNumeric; kAccountingNumeric
  #cjkOtherNumeric; kOtherNumeric
@@ -905,7 +958,7 @@ my @cjk_properties = split "\n", <<'END';
  END
  
  # Similarly for the property values.  For your convenience, the lines in the
-# 5.2 PropertyAliases.txt file are listed.  Just remove the first BUT NOT both
+# 6.0 PropertyAliases.txt file are listed.  Just remove the first BUT NOT both
  # '#' marks
  my @cjk_property_values = split "\n", <<'END';
  ## @missing: 0000..10FFFF; cjkAccountingNumeric; NaN
@@ -988,6 +1041,10 @@ my %ignored_files = (
      'ReadMe.txt' => 'Just comments',
      'README.TXT' => 'Just comments',
      'StandardizedVariants.txt' => 'Only for glyph changes, not a Unicode character property.  Does not fit into current scheme where one code point is mapped',
+    'EmojiSources.txt' => 'Not of general utility: for Japanese legacy cell-phone applications',
+    'IndicMatraCategory.txt' => 'Provisional',
+    'IndicSyllabicCategory.txt' => 'Provisional',
+    'ScriptExtensions.txt' => 'Provisional',
  );
  
  ### End of externally interesting definitions, except for @input_file_objects
@@ -1079,6 +1136,7 @@ my $IF_NOT_EQUIVALENT = 1; # Replace only under certain conditions; details in
  my $UNCONDITIONALLY = 2;   # Replace without conditions.
  my $MULTIPLE = 4;          # Don't replace, but add a duplicate record if
                             # already there
+my $CROAK = 5;             # Die with an error if is already there
  
  # Flags to give property statuses.  The phrases are to remind maintainers that
  # if the flag is changed, the indefinite article referring to it in the
@@ -1111,7 +1169,8 @@ my %status_past_participles = (
      $DEPRECATED => 'deprecated',
  );
  
-# The format of the values of the map tables:
+# The format of the values of the tables:
+my $EMPTY_FORMAT = "";
  my $BINARY_FORMAT = 'b';
  my $DECIMAL_FORMAT = 'd';
  my $FLOAT_FORMAT = 'f';
@@ -1119,6 +1178,7 @@ my $INTEGER_FORMAT = 'i';
  my $HEX_FORMAT = 'x';
  my $RATIONAL_FORMAT = 'r';
  my $STRING_FORMAT = 's';
+my $DECOMP_STRING_FORMAT = 'c';
  
  my %map_table_formats = (
      $BINARY_FORMAT => 'binary',
@@ -1127,7 +1187,8 @@ my %map_table_formats = (
      $INTEGER_FORMAT => 'integer',
      $HEX_FORMAT => 'positive hex whole number; a code point',
      $RATIONAL_FORMAT => 'rational: an integer or a fraction',
-    $STRING_FORMAT => 'arbitrary string',
+    $STRING_FORMAT => 'string',
+    $DECOMP_STRING_FORMAT => 'Perl\'s internal (Normalize.pm) decomposition mapping',
  );
  
  # Unicode didn't put such derived files in a separate directory at first.
@@ -1143,13 +1204,30 @@ my %nv_floating_to_rational; # maps numeric values floating point numbers to
                               # their rational equivalent
  my %loose_property_name_of; # Loosely maps property names to standard form
  
+# Most properties are immune to caseless matching, otherwise you would get
+# nonsensical results, as properties are a function of a code point, not
+# everything that is caselessly equivalent to that code point.  For example,
+# Changes_When_Case_Folded('s') should be false, whereas caselessly it would
+# be true because 's' and 'S' are equivalent caselessly.  However,
+# traditionally, [:upper:] and [:lower:] are equivalent caselessly, so we
+# extend that concept to those very few properties that are like this.  Each
+# such property will match the full range caselessly.  They are hard-coded in
+# the program; it's not worth trying to make it general as it's extremely
+# unlikely that they will ever change.
+my %caseless_equivalent_to;
+
  # These constants names and values were taken from the Unicode standard,
  # version 5.1, section 3.12.  They are used in conjunction with Hangul
-# syllables
-my $SBase = 0xAC00;
-my $LBase = 0x1100;
-my $VBase = 0x1161;
-my $TBase = 0x11A7;
+# syllables.  The '_string' versions are so generated tables can retain the
+# hex format, which is the more familiar value
+my $SBase_string = "0xAC00";
+my $SBase = CORE::hex $SBase_string;
+my $LBase_string = "0x1100";
+my $LBase = CORE::hex $LBase_string;
+my $VBase_string = "0x1161";
+my $VBase = CORE::hex $VBase_string;
+my $TBase_string = "0x11A7";
+my $TBase = CORE::hex $TBase_string;
  my $SCount = 11172;
  my $LCount = 19;
  my $VCount = 21;
@@ -1185,6 +1263,8 @@ my $MAX_FLOATING_SLOP = 10 ** - $MIN_FRACTION_LENGTH; # And in floating terms
  my $gc;
  my $perl;
  my $block;
+my $perl_charname;
+my $print;
  
  # Are there conflicting names because of beginning with 'In_', or 'Is_'
  my $has_In_conflicts = 0;
@@ -1216,7 +1296,143 @@ sub objaddr($) {
      no overloading; # If overloaded, numifying below won't work.
  
      # Numifying a ref gives its address.
-    return 0 + $_[0];
+    return pack 'J', $_[0];
+}
+
+# These are used only if $annotate is true.
+# The entire range of Unicode characters is examined to populate these
+# after all the input has been processed.  But most can be skipped, as they
+# have the same descriptive phrases, such as being unassigned
+my @viacode;            # Contains the 1 million character names
+my @printable;          # boolean: And are those characters printable?
+my @annotate_char_type; # Contains a type of those characters, specifically
+                        # for the purposes of annotation.
+my $annotate_ranges;    # A map of ranges of code points that have the same
+                        # name for the purposes of annotation.  They map to the
+                        # upper edge of the range, so that the end point can
+                        # be immediately found.  This is used to skip ahead to
+                        # the end of a range, and avoid processing each
+                        # individual code point in it.
+my $unassigned_sans_noncharacters; # A Range_List of the unassigned
+                                   # characters, but excluding those which are
+                                   # also noncharacter code points
+
+# The annotation types are an extension of the regular range types, though
+# some of the latter are folded into one.  Make the new types negative to
+# avoid conflicting with the regular types
+my $SURROGATE_TYPE = -1;
+my $UNASSIGNED_TYPE = -2;
+my $PRIVATE_USE_TYPE = -3;
+my $NONCHARACTER_TYPE = -4;
+my $CONTROL_TYPE = -5;
+my $UNKNOWN_TYPE = -6;  # Used only if there is a bug in this program
+
+sub populate_char_info ($) {
+    # Used only with the $annotate option.  Populates the arrays with the
+    # input code point's info that are needed for outputting more detailed
+    # comments.  If calling context wants a return, it is the end point of
+    # any contiguous range of characters that share essentially the same info
+
+    my $i = shift;
+    Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+
+    $viacode[$i] = $perl_charname->value_of($i) || "";
+
+    # A character is generally printable if Unicode says it is,
+    # but below we make sure that most Unicode general category 'C' types
+    # aren't.
+    $printable[$i] = $print->contains($i);
+
+    $annotate_char_type[$i] = $perl_charname->type_of($i) || 0;
+
+    # Only these two regular types are treated specially for annotations
+    # purposes
+    $annotate_char_type[$i] = 0 if $annotate_char_type[$i] != $CP_IN_NAME
+                                && $annotate_char_type[$i] != $HANGUL_SYLLABLE;
+
+    # Give a generic name to all code points that don't have a real name.
+    # We output ranges, if applicable, for these.  Also calculate the end
+    # point of the range.
+    my $end;
+    if (! $viacode[$i]) {
+        if ($gc-> table('Surrogate')->contains($i)) {
+            $viacode[$i] = 'Surrogate';
+            $annotate_char_type[$i] = $SURROGATE_TYPE;
+            $printable[$i] = 0;
+            $end = $gc->table('Surrogate')->containing_range($i)->end;
+        }
+        elsif ($gc-> table('Private_use')->contains($i)) {
+            $viacode[$i] = 'Private Use';
+            $annotate_char_type[$i] = $PRIVATE_USE_TYPE;
+            $printable[$i] = 0;
+            $end = $gc->table('Private_Use')->containing_range($i)->end;
+        }
+        elsif (Property::property_ref('Noncharacter_Code_Point')-> table('Y')->
+                                                                contains($i))
+        {
+            $viacode[$i] = 'Noncharacter';
+            $annotate_char_type[$i] = $NONCHARACTER_TYPE;
+            $printable[$i] = 0;
+            $end = property_ref('Noncharacter_Code_Point')->table('Y')->
+                                                    containing_range($i)->end;
+        }
+        elsif ($gc-> table('Control')->contains($i)) {
+            $viacode[$i] = 'Control';
+            $annotate_char_type[$i] = $CONTROL_TYPE;
+            $printable[$i] = 0;
+            $end = 0x81 if $i == 0x80;  # Hard-code this one known case
+        }
+        elsif ($gc-> table('Unassigned')->contains($i)) {
+            $viacode[$i] = 'Unassigned, block=' . $block-> value_of($i);
+            $annotate_char_type[$i] = $UNASSIGNED_TYPE;
+            $printable[$i] = 0;
+
+            # Because we name the unassigned by the blocks they are in, it
+            # can't go past the end of that block, and it also can't go past
+            # the unassigned range it is in.  The special table makes sure
+            # that the non-characters, which are unassigned, are separated
+            # out.
+            $end = min($block->containing_range($i)->end,
+                       $unassigned_sans_noncharacters-> containing_range($i)->
+                                                                         end);
+        }
+        else {
+            Carp::my_carp_bug("Can't figure out how to annotate "
+                              . sprintf("U+%04X", $i)
+                              . ".  Proceeding anyway.");
+            $viacode[$i] = 'UNKNOWN';
+            $annotate_char_type[$i] = $UNKNOWN_TYPE;
+            $printable[$i] = 0;
+        }
+    }
+
+    # Here, has a name, but if it's one in which the code point number is
+    # appended to the name, do that.
+    elsif ($annotate_char_type[$i] == $CP_IN_NAME) {
+        $viacode[$i] .= sprintf("-%04X", $i);
+        $end = $perl_charname->containing_range($i)->end;
+    }
+
+    # And here, has a name, but if it's a hangul syllable one, replace it with
+    # the correct name from the Unicode algorithm
+    elsif ($annotate_char_type[$i] == $HANGUL_SYLLABLE) {
+        use integer;
+        my $SIndex = $i - $SBase;
+        my $L = $LBase + $SIndex / $NCount;
+        my $V = $VBase + ($SIndex % $NCount) / $TCount;
+        my $T = $TBase + $SIndex % $TCount;
+        $viacode[$i] = "HANGUL SYLLABLE $Jamo{$L}$Jamo{$V}";
+        $viacode[$i] .= $Jamo{$T} if $T != $TBase;
+        $end = $perl_charname->containing_range($i)->end;
+    }
+
+    return if ! defined wantarray;
+    return $i if ! defined $end;    # If not a range, return the input
+
+    # Save this whole range so can find the end point quickly
+    $annotate_ranges->add_map($i, $end, $end);
+
+    return $end;
  }
  
  # Commented code below should work on Perl 5.8.
@@ -1241,7 +1457,7 @@ sub objaddr($) {
  #    bless $_[0], 'main::Fake';
  #
  #    # Numifying a ref gives its address.
-#    my $addr = 0 + $_[0];
+#    my $addr = pack 'J', $_[0];
  #
  #    # Return to original class
  #    bless $_[0], $pkg;
@@ -1431,7 +1647,7 @@ package main;
              # Use typeglob to give the anonymous subroutine the name we want
              *$destroy_name = sub {
                  my $self = shift;
-                my $addr = main::objaddr($self);
+                my $addr = do { no overloading; pack 'J', $self; };
  
                  $self->$destroy_callback if $destroy_callback;
                  foreach my $field (keys %{$package_fields{$package}}) {
@@ -1477,7 +1693,7 @@ package main;
          # "protection" is only by convention.  All that happens is that the
          # accessor functions' names begin with an underscore.  So instead of
          # calling set_foo, the call is _set_foo.  (Real protection could be
-        # accomplished by having a new subroutine, end_package called at the
+        # accomplished by having a new subroutine, end_package, called at the
          # end of each package, and then storing the __LINE__ ranges and
          # checking them on every accessor.  But that is way overkill.)
  
@@ -1530,16 +1746,15 @@ package main;
                      return Carp::carp_too_few_args(\@_, 2) if main::DEBUG && @_ < 2;
                      my $self = shift;
                      my $value = shift;
+                    my $addr = do { no overloading; pack 'J', $self; };
                      Carp::carp_extra_args(\@_) if main::DEBUG && @_;
                      if (ref $value) {
-                        return if grep { $value == $_ }
-                                            @{$field->{main::objaddr $self}};
+                        return if grep { $value == $_ } @{$field->{$addr}};
                      }
                      else {
-                        return if grep { $value eq $_ }
-                                            @{$field->{main::objaddr $self}};
+                        return if grep { $value eq $_ } @{$field->{$addr}};
                      }
-                    push @{$field->{main::objaddr $self}}, $value;
+                    push @{$field->{$addr}}, $value;
                      return;
                  }
              }
@@ -1565,7 +1780,7 @@ package main;
                      *$subname = sub {
                          use strict "refs";
                          Carp::carp_extra_args(\@_) if main::DEBUG && @_ > 1;
-                        my $addr = main::objaddr $_[0];
+                        my $addr = do { no overloading; pack 'J', $_[0]; };
                          if (ref $field->{$addr} ne 'ARRAY') {
                              my $type = ref $field->{$addr};
                              $type = 'scalar' unless $type;
@@ -1587,7 +1802,8 @@ package main;
                      *$subname = sub {
                          use strict "refs";
                          Carp::carp_extra_args(\@_) if main::DEBUG && @_ > 1;
-                        return $field->{main::objaddr $_[0]};
+                        no overloading;
+                        return $field->{pack 'J', $_[0]};
                      }
                  }
              }
@@ -1601,7 +1817,8 @@ package main;
                          Carp::carp_extra_args(\@_) if @_ > 2;
                      }
                      # $self is $_[0]; $value is $_[1]
-                    $field->{main::objaddr $_[0]} = $_[1];
+                    no overloading;
+                    $field->{pack 'J', $_[0]} = $_[1];
                      return;
                  }
              }
@@ -1761,7 +1978,7 @@ sub trace { return main::trace(@_); }
          my $class = shift;
  
          my $self = bless \do{ my $anonymous_scalar }, $class;
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Set defaults
          $handler{$addr} = \&main::process_generic_property_file;
@@ -1852,7 +2069,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my $file = $file{$addr};
  
@@ -2022,7 +2239,7 @@ END
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Here the file is open (or if the handle is not a ref, is an open
          # 'virtual' file).  Get the next line; any inserted lines get priority
@@ -2167,7 +2384,7 @@ END
  #        # an each_line_handler() on the line.
  #
  #        my $self = shift;
-#        my $addr = main::objaddr $self;
+#        my $addr = do { no overloading; pack 'J', $self; };
  #
  #        foreach my $inserted_ref (@{$added_lines{$addr}}) {
  #            my ($adjusted, $line) = @{$inserted_ref};
@@ -2208,7 +2425,8 @@ END
          # Each inserted line is an array, with the first element being 0 to
          # indicate that this line hasn't been adjusted, and needs to be
          # processed.
-        push @{$added_lines{main::objaddr $self}}, map { [ 0, $_ ] } @_;
+        no overloading;
+        push @{$added_lines{pack 'J', $self}}, map { [ 0, $_ ] } @_;
          return;
      }
  
@@ -2231,7 +2449,8 @@ END
  
          # Each inserted line is an array, with the first element being 1 to
          # indicate that this line has been adjusted
-        push @{$added_lines{main::objaddr $self}}, map { [ 1, $_ ] } @_;
+        no overloading;
+        push @{$added_lines{pack 'J', $self}}, map { [ 1, $_ ] } @_;
          return;
      }
  
@@ -2244,7 +2463,7 @@ END
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # If not accepting a list return, just return the first one.
          return shift @{$missings{$addr}} unless wantarray;
@@ -2257,7 +2476,9 @@ END
      sub _insert_property_into_line {
          # Add a property field to $_, if this file requires it.
  
-        my $property = $property{main::objaddr shift};
+        my $self = shift;
+        my $addr = do { no overloading; pack 'J', $self; };
+        my $property = $property{$addr};
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
          $_ =~ s/(;|$)/; $property$1/;
@@ -2275,7 +2496,7 @@ END
          my $message = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $message = 'Unexpected line' unless $message;
  
@@ -2286,7 +2507,7 @@ END
          # increment the count of how many times it has occurred
          unless ($errors{$addr}->{$message}) {
              Carp::my_carp("$message in '$_' in "
-                            . $file{main::objaddr $self}
+                            . $file{$addr}
                              . " at line $..  Skipping this line;");
              $errors{$addr}->{$message} = 1;
          }
@@ -2340,7 +2561,7 @@ package Multi_Default;
          my $class = shift;
  
          my $self = bless \do{my $anonymous_scalar}, $class;
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          while (@_ > 1) {
              my $default = shift;
@@ -2358,7 +2579,7 @@ package Multi_Default;
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return each %{$class_defaults{$addr}};
      }
@@ -2405,7 +2626,7 @@ package Alias;
          my $class = shift;
  
          my $self = bless \do { my $anonymous_scalar }, $class;
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $name{$addr} = shift;
          $loose_match{$addr} = shift;
@@ -2467,7 +2688,7 @@ sub trace { return main::trace(@_); }
          my $class = shift;
  
          my $self = bless \do { my $anonymous_scalar }, $class;
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $start{$addr} = shift;
          $end{$addr} = shift;
@@ -2497,7 +2718,7 @@ sub trace { return main::trace(@_); }
  
      sub _operator_stringify {
          my $self = shift;
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Output it like '0041..0065 (value)'
          my $return = sprintf("%04X", $start{$addr})
@@ -2520,7 +2741,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return $standard_form{$addr} if defined $standard_form{$addr};
          return $value{$addr};
@@ -2533,7 +2754,7 @@ sub trace { return main::trace(@_); }
          my $indent = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my $return = $indent
                      . sprintf("%04X", $start{$addr})
@@ -2568,13 +2789,6 @@ package _Range_List_Base;
  # There are a number of methods to manipulate range lists, and some operators
  # are overloaded to handle them.
  
-# Because of the slowness of pure Perl objaddr() on miniperl, and measurements
-# showing this package was using a lot of real time calculating that, the code
-# was changed to only calculate it once per call stack.  This is done by
-# consistently using the package variable $addr in routines, and only calling
-# objaddr() if it isn't defined, and setting that to be local, so that callees
-# will have it already.  It would be a good thing to change this. XXX
-
  sub trace { return main::trace(@_); }
  
  { # Closure
@@ -2622,7 +2836,7 @@ sub trace { return main::trace(@_); }
          return _union($class, $initialize, %args) if defined $initialize;
  
          $self = bless \do { my $anonymous_scalar }, $class;
-        local $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Optional parent object, only for debug info.
          $owner_name_of{$addr} = delete $args{'Owner'};
@@ -2654,7 +2868,7 @@ sub trace { return main::trace(@_); }
  
      sub _operator_stringify {
          my $self = shift;
-        local $addr = main::objaddr($self) if !defined $addr;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return "Range_List attached to '$owner_name_of{$addr}'"
                                                  if $owner_name_of{$addr};
@@ -2712,7 +2926,8 @@ sub trace { return main::trace(@_); }
              if (! defined $arg) {
                  my $message = "";
                  if (defined $self) {
-                    $message .= $owner_name_of{main::objaddr $self};
+                    no overloading;
+                    $message .= $owner_name_of{pack 'J', $self};
                  }
                  Carp::my_carp_bug($message .= "Undefined argument to _union.  No union done.");
                  return;
@@ -2733,7 +2948,8 @@ sub trace { return main::trace(@_); }
              else {
                  my $message = "";
                  if (defined $self) {
-                    $message .= $owner_name_of{main::objaddr $self};
+                    no overloading;
+                    $message .= $owner_name_of{pack 'J', $self};
                  }
                  Carp::my_carp_bug($message . "Cannot take the union of a $type.  No union done.");
                  return;
@@ -2773,9 +2989,8 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr($self) if ! defined $addr;
-
-        return scalar @{$ranges{$addr}};
+        no overloading;
+        return scalar @{$ranges{pack 'J', $self}};
      }
  
      sub min {
@@ -2788,7 +3003,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr($self) if ! defined $addr;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # If the range list is empty, return a large value that isn't adjacent
          # to any that could be in the range list, for simpler tests
@@ -2805,8 +3020,6 @@ sub trace { return main::trace(@_); }
          my $codepoint = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr $self if ! defined $addr;
-
          my $i = $self->_search_ranges($codepoint);
          return 0 unless defined $i;
  
@@ -2814,24 +3027,51 @@ sub trace { return main::trace(@_); }
          #   range[$i-1]->end < $codepoint <= range[$i]->end
          # So is in the table if and only iff it is at least the start position
          # of range $i.
-        return 0 if $ranges{$addr}->[$i]->start > $codepoint;
+        no overloading;
+        return 0 if $ranges{pack 'J', $self}->[$i]->start > $codepoint;
          return $i + 1;
      }
  
-    sub value_of {
-        # Returns the value associated with the code point, undef if none
+    sub containing_range {
+        # Returns the range object that contains the code point, undef if none
  
          my $self = shift;
          my $codepoint = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr $self if ! defined $addr;
-
          my $i = $self->contains($codepoint);
          return unless $i;
  
          # contains() returns 1 beyond where we should look
-        return $ranges{$addr}->[$i-1]->value;
+        no overloading;
+        return $ranges{pack 'J', $self}->[$i-1];
+    }
+
+    sub value_of {
+        # Returns the value associated with the code point, undef if none
+
+        my $self = shift;
+        my $codepoint = shift;
+        Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+
+        my $range = $self->containing_range($codepoint);
+        return unless defined $range;
+
+        return $range->value;
+    }
+
+    sub type_of {
+        # Returns the type of the range containing the code point, undef if
+        # the code point is not in the table
+
+        my $self = shift;
+        my $codepoint = shift;
+        Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+
+        my $range = $self->containing_range($codepoint);
+        return unless defined $range;
+
+        return $range->type;
      }
  
      sub _search_ranges {
@@ -2845,7 +3085,7 @@ sub trace { return main::trace(@_); }
          my $code_point = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr $self if ! defined $addr;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return if $code_point > $max{$addr};
          my $r = $ranges{$addr};                # The current list of ranges
@@ -2950,10 +3190,10 @@ sub trace { return main::trace(@_); }
          #
          # The range list is kept sorted so that the range with the lowest
          # starting position is first in the list, and generally, adjacent
-        # ranges with the same values are merged into single larger one (see
+        # ranges with the same values are merged into a single larger one (see
          # exceptions below).
          #
-        # There are more parameters, all are key => value pairs:
+        # There are more parameters; all are key => value pairs:
          #   Type    gives the type of the value.  It is only valid for '+'.
          #           All ranges have types; if this parameter is omitted, 0 is
          #           assumed.  Ranges with type 0 are assumed to obey the
@@ -2977,7 +3217,7 @@ sub trace { return main::trace(@_); }
          #       => $IF_NOT_EQUIVALENT means to replace the existing values
          #                         with this one if they are not equivalent.
          #                         Ranges are equivalent if their types are the
-        #                         same, and they are the same string, or if
+        #                         same, and they are the same string; or if
          #                         both are type 0 ranges, if their Unicode
          #                         standard forms are identical.  In this last
          #                         case, the routine chooses the more "modern"
@@ -2993,11 +3233,13 @@ sub trace { return main::trace(@_); }
          #                         existing one, but has a different value,
          #                         don't replace the existing one, but insert
          #                         this, one so that the same range can occur
-        #                         multiple times.
+        #                         multiple times.  They are stored LIFO, so
+        #                         that the final one inserted is the first one
+        #                         returned in an ordered search of the table.
          #       => anything else  is the same as => $IF_NOT_EQUIVALENT
          #
-        # "same value" means identical for type-0 ranges, and it means having
-        # the same standard forms for non-type-0 ranges.
+        # "same value" means identical for non-type-0 ranges, and it means
+        # having the same standard forms for type-0 ranges.
  
          return Carp::carp_too_few_args(\@_, 5) if main::DEBUG && @_ < 5;
  
@@ -3019,7 +3261,7 @@ sub trace { return main::trace(@_); }
  
          Carp::carp_extra_args(\%args) if main::DEBUG && %args;
  
-        local $addr = main::objaddr($self) if ! defined $addr;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          if ($operation ne '+' && $operation ne '-') {
              Carp::my_carp_bug("$owner_name_of{$addr}First parameter to _add_delete must be '+' or '-'.  No action taken.");
@@ -3222,23 +3464,60 @@ sub trace { return main::trace(@_); }
              return;
          }
  
-        # Here, we have taken care of the case where $replace is $NO, which
-        # means that whatever action we now take is done unconditionally.  It
-        # still could be that this call will result in a no-op, if duplicates
-        # aren't allowed, and we are inserting a range that merely duplicates
-        # data already in the range list; or also if deleting a non-existent
-        # range.
-        # $i still points to the first potential affected range.  Now find the
-        # highest range affected, which will determine the length parameter to
-        # splice.  (The input range can span multiple existing ones.)  While
-        # we are looking through the range list, see also if this is an
-        # insertion that will change the values of at least one of the
-        # affected ranges.  We don't need to do this check unless this is an
-        # insertion of non-multiples, and also since this is a boolean, we
-        # don't need to do it if have already determined that it will make a
-        # change; just unconditionally change them.  $cdm is created to be 1
-        # if either of these is true. (The 'c' in the name comes from below)
-        my $cdm = ($operation eq '-' || $replace == $MULTIPLE);
+        # Here, we have taken care of the case where $replace is $NO.
+        # Remember that here, r[$i-1]->end < $start <= r[$i]->end
+        # If inserting a multiple record, this is where it goes, before the
+        # first (if any) existing one.  This implies an insertion, and no
+        # change to any existing ranges.  Note that $i can be -1 if this new
+        # range doesn't actually duplicate any existing, and comes at the
+        # beginning of the list.
+        if ($replace == $MULTIPLE) {
+
+            if ($start != $end) {
+                Carp::my_carp_bug("$owner_name_of{$addr}Can't cope with adding a multiple record when the range ($start..$end) contains more than one code point.  No action taken.");
+                return;
+            }
+
+            # Don't add an exact duplicate, as it isn't really a multiple
+            if ($end >= $r->[$i]->start) {
+                if ($r->[$i]->start != $r->[$i]->end) {
+                    Carp::my_carp_bug("$owner_name_of{$addr}Can't cope with adding a multiple record when the other range ($r->[$i]) contains more than one code point.  No action taken.");
+                    return;
+                }
+                return if $value eq $r->[$i]->value && $type eq $r->[$i]->type;
+            }
+
+            trace "Adding multiple record at $i with $start..$end, $value" if main::DEBUG && $to_trace;
+            my @return = splice @$r,
+                                $i,
+                                0,
+                                Range->new($start,
+                                           $end,
+                                           Value => $value,
+                                           Type => $type);
+            if (main::DEBUG && $to_trace) {
+                trace "After splice:";
+                trace 'i-2=[', $i-2, ']', $r->[$i-2] if $i >= 2;
+                trace 'i-1=[', $i-1, ']', $r->[$i-1] if $i >= 1;
+                trace "i  =[", $i, "]", $r->[$i] if $i >= 0;
+                trace 'i+1=[', $i+1, ']', $r->[$i+1] if $i < @$r - 1;
+                trace 'i+2=[', $i+2, ']', $r->[$i+2] if $i < @$r - 2;
+                trace 'i+3=[', $i+3, ']', $r->[$i+3] if $i < @$r - 3;
+            }
+            return @return;
+        }
+
+        # Here, we have taken care of $NO and $MULTIPLE replaces.  This leaves
+        # delete, insert, and replace either unconditionally or if not
+        # equivalent.  $i still points to the first potential affected range.
+        # Now find the highest range affected, which will determine the length
+        # parameter to splice.  (The input range can span multiple existing
+        # ones.)  If this isn't a deletion, while we are looking through the
+        # range list, see also if this is a replacement rather than a clean
+        # insertion; that is if it will change the values of at least one
+        # existing range.  Start off assuming it is an insert, until find it
+        # isn't.
+        my $clean_insert = $operation eq '+';
          my $j;        # This will point to the highest affected range
  
          # For non-zero types, the standard form is the value itself;
@@ -3251,12 +3530,19 @@ sub trace { return main::trace(@_); }
              # searching
              last if $end < $r->[$j]->start;
  
-            # Here, overlaps the range at $j.  If the value's don't match,
-            # and this is supposedly an insertion, it becomes a change
-            # instead.  This is what the 'c' stands for in $cdm.
-            if (! $cdm) {
+            # Here, overlaps the range at $j.  If the values don't match,
+            # and so far we think this is a clean insertion, it becomes a
+            # non-clean insertion, i.e., a 'change' or 'replace' instead.
+            if ($clean_insert) {
                  if ($r->[$j]->standard_form ne $standard_form) {
-                    $cdm = 1;
+                    $clean_insert = 0;
+                    if ($replace == $CROAK) {
+                        main::croak("The range to add "
+                        . sprintf("%04X", $start)
+                        . '-'
+                        . sprintf("%04X", $end)
+                        . " with value '$value' overlaps an existing range $r->[$j]");
+                    }
                  }
                  else {
  
@@ -3270,7 +3556,7 @@ sub trace { return main::trace(@_); }
                          # same, but the non-standardized values aren't.  If
                          # replacing unconditionally, then replace
                          if( $replace == $UNCONDITIONALLY) {
-                            $cdm = 1;
+                            $clean_insert = 0;
                          }
                          else {
  
@@ -3284,13 +3570,13 @@ sub trace { return main::trace(@_); }
                                              && $pre_existing =~ /[a-z]/;
  
                              if ($old_mixed != $new_mixed) {
-                                $cdm = 1 if $new_mixed;
+                                $clean_insert = 0 if $new_mixed;
                                  if (main::DEBUG && $to_trace) {
-                                    if ($cdm) {
-                                        trace "Replacing $pre_existing with $value";
+                                    if ($clean_insert) {
+                                        trace "Retaining $pre_existing over $value";
                                      }
                                      else {
-                                        trace "Retaining $pre_existing over $value";
+                                        trace "Replacing $pre_existing with $value";
                                      }
                                  }
                              }
@@ -3304,13 +3590,13 @@ sub trace { return main::trace(@_); }
                                  my $old_punct = $pre_existing =~ /[-_]/;
  
                                  if ($old_punct != $new_punct) {
-                                    $cdm = 1 if $new_punct;
+                                    $clean_insert = 0 if $new_punct;
                                      if (main::DEBUG && $to_trace) {
-                                        if ($cdm) {
-                                            trace "Replacing $pre_existing with $value";
+                                        if ($clean_insert) {
+                                            trace "Retaining $pre_existing over $value";
                                          }
                                          else {
-                                            trace "Retaining $pre_existing over $value";
+                                            trace "Replacing $pre_existing with $value";
                                          }
                                      }
                                  }   # else existing one is just as "good";
@@ -3333,44 +3619,6 @@ sub trace { return main::trace(@_); }
          $j--;        # $j now points to the highest affected range.
          trace "Final affected range is $j: $r->[$j]" if main::DEBUG && $to_trace;
  
-        # If inserting a multiple record, this is where it goes, after all the
-        # existing ones for this range.  This implies an insertion, and no
-        # change to any existing ranges.  Note that $j can be -1 if this new
-        # range doesn't actually duplicate any existing, and comes at the
-        # beginning of the list, in which case we can handle it like any other
-        # insertion, and is easier to do so.
-        if ($replace == $MULTIPLE && $j >= 0) {
-
-            # This restriction could be remedied with a little extra work, but
-            # it won't hopefully ever be necessary
-            if ($r->[$j]->start != $r->[$j]->end) {
-                Carp::my_carp_bug("$owner_name_of{$addr}Can't cope with adding a multiple when the other range ($r->[$j]) contains more than one code point.  No action taken.");
-                return;
-            }
-
-            # Don't add an exact duplicate, as it isn't really a multiple
-            return if $value eq $r->[$j]->value && $type eq $r->[$j]->type;
-
-            trace "Adding multiple record at $j+1 with $start..$end, $value" if main::DEBUG && $to_trace;
-            my @return = splice @$r,
-                                $j+1,
-                                0,
-                                Range->new($start,
-                                           $end,
-                                           Value => $value,
-                                           Type => $type);
-            if (main::DEBUG && $to_trace) {
-                trace "After splice:";
-                trace 'j-2=[', $j-2, ']', $r->[$j-2] if $j >= 2;
-                trace 'j-1=[', $j-1, ']', $r->[$j-1] if $j >= 1;
-                trace "j  =[", $j, "]", $r->[$j] if $j >= 0;
-                trace 'j+1=[', $j+1, ']', $r->[$j+1] if $j < @$r - 1;
-                trace 'j+2=[', $j+2, ']', $r->[$j+2] if $j < @$r - 2;
-                trace 'j+3=[', $j+3, ']', $r->[$j+3] if $j < @$r - 3;
-            }
-            return @return;
-        }
-
          # Here, have taken care of $NO and $MULTIPLE replaces.
          # $j points to the highest affected range.  But it can be < $i or even
          # -1.  These happen only if the insertion is entirely in the gap
@@ -3396,8 +3644,9 @@ sub trace { return main::trace(@_); }
          }
          else {
  
-            # Here the entire input range is not in the gap before $i.  There
-            # is an affected one, and $j points to the highest such one.
+            # Here part of the input range is not in the gap before $i.  Thus,
+            # there is at least one affected one, and $j points to the highest
+            # such one.
  
              # At this point, here is the situation:
              # This is not an insertion of a multiple, nor of tentative ($NO)
@@ -3413,21 +3662,21 @@ sub trace { return main::trace(@_); }
              #   r[$i-1]->end < $start <= $end <= r[$j]->end
              #
              # Also:
-            #   $cdm is a boolean which is set true if and only if this is a
-            #        change or deletion (multiple was handled above).  In
-            #        other words, it could be renamed to be just $cd.
+            #   $clean_insert is a boolean which is set true if and only if
+            #        this is a "clean insertion", i.e., not a change nor a
+            #        deletion (multiple was handled above).
  
              # We now have enough information to decide if this call is a no-op
-            # or not.  It is a no-op if it is a deletion of a non-existent
-            # range, or an insertion of already existing data.
+            # or not.  It is a no-op if this is an insertion of already
+            # existing data.
  
-            if (main::DEBUG && $to_trace && ! $cdm
+            if (main::DEBUG && $to_trace && $clean_insert
                                           && $i == $j
                                           && $start >= $r->[$i]->start)
              {
                      trace "no-op";
              }
-            return if ! $cdm      # change or delete => not no-op
+            return if $clean_insert
                        && $i == $j # more than one affected range => not no-op
  
                        # Here, r[$i-1]->end < $start <= $end <= r[$i]->end
@@ -3464,7 +3713,7 @@ sub trace { return main::trace(@_); }
              $extends_above = ($j+1 < $range_list_size
                              && $r->[$j+1]->start == $end +1
                              && $r->[$j+1]->standard_form eq $standard_form
-                            && $r->[$j-1]->type == $type);
+                            && $r->[$j+1]->type == $type);
          }
          if ($extends_below && $extends_above) { # Adds to both
              $splice_start--;     # start replace at element below
@@ -3489,7 +3738,7 @@ sub trace { return main::trace(@_); }
                  # Here the new element adds to the one below, but not to the
                  # one above.  If inserting, and only to that one range,  can
                  # just change its ending to include the new one.
-                if ($length == 0 && ! $cdm) {
+                if ($length == 0 && $clean_insert) {
                      $r->[$i-1]->set_end($end);
                      trace "inserted range extends range to below so it is now $r->[$i-1]" if main::DEBUG && $to_trace;
                      return;
@@ -3505,7 +3754,7 @@ sub trace { return main::trace(@_); }
  
                  # Here the new element adds to the one above, but not below.
                  # Mirror the code above
-                if ($length == 0 && ! $cdm) {
+                if ($length == 0 && $clean_insert) {
                      $r->[$j+1]->set_start($start);
                      trace "inserted range extends range to above so it is now $r->[$j+1]" if main::DEBUG && $to_trace;
                      return;
@@ -3586,7 +3835,7 @@ sub trace { return main::trace(@_); }
              trace "i  =[", $i, "]", $r->[$i];
              trace 'i+1=[', $i+1, ']', $r->[$i+1] if $i < @$r - 1;
              trace 'i+2=[', $i+2, ']', $r->[$i+2] if $i < @$r - 2;
-            trace "removed @return";
+            trace "removed ", @return if @return;
          }
  
          # An actual deletion could have changed the maximum in the list.
@@ -3603,9 +3852,8 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr $self if ! defined $addr;
-
-        undef $each_range_iterator{$addr};
+        no overloading;
+        undef $each_range_iterator{pack 'J', $self};
          return;
      }
  
@@ -3616,7 +3864,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr($self) if ! defined $addr;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return if $self->is_empty;
  
@@ -3633,7 +3881,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr($self) if ! defined $addr;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my $count = 0;
          foreach my $range (@{$ranges{$addr}}) {
@@ -3656,8 +3904,8 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr($self) if ! defined $addr;
-        return scalar @{$ranges{$addr}} == 0;
+        no overloading;
+        return scalar @{$ranges{pack 'J', $self}} == 0;
      }
  
      sub hash {
@@ -3668,7 +3916,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        local $addr = main::objaddr($self) if ! defined $addr;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # These are quickly computable.  Return looks like 'min..max;count'
          return $self->min . "..$max{$addr};" . scalar @{$ranges{$addr}};
@@ -3940,7 +4188,35 @@ sub trace { return main::trace(@_); }
          return $self->_add_delete('+', $start, $end, "");
      }
  
-    my $non_ASCII = (ord('A') != 65);   # Assumes test on same platform
+    sub matches_identically_to {
+        # Return a boolean as to whether or not two Range_Lists match identical
+        # sets of code points.
+
+        my $self = shift;
+        my $other = shift;
+        Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+
+        # These are ordered in increasing real time to figure out (at least
+        # until a patch changes that and doesn't change this)
+        return 0 if $self->max != $other->max;
+        return 0 if $self->min != $other->min;
+        return 0 if $self->range_count != $other->range_count;
+        return 0 if $self->count != $other->count;
+
+        # Here they could be identical because all the tests above passed.
+        # The loop below is somewhat simpler since we know they have the same
+        # number of elements.  Compare range by range, until reach the end or
+        # find something that differs.
+        my @a_ranges = $self->ranges;
+        my @b_ranges = $other->ranges;
+        for my $i (0 .. @a_ranges - 1) {
+            my $a = $a_ranges[$i];
+            my $b = $b_ranges[$i];
+            trace "self $a; other $b" if main::DEBUG && $to_trace;
+            return 0 if $a->start != $b->start || $a->end != $b->end;
+        }
+        return 1;
+    }
  
      sub is_code_point_usable {
          # This used only for making the test script.  See if the input
@@ -3954,21 +4230,10 @@ sub trace { return main::trace(@_); }
  
          return 0 if $code < 0;                # Never use a negative
  
-        # For non-ASCII, we shun the characters that don't have Perl encoding-
-        # independent symbols for them.  'A' is such a symbol, so is "\n".
-        return $try_hard if $non_ASCII
-                            && $code <= 0xFF
-                            && ($code >= 0x7F
-                                || ($code >= 0x0E && $code <= 0x1F)
-                                || ($code >= 0x01 && $code <= 0x06)
-                                || $code == 0x0B);
-
          # shun null.  I'm (khw) not sure why this was done, but NULL would be
          # the character very frequently used.
          return $try_hard if $code == 0x0000;
  
-        return 0 if $try_hard;  # XXX Temporary until fix utf8.c
-
          # shun non-character code points.
          return $try_hard if $code >= 0xFDD0 && $code <= 0xFDEF;
          return $try_hard if ($code & 0xFFFE) == 0xFFFE; # includes FFFF
@@ -3987,7 +4252,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # On first pass, don't choose less desirable code points; if no good
          # one is found, repeat, allowing a less desirable one to be selected.
@@ -4151,6 +4416,10 @@ sub trace { return main::trace(@_); }
      # A comment about its being obsolete, or whatever non normal status it has
      main::set_access('status_info', \%status_info, 'r');
  
+    my %caseless_equivalent;
+    # The table this is equivalent to under /i matching, if any.
+    main::set_access('caseless_equivalent', \%caseless_equivalent, 'r', 's');
+
      my %range_size_1;
      # Is the table to be output with each range only a single code point?
      # This is done to avoid breaking existing code that may have come to rely
@@ -4168,6 +4437,12 @@ sub trace { return main::trace(@_); }
      # The constructor can override the global flag of the same name.
      main::set_access('output_range_counts', \%output_range_counts, 'r');
  
+    my %format;
+    # The format of the entries of the table.  This is calculated from the
+    # data in the table (or passed in the constructor).  This is an enum e.g.,
+    # $STRING_FORMAT
+    main::set_access('format', \%format, 'r', 'p_s');
+
      sub new {
          # All arguments are key => value pairs, which you can see below, most
          # of which match fields documented above.  Otherwise: Pod_Entry,
@@ -4179,7 +4454,7 @@ sub trace { return main::trace(@_); }
          my $class = shift;
  
          my $self = bless \do { my $anonymous_scalar }, $class;
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my %args = @_;
  
@@ -4188,6 +4463,7 @@ sub trace { return main::trace(@_); }
          $full_name{$addr} = delete $args{'Full_Name'};
          my $complete_name = $complete_name{$addr}
                            = delete $args{'Complete_Name'};
+        $format{$addr} = delete $args{'Format'};
          $internal_only{$addr} = delete $args{'Internal_Only_Warning'} || 0;
          $output_range_counts{$addr} = delete $args{'Output_Range_Counts'};
          $property{$addr} = delete $args{'_Property'};
@@ -4195,6 +4471,7 @@ sub trace { return main::trace(@_); }
          $status{$addr} = delete $args{'Status'} || $NORMAL;
          $status_info{$addr} = delete $args{'_Status_Info'} || "";
          $range_size_1{$addr} = delete $args{'Range_Size_1'} || 0;
+        $caseless_equivalent{$addr} = delete $args{'Caseless_Equivalent'} || 0;
  
          my $description = delete $args{'Description'};
          my $externally_ok = delete $args{'Externally_Ok'};
@@ -4236,7 +4513,11 @@ sub trace { return main::trace(@_); }
              # lists of properties or tables that have particular statuses; if
              # not, is normal.  The lists are prioritized so the most serious
              # ones are checked first
-            if (exists $why_suppressed{$complete_name}) {
+            if (exists $why_suppressed{$complete_name}
+                # Don't suppress if overridden
+                && ! grep { $_ eq $complete_name{$addr} }
+                                                    @output_mapped_properties)
+            {
                  $status{$addr} = $SUPPRESSED;
              }
              elsif (exists $why_deprecated{$complete_name}) {
@@ -4299,13 +4580,19 @@ sub trace { return main::trace(@_); }
  
      # Here are the methods that are required to be defined by any derived
      # class
-    for my $sub qw(
+    for my $sub (qw(
+                    handle_special_range
                      append_to_body
                      pre_body
-                )
-                # append_to_body and pre_body are called in the write() method
-                # to add stuff after the main body of the table, but before
-                # its close; and to prepend stuff before the beginning of the
+                ))
+                # write() knows how to write out normal ranges, but it calls
+                # handle_special_range() when it encounters a non-normal one.
+                # append_to_body() is called by it after it has handled all
+                # ranges to add anything after the main portion of the table.
+                # And finally, pre_body() is called after all this to build up
+                # anything that should appear before the main portion of the
+                # table.  Doing it this way allows things in the middle to
+                # affect what should appear before the main portion of the
                  # table.
      {
          no strict "refs";
@@ -4327,7 +4614,8 @@ sub trace { return main::trace(@_); }
      sub ranges {
          # Returns the array of ranges associated with this table.
  
-        return $range_list{main::objaddr shift}->ranges;
+        no overloading;
+        return $range_list{pack 'J', shift}->ranges;
      }
  
      sub add_alias {
@@ -4363,7 +4651,7 @@ sub trace { return main::trace(@_); }
          # release
          $name = ucfirst($name) unless $name =~ /^k[A-Z]/;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Figure out if should be loosely matched if not already specified.
          if (! defined $loose_match) {
@@ -4424,7 +4712,8 @@ sub trace { return main::trace(@_); }
  
          # This name may be shorter than any existing ones, so clear the cache
          # of the shortest, so will have to be recalculated.
-        undef $short_name{main::objaddr $self};
+        no overloading;
+        undef $short_name{pack 'J', $self};
          return;
      }
  
@@ -4447,7 +4736,7 @@ sub trace { return main::trace(@_); }
          my $nominal_length_ptr = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # For efficiency, don't recalculate, but this means that adding new
          # aliases could change what the shortest is, so the code that does
@@ -4522,7 +4811,8 @@ sub trace { return main::trace(@_); }
          chomp $description;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        push @{$description{main::objaddr $self}}, $description;
+        no overloading;
+        push @{$description{pack 'J', $self}}, $description;
  
          return;
      }
@@ -4534,19 +4824,24 @@ sub trace { return main::trace(@_); }
          chomp $note;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        push @{$note{main::objaddr $self}}, $note;
+        no overloading;
+        push @{$note{pack 'J', $self}}, $note;
  
          return;
      }
  
      sub add_comment { # Adds the parameter as a comment.
  
+        return unless $debugging_build;
+
          my $self = shift;
          my $comment = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
          chomp $comment;
-        push @{$comment{main::objaddr $self}}, $comment;
+
+        no overloading;
+        push @{$comment{pack 'J', $self}}, $comment;
  
          return;
      }
@@ -4559,7 +4854,8 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my @list = @{$comment{main::objaddr $self}};
+        my $addr = do { no overloading; pack 'J', $self; };
+        my @list = @{$comment{$addr}};
          return @list if wantarray;
          my $return = "";
          foreach my $sentence (@list) {
@@ -4576,13 +4872,14 @@ sub trace { return main::trace(@_); }
          # initialization for range lists.
  
          my $self = shift;
+        my $addr = do { no overloading; pack 'J', $self; };
          my $initialization = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
          # Replace the current range list with a new one of the same exact
          # type.
-        my $class = ref $range_list{main::objaddr $self};
-        $range_list{main::objaddr $self} = $class->new(Owner => $self,
+        my $class = ref $range_list{$addr};
+        $range_list{$addr} = $class->new(Owner => $self,
                                          Initialize => $initialization);
          return;
  
@@ -4598,12 +4895,16 @@ sub trace { return main::trace(@_); }
          my $return = "";
          $return .= $DEVELOPMENT_ONLY if $compare_versions;
          $return .= $HEADER;
-        $return .= $INTERNAL_ONLY if $internal_only{main::objaddr $self};
+        no overloading;
+        $return .= $INTERNAL_ONLY if $internal_only{pack 'J', $self};
          return $return;
      }
  
      sub write {
-        # Write a representation of the table to its file.
+        # Write a representation of the table to its file.  It calls several
+        # functions furnished by sub-classes of this abstract base class to
+        # handle non-normal ranges, to add stuff before the table, and at its
+        # end.
  
          my $self = shift;
          my $tab_stops = shift;       # The number of tab stops over to put any
@@ -4613,21 +4914,33 @@ sub trace { return main::trace(@_); }
                                       # the range
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Start with the header
-        my @OUT = $self->header;
+        my @HEADER = $self->header;
  
          # Then the comments
-        push @OUT, "\n", main::simple_fold($comment{$addr}, '# '), "\n"
+        push @HEADER, "\n", main::simple_fold($comment{$addr}, '# '), "\n"
                                                          if $comment{$addr};
  
-        # Then any pre-body stuff.
-        my $pre_body = $self->pre_body;
-        push @OUT, $pre_body, "\n" if $pre_body;
-
-        # The main body looks like a 'here' document
-        push @OUT, "return <<'END';\n";
+        # Things discovered processing the main body of the document may
+        # affect what gets output before it, therefore pre_body() isn't called
+        # until after all other processing of the table is done.
+
+        # The main body looks like a 'here' document.  If annotating, get rid
+        # of the comments before passing to the caller, as some callers, such
+        # as charnames.pm, can't cope with them.  (Outputting range counts
+        # also introduces comments, but these don't show up in the tables that
+        # can't cope with comments, and there aren't that many of them that
+        # it's worth the extra real time to get rid of them).
+        my @OUT;
+        if ($annotate) {
+            # Use the line below in Perls that don't have /r
+            #push @OUT, 'return join "\n",  map { s/\s*#.*//mg; $_ } split "\n", <<\'END\';' . "\n";
+            push @OUT, "return <<'END' =~ s/\\s*#.*//mgr;\n";
+        } else {
+            push @OUT, "return <<'END';\n";
+        }
  
          if ($range_list{$addr}->is_empty) {
  
@@ -4639,24 +4952,49 @@ sub trace { return main::trace(@_); }
          }
          else {
              my $range_size_1 = $range_size_1{$addr};
+            my $format;            # Used only in $annotate option
+            my $include_name;      # Used only in $annotate option
+
+            if ($annotate) {
+
+                # if annotating each code point, must print 1 per line.
+                # The variable could point to a subroutine, and we don't want
+                # to lose that fact, so only set if not set already
+                $range_size_1 = 1 if ! $range_size_1;
+
+                $format = $self->format;
+
+                # The name of the character is output only for tables that
+                # don't already include the name in the output.
+                my $property = $self->property;
+                $include_name =
+                    !  ($property == $perl_charname
+                        || $property == main::property_ref('Unicode_1_Name')
+                        || $property == main::property_ref('Name')
+                        || $property == main::property_ref('Name_Alias')
+                       );
+            }
  
              # Output each range as part of the here document.
+            RANGE:
              for my $set ($range_list{$addr}->ranges) {
+                if ($set->type != 0) {
+                    $self->handle_special_range($set);
+                    next RANGE;
+                }
                  my $start = $set->start;
                  my $end   = $set->end;
                  my $value  = $set->value;
  
                  # Don't output ranges whose value is the one to suppress
-                next if defined $suppress_value && $value eq $suppress_value;
+                next RANGE if defined $suppress_value
+                              && $value eq $suppress_value;
  
-                # If has or wants a single point range output
-                if ($start == $end || $range_size_1) {
-                    for my $i ($start .. $end) {
-                        push @OUT, sprintf "%04X\t\t%s\n", $i, $value;
-                    }
-                }
-                else  {
-                    push @OUT, sprintf "%04X\t%04X\t%s", $start, $end, $value;
+                # If there is a range and doesn't need a single point range
+                # output
+                if ($start != $end && ! $range_size_1) {
+                    push @OUT, sprintf "%04X\t%04X", $start, $end;
+                    $OUT[-1] .= "\t$value" if $value ne "";
  
                      # Add a comment with the size of the range, if requested.
                      # Expand Tabs to make sure they all start in the same
@@ -4676,6 +5014,166 @@ sub trace { return main::trace(@_); }
                                              $count);
                          $OUT[-1] = Text::Tabs::unexpand($OUT[-1]);
                      }
+                    next RANGE;
+                }
+
+                # Here to output a single code point per line
+
+                # If not to annotate, use the simple formats
+                if (! $annotate) {
+
+                    # Use any passed in subroutine to output.
+                    if (ref $range_size_1 eq 'CODE') {
+                        for my $i ($start .. $end) {
+                            push @OUT, &{$range_size_1}($i, $value);
+                        }
+                    }
+                    else {
+
+                        # Here, caller is ok with default output.
+                        for (my $i = $start; $i <= $end; $i++) {
+                            push @OUT, sprintf "%04X\t\t%s\n", $i, $value;
+                        }
+                    }
+                    next RANGE;
+                }
+
+                # Here, wants annotation.
+                for (my $i = $start; $i <= $end; $i++) {
+
+                    # Get character information if don't have it already
+                    main::populate_char_info($i)
+                                        if ! defined $viacode[$i];
+                    my $type = $annotate_char_type[$i];
+
+                    # Figure out if should output the next code points as part
+                    # of a range or not.  If this is not in an annotation
+                    # range, then won't output as a range, so returns $i.
+                    # Otherwise use the end of the annotation range, but no
+                    # further than the maximum possible end point of the loop.
+                    my $range_end = main::min($annotate_ranges->value_of($i)
+                                                                        || $i,
+                                               $end);
+
+                    # Use a range if it is a range, and either is one of the
+                    # special annotation ranges, or the range is at most 3
+                    # long.  This last case causes the algorithmically named
+                    # code points to be output individually in spans of at
+                    # most 3, as they are the ones whose $type is > 0.
+                    if ($range_end != $i
+                        && ( $type < 0 || $range_end - $i > 2))
+                    {
+                        # Here is to output a range.  We don't allow a
+                        # caller-specified output format--just use the
+                        # standard one.
+                        push @OUT, sprintf "%04X\t%04X\t%s\t#", $i,
+                                                                $range_end,
+                                                                $value;
+                        my $range_name = $viacode[$i];
+
+                        # For the code points which end in their hex value, we
+                        # eliminate that from the output annotation, and
+                        # capitalize only the first letter of each word.
+                        if ($type == $CP_IN_NAME) {
+                            my $hex = sprintf "%04X", $i;
+                            $range_name =~ s/-$hex$//;
+                            my @words = split " ", $range_name;
+                            for my $word (@words) {
+                                $word = ucfirst(lc($word)) if $word ne 'CJK';
+                            }
+                            $range_name = join " ", @words;
+                        }
+                        elsif ($type == $HANGUL_SYLLABLE) {
+                            $range_name = "Hangul Syllable";
+                        }
+
+                        $OUT[-1] .= " $range_name" if $range_name;
+
+                        # Include the number of code points in the range
+                        my $count = main::clarify_number($range_end - $i + 1);
+                        $OUT[-1] .= " [$count]\n";
+
+                        # Skip to the end of the range
+                        $i = $range_end;
+                    }
+                    else { # Not in a range.
+                        my $comment = "";
+
+                        # When outputting the names of each character, use
+                        # the character itself if printable
+                        $comment .= "'" . chr($i) . "' " if $printable[$i];
+
+                        # To make it more readable, use a minimum indentation
+                        my $comment_indent;
+
+                        # Determine the annotation
+                        if ($format eq $DECOMP_STRING_FORMAT) {
+
+                            # This is very specialized, with the type of
+                            # decomposition beginning the line enclosed in
+                            # <...>, and the code points that the code point
+                            # decomposes to separated by blanks.  Create two
+                            # strings, one of the printable characters, and
+                            # one of their official names.
+                            (my $map = $value) =~ s/ \ * < .*? > \ +//x;
+                            my $tostr = "";
+                            my $to_name = "";
+                            my $to_chr = "";
+                            foreach my $to (split " ", $map) {
+                                $to = CORE::hex $to;
+                                $to_name .= " + " if $to_name;
+                                $to_chr .= chr($to);
+                                main::populate_char_info($to)
+                                                    if ! defined $viacode[$to];
+                                $to_name .=  $viacode[$to];
+                            }
+
+                            $comment .=
+                                    "=> '$to_chr'; $viacode[$i] => $to_name";
+                            $comment_indent = 25;   # Determined by experiment
+                        }
+                        else {
+
+                            # Assume that any table that has hex format is a
+                            # mapping of one code point to another.
+                            if ($format eq $HEX_FORMAT) {
+                                my $decimal_value = CORE::hex $value;
+                                main::populate_char_info($decimal_value)
+                                        if ! defined $viacode[$decimal_value];
+                                $comment .= "=> '"
+                                         . chr($decimal_value)
+                                         . "'; " if $printable[$decimal_value];
+                            }
+                            $comment .= $viacode[$i] if $include_name
+                                                        && $viacode[$i];
+                            if ($format eq $HEX_FORMAT) {
+                                my $decimal_value = CORE::hex $value;
+                                $comment .= " => $viacode[$decimal_value]"
+                                                    if $viacode[$decimal_value];
+                            }
+
+                            # If including the name, no need to indent, as the
+                            # name will already be way across the line.
+                            $comment_indent = ($include_name) ? 0 : 60;
+                        }
+
+                        # Use any passed in routine to output the base part of
+                        # the line.
+                        if (ref $range_size_1 eq 'CODE') {
+                            my $base_part = &{$range_size_1}($i, $value);
+                            chomp $base_part;
+                            push @OUT, $base_part;
+                        }
+                        else {
+                            push @OUT, sprintf "%04X\t\t%s", $i, $value;
+                        }
+
+                        # And add the annotation.
+                        $OUT[-1] = sprintf "%-*s\t# %s", $comment_indent,
+                                                         $OUT[-1],
+                                                         $comment if $comment;
+                        $OUT[-1] .= "\n";
+                    }
                  }
              } # End of loop through all the table's ranges
          }
@@ -4688,10 +5186,18 @@ sub trace { return main::trace(@_); }
          # And finish the here document.
          push @OUT, "END\n";
  
+        # Done with the main portion of the body.  Can now figure out what
+        # should appear before it in the file.
+        my $pre_body = $self->pre_body;
+        push @HEADER, $pre_body, "\n" if $pre_body;
+
          # All these files have a .pl suffix
          $file_path{$addr}->[-1] .= '.pl';
  
-        main::write($file_path{$addr}, \@OUT);
+        main::write($file_path{$addr},
+                    $annotate,      # utf8 iff annotating
+                    \@HEADER,
+                    \@OUT);
          return;
      }
  
@@ -4701,7 +5207,7 @@ sub trace { return main::trace(@_); }
          my $info = shift;   # Any message associated with it.
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $status{$addr} = $status;
          $status_info{$addr} = $info;
@@ -4716,7 +5222,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $locked{$addr} = "";
  
@@ -4744,7 +5250,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return 0 if ! $locked{$addr};
          Carp::my_carp_bug("Can't modify a locked table. Stack trace of locking:\n$locked{$addr}\n\n");
@@ -4755,37 +5261,42 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          # Rest of parameters passed on
  
-        @{$file_path{main::objaddr $self}} = @_;
+        no overloading;
+        @{$file_path{pack 'J', $self}} = @_;
          return
      }
  
      # Accessors for the range list stored in this table.  First for
      # unconditional
-    for my $sub qw(
+    for my $sub (qw(
+                    containing_range
                      contains
                      count
                      each_range
                      hash
                      is_empty
+                    matches_identically_to
                      max
                      min
                      range_count
                      reset_each_range
+                    type_of
                      value_of
-                )
+                ))
      {
          no strict "refs";
          *$sub = sub {
              use strict "refs";
              my $self = shift;
-            return $range_list{main::objaddr $self}->$sub(@_);
+            no overloading;
+            return $range_list{pack 'J', $self}->$sub(@_);
          }
      }
  
      # Then for ones that should fail if locked
-    for my $sub qw(
+    for my $sub (qw(
                      delete_range
-                )
+                ))
      {
          no strict "refs";
          *$sub = sub {
@@ -4793,7 +5304,8 @@ sub trace { return main::trace(@_); }
              my $self = shift;
  
              return if $self->carp_if_locked;
-            return $range_list{main::objaddr $self}->$sub(@_);
+            no overloading;
+            return $range_list{pack 'J', $self}->$sub(@_);
          }
      }
  
@@ -4848,26 +5360,11 @@ sub trace { return main::trace(@_); }
                      \%anomalous_entries,
                      'readable_array');
  
-    my %format;
-    # The format of the entries of the table.  This is calculated from the
-    # data in the table (or passed in the constructor).  This is an enum e.g.,
-    # $STRING_FORMAT
-    main::set_access('format', \%format);
-
      my %core_access;
      # This is a string, solely for documentation, indicating how one can get
      # access to this property via the Perl core.
      main::set_access('core_access', \%core_access, 'r', 's');
  
-    my %has_specials;
-    # Boolean set when non-zero map-type ranges are added to this table,
-    # which happens in only a few tables.  This is purely for performance, to
-    # avoid having to search through every table upon output, so if all the
-    # non-zero maps got deleted before output, this would remain set, and the
-    # only penalty would be performance.  Currently, most map tables that get
-    # output have specials in them, so this doesn't help that much anyway.
-    main::set_access('has_specials', \%has_specials);
-
      my %to_output_map;
      # Boolean as to whether or not to write out this map table
      main::set_access('to_output_map', \%to_output_map, 's');
@@ -4884,7 +5381,6 @@ sub trace { return main::trace(@_); }
  
          my $core_access = delete $args{'Core_Access'};
          my $default_map = delete $args{'Default_Map'};
-        my $format = delete $args{'Format'};
          my $property = delete $args{'_Property'};
          my $full_name = delete $args{'Full_Name'};
          # Rest of parameters passed on
@@ -4899,12 +5395,11 @@ sub trace { return main::trace(@_); }
                                      _Range_List => $range_list,
                                      %args);
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $anomalous_entries{$addr} = [];
          $core_access{$addr} = $core_access;
          $default_map{$addr} = $default_map;
-        $format{$addr} = $format;
  
          $self->initialize($initialize) if defined $initialize;
  
@@ -4951,9 +5446,7 @@ sub trace { return main::trace(@_); }
          # Can't change the table if locked.
          return if $self->carp_if_locked;
  
-        my $addr = main::objaddr $self;
-
-        $has_specials{$addr} = 1 if $type;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $self->_range_list->add_map($lower, $upper,
                                      $string,
@@ -4969,7 +5462,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return "" unless @{$anomalous_entries{$addr}};
          return join("\n", @{$anomalous_entries{$addr}}) . "\n";
@@ -4996,8 +5489,8 @@ sub trace { return main::trace(@_); }
              return;
          }
  
-        my $addr = main::objaddr $self;
-        my $other_addr = main::objaddr $other;
+        my $addr = do { no overloading; pack 'J', $self; };
+        my $other_addr = do { no overloading; pack 'J', $other; };
  
          local $to_trace = 0 if main::DEBUG;
  
@@ -5014,11 +5507,6 @@ sub trace { return main::trace(@_); }
                                            Replace => $UNCONDITIONALLY);
          }
  
-        # Copy the specials information from the other table to $self
-        if ($has_specials{$other_addr}) {
-            $has_specials{$addr} = 1;
-        }
-
          return;
      }
  
@@ -5030,7 +5518,7 @@ sub trace { return main::trace(@_); }
          my $map = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Convert the input to the standard equivalent, if any (won't have any
          # for $STRING properties)
@@ -5075,7 +5563,7 @@ sub trace { return main::trace(@_); }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # If overridden, use that
          return $to_output_map{$addr} if defined $to_output_map{$addr};
@@ -5114,13 +5602,15 @@ sub trace { return main::trace(@_); }
          # Just before output, create the comment that heads the file
          # containing this table.
  
+        return unless $debugging_build;
+
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
          # No sense generating a comment if aren't going to write it out.
          return if ! $self->to_output_map;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my $property = $self->property;
  
@@ -5282,17 +5772,138 @@ END
  
      my %swash_keys; # Makes sure don't duplicate swash names.
  
+    # The remaining variables are temporaries used while writing each table,
+    # to output special ranges.
+    my $has_hangul_syllables;
+    my @multi_code_point_maps;  # Map is to more than one code point.
+
+    # The key is the base name of the code point, and the value is an
+    # array giving all the ranges that use this base name.  Each range
+    # is actually a hash giving the 'low' and 'high' values of it.
+    my %names_ending_in_code_point;
+
+    # Inverse mapping.  The list of ranges that have these kinds of
+    # names.  Each element contains the low, high, and base names in a
+    # hash.
+    my @code_points_ending_in_code_point;
+
+    sub handle_special_range {
+        # Called in the middle of write when it finds a range it doesn't know
+        # how to handle.
+
+        my $self = shift;
+        my $range = shift;
+        Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+
+        my $addr = do { no overloading; pack 'J', $self; };
+
+        my $type = $range->type;
+
+        my $low = $range->start;
+        my $high = $range->end;
+        my $map = $range->value;
+
+        # No need to output the range if it maps to the default.
+        return if $map eq $default_map{$addr};
+
+        # Switch based on the map type...
+        if ($type == $HANGUL_SYLLABLE) {
+
+            # These are entirely algorithmically determinable based on
+            # some constants furnished by Unicode; for now, just set a
+            # flag to indicate that have them.  After everything is figured
+            # out, we will output the code that does the algorithm.
+            $has_hangul_syllables = 1;
+        }
+        elsif ($type == $CP_IN_NAME) {
+
+            # Code points whose the name ends in their code point are also
+            # algorithmically determinable, but need information about the map
+            # to do so.  Both the map and its inverse are stored in data
+            # structures output in the file.
+            push @{$names_ending_in_code_point{$map}->{'low'}}, $low;
+            push @{$names_ending_in_code_point{$map}->{'high'}}, $high;
+
+            push @code_points_ending_in_code_point, { low => $low,
+                                                        high => $high,
+                                                        name => $map
+                                                    };
+        }
+        elsif ($range->type == $MULTI_CP || $range->type == $NULL) {
+
+            # Multi-code point maps and null string maps have an entry
+            # for each code point in the range.  They use the same
+            # output format.
+            for my $code_point ($low .. $high) {
+
+                # The pack() below can't cope with surrogates.
+                if ($code_point >= 0xD800 && $code_point <= 0xDFFF) {
+                    Carp::my_carp("Surrogate code point '$code_point' in mapping to '$map' in $self.  No map created");
+                    next;
+                }
+
+                # Generate the hash entries for these in the form that
+                # utf8.c understands.
+                my $tostr = "";
+                my $to_name = "";
+                my $to_chr = "";
+                foreach my $to (split " ", $map) {
+                    if ($to !~ /^$code_point_re$/) {
+                        Carp::my_carp("Illegal code point '$to' in mapping '$map' from $code_point in $self.  No map created");
+                        next;
+                    }
+                    $tostr .= sprintf "\\x{%s}", $to;
+                    $to = CORE::hex $to;
+                    if ($annotate) {
+                        $to_name .= " + " if $to_name;
+                        $to_chr .= chr($to);
+                        main::populate_char_info($to)
+                                            if ! defined $viacode[$to];
+                        $to_name .=  $viacode[$to];
+                    }
+                }
+
+                # I (khw) have never waded through this line to
+                # understand it well enough to comment it.
+                my $utf8 = sprintf(qq["%s" => "$tostr",],
+                        join("", map { sprintf "\\x%02X", $_ }
+                            unpack("U0C*", pack("U", $code_point))));
+
+                # Add a comment so that a human reader can more easily
+                # see what's going on.
+                push @multi_code_point_maps,
+                        sprintf("%-45s # U+%04X", $utf8, $code_point);
+                if (! $annotate) {
+                    $multi_code_point_maps[-1] .= " => $map";
+                }
+                else {
+                    main::populate_char_info($code_point)
+                                    if ! defined $viacode[$code_point];
+                    $multi_code_point_maps[-1] .= " '"
+                        . chr($code_point)
+                        . "' => '$to_chr'; $viacode[$code_point] => $to_name";
+                }
+            }
+        }
+        else {
+            Carp::my_carp("Unrecognized map type '$range->type' in '$range' in $self.  Not written");
+        }
+
+        return;
+    }
+
      sub pre_body {
          # Returns the string that should be output in the file before the main
-        # body of this table.  This includes some hash entries identifying the
-        # format of the body, and what the single value should be for all
-        # ranges missing from it.  It also includes any code points which have
-        # map_types that don't go in the main table.
+        # body of this table.  It isn't called until the main body is
+        # calculated, saving a pass.  The string includes some hash entries
+        # identifying the format of the body, and what the single value should
+        # be for all ranges missing from it.  It also includes any code points
+        # which have map_types that don't go in the main table.
  
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my $name = $self->property->swash_name;
  
@@ -5306,180 +5917,76 @@ END
          }
          $swash_keys{$name} = "$self";
  
-        my $default_map = $default_map{$addr};
-
          my $pre_body = "";
-        if ($has_specials{$addr}) {
-
-            # Here, some maps with non-zero type have been added to the table.
-            # Go through the table and handle each of them.  None will appear
-            # in the body of the table, so delete each one as we go.  The
-            # code point count has already been calculated, so ok to delete
-            # now.
-
-            my @multi_code_point_maps;
-            my $has_hangul_syllables = 0;
-
-            # The key is the base name of the code point, and the value is an
-            # array giving all the ranges that use this base name.  Each range
-            # is actually a hash giving the 'low' and 'high' values of it.
-            my %names_ending_in_code_point;
-
-            # Inverse mapping.  The list of ranges that have these kinds of
-            # names.  Each element contains the low, high, and base names in a
-            # hash.
-            my @code_points_ending_in_code_point;
-
-            my $range_map = $self->_range_list;
-            foreach my $range ($range_map->ranges) {
-                next unless $range->type != 0;
-                my $low = $range->start;
-                my $high = $range->end;
-                my $map = $range->value;
-                my $type = $range->type;
-
-                # No need to output the range if it maps to the default.  And
-                # the write method won't output it either, so no need to
-                # delete it to keep it from being output, and is faster to
-                # skip than to delete anyway.
-                next if $map eq $default_map;
-
-                # Delete the range to keep write() from trying to output it
-                $range_map->delete_range($low, $high);
-
-                # Switch based on the map type...
-                if ($type == $HANGUL_SYLLABLE) {
-
-                    # These are entirely algorithmically determinable based on
-                    # some constants furnished by Unicode; for now, just set a
-                    # flag to indicate that have them.  Below we will output
-                    # the code that does the algorithm.
-                    $has_hangul_syllables = 1;
-                }
-                elsif ($type == $CP_IN_NAME) {
-
-                    # If the name ends in the code point it represents, are
-                    # also algorithmically determinable, but need information
-                    # about the map to do so.  Both the map and its inverse
-                    # are stored in data structures output in the file.
-                    push @{$names_ending_in_code_point{$map}->{'low'}}, $low;
-                    push @{$names_ending_in_code_point{$map}->{'high'}}, $high;
-
-                    push @code_points_ending_in_code_point, { low => $low,
-                                                              high => $high,
-                                                              name => $map
-                                                            };
-                }
-                elsif ($range->type == $MULTI_CP || $range->type == $NULL) {
-
-                    # Multi-code point maps and null string maps have an entry
-                    # for each code point in the range.  They use the same
-                    # output format.
-                    for my $code_point ($low .. $high) {
-
-                        # The pack() below can't cope with surrogates.
-                        if ($code_point >= 0xD800 && $code_point <= 0xDFFF) {
-                            Carp::my_carp("Surrogage code point '$code_point' in mapping to '$map' in $self.  No map created");
-                            next;
-                        }
  
-                        # Generate the hash entries for these in the form that
-                        # utf8.c understands.
-                        my $tostr = "";
-                        foreach my $to (split " ", $map) {
-                            if ($to !~ /^$code_point_re$/) {
-                                Carp::my_carp("Illegal code point '$to' in mapping '$map' from $code_point in $self.  No map created");
-                                next;
-                            }
-                            $tostr .= sprintf "\\x{%s}", $to;
-                        }
-
-                        # I (khw) have never waded through this line to
-                        # understand it well enough to comment it.
-                        my $utf8 = sprintf(qq["%s" => "$tostr",],
-                                join("", map { sprintf "\\x%02X", $_ }
-                                    unpack("U0C*", pack("U", $code_point))));
-
-                        # Add a comment so that a human reader can more easily
-                        # see what's going on.
-                        push @multi_code_point_maps,
-                                sprintf("%-45s # U+%04X => %s", $utf8,
-                                                                $code_point,
-                                                                $map);
-                    }
-                }
-                else {
-                    Carp::my_carp("Unrecognized map type '$range->type' in '$range' in $self.  Using type 0 instead");
-                    $range_map->add_map($low, $high, $map, Replace => $UNCONDITIONALLY, Type => 0);
-                }
-            } # End of loop through all ranges
-
-            # Here have gone through the whole file.  If actually generated
-            # anything for each map type, add its respective header and
-            # trailer
-            if (@multi_code_point_maps) {
-                $pre_body .= <<END;
+        # Here we assume we were called after have gone through the whole
+        # file.  If we actually generated anything for each map type, add its
+        # respective header and trailer
+        if (@multi_code_point_maps) {
+            $pre_body .= <<END;
  
  # Some code points require special handling because their mappings are each to
  # multiple code points.  These do not appear in the main body, but are defined
  # in the hash below.
  
-# The key: UTF-8 _bytes_, the value: UTF-8 (speed hack)
+# Each key is the string of N bytes that together make up the UTF-8 encoding
+# for the code point.  (i.e. the same as looking at the code point's UTF-8
+# under "use bytes").  Each value is the UTF-8 of the translation, for speed.
  %utf8::ToSpec$name = (
  END
-                $pre_body .= join("\n", @multi_code_point_maps) . "\n);\n";
-            }
-
-            if ($has_hangul_syllables || @code_points_ending_in_code_point) {
-
-                # Convert these structures to output format.
-                my $code_points_ending_in_code_point =
-                    main::simple_dumper(\@code_points_ending_in_code_point,
-                                        ' ' x 8);
-                my $names = main::simple_dumper(\%names_ending_in_code_point,
-                                                ' ' x 8);
-
-                # Do the same with the Hangul names,
-                my $jamo;
-                my $jamo_l;
-                my $jamo_v;
-                my $jamo_t;
-                my $jamo_re;
-                if ($has_hangul_syllables) {
-
-                    # Construct a regular expression of all the possible
-                    # combinations of the Hangul syllables.
-                    my @L_re;   # Leading consonants
-                    for my $i ($LBase .. $LBase + $LCount - 1) {
-                        push @L_re, $Jamo{$i}
-                    }
-                    my @V_re;   # Middle vowels
-                    for my $i ($VBase .. $VBase + $VCount - 1) {
-                        push @V_re, $Jamo{$i}
-                    }
-                    my @T_re;   # Trailing consonants
-                    for my $i ($TBase + 1 .. $TBase + $TCount - 1) {
-                        push @T_re, $Jamo{$i}
-                    }
-
-                    # The whole re is made up of the L V T combination.
-                    $jamo_re = '('
-                               . join ('|', sort @L_re)
-                               . ')('
-                               . join ('|', sort @V_re)
-                               . ')('
-                               . join ('|', sort @T_re)
-                               . ')?';
-
-                    # These hashes needed by the algorithm were generated
-                    # during reading of the Jamo.txt file
-                    $jamo = main::simple_dumper(\%Jamo, ' ' x 8);
-                    $jamo_l = main::simple_dumper(\%Jamo_L, ' ' x 8);
-                    $jamo_v = main::simple_dumper(\%Jamo_V, ' ' x 8);
-                    $jamo_t = main::simple_dumper(\%Jamo_T, ' ' x 8);
+            $pre_body .= join("\n", @multi_code_point_maps) . "\n);\n";
+        }
+
+        if ($has_hangul_syllables || @code_points_ending_in_code_point) {
+
+            # Convert these structures to output format.
+            my $code_points_ending_in_code_point =
+                main::simple_dumper(\@code_points_ending_in_code_point,
+                                    ' ' x 8);
+            my $names = main::simple_dumper(\%names_ending_in_code_point,
+                                            ' ' x 8);
+
+            # Do the same with the Hangul names,
+            my $jamo;
+            my $jamo_l;
+            my $jamo_v;
+            my $jamo_t;
+            my $jamo_re;
+            if ($has_hangul_syllables) {
+
+                # Construct a regular expression of all the possible
+                # combinations of the Hangul syllables.
+                my @L_re;   # Leading consonants
+                for my $i ($LBase .. $LBase + $LCount - 1) {
+                    push @L_re, $Jamo{$i}
+                }
+                my @V_re;   # Middle vowels
+                for my $i ($VBase .. $VBase + $VCount - 1) {
+                    push @V_re, $Jamo{$i}
+                }
+                my @T_re;   # Trailing consonants
+                for my $i ($TBase + 1 .. $TBase + $TCount - 1) {
+                    push @T_re, $Jamo{$i}
                  }
  
-                $pre_body .= <<END;
+                # The whole re is made up of the L V T combination.
+                $jamo_re = '('
+                            . join ('|', sort @L_re)
+                            . ')('
+                            . join ('|', sort @V_re)
+                            . ')('
+                            . join ('|', sort @T_re)
+                            . ')?';
+
+                # These hashes needed by the algorithm were generated
+                # during reading of the Jamo.txt file
+                $jamo = main::simple_dumper(\%Jamo, ' ' x 8);
+                $jamo_l = main::simple_dumper(\%Jamo_L, ' ' x 8);
+                $jamo_v = main::simple_dumper(\%Jamo_V, ' ' x 8);
+                $jamo_t = main::simple_dumper(\%Jamo_T, ' ' x 8);
+            }
+
+            $pre_body .= <<END;
  
  # To achieve significant memory savings when this file is read in,
  # algorithmically derivable code points are omitted from the main body below.
@@ -5506,10 +6013,10 @@ $names
  $code_points_ending_in_code_point
      );
  END
-                # Earlier releases didn't have Jamos.  No sense outputting
-                # them unless will be used.
-                if ($has_hangul_syllables) {
-                    $pre_body .= <<END;
+            # Earlier releases didn't have Jamos.  No sense outputting
+            # them unless will be used.
+            if ($has_hangul_syllables) {
+                $pre_body .= <<END;
  
      # Convert from code point to Jamo short name for use in composing Hangul
      # syllable names
@@ -5541,19 +6048,19 @@ $jamo_t
      # These constants names and values were taken from the Unicode standard,
      # version 5.1, section 3.12.  They are used in conjunction with Hangul
      # syllables
-    my \$SBase = 0xAC00;
-    my \$LBase = 0x1100;
-    my \$VBase = 0x1161;
-    my \$TBase = 0x11A7;
-    my \$SCount = 11172;
-    my \$LCount = 19;
-    my \$VCount = 21;
-    my \$TCount = 28;
+    my \$SBase = $SBase_string;
+    my \$LBase = $LBase_string;
+    my \$VBase = $VBase_string;
+    my \$TBase = $TBase_string;
+    my \$SCount = $SCount;
+    my \$LCount = $LCount;
+    my \$VCount = $VCount;
+    my \$TCount = $TCount;
      my \$NCount = \$VCount * \$TCount;
  END
-                } # End of has Jamos
+            } # End of has Jamos
  
-                $pre_body .= << 'END';
+            $pre_body .= << 'END';
  
      sub name_to_code_point_special {
          my $name = shift;
@@ -5561,8 +6068,8 @@ END
          # Returns undef if not one of the specially handled names; otherwise
          # returns the code point equivalent to the input name
  END
-                if ($has_hangul_syllables) {
-                    $pre_body .= << 'END';
+            if ($has_hangul_syllables) {
+                $pre_body .= << 'END';
  
          if (substr($name, 0, $HANGUL_SYLLABLE_LENGTH) eq $HANGUL_SYLLABLE) {
              $name = substr($name, $HANGUL_SYLLABLE_LENGTH);
@@ -5573,8 +6080,8 @@ END
              return ($L * $VCount + $V) * $TCount + $T + $SBase;
          }
  END
-                }
-                $pre_body .= << 'END';
+            }
+            $pre_body .= << 'END';
  
          # Name must end in '-code_point' for this to handle.
          if ($name !~ /^ (.*) - ($code_point_re) $/x) {
@@ -5608,8 +6115,8 @@ END
          # Returns the name of a code point if algorithmically determinable;
          # undef if not
  END
-                if ($has_hangul_syllables) {
-                    $pre_body .= << 'END';
+            if ($has_hangul_syllables) {
+                $pre_body .= << 'END';
  
          # If in the Hangul range, calculate the name based on Unicode's
          # algorithm
@@ -5619,13 +6126,13 @@ END
              my $L = $LBase + $SIndex / $NCount;
              my $V = $VBase + ($SIndex % $NCount) / $TCount;
              my $T = $TBase + $SIndex % $TCount;
-            $name = "$HANGUL_SYLLABLE $Jamo{$L}$Jamo{$V}";
+            $name = "$HANGUL_SYLLABLE$Jamo{$L}$Jamo{$V}";
              $name .= $Jamo{$T} if $T != $TBase;
              return $name;
          }
  END
-                }
-                $pre_body .= << 'END';
+            }
+            $pre_body .= << 'END';
  
          # Look through list of these code points for one in range.
          foreach my $hash (@code_points_ending_in_code_point) {
@@ -5639,13 +6146,50 @@ END
  } # End closure
  
  END
-            } # End of has hangul or code point in name maps.
-        } # End of has specials
+        } # End of has hangul or code point in name maps.
+
+        my $format = $self->format;
+
+        my $return = <<END;
+# The name this swash is to be known by, with the format of the mappings in
+# the main body of the table, and what all code points missing from this file
+# map to.
+\$utf8::SwashInfo{'To$name'}{'format'} = '$format'; # $map_table_formats{$format}
+END
+        my $default_map = $default_map{$addr};
+        $return .= "\$utf8::SwashInfo{'To$name'}{'missing'} = '$default_map';";
+
+        if ($default_map eq $CODE_POINT) {
+            $return .= ' # code point maps to itself';
+        }
+        elsif ($default_map eq "") {
+            $return .= ' # code point maps to the null string';
+        }
+        $return .= "\n";
+
+        $return .= $pre_body;
+
+        return $return;
+    }
+
+    sub write {
+        # Write the table to the file.
+
+        my $self = shift;
+        Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+
+        my $addr = do { no overloading; pack 'J', $self; };
+
+        # Clear the temporaries
+        $has_hangul_syllables = 0;
+        undef @multi_code_point_maps;
+        undef %names_ending_in_code_point;
+        undef @code_points_ending_in_code_point;
  
          # Calculate the format of the table if not already done.
-        my $format = $format{$addr};
-        my $property = $self->property;
-        my $type = $property->type;
+        my $format = $self->format;
+        my $type = $self->property->type;
+        my $default_map = $self->default_map;
          if (! defined $format) {
              if ($type == $BINARY) {
  
@@ -5676,6 +6220,8 @@ END
                      # most restrictive, and so on.
                      $format = $DECIMAL_FORMAT;
                      foreach my $range (@ranges) {
+                        next if $range->type != 0;  # Non-normal ranges don't
+                                                    # affect the main body
                          my $map = $range->value;
                          if ($map ne $default_map) {
                              last if $format eq $STRING_FORMAT;  # already at
@@ -5701,53 +6247,27 @@ END
              }
          } # end of calculating format
  
-        my $return = <<END;
-# The name this swash is to be known by, with the format of the mappings in
-# the main body of the table, and what all code points missing from this file
-# map to.
-\$utf8::SwashInfo{'To$name'}{'format'} = '$format'; # $map_table_formats{$format}
-END
-        my $missing = $default_map;
-        if ($missing eq $CODE_POINT
+        if ($default_map eq $CODE_POINT
              && $format ne $HEX_FORMAT
-            && ! defined $format{$addr})    # Is expected if was manually set
+            && ! defined $self->format)    # manual settings are always
+                                           # considered ok
          {
              Carp::my_carp_bug("Expecting hex format for mapping table for $self, instead got '$format'")
          }
-        $format{$addr} = $format;
-        $return .= "\$utf8::SwashInfo{'To$name'}{'missing'} = '$missing';";
-        if ($missing eq $CODE_POINT) {
-            $return .= ' # code point maps to itself';
-        }
-        elsif ($missing eq "") {
-            $return .= ' # code point maps to the null string';
-        }
-        $return .= "\n";
-
-        $return .= $pre_body;
-
-        return $return;
-    }
-
-    sub write {
-        # Write the table to the file.
-
-        my $self = shift;
-        Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        $self->_set_format($format);
  
          return $self->SUPER::write(
              ($self->property == $block)
                  ? 7     # block file needs more tab stops
                  : 3,
-            $default_map{$addr});   # don't write defaulteds
+            $default_map);   # don't write defaulteds
      }
  
      # Accessors for the underlying list that should fail if locked.
-    for my $sub qw(
+    for my $sub (qw(
                      add_duplicate
-                )
+                ))
      {
          no strict "refs";
          *$sub = sub {
@@ -5859,6 +6379,7 @@ sub trace { return main::trace(@_); }
          # Optional
          my $initialize = delete $args{'Initialize'};
          my $matches_all = delete $args{'Matches_All'} || 0;
+        my $format = delete $args{'Format'};
          # Rest of parameters passed on.
  
          my $range_list = Range_List->new(Initialize => $initialize,
@@ -5875,15 +6396,15 @@ sub trace { return main::trace(@_); }
          # places in this program that assume an equal sign)
          $complete = $property->full_name . "=$complete" if $property != $perl;
  
-
          my $self = $class->SUPER::new(%args,
                                        Name => $name,
                                        Complete_Name => $complete,
                                        Full_Name => $full_name,
                                        _Property => $property,
                                        _Range_List => $range_list,
+                                      Format => $EMPTY_FORMAT,
                                        );
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $conflicting{$addr} = [ ];
          $equivalents{$addr} = [ ];
@@ -5892,6 +6413,10 @@ sub trace { return main::trace(@_); }
          $leader{$addr} = $self;
          $parent{$addr} = $self;
  
+        if (defined $format && $format ne $EMPTY_FORMAT) {
+            Carp::my_carp_bug("'Format' must be '$EMPTY_FORMAT' in a match table instead of '$format'.  Using '$EMPTY_FORMAT'");
+        }
+
          return $self;
      }
  
@@ -5924,7 +6449,7 @@ sub trace { return main::trace(@_); }
  
                          return if $self->carp_if_locked;
  
-                        my $addr = main::objaddr $self;
+                        my $addr = do { no overloading; pack 'J', $self; };
  
                          if (ref $other) {
  
@@ -5991,7 +6516,7 @@ sub trace { return main::trace(@_); }
                                          # be an optional parameter.
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Check if the conflicting name is exactly the same as any existing
          # alias in this table (as long as there is a real object there to
@@ -6020,7 +6545,7 @@ sub trace { return main::trace(@_); }
          return;
      }
  
-    sub is_equivalent_to {
+    sub is_set_equivalent_to {
          # Return boolean of whether or not the other object is a table of this
          # type and has been marked equivalent to this one.
  
@@ -6033,53 +6558,16 @@ sub trace { return main::trace(@_); }
          unless ($other->isa(__PACKAGE__)) {
              my $ref_other = ref $other;
              my $ref_self = ref $self;
-            Carp::my_carp_bug("Argument to 'is_equivalent_to' must be another $ref_self, not a '$ref_other'.  $other not set equivalent to $self.");
+            Carp::my_carp_bug("Argument to 'is_set_equivalent_to' must be another $ref_self, not a '$ref_other'.  $other not set equivalent to $self.");
              return 0;
          }
  
          # Two tables are equivalent if they have the same leader.
-        return $leader{main::objaddr $self}
-                == $leader{main::objaddr $other};
+        no overloading;
+        return $leader{pack 'J', $self} == $leader{pack 'J', $other};
          return;
      }
  
-    sub matches_identically_to {
-        # Return a boolean as to whether or not two tables match identical
-        # sets of code points.
-
-        my $self = shift;
-        my $other = shift;
-        Carp::carp_extra_args(\@_) if main::DEBUG && @_;
-
-        unless ($other->isa(__PACKAGE__)) {
-            my $ref_other = ref $other;
-            my $ref_self = ref $self;
-            Carp::my_carp_bug("Argument to 'matches_identically_to' must be another $ref_self, not a '$ref_other'.  $other not set equivalent to $self.");
-            return 0;
-        }
-
-        # These are ordered in increasing real time to figure out (at least
-        # until a patch changes that and doesn't change this)
-        return 0 if $self->max != $other->max;
-        return 0 if $self->min != $other->min;
-        return 0 if $self->range_count != $other->range_count;
-        return 0 if $self->count != $other->count;
-
-        # Here they could be identical because all the tests above passed.
-        # The loop below is somewhat simpler since we know they have the same
-        # number of elements.  Compare range by range, until reach the end or
-        # find something that differs.
-        my @a_ranges = $self->_range_list->ranges;
-        my @b_ranges = $other->_range_list->ranges;
-        for my $i (0 .. @a_ranges - 1) {
-            my $a = $a_ranges[$i];
-            my $b = $b_ranges[$i];
-            trace "self $a; other $b" if main::DEBUG && $to_trace;
-            return 0 if $a->start != $b->start || $a->end != $b->end;
-        }
-        return 1;
-    }
-
      sub set_equivalent_to {
          # Set $self equivalent to the parameter table.
          # The required Related => 'x' parameter is a boolean indicating
@@ -6090,7 +6578,7 @@ sub trace { return main::trace(@_); }
          # not quite so many.
          # If they are related, one must be a perl extension.  This is because
          # we can't guarantee that Unicode won't change one or the other in a
-        # later release even if they are idential now.
+        # later release even if they are identical now.
  
          my $self = shift;
          my $other = shift;
@@ -6110,23 +6598,31 @@ sub trace { return main::trace(@_); }
  
          # If already are equivalent, no need to re-do it;  if subroutine
          # returns null, it found an error, also do nothing
-        my $are_equivalent = $self->is_equivalent_to($other);
+        my $are_equivalent = $self->is_set_equivalent_to($other);
          return if ! defined $are_equivalent || $are_equivalent;
  
-        my $current_leader = ($related)
-                             ? $parent{main::objaddr $self}
-                             : $leader{main::objaddr $self};
+        my $addr = do { no overloading; pack 'J', $self; };
+        my $current_leader = ($related) ? $parent{$addr} : $leader{$addr};
  
-        if ($related &&
-            ! $other->perl_extension
-            && ! $current_leader->perl_extension)
-        {
-            Carp::my_carp_bug("set_equivalent_to should have 'Related => 0 for equivalencing two Unicode properties.  Assuming $self is not related to $other");
-            $related = 0;
+        if ($related) {
+            if ($current_leader->perl_extension) {
+                if ($other->perl_extension) {
+                    Carp::my_carp_bug("Use add_alias() to set two Perl tables '$self' and '$other', equivalent.");
+                    return;
+                }
+            } elsif (! $other->perl_extension) {
+                Carp::my_carp_bug("set_equivalent_to should have 'Related => 0 for equivalencing two Unicode properties.  Assuming $self is not related to $other");
+                $related = 0;
+            }
+        }
+
+        if (! $self->is_empty && ! $self->matches_identically_to($other)) {
+            Carp::my_carp_bug("$self should be empty or match identically to $other.  Not setting equivalent");
+            return;
          }
  
-        my $leader = main::objaddr $current_leader;
-        my $other_addr = main::objaddr $other;
+        my $leader = do { no overloading; pack 'J', $current_leader; };
+        my $other_addr = do { no overloading; pack 'J', $other; };
  
          # Any tables that are equivalent to or children of this table must now
          # instead be equivalent to or (children) to the new leader (parent),
@@ -6137,11 +6633,12 @@ sub trace { return main::trace(@_); }
          my $status = $other->status;
          my $status_info = $other->status_info;
          my $matches_all = $matches_all{other_addr};
+        my $caseless_equivalent = $other->caseless_equivalent;
          foreach my $table ($current_leader, @{$equivalents{$leader}}) {
              next if $table == $other;
              trace "setting $other to be the leader of $table, status=$status" if main::DEBUG && $to_trace;
  
-            my $table_addr = main::objaddr $table;
+            my $table_addr = do { no overloading; pack 'J', $table; };
              $leader{$table_addr} = $other;
              $matches_all{$table_addr} = $matches_all;
              $self->_set_range_list($other->_range_list);
@@ -6150,6 +6647,7 @@ sub trace { return main::trace(@_); }
                  $parent{$table_addr} = $other;
                  push @{$children{$other_addr}}, $table;
                  $table->set_status($status, $status_info);
+                $self->set_caseless_equivalent($caseless_equivalent);
              }
          }
  
@@ -6191,11 +6689,13 @@ sub trace { return main::trace(@_); }
          # ones that share the same file.  It lists all such tables, ordered so
          # that related ones are together.
  
+        return unless $debugging_build;
+
          my $leader = shift;   # Should only be called on the leader table of
                                # an equivalent group
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $leader;
+        my $addr = do { no overloading; pack 'J', $leader; };
  
          if ($leader{$addr} != $leader) {
              Carp::my_carp_bug(<<END
@@ -6250,7 +6750,7 @@ END
                  && $parent == $property->table('N')
                  && defined (my $yes = $property->table('Y')))
              {
-                my $yes_addr = main::objaddr $yes;
+                my $yes_addr = do { no overloading; pack 'J', $yes; };
                  @yes_perl_synonyms
                      = grep { $_->property == $perl }
                                      main::uniques($yes,
@@ -6266,11 +6766,12 @@ END
              my @conflicting;        # Will hold the table conflicts.
  
              # Look at the parent, any yes synonyms, and all the children
+            my $parent_addr = do { no overloading; pack 'J', $parent; };
              for my $table ($parent,
                             @yes_perl_synonyms,
-                           @{$children{main::objaddr $parent}})
+                           @{$children{$parent_addr}})
              {
-                my $table_addr = main::objaddr $table;
+                my $table_addr = do { no overloading; pack 'J', $table; };
                  my $table_property = $table->property;
  
                  # Tables are separated by a blank line to create a grouping.
@@ -6516,10 +7017,10 @@ END
      }
  
      # Accessors for the underlying list
-    for my $sub qw(
+    for my $sub (qw(
                      get_valid_code_point
                      get_invalid_code_point
-                )
+                ))
      {
          no strict "refs";
          *$sub = sub {
@@ -6586,7 +7087,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          # each of them is stored in %alias_to_property_of as they are defined.
          # But it's possible that this subroutine will be called with some
          # variant, so if the initial lookup fails, it is repeated with the
-        # standarized form of the input name.  If found, besides returning the
+        # standardized form of the input name.  If found, besides returning the
          # result, the input name is added to the list so future calls won't
          # have to do the conversion again.
  
@@ -6687,7 +7188,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          my %args = @_;
  
          $self = bless \do { my $anonymous_scalar }, $class;
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          $directory{$addr} = delete $args{'Directory'};
          $file{$addr} = delete $args{'File'};
@@ -6740,14 +7241,15 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
                          . " argument to '-='.  Subtraction ignored.");
              return $self;
          }
-        elsif ($reversed) {   # Shouldnt happen in a -=, but just in case
+        elsif ($reversed) {   # Shouldn't happen in a -=, but just in case
              Carp::my_carp_bug("Can't cope with a "
              .  __PACKAGE__
              . " being the first parameter in a '-='.  Subtraction ignored.");
              return $self;
          }
          else {
-            $map{main::objaddr $self}->delete_range($other, $other);
+            no overloading;
+            $map{pack 'J', $self}->delete_range($other, $other);
          }
          return $self;
      }
@@ -6760,7 +7262,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          my $name = shift;
          my %args = @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my $table = $table_ref{$addr}{$name};
          my $standard_name = main::standardize($name);
@@ -6828,7 +7330,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          my $name = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return $table_ref{$addr}{$name} if defined $table_ref{$addr}{$name};
  
@@ -6846,7 +7348,8 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          # Return a list of pointers to all the match tables attached to this
          # property
  
-        return main::uniques(values %{$table_ref{main::objaddr shift}});
+        no overloading;
+        return main::uniques(values %{$table_ref{pack 'J', shift}});
      }
  
      sub directory {
@@ -6855,7 +7358,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          # priority;  'undef' is returned if the type isn't defined;
          # or $map_directory for everything else.
  
-        my $addr = main::objaddr shift;
+        my $addr = do { no overloading; pack 'J', shift; };
  
          return $directory{$addr} if defined $directory{$addr};
          return undef if $type{$addr} == $UNKNOWN;
@@ -6876,7 +7379,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          return $file{$addr} if defined $file{$addr};
          return $map{$addr}->external_name;
@@ -6892,7 +7395,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          # The whole point of this pseudo property is match tables.
          return 1 if $self == $perl;
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # Don't generate tables of code points that match the property values
          # of a string property.  Such a list would most likely have many
@@ -6926,8 +7429,8 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
              return;
          }
  
-        return $map{main::objaddr $self}->
-                map_add_or_replace_non_nulls($map{main::objaddr $other});
+        no overloading;
+        return $map{pack 'J', $self}->map_add_or_replace_non_nulls($map{pack 'J', $other});
      }
  
      sub set_type {
@@ -6946,7 +7449,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
              return;
          }
  
-        $type{main::objaddr $self} = $type;
+        { no overloading; $type{pack 'J', $self} = $type; }
          return if $type != $BINARY;
  
          my $yes = $self->table('Y');
@@ -6976,7 +7479,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          my $map = shift;    # What the range maps to.
          # Rest of parameters passed on.
  
-        my $addr = main::objaddr $self;
+        my $addr = do { no overloading; pack 'J', $self; };
  
          # If haven't the type of the property, gather information to figure it
          # out.
@@ -7028,7 +7531,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          my $self = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-        my $addr = main::objaddr($self);
+        my $addr = do { no overloading; pack 'J', $self; };
  
          my $type = $type{$addr};
  
@@ -7082,7 +7585,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
  
      # Most of the accessors for a property actually apply to its map table.
      # Setup up accessor functions for those, referring to %map
-    for my $sub qw(
+    for my $sub (qw(
                      add_alias
                      add_anomalous_entry
                      add_comment
@@ -7093,6 +7596,7 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
                      aliases
                      comment
                      complete_name
+                    containing_range
                      core_access
                      count
                      default_map
@@ -7125,9 +7629,10 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
                      status
                      status_info
                      to_output_map
+                    type_of
                      value_of
                      write
-                )
+                ))
                      # 'property' above is for symmetry, so that one can take
                      # the property of a property and get itself, and so don't
                      # have to distinguish between properties and tables in
@@ -7137,7 +7642,8 @@ sub trace { return main::trace(@_) if main::DEBUG && $to_trace }
          *$sub = sub {
              use strict "refs";
              my $self = shift;
-            return $map{main::objaddr $self}->$sub(@_);
+            no overloading;
+            return $map{pack 'J', $self}->$sub(@_);
          }
      }
  
@@ -7158,7 +7664,7 @@ sub join_lines($) {
      # A blank separates the joined lines except if there is a break; an extra
      # blank is inserted after a period ending a line.
  
-    # Intialize the return with the first line.
+    # Initialize the return with the first line.
      my ($return, @lines) = split "\n", shift;
  
      # If the first line is null, it was an empty line, add the \n back in
@@ -7400,19 +7906,15 @@ sub force_unlink ($) {
      return;
  }
  
-sub write ($\@) {
-    # Given a filename and a reference to an array of lines, write the lines
-    # to the file
+sub write ($$@) {
+    # Given a filename and references to arrays of lines, write the lines of
+    # each array to the file
      # Filename can be given as an arrayref of directory names
  
-    my $file  = shift;
-    my $lines_ref = shift;
-    Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+    return Carp::carp_too_few_args(\@_, 3) if main::DEBUG && @_ < 3;
  
-    if (! defined $lines_ref) {
-        Carp::my_carp("Missing lines to write parameter for $file.  Writing skipped;");
-        return;
-    }
+    my $file  = shift;
+    my $use_utf8 = shift;
  
      # Get into a single string if an array, and get rid of, in Unix terms, any
      # leading '.'
@@ -7425,15 +7927,6 @@ sub write ($\@) {
  
      push @files_actually_output, $file;
  
-    my $text;
-    if (@$lines_ref) {
-        $text = join "", @$lines_ref;
-    }
-    else {
-        $text = "";
-        Carp::my_carp("Output file '$file' is empty; writing it anyway;");
-    }
-
      force_unlink ($file);
  
      my $OUT;
@@ -7441,10 +7934,20 @@ sub write ($\@) {
          Carp::my_carp("can't open $file for output.  Skipping this file: $!");
          return;
      }
+
+    binmode $OUT, ":utf8" if $use_utf8;
+
+    while (defined (my $lines_ref = shift)) {
+        unless (@$lines_ref) {
+            Carp::my_carp("An array of lines for writing to file '$file' is empty; writing it anyway;");
+        }
+
+        print $OUT @$lines_ref or die Carp::my_carp("write to '$file' failed: $!");
+    }
+    close $OUT or die Carp::my_carp("close '$file' failed: $!");
+
      print "$file written.\n" if $verbosity >= $VERBOSE;
  
-    print $OUT $text;
-    close $OUT;
      return;
  }
  
@@ -7463,7 +7966,7 @@ sub Standardize($) {
      $name =~ s/^\s+//g;
      $name =~ s/\s+$//g;
  
-    # Convert interior white space and hypens into underscores.
+    # Convert interior white space and hyphens into underscores.
      $name =~ s/ (?<= .) [ -]+ (.) /_$1/xg;
  
      # Capitalize the letter following an underscore, and convert a sequence of
@@ -7491,6 +7994,30 @@ sub standardize ($) {
      return lc $name;
  }
  
+sub utf8_heavy_name ($$) {
+    # Returns the name that utf8_heavy.pl will use to find a table.  XXX
+    # perhaps this function should be placed somewhere, like Heavy.pl so that
+    # utf8_heavy can use it directly without duplicating code that can get
+    # out-of sync.
+
+    my $table = shift;
+    my $alias = shift;
+    Carp::carp_extra_args(\@_) if main::DEBUG && @_;
+
+    my $property = $table->property;
+    $property = ($property == $perl)
+                ? ""                # 'perl' is never explicitly stated
+                : standardize($property->name) . '=';
+    if ($alias->loose_match) {
+        return $property . standardize($alias->name);
+    }
+    else {
+        return lc ($property . $alias->name);
+    }
+
+    return;
+}
+
  {   # Closure
  
      my $indent_increment = " " x 2;
@@ -7545,10 +8072,11 @@ sub standardize ($) {
          else {
  
              # Keep track of cycles in the input, and refuse to infinitely loop
-            if (defined $already_output{main::objaddr $item}) {
+            my $addr = do { no overloading; pack 'J', $item; };
+            if (defined $already_output{$addr}) {
                  return "${indent}ALREADY OUTPUT: $item\n";
              }
-            $already_output{main::objaddr $item} = $item;
+            $already_output{$addr} = $item;
  
              if (ref $item eq 'ARRAY') {
                  my $using_brackets;
@@ -7665,7 +8193,7 @@ sub dump_inside_out {
      my $fields_ref = shift;
      Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
-    my $addr = main::objaddr $object;
+    my $addr = do { no overloading; pack 'J', $object; };
  
      my %hash;
      foreach my $key (keys %$fields_ref) {
@@ -7693,7 +8221,7 @@ sub _operator_dot {
          }
          else {
              my $ref = ref $$which;
-            my $addr = main::objaddr $$which;
+            my $addr = do { no overloading; pack 'J', $$which; };
              $$which = "$ref ($addr)";
          }
      }
@@ -7711,7 +8239,8 @@ sub _operator_equal {
  
      return 0 unless defined $other;
      return 0 unless ref $other;
-    return main::objaddr $self == main::objaddr $other;
+    no overloading;
+    return $self == $other;
  }
  
  sub _operator_not_equal {
@@ -7772,7 +8301,7 @@ sub finish_property_setup {
          }
      }
  
-    # This entry is still missing as of 5.2, perhaps because no short name for
+    # This entry is still missing as of 6.0, perhaps because no short name for
      # it.
      if (-e 'NameAliases.txt') {
          my $aliases = property_ref('Name_Alias');
@@ -7804,9 +8333,9 @@ sub finish_property_setup {
      my $fold = property_ref('Case_Folding');
      $fold->set_file('Fold') if defined $fold;
  
-    # utf8.c can't currently cope with non range-size-1 for these, and even if
-    # it were changed to do so, someone else may be using them, expecting the
-    # old style
+    # utf8.c has a different meaning for non range-size-1 for map properties
+    # that this program doesn't currently handle; and even if it were changed
+    # to do so, some other code may be using them expecting range size 1.
      foreach my $property (qw {
                                  Case_Folding
                                  Lowercase_Mapping
@@ -7862,7 +8391,7 @@ sub finish_property_setup {
          ;
  
          # The defaults apply only to unassigned characters
-        $default_R .= '$gc->table("Cn") & $default;';
+        $default_R .= '$gc->table("Unassigned") & $default;';
  
          if ($v_version lt v3.0.0) {
              $default = Multi_Default->new(R => $default_R, 'L');
@@ -7882,7 +8411,7 @@ sub finish_property_setup {
              if ($v_version ge 3.1.0) {
                  $default_AL .= '$default->delete_range(0xFDD0, 0xFDEF);';
              }
-            $default_AL .= '$gc->table("Cn") & $default';
+            $default_AL .= '$gc->table("Unassigned") & $default';
              $default = Multi_Default->new(AL => $default_AL,
                                            R => $default_R,
                                            'L');
@@ -8497,6 +9026,17 @@ END
      return @return;
  }
  
+sub output_perl_charnames_line ($$) {
+
+    # Output the entries in Perl_charnames specially, using 5 digits instead
+    # of four.  This makes the entries a constant length, and simplifies
+    # charnames.pm which this table is for.  Unicode can have 6 digit
+    # ordinals, but they are all private use or noncharacters which do not
+    # have names, so won't be in this table.
+
+    return sprintf "%05X\t%s\n", $_[0], $_[1];
+}
+
  { # Closure
      # This is used to store the range list of all the code points usable when
      # the little used $compare_versions feature is enabled.
@@ -8513,11 +9053,11 @@ END
          # 0374          ; NFD_QC; N
          # 003C..003E    ; Math
          #
-        # the fields are: "codepoint range ; property; map"
+        # the fields are: "codepoint-range ; property; map"
          #
          # meaning the codepoints in the range all have the value 'map' under
          # 'property'.
-        # Beginning and trailing white space in each field are not signficant.
+        # Beginning and trailing white space in each field are not significant.
          # Note there is not a trailing semi-colon in the above.  A trailing
          # semi-colon means the map is a null-string.  An omitted map, as
          # opposed to a null-string, is assumed to be 'Y', based on Unicode
@@ -8537,8 +9077,8 @@ END
          # file, in any order, interspersed in any way.  The first time a
          # property is seen, it gets information about that property and
          # caches it for quick retrieval later.  It also normalizes the maps
-        # so that only one of many synonym is stored.  The Unicode input files
-        # do use some multiple synonyms.
+        # so that only one of many synonyms is stored.  The Unicode input
+        # files do use some multiple synonyms.
  
          my $file = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
@@ -8672,7 +9212,7 @@ END
                      $file->carp_bad_line("Unexpected property '$property_name'.  Skipped");
                      next LINE;
                  }
-                $property_addr = main::objaddr($property_object);
+                { no overloading; $property_addr = pack 'J', $property_object; }
  
                  # Defer changing names until have a line that is acceptable
                  # (the 'next' statement above means is unacceptable)
@@ -8724,7 +9264,7 @@ END
                                              if $file->has_missings_defaults;
                      foreach my $default_ref (@missings_list) {
                          my $default = $default_ref->[0];
-                        my $addr = objaddr property_ref($default_ref->[1]);
+                        my $addr = do { no overloading; pack 'J', property_ref($default_ref->[1]); };
  
                          # For string properties, the default is just what the
                          # file says, but non-string properties should already
@@ -8847,19 +9387,17 @@ END
  
                  # If the map begins with a special command to us (enclosed in
                  # delimiters), extract the command(s).
-                if (substr($map, 0, 1) eq $CMD_DELIM) {
-                    while ($map =~ s/ ^ $CMD_DELIM (.*?) $CMD_DELIM //x) {
-                        my $command = $1;
-                        if ($command =~  / ^ $REPLACE_CMD= (.*) /x) {
-                            $replace = $1;
-                        }
-                        elsif ($command =~  / ^ $MAP_TYPE_CMD= (.*) /x) {
-                            $map_type = $1;
-                        }
-                        else {
-                           $file->carp_bad_line("Unknown command line: '$1'");
-                           next LINE;
-                        }
+                while ($map =~ s/ ^ $CMD_DELIM (.*?) $CMD_DELIM //x) {
+                    my $command = $1;
+                    if ($command =~  / ^ $REPLACE_CMD= (.*) /x) {
+                        $replace = $1;
+                    }
+                    elsif ($command =~  / ^ $MAP_TYPE_CMD= (.*) /x) {
+                        $map_type = $1;
+                    }
+                    else {
+                        $file->carp_bad_line("Unknown command line: '$1'");
+                        next LINE;
                      }
                  }
              }
@@ -8939,23 +9477,6 @@ END
      }
  }
  
-# XXX Unused until revise charnames;
-#sub check_and_handle_compound_name {
-#    This looks at Name properties for parenthesized components and splits
-#    them off.  Thus it finds FF as an equivalent to Form Feed.
-#    my $code_point = shift;
-#    my $name = shift;
-#    if ($name =~ /^ ( .*? ) ( \s* ) \( ( [^)]* ) \) (.*) $/x) {
-#        #local $to_trace = 1 if main::DEBUG;
-#        trace $1, $2, $3, $4 if main::DEBUG && $to_trace;
-#        push @more_Names, "$code_point; $1";
-#        push @more_Names, "$code_point; $3";
-#        Carp::my_carp_bug("Expecting blank space before left parenthesis in '$_'.  Proceeding and assuming it was there;") if $2 ne " ";
-#        Carp::my_carp_bug("Not expecting anything after the right parenthesis in '$_'.  Proceeding and ignoring that;") if $4 ne "";
-#    }
-#    return;
-#}
-
  { # Closure for UnicodeData.txt handling
  
      # This file was the first one in the UCD; its design leads to some
@@ -8963,7 +9484,7 @@ END
      # 0041;LATIN CAPITAL LETTER A;Lu;0;L;;;;;N;;;;0061;
      # The fields in order are:
      my $i = 0;            # The code point is in field 0, and is shifted off.
-    my $NAME = $i++;      # character name (e.g. "LATIN CAPITAL LETTER A")
+    my $CHARNAME = $i++;  # character name (e.g. "LATIN CAPITAL LETTER A")
      my $CATEGORY = $i++;  # category (e.g. "Lu")
      my $CCC = $i++;       # Canonical combining class (e.g. "230")
      my $BIDI = $i++;      # directional class (e.g. "L")
@@ -8982,7 +9503,14 @@ END
  
      # This routine in addition outputs these extra fields:
      my $DECOMP_TYPE = $i++; # Decomposition type
-    my $DECOMP_MAP = $i++;  # Must be last; another decomposition mapping
+
+    # These fields are modifications of ones above, and are usually
+    # suppressed; they must come last, as for speed, the loop upper bound is
+    # normally set to ignore them
+    my $NAME = $i++;        # This is the strict name field, not the one that
+                            # charnames uses.
+    my $DECOMP_MAP = $i++;  # Strict decomposition mapping; not the one used
+                            # by Unicode::Normalize
      my $last_field = $i - 1;
  
      # All these are read into an array for each line, with the indices defined
@@ -8995,31 +9523,44 @@ END
      $field_names[$BIDI] = 'Bidi_Class';
      $field_names[$CATEGORY] = 'General_Category';
      $field_names[$CCC] = 'Canonical_Combining_Class';
+    $field_names[$CHARNAME] = 'Perl_Charnames';
      $field_names[$COMMENT] = 'ISO_Comment';
      $field_names[$DECOMP_MAP] = 'Decomposition_Mapping';
      $field_names[$DECOMP_TYPE] = 'Decomposition_Type';
-    $field_names[$LOWER] = 'Simple_Lowercase_Mapping';
+    $field_names[$LOWER] = 'Lowercase_Mapping';
      $field_names[$MIRRORED] = 'Bidi_Mirrored';
      $field_names[$NAME] = 'Name';
      $field_names[$NUMERIC] = 'Numeric_Value';
      $field_names[$NUMERIC_TYPE_OTHER_DIGIT] = 'Numeric_Type';
      $field_names[$PERL_DECIMAL_DIGIT] = 'Perl_Decimal_Digit';
      $field_names[$PERL_DECOMPOSITION] = 'Perl_Decomposition_Mapping';
-    $field_names[$TITLE] = 'Simple_Titlecase_Mapping';
+    $field_names[$TITLE] = 'Titlecase_Mapping';
      $field_names[$UNICODE_1_NAME] = 'Unicode_1_Name';
-    $field_names[$UPPER] = 'Simple_Uppercase_Mapping';
-
-    # Some of these need a little more explanation.  The $PERL_DECIMAL_DIGIT
-    # field does not lead to an official Unicode property, but is used in
-    # calculating the Numeric_Type.  Perl however, creates a file from this
-    # field, so a Perl property is created from it.  Similarly, the Other
-    # Digit field is used only for calculating the Numeric_Type, and so it can
-    # be safely re-used as the place to store the value for Numeric_Type;
-    # hence it is referred to as $NUMERIC_TYPE_OTHER_DIGIT.  The input field
-    # named $PERL_DECOMPOSITION is a combination of both the decomposition
-    # mapping and its type.  Perl creates a file containing exactly this
-    # field, so it is used for that.  The two properties are separated into
-    # two extra output fields, $DECOMP_MAP and $DECOMP_TYPE.
+    $field_names[$UPPER] = 'Uppercase_Mapping';
+
+    # Some of these need a little more explanation:
+    # The $PERL_DECIMAL_DIGIT field does not lead to an official Unicode
+    #   property, but is used in calculating the Numeric_Type.  Perl however,
+    #   creates a file from this field, so a Perl property is created from it.
+    # Similarly, the Other_Digit field is used only for calculating the
+    #   Numeric_Type, and so it can be safely re-used as the place to store
+    #   the value for Numeric_Type; hence it is referred to as
+    #   $NUMERIC_TYPE_OTHER_DIGIT.
+    # The input field named $PERL_DECOMPOSITION is a combination of both the
+    #   decomposition mapping and its type.  Perl creates a file containing
+    #   exactly this field, so it is used for that.  The two properties are
+    #   separated into two extra output fields, $DECOMP_MAP and $DECOMP_TYPE.
+    #   $DECOMP_MAP is usually suppressed (unless the lists are changed to
+    #   output it), as Perl doesn't use it directly.
+    # The input field named here $CHARNAME is used to construct the
+    #   Perl_Charnames property, which is a combination of the Name property
+    #   (which the input field contains), and the Unicode_1_Name property, and
+    #   others from other files.  Since, the strict Name property is not used
+    #   by Perl, this field is used for the table that Perl does use.  The
+    #   strict Name property table is usually suppressed (unless the lists are
+    #   changed to output it), so it is accumulated in a separate field,
+    #   $NAME, which to save time is discarded unless the table is actually to
+    #   be output
  
      # This file is processed like most in this program.  Control is passed to
      # process_generic_property_file() which calls filter_UnicodeData_line()
@@ -9048,7 +9589,7 @@ END
      # the code point and name on each line.  This was actually the hardest
      # thing to design around.  The code points in those ranges may actually
      # have real maps not given by these two lines.  These maps will either
-    # be algorthimically determinable, or in the extracted files furnished
+    # be algorithmically determinable, or in the extracted files furnished
      # with the UCD.  In the event of conflicts between these extracted files,
      # and this one, Unicode says that this one prevails.  But it shouldn't
      # prevail for conflicts that occur in these ranges.  The data from the
@@ -9066,10 +9607,26 @@ END
          my $file = shift;
          Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
+        # Create a new property specially located that is a combination of the
+        # various Name properties: Name, Unicode_1_Name, Named Sequences, and
+        # Name_Alias properties.  (The final duplicates elements of the
+        # first.)  A comment for it will later be constructed based on the
+        # actual properties present and used
+        $perl_charname = Property->new('Perl_Charnames',
+                       Core_Access => '\N{...} and "use charnames"',
+                       Default_Map => "",
+                       Directory => File::Spec->curdir(),
+                       File => 'Name',
+                       Internal_Only_Warning => 1,
+                       Perl_Extension => 1,
+                       Range_Size_1 => \&output_perl_charnames_line,
+                       Type => $STRING,
+                       );
+
          my $Perl_decomp = Property->new('Perl_Decomposition_Mapping',
                                          Directory => File::Spec->curdir(),
                                          File => 'Decomposition',
-                                        Format => $STRING_FORMAT,
+                                        Format => $DECOMP_STRING_FORMAT,
                                          Internal_Only_Warning => 1,
                                          Perl_Extension => 1,
                                          Default_Map => $CODE_POINT,
@@ -9117,12 +9674,18 @@ numerals.
  END
          ));
  
-        # This property is not used for generating anything else, and is
-        # usually not output.  By making it last in the list, we can just
+        # These properties are not used for generating anything else, and are
+        # usually not output.  By making them last in the list, we can just
          # change the high end of the loop downwards to avoid the work of
-        # generating a table that is just going to get thrown away.
-        if (! property_ref('Decomposition_Mapping')->to_output_map) {
-            $last_field--;
+        # generating a table(s) that is/are just going to get thrown away.
+        if (! property_ref('Decomposition_Mapping')->to_output_map
+            && ! property_ref('Name')->to_output_map)
+        {
+            $last_field = min($NAME, $DECOMP_MAP) - 1;
+        } elsif (property_ref('Decomposition_Mapping')->to_output_map) {
+            $last_field = $DECOMP_MAP;
+        } elsif (property_ref('Name')->to_output_map) {
+            $last_field = $NAME;
          }
          return;
      }
@@ -9243,7 +9806,7 @@ END
          # Certain fields just haven't been empty so far in any Unicode
          # version, so don't look at those, namely $MIRRORED, $BIDI, $CCC,
          # $CATEGORY.  This leaves just the two fields, and so we hard-code in
-        # the defaults; which are verly unlikely to ever change.
+        # the defaults; which are very unlikely to ever change.
          $fields[$UPPER] = $CODE_POINT if $fields[$UPPER] eq "";
          $fields[$LOWER] = $CODE_POINT if $fields[$LOWER] eq "";
  
@@ -9256,62 +9819,53 @@ END
          #   D7A3;<Hangul Syllable, Last>;Lo;0;L;;;;;N;;;;;
          # that define ranges.  These should be processed after the fields are
          # adjusted above, as they may override some of them; but mostly what
-        # is left is to possibly adjust the $NAME field.  The names of all the
+        # is left is to possibly adjust the $CHARNAME field.  The names of all the
          # paired lines start with a '<', but this is also true of '<control>,
          # which isn't one of these special ones.
-        if ($fields[$NAME] eq '<control>') {
+        if ($fields[$CHARNAME] eq '<control>') {
  
              # Some code points in this file have the pseudo-name
              # '<control>', but the official name for such ones is the null
-            # string.
+            # string.  For charnames.pm, we use the Unicode version 1 name
              $fields[$NAME] = "";
+            $fields[$CHARNAME] = $fields[$UNICODE_1_NAME];
  
              # We had better not be in between range lines.
              if ($in_range) {
-                $file->carp_bad_line("Expecting a closing range line, not a $fields[$NAME]'.  Trying anyway");
+                $file->carp_bad_line("Expecting a closing range line, not a $fields[$CHARNAME]'.  Trying anyway");
                  $in_range = 0;
              }
          }
-        elsif (substr($fields[$NAME], 0, 1) ne '<') {
+        elsif (substr($fields[$CHARNAME], 0, 1) ne '<') {
  
              # Here is a non-range line.  We had better not be in between range
              # lines.
              if ($in_range) {
-                $file->carp_bad_line("Expecting a closing range line, not a $fields[$NAME]'.  Trying anyway");
+                $file->carp_bad_line("Expecting a closing range line, not a $fields[$CHARNAME]'.  Trying anyway");
                  $in_range = 0;
              }
-            # XXX until charnames catches up.
-#            if ($fields[$NAME] =~ s/- $cp $//x) {
-#
-#                # These are code points whose names end in their code points,
-#                # which means the names are algorithmically derivable from the
-#                # code points.  To shorten the output Name file, the algorithm
-#                # for deriving these is placed in the file instead of each
-#                # code point, so they have map type $CP_IN_NAME
-#                $fields[$NAME] = $CMD_DELIM
-#                                 . $MAP_TYPE_CMD
-#                                 . '='
-#                                 . $CP_IN_NAME
-#                                 . $CMD_DELIM
-#                                 . $fields[$NAME];
-#            }
-
-            # Some official names are really two alternate names with one in
-            # parentheses.  What we do here is use the full official one for
-            # the standard property (stored just above), but for the charnames
-            # table, we add two more entries, one for each of the alternate
-            # ones.
-            # elsif name ne ""
-            #check_and_handle_compound_name($cp, $fields[$NAME]);
-            #check_and_handle_compound_name($cp, $unicode_1_name);
-            # XXX until charnames catches up.
-        }
-        elsif ($fields[$NAME] =~ /^<(.+), First>$/) {
-            $fields[$NAME] = $1;
+            if ($fields[$CHARNAME] =~ s/- $cp $//x) {
+
+                # These are code points whose names end in their code points,
+                # which means the names are algorithmically derivable from the
+                # code points.  To shorten the output Name file, the algorithm
+                # for deriving these is placed in the file instead of each
+                # code point, so they have map type $CP_IN_NAME
+                $fields[$CHARNAME] = $CMD_DELIM
+                                 . $MAP_TYPE_CMD
+                                 . '='
+                                 . $CP_IN_NAME
+                                 . $CMD_DELIM
+                                 . $fields[$CHARNAME];
+            }
+            $fields[$NAME] = $fields[$CHARNAME];
+        }
+        elsif ($fields[$CHARNAME] =~ /^<(.+), First>$/) {
+            $fields[$CHARNAME] = $fields[$NAME] = $1;
  
              # Here we are at the beginning of a range pair.
              if ($in_range) {
-                $file->carp_bad_line("Expecting a closing range line, not a beginning one, $fields[$NAME]'.  Trying anyway");
+                $file->carp_bad_line("Expecting a closing range line, not a beginning one, $fields[$CHARNAME]'.  Trying anyway");
              }
              $in_range = 1;
  
@@ -9321,20 +9875,22 @@ END
              $force_output = 1;
  
          }
-        elsif ($fields[$NAME] !~ s/^<(.+), Last>$/$1/) {
-            $file->carp_bad_line("Unexpected name starting with '<' $fields[$NAME].  Ignoring this line.");
+        elsif ($fields[$CHARNAME] !~ s/^<(.+), Last>$/$1/) {
+            $file->carp_bad_line("Unexpected name starting with '<' $fields[$CHARNAME].  Ignoring this line.");
              $_ = "";
              return;
          }
          else { # Here, we are at the last line of a range pair.
  
              if (! $in_range) {
-                $file->carp_bad_line("Unexpected end of range $fields[$NAME] when not in one.  Ignoring this line.");
+                $file->carp_bad_line("Unexpected end of range $fields[$CHARNAME] when not in one.  Ignoring this line.");
                  $_ = "";
                  return;
              }
              $in_range = 0;
  
+            $fields[$NAME] = $fields[$CHARNAME];
+
              # Check that the input is valid: that the closing of the range is
              # the same as the beginning.
              foreach my $i (0 .. $last_field) {
@@ -9343,8 +9899,8 @@ END
              }
  
              # The processing differs depending on the type of range,
-            # determined by its $NAME
-            if ($fields[$NAME] =~ /^Hangul Syllable/) {
+            # determined by its $CHARNAME
+            if ($fields[$CHARNAME] =~ /^Hangul Syllable/) {
  
                  # Check that the data looks right.
                  if ($decimal_previous_cp != $SBase) {
@@ -9368,20 +9924,22 @@ END
  
                  # This range is stored in our internal structure with its
                  # own map type, different from all others.
-                $previous_fields[$NAME] = $CMD_DELIM
+                $previous_fields[$CHARNAME] = $previous_fields[$NAME]
+                                        = $CMD_DELIM
                                            . $MAP_TYPE_CMD
                                            . '='
                                            . $HANGUL_SYLLABLE
                                            . $CMD_DELIM
-                                          . $fields[$NAME];
+                                          . $fields[$CHARNAME];
              }
-            elsif ($fields[$NAME] =~ /^CJK/) {
+            elsif ($fields[$CHARNAME] =~ /^CJK/) {
  
                  # The name for these contains the code point itself, and all
                  # are defined to have the same base name, regardless of what
                  # is in the file.  They are stored in our internal structure
                  # with a map type of $CP_IN_NAME
-                $previous_fields[$NAME] = $CMD_DELIM
+                $previous_fields[$CHARNAME] = $previous_fields[$NAME]
+                                        = $CMD_DELIM
                                             . $MAP_TYPE_CMD
                                             . '='
                                             . $CP_IN_NAME
@@ -9396,10 +9954,10 @@ END
                  # null, as there are no names for the private use and
                  # surrogate code points.
  
-                $previous_fields[$NAME] = "";
+                $previous_fields[$CHARNAME] = $previous_fields[$NAME] = "";
              }
              else {
-                $file->carp_bad_line("Unexpected code point range $fields[$NAME] because category is $fields[$CATEGORY].  Attempting to process it.");
+                $file->carp_bad_line("Unexpected code point range $fields[$CHARNAME] because category is $fields[$CATEGORY].  Attempting to process it.");
              }
  
              # The first line of the range caused everything else to be output,
@@ -9428,6 +9986,7 @@ END
              # code in this subroutine that does the same thing, but doesn't
              # know about these ranges.
              $_ = "";
+
              return;
          }
  
@@ -9649,6 +10208,32 @@ END
          }
          return;
      }
+
+    sub filter_v6_ucd {
+
+        # Unicode 6.0 co-opted the name BELL for U+1F514, so change the input
+        # to pretend that U+0007 is ALERT instead, and for Perl 5.14, don't
+        # allow the BELL name for U+1F514, so that the old usage can be
+        # deprecated for one cycle.
+
+        return if $_ !~ /^(?:0007|1F514|070F);/;
+
+        my ($code_point, @fields) = split /\s*;\s*/, $_, -1;
+        if ($code_point eq '0007') {
+            $fields[$CHARNAME] = "ALERT";
+        }
+        elsif ($code_point eq '070F') { # Unicode Corrigendum #8; see
+                            # http://www.unicode.org/versions/corrigendum8.html
+            $fields[$BIDI] = "AL";
+        }
+        elsif ($^V lt v5.15.0) { # For 5.16 will convert to use Unicode's name
+            $fields[$CHARNAME] = "";
+        }
+
+        $_ = join ';', $code_point, @fields;
+
+        return;
+    }
  } # End closure for UnicodeData
  
  sub process_GCB_test {
@@ -9671,7 +10256,6 @@ sub process_NamedSequences {
      #
      # This just adds the sequence to an array for later handling
  
-    return; # XXX Until charnames catches up
      my $file = shift;
      Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
@@ -9682,7 +10266,12 @@ sub process_NamedSequences {
                  "Doesn't look like 'KHMER VOWEL SIGN OM;17BB 17C6'");
              next;
          }
-        push @named_sequences, "$sequence\t\t$name";
+
+        # Note single \t in keeping with special output format of
+        # Perl_charnames.  But it turns out that the code points don't have to
+        # be 5 digits long, like the rest, based on the internal workings of
+        # charnames.pm.  This could be easily changed for consistency.
+        push @named_sequences, "$sequence\t$name";
      }
      return;
  }
@@ -9757,26 +10346,35 @@ sub filter_arabic_shaping_line {
  
  sub setup_special_casing {
      # SpecialCasing.txt contains the non-simple case change mappings.  The
-    # simple ones are in UnicodeData.txt, and should already have been read
-    # in.
-    # This routine initializes the full mappings to the simple, then as each
-    # line is processed, it overrides the simple ones.
+    # simple ones are in UnicodeData.txt, which should already have been read
+    # in to the full property data structures, so as to initialize these with
+    # the simple ones.  Then the SpecialCasing.txt entries overwrite the ones
+    # which have different full mappings.
+
+    # This routine sees if the simple mappings are to be output, and if so,
+    # copies what has already been put into the full mapping tables, while
+    # they still contain only the simple mappings.
+
+    # The reason it is done this way is that the simple mappings are probably
+    # not going to be output, so it saves work to initialize the full tables
+    # with the simple mappings, and then overwrite those relatively few
+    # entries in them that have different full mappings, and thus skip the
+    # simple mapping tables altogether.
  
      my $file= shift;
      Carp::carp_extra_args(\@_) if main::DEBUG && @_;
  
      # For each of the case change mappings...
      foreach my $case ('lc', 'tc', 'uc') {
+        my $full = property_ref($case);
+        unless (defined $full && ! $full->is_empty) {
+            Carp::my_carp_bug("Need to process UnicodeData before SpecialCasing.  Only special casing will be generated.");
+        }
  
          # The simple version's name in each mapping merely has an 's' in front
          # of the full one's
          my $simple = property_ref('s' . $case);
-        unless (defined $simple && ! $simple->is_empty) {
-            Carp::my_carp_bug("Need to process UnicodeData before SpecialCasing.  Only special casing will be generated.");
-        }
-
-        # Initialize the full case mappings with the simple ones.
-        property_ref($case)->initialize($simple);
+        $simple->initialize($full) if $simple->to_output_map();
      }
  
      return;
@@ -9806,7 +10404,7 @@ sub filter_special_casing_line {
      # implemented, it would be by hard-coding in the casing functions in the
      # Perl core, not through tables.  But if there is a new condition we don't
      # know about, output a warning.  We know about all the conditions through
-    # 5.2
+    # 6.0
      if ($fields[4] ne "") {
          my @conditions = split ' ', $fields[4];
          if ($conditions[0] ne 'tr'  # We know that these languages have
@@ -9884,6 +10482,7 @@ sub filter_old_style_case_folding {
      # it takes no part in anything we do.
      my $to_output_simple;
  
+    # XXX
      # These are experimental, perhaps will need these to pass to regcomp.c to
      # handle the cases where for example the Kelvin sign character folds to k,
      # and in regcomp, we need to know which of the characters can have a
@@ -9952,7 +10551,7 @@ sub filter_old_style_case_folding {
              $file->insert_adjusted_lines("$range; Simple_Case_Folding; $map");
          }
  
-        # Experimental, see comment above
+        # XXX Experimental, see comment above
          if ($type ne 'S' && hex($range) >= 256) {   # assumes range is 1 point
              my @folded = split ' ', $map;
              if (hex $folded[0] < 256 && @folded == 1) {
@@ -9967,7 +10566,7 @@ sub filter_old_style_case_folding {
      }
  
      sub post_fold {
-        # Experimental, see comment above
+        # XXX Experimental, see comment above
          return;
  
          #local $to_trace = 1 if main::DEBUG;
@@ -10302,7 +10901,7 @@ sub filter_blocks_lines {
          #                                one.
          #   Titlecase                    duplicates UnicodeData.txt: gc=lt
          #   Unassigned Code Value        duplicates UnicodeData.txt: gc=cc
-        #   Zero-width                   never made into offical property;
+        #   Zero-width                   never made into official property;
          #                                subset of gc=cf
          # Most of the properties have the same names in this file as in later
          # versions, but a couple do not.
@@ -10443,7 +11042,8 @@ sub finish_Unicode() {
  
                  # Add mappings to the property for each code point in the list
                  foreach my $range ($list->ranges) {
-                    $property->add_map($range->start, $range->end, $default);
+                    $property->add_map($range->start, $range->end, $default,
+                    Replace => $CROAK);
                  }
              }
  
@@ -10470,11 +11070,12 @@ sub finish_Unicode() {
          }
  
          # Add any remaining code points to the mapping, using the default for
-        # missing code points
+        # missing code points.
          if (defined (my $default_map = $property->default_map)) {
-            foreach my $range ($property->inverse_list->ranges) {
-                $property->add_map($range->start, $range->end, $default_map);
-            }
+
+            # This fills in any missing values with the default.
+            $property->add_map(0, $LAST_UNICODE_CODEPOINT,
+                               $default_map, Replace => $NO);
  
              # Make sure there is a match table for the default
              if (! defined $property->table($default_map)) {
@@ -10567,19 +11168,17 @@ END
          $LC->initialize($gc->table('Ll') + $gc->table('Lu'));
  
          # Lt not in release 1.
-        $LC += $gc->table('Lt') if defined $gc->table('Lt');
+        if (defined $gc->table('Lt')) {
+            $LC += $gc->table('Lt');
+            $gc->table('Lt')->set_caseless_equivalent($LC);
+        }
      }
      $LC->add_description('[\p{Ll}\p{Lu}\p{Lt}]');
  
+    $gc->table('Ll')->set_caseless_equivalent($LC);
+    $gc->table('Lu')->set_caseless_equivalent($LC);
+
      my $Cs = $gc->table('Cs');
-    if (defined $Cs) {
-        $Cs->add_note('Mostly not usable in Perl.');
-        $Cs->add_comment(join_lines(<<END
-Surrogates are used exclusively for I/O in UTF-16, and should not appear in
-Unicode text, and hence their use will generate (usually fatal) messages
-END
-        ));
-    }
  
  
      # Folding information was introduced later into Unicode data.  To get
@@ -10627,7 +11226,8 @@ sub compile_perl() {
      # range, with their names prefaced by 'Posix', to signify that these match
      # what the Posix standard says they should match.  A couple are
      # effectively this, but the name doesn't have 'Posix' in it because there
-    # just isn't any Posix equivalent.
+    # just isn't any Posix equivalent.  'XPosix' are the Posix tables extended
+    # to the full Unicode range, by our guesses as to what is appropriate.
  
      # 'Any' is all code points.  As an error check, instead of just setting it
      # to be that, construct it to be the union of all the major categories
@@ -10687,12 +11287,17 @@ sub compile_perl() {
      my $Unicode_Lower = property_ref('Lowercase');
      if (defined $Unicode_Lower && ! $Unicode_Lower->is_empty) {
          $Lower->set_equivalent_to($Unicode_Lower->table('Y'), Related => 1);
+        $Unicode_Lower->table('Y')->set_caseless_equivalent(property_ref('Cased')->table('Y'));
+        $Unicode_Lower->table('N')->set_caseless_equivalent(property_ref('Cased')->table('N'));
+        $Lower->set_caseless_equivalent(property_ref('Cased')->table('Y'));
+
      }
      else {
          $Lower->set_equivalent_to($gc->table('Lowercase_Letter'),
                                                                  Related => 1);
      }
-    $perl->add_match_table("PosixLower",
+    $Lower->add_alias('XPosixLower');
+    my $Posix_Lower = $perl->add_match_table("PosixLower",
                              Description => "[a-z]",
                              Initialize => $Lower & $ASCII,
                              );
@@ -10701,12 +11306,16 @@ sub compile_perl() {
      my $Unicode_Upper = property_ref('Uppercase');
      if (defined $Unicode_Upper && ! $Unicode_Upper->is_empty) {
          $Upper->set_equivalent_to($Unicode_Upper->table('Y'), Related => 1);
+        $Unicode_Upper->table('Y')->set_caseless_equivalent(property_ref('Cased')->table('Y'));
+        $Unicode_Upper->table('N')->set_caseless_equivalent(property_ref('Cased')->table('N'));
+        $Upper->set_caseless_equivalent(property_ref('Cased')->table('Y'));
      }
      else {
          $Upper->set_equivalent_to($gc->table('Uppercase_Letter'),
                                                                  Related => 1);
      }
-    $perl->add_match_table("PosixUpper",
+    $Upper->add_alias('XPosixUpper');
+    my $Posix_Upper = $perl->add_match_table("PosixUpper",
                              Description => "[A-Z]",
                              Initialize => $Upper & $ASCII,
                              );
@@ -10715,20 +11324,25 @@ sub compile_perl() {
      # otherwise present
      my $Title = $perl->add_match_table('Title');
      my $lt = $gc->table('Lt');
-    if (defined $lt) {
-        $Title->set_equivalent_to($lt, Related => 1);
-    }
+
+    # Earlier versions of mktables had this related to $lt since they have
+    # identical code points, but their casefolds are not equivalent, and so
+    # now must be kept as separate entities.
+    $Title += $lt if defined $lt;
  
      # If this Unicode version doesn't have Cased, set up our own.  From
      # Unicode 5.1: Definition D120: A character C is defined to be cased if
      # and only if C has the Lowercase or Uppercase property or has a
      # General_Category value of Titlecase_Letter.
-    unless (defined property_ref('Cased')) {
+    my $Unicode_Cased = property_ref('Cased');
+    unless (defined $Unicode_Cased) {
          my $cased = $perl->add_match_table('Cased',
                          Initialize => $Lower + $Upper + $Title,
                          Description => 'Uppercase or Lowercase or Titlecase',
                          );
+        $Unicode_Cased = $cased;
      }
+    $Title->set_caseless_equivalent($Unicode_Cased->table('Y'));
  
      # Similarly, set up our own Case_Ignorable property if this Unicode
      # version doesn't have it.  From Unicode 5.1: Definition D121: A character
@@ -10800,32 +11414,39 @@ sub compile_perl() {
          $Alpha += $gc->table('Nl') if defined $gc->table('Nl');
          $Alpha->add_description('Alphabetic');
      }
-    $perl->add_match_table("PosixAlpha",
+    $Alpha->add_alias('XPosixAlpha');
+    my $Posix_Alpha = $perl->add_match_table("PosixAlpha",
                              Description => "[A-Za-z]",
                              Initialize => $Alpha & $ASCII,
                              );
+    $Posix_Upper->set_caseless_equivalent($Posix_Alpha);
+    $Posix_Lower->set_caseless_equivalent($Posix_Alpha);
  
      my $Alnum = $perl->add_match_table('Alnum',
                          Description => 'Alphabetic and (Decimal) Numeric',
                          Initialize => $Alpha + $gc->table('Decimal_Number'),
                          );
+    $Alnum->add_alias('XPosixAlnum');
      $perl->add_match_table("PosixAlnum",
                              Description => "[A-Za-z0-9]",
                              Initialize => $Alnum & $ASCII,
                              );
  
      my $Word = $perl->add_match_table('Word',
-                                Description => '\w, including beyond ASCII',
+                                Description => '\w, including beyond ASCII;'
+                                            . ' = \p{Alnum} + \pM + \p{Pc}',
                                  Initialize => $Alnum + $gc->table('Mark'),
                                  );
+    $Word->add_alias('XPosixWord');
      my $Pc = $gc->table('Connector_Punctuation'); # 'Pc' Not in release 1
      $Word += $Pc if defined $Pc;
  
      # This is a Perl extension, so the name doesn't begin with Posix.
-    $perl->add_match_table('PerlWord',
+    my $PerlWord = $perl->add_match_table('PerlWord',
                      Description => '\w, restricted to ASCII = [A-Za-z0-9_]',
                      Initialize => $Word & $ASCII,
                      );
+    $PerlWord->add_alias('PosixWord');
  
      my $Blank = $perl->add_match_table('Blank',
                                  Description => '\h, Horizontal white space',
@@ -10838,6 +11459,7 @@ sub compile_perl() {
                                              -   0x200B, # ZWSP
                                  );
      $Blank->add_alias('HorizSpace');        # Another name for it.
+    $Blank->add_alias('XPosixBlank');
      $perl->add_match_table("PosixBlank",
                              Description => "\\t and ' '",
                              Initialize => $Blank & $ASCII,
@@ -10859,24 +11481,28 @@ sub compile_perl() {
                  Description => '\s including beyond ASCII plus vertical tab',
                  Initialize => $Blank + $VertSpace,
      );
+    $Space->add_alias('XPosixSpace');
      $perl->add_match_table("PosixSpace",
                              Description => "\\t, \\n, \\cK, \\f, \\r, and ' '.  (\\cK is vertical tab)",
                              Initialize => $Space & $ASCII,
                              );
  
      # Perl's traditional space doesn't include Vertical Tab
-    my $SpacePerl = $perl->add_match_table('SpacePerl',
+    my $XPerlSpace = $perl->add_match_table('XPerlSpace',
                                    Description => '\s, including beyond ASCII',
                                    Initialize => $Space - 0x000B,
                                  );
-    $perl->add_match_table('PerlSpace',
+    $XPerlSpace->add_alias('SpacePerl');    # A pre-existing synonym
+    my $PerlSpace = $perl->add_match_table('PerlSpace',
                              Description => '\s, restricted to ASCII',
-                            Initialize => $SpacePerl & $ASCII,
+                            Initialize => $XPerlSpace & $ASCII,
                              );
  
+
      my $Cntrl = $perl->add_match_table('Cntrl',
                                          Description => 'Control characters');
      $Cntrl->set_equivalent_to($gc->table('Cc'), Related => 1);
+    $Cntrl->add_alias('XPosixCntrl');
      $perl->add_match_table("PosixCntrl",
                              Description => "ASCII control characters: NUL, SOH, STX, ETX, EOT, ENQ, ACK, BEL, BS, HT, LF, VT, FF, CR, SO, SI, DLE, DC1, DC2, DC3, DC4, NAK, SYN, ETB, CAN, EOM, SUB, ESC, FS, GS, RS, US, and DEL",
                              Initialize => $Cntrl & $ASCII,
@@ -10893,35 +11519,42 @@ sub compile_perl() {
                          Description => 'Characters that are graphical',
                          Initialize => ~ ($Space + $controls),
                          );
+    $Graph->add_alias('XPosixGraph');
      $perl->add_match_table("PosixGraph",
                              Description =>
                                  '[-!"#$%&\'()*+,./:;<>?@[\\\]^_`{|}~0-9A-Za-z]',
                              Initialize => $Graph & $ASCII,
                              );
  
-    my $Print = $perl->add_match_table('Print',
+    $print = $perl->add_match_table('Print',
                          Description => 'Characters that are graphical plus space characters (but no controls)',
                          Initialize => $Blank + $Graph - $gc->table('Control'),
                          );
+    $print->add_alias('XPosixPrint');
      $perl->add_match_table("PosixPrint",
-                            Description => 
+                            Description =>
                                '[- 0-9A-Za-z!"#$%&\'()*+,./:;<>?@[\\\]^_`{|}~]',
-                            Initialize => $Print & $ASCII,
+                            Initialize => $print & $ASCII,
                              );
  
      my $Punct = $perl->add_match_table('Punct');
      $Punct->set_equivalent_to($gc->table('Punctuation'), Related => 1);
  
      # \p{punct} doesn't include the symbols, which posix does
+    my $XPosixPunct = $perl->add_match_table('XPosixPunct',
+                    Description => '\p{Punct} + ASCII-range \p{Symbol}',
+                    Initialize => $gc->table('Punctuation')
+                                + ($ASCII & $gc->table('Symbol')),
+        );
      $perl->add_match_table('PosixPunct',
          Description => '[-!"#$%&\'()*+,./:;<>?@[\\\]^_`{|}~]',
-        Initialize => $ASCII & ($gc->table('Punctuation')
-                                + $gc->table('Symbol')),
+        Initialize => $ASCII & $XPosixPunct,
          );
  
      my $Digit = $perl->add_match_table('Digit',
-                            Description => '\d, extended beyond just [0-9]');
+                            Description => '[0-9] + all other decimal digits');
      $Digit->set_equivalent_to($gc->table('Decimal_Number'), Related => 1);
+    $Digit->add_alias('XPosixDigit');
      my $PosixDigit = $perl->add_match_table("PosixDigit",
                                              Description => '[0-9]',
                                              Initialize => $Digit & $ASCII,
@@ -10929,6 +11562,7 @@ sub compile_perl() {
  
      # Hex_Digit was not present in first release
      my $Xdigit = $perl->add_match_table('XDigit');
+    $Xdigit->add_alias('XPosixXDigit');
      my $Hex = property_ref('Hex_Digit');
      if (defined $Hex && ! $Hex->is_empty) {
          $Xdigit->set_equivalent_to($Hex->table('Y'), Related => 1);
@@ -10940,6 +11574,10 @@ sub compile_perl() {
                                0xFF10..0xFF19, 0xFF21..0xFF26, 0xFF41..0xFF46]);
          $Xdigit->add_description('[0-9A-Fa-f] and corresponding fullwidth versions, like U+FF10: FULLWIDTH DIGIT ZERO');
      }
+    $perl->add_match_table('PosixXDigit',
+                            Initialize => $ASCII & $Xdigit,
+                            Description => '[0-9A-Fa-f]',
+                        );
  
      my $dt = property_ref('Decomposition_Type');
      $dt->add_match_table('Non_Canon', Full_Name => 'Non_Canonical',
@@ -11046,24 +11684,7 @@ sub compile_perl() {
          $lv_lvt_v->add_comment('For use in \X; matches: HST=LV | HST=LVT | HST=V');
      }
  
-    # Create a new property specially located that is a combination of the
-    # various Name properties: Name, Unicode_1_Name, Named Sequences, and
-    # Name_Alias properties.  (The final duplicates elements of the first.)  A
-    # comment for it is constructed based on the actual properties present and
-    # used
-    my $perl_charname = Property->new('Perl_Charnames',
-                                Core_Access => '\N{...} and charnames.pm',
-                                Default_Map => "",
-                                Directory => File::Spec->curdir(),
-                                File => 'Name',
-                                Internal_Only_Warning => 1,
-                                Perl_Extension => 1,
-                                Range_Size_1 => 1,
-                                Type => $STRING,
-                                Initialize => property_ref('Unicode_1_Name'),
-                                );
-    # Name overrides Unicode_1_Name
-    $perl_charname->property_add_or_replace_non_nulls(property_ref('Name'));
+    # Was previously constructed to contain both Name and Unicode_1_Name
      my @composition = ('Name', 'Unicode_1_Name');
  
      if (@named_sequences) {
@@ -11088,7 +11709,7 @@ sub compile_perl() {
          $alias_sentence = <<END;
  The Name_Alias property adds duplicate code point entries with a corrected
  name.  The original (less correct, but still valid) name will be physically
-first.
+last.
  END
      }
      my $comment;
@@ -11100,27 +11721,6 @@ END
          $comment .= ", and $composition[-1]";
      }
  
-    # Wait for charnames to catch up
-#    foreach my $entry (@more_Names,
-#                        split "\n", <<"END"
-#000A; LF
-#000C; FF
-#000D; CR
-#0085; NEL
-#200C; ZWNJ
-#200D; ZWJ
-#FEFF; BOM
-#FEFF; BYTE ORDER MARK
-#END
-#    ) {
-#        #local $to_trace = 1 if main::DEBUG;
-#        trace $entry if main::DEBUG && $to_trace;
-#        my ($code_point, $name) = split /\s*;\s*/, $entry;
-#        $code_point = hex $code_point;
-#        trace $code_point, $name if main::DEBUG && $to_trace;
-#        $perl_charname->add_duplicate($code_point, $name);
-#    }
-#    #$perl_charname->add_comment("This file is for charnames.pm.  It is the union of the $comment properties, plus certain commonly used but unofficial names, such as 'FF' and 'ZWNJ'.  Unicode_1_Name entries are used only for otherwise nameless code points.$alias_sentence");
      $perl_charname->add_comment(join_lines( <<END
  This file is for charnames.pm.  It is the union of the $comment properties.
  Unicode_1_Name entries are used only for otherwise nameless code
@@ -11193,7 +11793,7 @@ END
          my $description_start = "Code point's usage introduced in version ";
          $first_age->add_description($description_start . $first_age->name);
  
-        # To construct the accumlated values, for each of the age tables
+        # To construct the accumulated values, for each of the age tables
          # starting with the 2nd earliest, merge the earliest with it, to get
          # all those code points existing in the 2nd earliest.  Repeat merging
          # the new 2nd earliest with the 3rd earliest to get all those existing
@@ -11247,6 +11847,24 @@ END
          }
      }
  
+    # Here done with all the basic stuff.  Ready to populate the information
+    # about each character if annotating them.
+    if ($annotate) {
+
+        # See comments at its declaration
+        $annotate_ranges = Range_Map->new;
+
+        # This separates out the non-characters from the other unassigneds, so
+        # can give different annotations for each.
+        $unassigned_sans_noncharacters = Range_List->new(
+         Initialize => $gc->table('Unassigned')
+                       & property_ref('Noncharacter_Code_Point')->table('N'));
+
+        for (my $i = 0; $i <= $LAST_UNICODE_CODEPOINT; $i++ ) {
+            $i = populate_char_info($i);    # Note sets $i so may cause skips
+        }
+    }
+
      return;
  }
  
@@ -11412,7 +12030,7 @@ sub add_perl_synonyms() {
                  # name.  We could be in trouble, but not if this is just a
                  # synonym for another table that we have already made a child
                  # of the pre-existing one.
-                if ($pre_existing->is_equivalent_to($actual)) {
+                if ($pre_existing->is_set_equivalent_to($actual)) {
                      trace "$pre_existing is already equivalent to $actual; adding alias perl=$proposed_name to it" if main::DEBUG && $to_trace;
                      $pre_existing->add_alias($proposed_name);
                      next;
@@ -11512,7 +12130,7 @@ END
  
  sub register_file_for_name($$$) {
      # Given info about a table and a datafile that it should be associated
-    # with, register that assocation
+    # with, register that association
  
      my $table = shift;
      my $directory_ref = shift;   # Array of the directory path for the file
@@ -11557,19 +12175,18 @@ sub register_file_for_name($$$) {
          my $deprecated = ($table->status eq $DEPRECATED)
                           ? $table->status_info
                           : "";
+        my $caseless_equivalent = $table->caseless_equivalent;
  
          # And for each of the table's aliases...  This inner loop eventually
          # goes through all aliases in the UCD that we generate regex match
          # files for
          foreach my $alias ($table->aliases) {
-            my $name = $alias->name;
+            my $standard = utf8_heavy_name($table, $alias);
  
              # Generate an entry in either the loose or strict hashes, which
              # will translate the property and alias names combination into the
              # file where the table for them is stored.
-            my $standard;
              if ($alias->loose_match) {
-                $standard = $property . standardize($alias->name);
                  if (exists $loose_to_file_of{$standard}) {
                      Carp::my_carp("Can't change file registered to $loose_to_file_of{$standard} to '$sub_filename'.");
                  }
@@ -11578,7 +12195,6 @@ sub register_file_for_name($$$) {
                  }
              }
              else {
-                $standard = lc ($property . $name);
                  if (exists $stricter_to_file_of{$standard}) {
                      Carp::my_carp("Can't change file registered to $stricter_to_file_of{$standard} to '$sub_filename'.");
                  }
@@ -11591,7 +12207,7 @@ sub register_file_for_name($$$) {
                      # will work.  Also note that this assumes that such a
                      # number is matched strictly; so if that were to change,
                      # this would be wrong.
-                    if ((my $integer_name = $name)
+                    if ((my $integer_name = $alias->name)
                              =~ s/^ ( -? \d+ ) \.0+ $ /$1/x)
                      {
                          $stricter_to_file_of{$property . $integer_name}
@@ -11604,6 +12220,11 @@ sub register_file_for_name($$$) {
              if ($deprecated) {
                  $utf8::why_deprecated{$sub_filename} = $deprecated;
              }
+
+            # And a substitute table, if any, for case-insensitive matching
+            if ($caseless_equivalent != 0) {
+                $caseless_equivalent_to{$standard} = $caseless_equivalent;
+            }
          }
      }
  
@@ -12016,7 +12637,6 @@ sub make_table_pod_entries($) {
                  # expression, but with only one of 'Single', 'Short' if there
                  # are both items.
                  if ($short_name || $single_form || $table->conflicting) {
-                    $parenthesized .= '(';
                      $parenthesized .= "Short: $short_name" if $short_name;
                      if ($short_name && $single_form) {
                          $parenthesized .= ', ';
@@ -12036,18 +12656,16 @@ sub make_table_pod_entries($) {
              # to go on every entry.
              my $conflicting = join " NOR ", $table->conflicting;
              if ($conflicting) {
-                $parenthesized .= '(' if ! $parenthesized;
-                $parenthesized .=  '; ' if $parenthesized ne '(';
+                $parenthesized .=  '; ' if $parenthesized ne "";
                  $parenthesized .= "NOT $conflicting";
              }
-            $parenthesized .= ')' if $parenthesized;
  
-            push @info, $parenthesized if $parenthesized;
+            push @info, "($parenthesized)" if $parenthesized;
  
              if ($table_property != $perl && $table->perl_extension) {
                  push @info, '(Perl extension)';
              }
-            push @info, "($string_count)" if $output_range_counts;
+            push @info, "($string_count)";
  
              # Now, we have both the entry and info so add them to the
              # list of all the properties.
@@ -12358,7 +12976,7 @@ both single and compound forms.
  B<Compound forms> consist of two components, separated by an equals sign or a
  colon.  The first component is the property name, and the second component is
  the particular value of the property to match against, for example,
-'\\p{Script: Greek}' or '\\p{Script=Greek}' both mean to match characters
+'\\p{Script: Greek}' and '\\p{Script=Greek}' both mean to match characters
  whose Script property is Greek.
  
  B<Single forms>, like '\\p{Greek}', are mostly Perl-defined shortcuts for
@@ -12410,29 +13028,28 @@ adjacent to (but within) the braces and the colon or equal sign.
  =back
  
  Some properties are considered obsolete, but still available.  There are
-several varieties of obsolesence:
+several varieties of obsolescence:
  
  =over 4
  
  =item Obsolete
  
  Properties marked with $a_bold_obsolete in the table are considered
-obsolete.  At the time of this writing (Unicode version 5.2) there is no
-information in the Unicode standard about the implications of a property being
  obsolete.
  
  =item Stabilized
  
-Obsolete properties may be stabilized.  This means that they are not actively
-maintained by Unicode, and will not be extended as new characters are added to
-the standard.  Such properties are marked with $a_bold_stabilized in the
-table.  At the time of this writing (Unicode version 5.2) there is no further
-information in the Unicode standard about the implications of a property being
-stabilized.
+Obsolete properties may be stabilized.  Such a determination does not indicate
+that the property should or should not be used; instead it is a declaration
+that the property will not be maintained nor extended for newly encoded
+characters.  Such properties are marked with $a_bold_stabilized in the
+table.
  
  =item Deprecated
  
-Obsolete properties may be deprecated.  This means that their use is strongly
+An obsolete property may be deprecated, perhaps because its original intent
+has been replaced by another property or because its specification was somehow
+defective.  This means that its use is strongly
  discouraged, so much so that a warning will be issued if used, unless the
  regular expression is in the scope of a C<S<no warnings 'deprecated'>>
  statement.  $A_bold_deprecated flags each such entry in the table, and
@@ -12455,7 +13072,7 @@ flags each such entry in the table.
  @block_warning
  
  The table below has two columns.  The left column contains the \\p{}
-constructs to look up, possibly preceeded by the flags mentioned above; and
+constructs to look up, possibly preceded by the flags mentioned above; and
  the right column contains information about them, like a description, or
  synonyms.  It shows both the single and compound forms for each property that
  has them.  If the left column is a short name for a property, the right column
@@ -12540,8 +13157,8 @@ Case_Folding is accessible through the /i modifier in regular expressions.
  
  The Name property is accessible through the \\N{} interpolation in
  double-quoted strings and regular expressions, but both usages require a C<use
-charnames;> to be specified, which also contains related functions viacode()
-and vianame().
+charnames;> to be specified, which also contains related functions viacode(),
+vianame(), and string_vianame().
  
  =head1 Unicode regular expression properties that are NOT accepted by Perl
  
@@ -12557,8 +13174,9 @@ the properties are listed enclosed in (parentheses).
  =back
  
  An installation can choose to allow any of these to be matched by changing the
-controlling lists contained in the program C<\$Config{privlib}>/F<unicore/$0>
-and then re-running F<$0>.  (C<\%Config> is available from the Config module).
+controlling lists contained in the program
+C<\$Config{privlib}>/F<unicore/mktables> and then re-running F<mktables>.
+(C<\%Config> is available from the Config module).
  
  =head1 Files in the I<To> directory (for serious hackers only)
  
@@ -12581,14 +13199,14 @@ accessible through the Perl core, although some may be accessed indirectly.
  For example, the uc() function implements the Uppercase_Mapping property and
  uses the F<Upper.pl> file found in this directory.
  
-The available files with their properties (short names in parentheses),
-and any flags or comments about them, are:
+The available files in the current installation, with their properties (short
+names in parentheses), and any flags or comments about them, are:
  
  @map_tables_actually_output
  
  An installation can choose to change which files are generated by changing the
-controlling lists contained in the program C<\$Config{privlib}>/F<unicore/$0>
-and then re-running F<$0>.
+controlling lists contained in the program
+C<\$Config{privlib}>/F<unicore/mktables> and then re-running F<mktables>.
  
  Each of these files defines two hash entries to help reading programs decipher
  it.  One of them looks like this:
@@ -12628,8 +13246,8 @@ L<perlunicode>
  
  END
  
-    # And write it.
-    main::write([ $pod_directory, "$pod_file.pod" ], @OUT);
+    # And write it.  The 0 means no utf8.
+    main::write([ $pod_directory, "$pod_file.pod" ], 0, \@OUT);
      return;
  }
  
@@ -12687,10 +13305,29 @@ END
      push @heavy, <<END;
  );
  
+# A few properties have different behavior under /i matching.  This maps the
+# those to substitute files to use under /i.
+\%utf8::caseless_equivalent = (
+END
+
+
+    # We set the key to the file when we associated files with tables, but we
+    # couldn't do the same for the value then, as we might not have the file
+    # for the alternate table figured out at that time.
+    foreach my $cased (keys %caseless_equivalent_to) {
+        my @path = $caseless_equivalent_to{$cased}->file_path;
+        my $path = join '/', @path[1, -1];
+        $path =~ s/\.pl//;
+        $utf8::caseless_equivalent_to{$cased} = $path;
+    }
+    push @heavy, simple_dumper (\%utf8::caseless_equivalent_to, ' ' x 4);
+    push @heavy, <<END;
+);
+
  1;
  END
  
-    main::write("Heavy.pl", @heavy);
+    main::write("Heavy.pl", 0, \@heavy);  # The 0 means no utf8.
      return;
  }
  
@@ -13007,7 +13644,7 @@ sub write_all_tables() {
              $filename = $table->file;
          }
  
-        # Use specified filename if avaliable, or default to property's
+        # Use specified filename if available, or default to property's
          # shortest name.  We need an 8.3 safe filename (which means "an 8
          # safe" filename, since after the dot is only 'pl', which is < 3)
          # The 2nd parameter is if the filename shouldn't be changed, and
@@ -13067,12 +13704,11 @@ sub generate_separator($) {
              . $spaces_after;
  }
  
-sub generate_tests($$$$$$) {
+sub generate_tests($$$$$) {
      # This used only for making the test script.  It generates test cases that
      # are expected to compile successfully in perl.  Note that the lhs and
      # rhs are assumed to already be as randomized as the caller wants.
  
-    my $file_handle = shift;   # Where to output the tests
      my $lhs = shift;           # The property: what's to the left of the colon
                                 #  or equals separator
      my $rhs = shift;           # The property value; what's to the right
@@ -13089,35 +13725,31 @@ sub generate_tests($$$$$$) {
      # The whole 'property=value'
      my $name = "$lhs$separator$rhs";
  
+    my @output;
      # Create a complete set of tests, with complements.
      if (defined $valid_code) {
-        printf $file_handle
-                    qq/Expect(1, $valid_code, '\\p{$name}', $warning);\n/;
-        printf $file_handle
-                    qq/Expect(0, $valid_code, '\\p{^$name}', $warning);\n/;
-        printf $file_handle
-                    qq/Expect(0, $valid_code, '\\P{$name}', $warning);\n/;
-        printf $file_handle
-                    qq/Expect(1, $valid_code, '\\P{^$name}', $warning);\n/;
+       push @output, <<"EOC"
+Expect(1, $valid_code, '\\p{$name}', $warning);
+Expect(0, $valid_code, '\\p{^$name}', $warning);
+Expect(0, $valid_code, '\\P{$name}', $warning);
+Expect(1, $valid_code, '\\P{^$name}', $warning);
+EOC
      }
      if (defined $invalid_code) {
-        printf $file_handle
-                    qq/Expect(0, $invalid_code, '\\p{$name}', $warning);\n/;
-        printf $file_handle
-                    qq/Expect(1, $invalid_code, '\\p{^$name}', $warning);\n/;
-        printf $file_handle
-                    qq/Expect(1, $invalid_code, '\\P{$name}', $warning);\n/;
-        printf $file_handle
-                    qq/Expect(0, $invalid_code, '\\P{^$name}', $warning);\n/;
-    }
-    return;
+       push @output, <<"EOC"
+Expect(0, $invalid_code, '\\p{$name}', $warning);
+Expect(1, $invalid_code, '\\p{^$name}', $warning);
+Expect(1, $invalid_code, '\\P{$name}', $warning);
+Expect(0, $invalid_code, '\\P{^$name}', $warning);
+EOC
+    }
+    return @output;
  }
  
-sub generate_error($$$$) {
+sub generate_error($$$) {
      # This used only for making the test script.  It generates test cases that
      # are expected to not only not match, but to be syntax or similar errors
  
-    my $file_handle = shift;        # Where to output to.
      my $lhs = shift;                # The property: what's to the left of the
                                      # colon or equals separator
      my $rhs = shift;                # The property value; what's to the right
@@ -13134,9 +13766,10 @@ sub generate_error($$$$) {
  
      my $property = $lhs . $separator . $rhs;
  
-    print $file_handle qq/Error('\\p{$property}');\n/;
-    print $file_handle qq/Error('\\P{$property}');\n/;
-    return;
+    return <<"EOC";
+Error('\\p{$property}');
+Error('\\P{$property}');
+EOC
  }
  
  # These are used only for making the test script
@@ -13302,14 +13935,6 @@ sub make_property_test_script() {
  
      $t_path = 'TestProp.pl' unless defined $t_path; # the traditional name
  
-    force_unlink ($t_path);
-    push @files_actually_output, $t_path;
-    my $OUT;
-    if (not open $OUT, "> $t_path") {
-        Carp::my_carp("Can't open $t_path.  Skipping: $!");
-        return;
-    }
-
      # Keep going down an order of magnitude
      # until find that adding this quantity to
      # 1 remains 1; but put an upper limit on
@@ -13326,7 +13951,10 @@ sub make_property_test_script() {
                              # use previous one
          $min_floating_slop = $next;
      }
-    print $OUT $HEADER, <DATA>;
+
+    # It doesn't matter whether the elements of this array contain single lines
+    # or multiple lines. main::write doesn't count the lines.
+    my @output;
  
      foreach my $property (property_ref('*')) {
          foreach my $table ($property->tables) {
@@ -13361,10 +13989,9 @@ sub make_property_test_script() {
                  my $already_error = ! $table->file_path;
  
                  # Generate error cases for this alias.
-                generate_error($OUT,
-                                $property_name,
-                                $table_name,
-                                $already_error);
+                push @output, generate_error($property_name,
+                                             $table_name,
+                                             $already_error);
  
                  # If the table is guaranteed to always generate an error,
                  # quit now without generating success cases.
@@ -13385,13 +14012,12 @@ sub make_property_test_script() {
                      # Don't output duplicate test cases.
                      if (! exists $test_generated{$test_name}) {
                          $test_generated{$test_name} = 1;
-                        generate_tests($OUT,
-                                        $property_name,
-                                        $standard,
-                                        $valid,
-                                        $invalid,
-                                        $warning,
-                                    );
+                        push @output, generate_tests($property_name,
+                                                     $standard,
+                                                     $valid,
+                                                     $invalid,
+                                                     $warning,
+                                                 );
                      }
                      $random = randomize_loose_name($table_name)
                  }
@@ -13403,13 +14029,12 @@ sub make_property_test_script() {
                  my $test_name = "$property_name=$random";
                  if (! exists $test_generated{$test_name}) {
                      $test_generated{$test_name} = 1;
-                    generate_tests($OUT,
-                                    $property_name,
-                                    $random,
-                                    $valid,
-                                    $invalid,
-                                    $warning,
-                                );
+                    push @output, generate_tests($property_name,
+                                                 $random,
+                                                 $valid,
+                                                 $invalid,
+                                                 $warning,
+                                             );
  
                      # If the name is a rational number, add tests for the
                      # floating point equivalent.
@@ -13451,24 +14076,22 @@ sub make_property_test_script() {
                                          if abs($table_name - $existing)
                                                  < $MAX_FLOATING_SLOP;
                                  }
-                                generate_error($OUT,
-                                            $property_name,
-                                            $table_name,
-                                            1   # 1 => already an error
-                                );
+                                push @output, generate_error($property_name,
+                                                             $table_name,
+                                                             1   # 1 => already an error
+                                              );
                              }
                              else {
  
                                  # Here the number of digits exceeds the
                                  # minimum we think is needed.  So generate a
                                  # success test case for it.
-                                generate_tests($OUT,
-                                                $property_name,
-                                                $table_name,
-                                                $valid,
-                                                $invalid,
-                                                $warning,
-                                );
+                                push @output, generate_tests($property_name,
+                                                             $table_name,
+                                                             $valid,
+                                                             $invalid,
+                                                             $warning,
+                                             );
                              }
                          }
                      }
@@ -13477,12 +14100,12 @@ sub make_property_test_script() {
          }
      }
  
-    foreach my $test (@backslash_X_tests) {
-        print $OUT "Test_X('$test');\n";
-    }
-
-    print $OUT "Finished();\n";
-    close $OUT;
+    &write($t_path,
+           0,           # Not utf8;
+           [<DATA>,
+            @output,
+            (map {"Test_X('$_');\n"} @backslash_X_tests),
+            "Finished();\n"]);
      return;
  }
  
@@ -13572,7 +14195,12 @@ my @input_file_objects = (
                                              ? \&filter_v1_ucd
                                              : ($v_version eq v2.1.5)
                                                  ? \&filter_v2_1_5_ucd
-                                                : undef),
+
+                                                # And for 5.14 Perls with 6.0,
+                                                # have to also make changes
+                                                : ($v_version ge v6.0.0)
+                                                    ? \&filter_v6_ucd
+                                                    : undef),
  
                                              # And the main filter
                                              \&filter_UnicodeData_line,
@@ -13757,15 +14385,19 @@ File::Find::find({
  }, File::Spec->curdir());
  
  my @mktables_list_output_files;
+my $old_start_time = 0;
  
-if ($write_unchanged_files) {
+if (! -e $file_list) {
+    print "'$file_list' doesn't exist, so forcing rebuild.\n" if $verbosity >= $VERBOSE;
+    $write_unchanged_files = 1;
+} elsif ($write_unchanged_files) {
      print "Not checking file list '$file_list'.\n" if $verbosity >= $VERBOSE;
  }
  else {
      print "Reading file list '$file_list'\n" if $verbosity >= $VERBOSE;
      my $file_handle;
      if (! open $file_handle, "<", $file_list) {
-        Carp::my_carp("Failed to open '$file_list' (this is expected to be missing the first time); turning on -globlist option instead: $!");
+        Carp::my_carp("Failed to open '$file_list'; turning on -globlist option instead: $!");
          $glob_list = 1;
      }
      else {
@@ -13776,6 +14408,9 @@ else {
          for my $list ( \@input, \@mktables_list_output_files ) {
              while (<$file_handle>) {
                  s/^ \s+ | \s+ $//xg;
+                if (/^ \s* \# .* Autogenerated\ starting\ on\ (\d+)/x) {
+                    $old_start_time = $1;
+                }
                  next if /^ \s* (?: \# .* )? $/x;
                  last if /^ =+ $/x;
                  my ( $file ) = split /\t/;
@@ -13883,12 +14518,12 @@ if ( $verbosity >= $VERBOSE ) {
           "Checking ".scalar( @mktables_list_output_files )." output files.\n";
  }
  
-# We set $youngest to be the most recently changed input file, including this
-# program itself (done much earlier in this file)
+# We set $most_recent to be the most recently changed input file, including
+# this program itself (done much earlier in this file)
  foreach my $in (@input_files) {
-    my $age = -M $in;
-    next unless defined $age;        # Keep going even if missing a file
-    $youngest = $age if $age < $youngest;
+    next unless -e $in;        # Keep going even if missing a file
+    my $mod_time = (stat $in)[9];
+    $most_recent = $mod_time if $mod_time > $most_recent;
  
      # See that the input files have distinct names, to warn someone if they
      # are adding a new one
@@ -13901,30 +14536,31 @@ foreach my $in (@input_files) {
      }
  }
  
-my $ok = ! $write_unchanged_files
-        && scalar @mktables_list_output_files;        # If none known, rebuild
+my $rebuild = $write_unchanged_files    # Rebuild: if unconditional rebuild
+              || ! scalar @mktables_list_output_files  # or if no outputs known
+              || $old_start_time < $most_recent;       # or out-of-date
  
  # Now we check to see if any output files are older than youngest, if
  # they are, we need to continue on, otherwise we can presumably bail.
-if ($ok) {
+if (! $rebuild) {
      foreach my $out (@mktables_list_output_files) {
          if ( ! file_exists($out)) {
              print "'$out' is missing.\n" if $verbosity >= $VERBOSE;
-            $ok = 0;
+            $rebuild = 1;
              last;
           }
          #local $to_trace = 1 if main::DEBUG;
-        trace $youngest, -M $out if main::DEBUG && $to_trace;
-        if ( -M $out > $youngest ) {
-            #trace "$out: age: ", -M $out, ", youngest: $youngest\n" if main::DEBUG && $to_trace;
+        trace $most_recent, (stat $out)[9] if main::DEBUG && $to_trace;
+        if ( (stat $out)[9] <= $most_recent ) {
+            #trace "$out:  most recent mod time: ", (stat $out)[9], ", youngest: $most_recent\n" if main::DEBUG && $to_trace;
              print "'$out' is too old.\n" if $verbosity >= $VERBOSE;
-            $ok = 0;
+            $rebuild = 1;
              last;
          }
      }
  }
-if ($ok) {
-    print "Files seem to be ok, not bothering to rebuild.\n";
+if (! $rebuild) {
+    print "Files seem to be ok, not bothering to rebuild.  Add '-w' option to force build\n";
      exit(0);
  }
  print "Must rebuild tables.\n" if $verbosity >= $VERBOSE;
@@ -13967,15 +14603,16 @@ if ( $file_list and $make_list ) {
          return
      }
      else {
+        my $localtime = localtime $start_time;
          print $ofh <<"END";
  #
  # $file_list -- File list for $0.
  #
-#   Autogenerated on @{[scalar localtime]}
+#   Autogenerated starting on $start_time ($localtime)
  #
  # - First section is input files
  #   ($0 itself is not listed but is automatically considered an input)
-# - Section seperator is /^=+\$/
+# - Section separator is /^=+\$/
  # - Second section is a list of output files.
  # - Lines matching /^\\s*#/ are treated as comments
  #   which along with blank lines are ignored.
@@ -14024,6 +14661,11 @@ __DATA__
  use strict;
  use warnings;
  
+# If run outside the normal test suite on an ASCII platform, you can
+# just create a latin1_to_native() function that just returns its
+# inputs, because that's the only function used from test.pl
+require "test.pl";
+
  # Test qr/\X/ and the \p{} regular expression constructs.  This file is
  # constructed by mktables from the tables it generates, so if mktables is
  # buggy, this won't necessarily catch those bugs.  Tests are generated for all
@@ -14036,42 +14678,6 @@ use warnings;
  my $Tests = 0;
  my $Fails = 0;
  
-my $non_ASCII = (ord('A') != 65);
-
-# The 256 8-bit characters in ASCII ordinal order, with the ones that don't
-# have Perl names replaced by -1
-my @ascii_ordered_chars = (
-    "\0",
-    (-1) x 6,
-    "\a", "\b", "\t", "\n",
-    -1,   # No Vt
-    "\f", "\r",
-    (-1) x 18,
-    " ", "!", "\"", "#", '$', "%", "&", "'",
-    "(", ")", "*", "+", ",", "-", ".", "/",
-    "0", "1", "2", "3", "4", "5", "6", "7", "8", "9",
-    ":", ";", "<", "=", ">", "?", "@",
-    "A", "B", "C", "D", "E", "F", "G", "H", "I", "J", "K", "L", "M",
-    "N", "O", "P", "Q", "R", "S", "T", "U", "V", "W", "X", "Y", "Z",
-    "[", "\\", "]", "^", "_", "`",
-    "a", "b", "c", "d", "e", "f", "g", "h", "i", "j", "k", "l", "m",
-    "n", "o", "p", "q", "r", "s", "t", "u", "v", "w", "x", "y", "z",
-    "{", "|", "}", "~",
-    (-1) x 129
-);
-
-sub ASCII_ord_to_native ($) {
-    # Converts input ordinal number to the native one, if can be done easily.
-    # Returns -1 otherwise.
-
-    my $ord = shift;
-
-    return $ord if $ord > 255 || ! $non_ASCII;
-    my $result = $ascii_ordered_chars[$ord];
-    return $result if $result eq '-1';
-    return ord($result);
-}
-
  sub Expect($$$$) {
      my $expected = shift;
      my $ord = shift;
@@ -14079,17 +14685,7 @@ sub Expect($$$$) {
      my $warning_type = shift;   # Type of warning message, like 'deprecated'
                                  # or empty if none
      my $line   = (caller)[2];
-
-    # Convert the non-ASCII code points expressible as characters to their
-    # ASCII equivalents, and skip the others.
-    $ord = ASCII_ord_to_native($ord);
-    if ($ord < 0) {
-        $Tests++;
-        print "ok $Tests - "
-              . sprintf("\"\\x{%04X}\"", $ord)
-              . " =~ $regex # Skipped: non-ASCII\n";
-        return;
-    }
+    $ord = ord(latin1_to_native(chr($ord)));
  
      # Convert the code point to hex form
      my $string = sprintf "\"\\x{%04X}\"", $ord;
@@ -14220,13 +14816,7 @@ sub Test_X($) {
          my $this_string = "";
          my $this_display = "";
          foreach my $code_point (@code_points) {
-            my $ord = ASCII_ord_to_native(hex $code_point);
-            if ($ord < 0) {
-                $Tests++;
-                print "ok $Tests - String containing $code_point =~ /(\\X)/g # Skipped: non-ASCII\n";
-                return;
-            }
-            $this_string .= chr $ord;
+            $this_string .= latin1_to_native(chr(hex $code_point));
              $this_display .= "\\x{$code_point}";
          }