Clean up -Dy debugging

[perl5.git] / op.c
diff --git a/op.c b/op.c

index b9abc1c..66d773f 100644 (file)
--- a/op.c
+++ b/op.c
@@ -164,6 +164,7 @@ recursive, but it's recursive on basic blocks, not on tree nodes.
  #include "keywords.h"
  #include "feature.h"
  #include "regcomp.h"
  #include "keywords.h"
  #include "feature.h"
  #include "regcomp.h"
+#include "invlist_inline.h"
  
  #define CALL_PEEP(o) PL_peepp(aTHX_ o)
  #define CALL_RPEEP(o) PL_rpeepp(aTHX_ o)
  
  #define CALL_PEEP(o) PL_peepp(aTHX_ o)
  #define CALL_RPEEP(o) PL_rpeepp(aTHX_ o)
@@ -208,13 +209,26 @@ S_prune_chain_head(OP** op_p)
  #define SIZE_TO_PSIZE(x)       (((x) + sizeof(I32 *) - 1)/sizeof(I32 *))
  #define DIFF(o,p)              ((size_t)((I32 **)(p) - (I32**)(o)))
  
  #define SIZE_TO_PSIZE(x)       (((x) + sizeof(I32 *) - 1)/sizeof(I32 *))
  #define DIFF(o,p)              ((size_t)((I32 **)(p) - (I32**)(o)))
  
-/* malloc a new op slab (suitable for attaching to PL_compcv) */
+/* requires double parens and aTHX_ */
+#define DEBUG_S_warn(args)                                            \
+    DEBUG_S(                                                           \
+       PerlIO_printf(Perl_debug_log, "%s", SvPVx_nolen(Perl_mess args)) \
+    )
+
+
+/* malloc a new op slab (suitable for attaching to PL_compcv).
+ * sz is in units of pointers */
  
  static OPSLAB *
  
  static OPSLAB *
-S_new_slab(pTHX_ size_t sz)
+S_new_slab(pTHX_ OPSLAB *head, size_t sz)
  {
  {
+    OPSLAB *slab;
+
+    /* opslot_offset is only U16 */
+    assert(sz  < U16_MAX);
+
  #ifdef PERL_DEBUG_READONLY_OPS
  #ifdef PERL_DEBUG_READONLY_OPS
-    OPSLAB *slab = (OPSLAB *) mmap(0, sz * sizeof(I32 *),
+    slab = (OPSLAB *) mmap(0, sz * sizeof(I32 *),
                                    PROT_READ|PROT_WRITE,
                                    MAP_ANON|MAP_PRIVATE, -1, 0);
      DEBUG_m(PerlIO_printf(Perl_debug_log, "mapped %lu at %p\n",
                                    PROT_READ|PROT_WRITE,
                                    MAP_ANON|MAP_PRIVATE, -1, 0);
      DEBUG_m(PerlIO_printf(Perl_debug_log, "mapped %lu at %p\n",
@@ -223,23 +237,23 @@ S_new_slab(pTHX_ size_t sz)
         perror("mmap failed");
         abort();
      }
         perror("mmap failed");
         abort();
      }
-    slab->opslab_size = (U16)sz;
  #else
  #else
-    OPSLAB *slab = (OPSLAB *)PerlMemShared_calloc(sz, sizeof(I32 *));
+    slab = (OPSLAB *)PerlMemShared_calloc(sz, sizeof(I32 *));
  #endif
  #endif
+    slab->opslab_size = (U16)sz;
+
  #ifndef WIN32
      /* The context is unused in non-Windows */
      PERL_UNUSED_CONTEXT;
  #endif
  #ifndef WIN32
      /* The context is unused in non-Windows */
      PERL_UNUSED_CONTEXT;
  #endif
-    slab->opslab_first = (OPSLOT *)((I32 **)slab + sz - 1);
+    slab->opslab_free_space = sz - DIFF(slab, &slab->opslab_slots);
+    slab->opslab_head = head ? head : slab;
+    DEBUG_S_warn((aTHX_ "allocated new op slab sz 0x%x, %p, head slab %p",
+        (unsigned int)slab->opslab_size, (void*)slab,
+        (void*)(slab->opslab_head)));
      return slab;
  }
  
      return slab;
  }
  
-/* requires double parens and aTHX_ */
-#define DEBUG_S_warn(args)                                            \
-    DEBUG_S(                                                           \
-       PerlIO_printf(Perl_debug_log, "%s", SvPVx_nolen(Perl_mess args)) \
-    )
  
  /* Returns a sz-sized block of memory (suitable for holding an op) from
   * a free slot in the chain of op slabs attached to PL_compcv.
  
  /* Returns a sz-sized block of memory (suitable for holding an op) from
   * a free slot in the chain of op slabs attached to PL_compcv.
@@ -250,11 +264,11 @@ S_new_slab(pTHX_ size_t sz)
  void *
  Perl_Slab_Alloc(pTHX_ size_t sz)
  {
  void *
  Perl_Slab_Alloc(pTHX_ size_t sz)
  {
-    OPSLAB *slab;
+    OPSLAB *head_slab; /* first slab in the chain */
      OPSLAB *slab2;
      OPSLOT *slot;
      OP *o;
      OPSLAB *slab2;
      OPSLOT *slot;
      OP *o;
-    size_t opsz, space;
+    size_t opsz;
  
      /* We only allocate ops from the slab during subroutine compilation.
         We find the slab via PL_compcv, hence that must be non-NULL. It could
  
      /* We only allocate ops from the slab during subroutine compilation.
         We find the slab via PL_compcv, hence that must be non-NULL. It could
@@ -277,11 +291,11 @@ Perl_Slab_Alloc(pTHX_ size_t sz)
         details.  */
      if (!CvSTART(PL_compcv)) {
         CvSTART(PL_compcv) =
         details.  */
      if (!CvSTART(PL_compcv)) {
         CvSTART(PL_compcv) =
-           (OP *)(slab = S_new_slab(aTHX_ PERL_SLAB_SIZE));
+           (OP *)(head_slab = S_new_slab(aTHX_ NULL, PERL_SLAB_SIZE));
         CvSLABBED_on(PL_compcv);
         CvSLABBED_on(PL_compcv);
-       slab->opslab_refcnt = 2; /* one for the CV; one for the new OP */
+       head_slab->opslab_refcnt = 2; /* one for the CV; one for the new OP */
      }
      }
-    else ++(slab = (OPSLAB *)CvSTART(PL_compcv))->opslab_refcnt;
+    else ++(head_slab = (OPSLAB *)CvSTART(PL_compcv))->opslab_refcnt;
  
      opsz = SIZE_TO_PSIZE(sz);
      sz = opsz + OPSLOT_HEADER_P;
  
      opsz = SIZE_TO_PSIZE(sz);
      sz = opsz + OPSLOT_HEADER_P;
@@ -289,16 +303,24 @@ Perl_Slab_Alloc(pTHX_ size_t sz)
      /* The slabs maintain a free list of OPs. In particular, constant folding
         will free up OPs, so it makes sense to re-use them where possible. A
         freed up slot is used in preference to a new allocation.  */
      /* The slabs maintain a free list of OPs. In particular, constant folding
         will free up OPs, so it makes sense to re-use them where possible. A
         freed up slot is used in preference to a new allocation.  */
-    if (slab->opslab_freed) {
-       OP **too = &slab->opslab_freed;
+    if (head_slab->opslab_freed) {
+       OP **too = &head_slab->opslab_freed;
         o = *too;
         o = *too;
-       DEBUG_S_warn((aTHX_ "found free op at %p, slab %p", (void*)o, (void*)slab));
-       while (o && DIFF(OpSLOT(o), OpSLOT(o)->opslot_next) < sz) {
+        DEBUG_S_warn((aTHX_ "found free op at %p, slab %p, head slab %p",
+            (void*)o,
+            (I32**)OpSLOT(o) - OpSLOT(o)->opslot_offset,
+            (void*)head_slab));
+
+       while (o && OpSLOT(o)->opslot_size < sz) {
             DEBUG_S_warn((aTHX_ "Alas! too small"));
             o = *(too = &o->op_next);
             if (o) { DEBUG_S_warn((aTHX_ "found another free op at %p", (void*)o)); }
         }
         if (o) {
             DEBUG_S_warn((aTHX_ "Alas! too small"));
             o = *(too = &o->op_next);
             if (o) { DEBUG_S_warn((aTHX_ "found another free op at %p", (void*)o)); }
         }
         if (o) {
+            DEBUG_S_warn((aTHX_ "realloced  op at %p, slab %p, head slab %p",
+                (void*)o,
+                (I32**)OpSLOT(o) - OpSLOT(o)->opslot_offset,
+                (void*)head_slab));
             *too = o->op_next;
             Zero(o, opsz, I32 *);
             o->op_slabbed = 1;
             *too = o->op_next;
             Zero(o, opsz, I32 *);
             o->op_slabbed = 1;
@@ -306,48 +328,45 @@ Perl_Slab_Alloc(pTHX_ size_t sz)
         }
      }
  
         }
      }
  
-#define INIT_OPSLOT \
-           slot->opslot_slab = slab;                   \
-           slot->opslot_next = slab2->opslab_first;    \
-           slab2->opslab_first = slot;                 \
+#define INIT_OPSLOT(s) \
+           slot->opslot_offset = DIFF(slab2, slot) ;   \
+           slot->opslot_size = s;                      \
+           slab2->opslab_free_space -= s;              \
             o = &slot->opslot_op;                       \
             o->op_slabbed = 1
  
      /* The partially-filled slab is next in the chain. */
             o = &slot->opslot_op;                       \
             o->op_slabbed = 1
  
      /* The partially-filled slab is next in the chain. */
-    slab2 = slab->opslab_next ? slab->opslab_next : slab;
-    if ((space = DIFF(&slab2->opslab_slots, slab2->opslab_first)) < sz) {
+    slab2 = head_slab->opslab_next ? head_slab->opslab_next : head_slab;
+    if (slab2->opslab_free_space  < sz) {
         /* Remaining space is too small. */
         /* Remaining space is too small. */
-
         /* If we can fit a BASEOP, add it to the free chain, so as not
            to waste it. */
         /* If we can fit a BASEOP, add it to the free chain, so as not
            to waste it. */
-       if (space >= SIZE_TO_PSIZE(sizeof(OP)) + OPSLOT_HEADER_P) {
+       if (slab2->opslab_free_space >= SIZE_TO_PSIZE(sizeof(OP)) + OPSLOT_HEADER_P) {
             slot = &slab2->opslab_slots;
             slot = &slab2->opslab_slots;
-           INIT_OPSLOT;
+           INIT_OPSLOT(slab2->opslab_free_space);
             o->op_type = OP_FREED;
             o->op_type = OP_FREED;
-           o->op_next = slab->opslab_freed;
-           slab->opslab_freed = o;
+           o->op_next = head_slab->opslab_freed;
+           head_slab->opslab_freed = o;
         }
  
         /* Create a new slab.  Make this one twice as big. */
         }
  
         /* Create a new slab.  Make this one twice as big. */
-       slot = slab2->opslab_first;
-       while (slot->opslot_next) slot = slot->opslot_next;
-       slab2 = S_new_slab(aTHX_
-                           (DIFF(slab2, slot)+1)*2 > PERL_MAX_SLAB_SIZE
-                                       ? PERL_MAX_SLAB_SIZE
-                                       : (DIFF(slab2, slot)+1)*2);
-       slab2->opslab_next = slab->opslab_next;
-       slab->opslab_next = slab2;
+       slab2 = S_new_slab(aTHX_ head_slab,
+                           slab2->opslab_size  > PERL_MAX_SLAB_SIZE / 2
+                                ? PERL_MAX_SLAB_SIZE
+                                : slab2->opslab_size * 2);
+       slab2->opslab_next = head_slab->opslab_next;
+       head_slab->opslab_next = slab2;
      }
      }
-    assert(DIFF(&slab2->opslab_slots, slab2->opslab_first) >= sz);
+    assert(slab2->opslab_size >= sz);
  
      /* Create a new op slot */
  
      /* Create a new op slot */
-    slot = (OPSLOT *)((I32 **)slab2->opslab_first - sz);
+    slot = (OPSLOT *)
+                ((I32 **)&slab2->opslab_slots
+                                + slab2->opslab_free_space - sz);
      assert(slot >= &slab2->opslab_slots);
      assert(slot >= &slab2->opslab_slots);
-    if (DIFF(&slab2->opslab_slots, slot)
-        < SIZE_TO_PSIZE(sizeof(OP)) + OPSLOT_HEADER_P)
-       slot = &slab2->opslab_slots;
-    INIT_OPSLOT;
-    DEBUG_S_warn((aTHX_ "allocating op at %p, slab %p", (void*)o, (void*)slab));
+    INIT_OPSLOT(sz);
+    DEBUG_S_warn((aTHX_ "allocating op at %p, slab %p, head slab %p",
+        (void*)o, (void*)slab2, (void*)head_slab));
  
    gotit:
      /* moresib == 0, op_sibling == 0 implies a solitary unattached op */
  
    gotit:
      /* moresib == 0, op_sibling == 0 implies a solitary unattached op */
@@ -446,7 +465,10 @@ Perl_Slab_Free(pTHX_ void *op)
      o->op_type = OP_FREED;
      o->op_next = slab->opslab_freed;
      slab->opslab_freed = o;
      o->op_type = OP_FREED;
      o->op_next = slab->opslab_freed;
      slab->opslab_freed = o;
-    DEBUG_S_warn((aTHX_ "free op at %p, recorded in slab %p", (void*)o, (void*)slab));
+    DEBUG_S_warn((aTHX_ "freeing    op at %p, slab %p, head slab %p",
+        (void*)o,
+        (I32**)OpSLOT(o) - OpSLOT(o)->opslot_offset,
+        (void*)slab));
      OpslabREFCNT_dec_padok(slab);
  }
  
      OpslabREFCNT_dec_padok(slab);
  }
  
@@ -514,10 +536,13 @@ Perl_opslab_force_free(pTHX_ OPSLAB *slab)
      PERL_ARGS_ASSERT_OPSLAB_FORCE_FREE;
      slab2 = slab;
      do {
      PERL_ARGS_ASSERT_OPSLAB_FORCE_FREE;
      slab2 = slab;
      do {
-        OPSLOT *slot;
-       for (slot = slab2->opslab_first;
-            slot->opslot_next;
-            slot = slot->opslot_next) {
+        OPSLOT *slot = (OPSLOT*)
+                    ((I32**)&slab2->opslab_slots + slab2->opslab_free_space);
+        OPSLOT *end  = (OPSLOT*)
+                        ((I32**)slab2 + slab2->opslab_size);
+       for (; slot < end;
+                slot = (OPSLOT*) ((I32**)slot + slot->opslot_size) )
+        {
             if (slot->opslot_op.op_type != OP_FREED
              && !(slot->opslot_op.op_savefree
  #ifdef DEBUGGING
             if (slot->opslot_op.op_type != OP_FREED
              && !(slot->opslot_op.op_savefree
  #ifdef DEBUGGING
@@ -616,7 +641,7 @@ S_too_few_arguments_pv(pTHX_ OP *o, const char* name, U32 flags)
      yyerror_pv(Perl_form(aTHX_ "Not enough arguments for %s", name), flags);
      return o;
  }
      yyerror_pv(Perl_form(aTHX_ "Not enough arguments for %s", name), flags);
      return o;
  }
- 
+
  STATIC OP *
  S_too_many_arguments_pv(pTHX_ OP *o, const char *name, U32 flags)
  {
  STATIC OP *
  S_too_many_arguments_pv(pTHX_ OP *o, const char *name, U32 flags)
  {
@@ -642,7 +667,7 @@ S_bad_type_gv(pTHX_ I32 n, GV *gv, const OP *kid, const char *t)
  {
      SV * const namesv = cv_name((CV *)gv, NULL, 0);
      PERL_ARGS_ASSERT_BAD_TYPE_GV;
  {
      SV * const namesv = cv_name((CV *)gv, NULL, 0);
      PERL_ARGS_ASSERT_BAD_TYPE_GV;
- 
+
      yyerror_pv(Perl_form(aTHX_ "Type of arg %d to %" SVf " must be %s (not %s)",
                  (int)n, SVfARG(namesv), t, OP_DESC(kid)), SvUTF8(namesv));
  }
      yyerror_pv(Perl_form(aTHX_ "Type of arg %d to %" SVf " must be %s (not %s)",
                  (int)n, SVfARG(namesv), t, OP_DESC(kid)), SvUTF8(namesv));
  }
@@ -680,16 +705,22 @@ Perl_allocmy(pTHX_ const char *const name, const STRLEN len, const U32 flags)
                  && isIDFIRST_utf8_safe((U8 *)name+1, name + len))
              || (name[1] == '_' && len > 2)))
      {
                  && isIDFIRST_utf8_safe((U8 *)name+1, name + len))
              || (name[1] == '_' && len > 2)))
      {
+        const char * const type =
+              PL_parser->in_my == KEY_sigvar ? "subroutine signature" :
+              PL_parser->in_my == KEY_state  ? "\"state\""     : "\"my\"";
+
         if (!(flags & SVf_UTF8 && UTF8_IS_START(name[1]))
          && isASCII(name[1])
          && (!isPRINT(name[1]) || strchr("\t\n\r\f", name[1]))) {
         if (!(flags & SVf_UTF8 && UTF8_IS_START(name[1]))
          && isASCII(name[1])
          && (!isPRINT(name[1]) || strchr("\t\n\r\f", name[1]))) {
-           /* diag_listed_as: Can't use global %s in "%s" */
-           yyerror(Perl_form(aTHX_ "Can't use global %c^%c%.*s in \"%s\"",
-                             name[0], toCTRL(name[1]), (int)(len - 2), name + 2,
-                             PL_parser->in_my == KEY_state ? "state" : "my"));
+           /* diag_listed_as: Can't use global %s in %s */
+           yyerror(Perl_form(aTHX_ "Can't use global %c^%c%.*s in %s",
+                             name[0], toCTRL(name[1]),
+                              (int)(len - 2), name + 2,
+                             type));
         } else {
         } else {
-           yyerror_pv(Perl_form(aTHX_ "Can't use global %.*s in \"%s\"", (int) len, name,
-                             PL_parser->in_my == KEY_state ? "state" : "my"), flags & SVf_UTF8);
+           yyerror_pv(Perl_form(aTHX_ "Can't use global %.*s in %s",
+                              (int) len, name,
+                             type), flags & SVf_UTF8);
         }
      }
  
         }
      }
  
@@ -1008,7 +1039,7 @@ Perl_op_clear(pTHX_ OP *o)
         /** Bug #15654
           Even if op_clear does a pad_free for the target of the op,
           pad_free doesn't actually remove the sv that exists in the pad;
         /** Bug #15654
           Even if op_clear does a pad_free for the target of the op,
           pad_free doesn't actually remove the sv that exists in the pad;
-         instead it lives on. This results in that it could be reused as 
+         instead it lives on. This results in that it could be reused as
           a target later on when the pad was reallocated.
         **/
          if(o->op_targ) {
           a target later on when the pad was reallocated.
         **/
          if(o->op_targ) {
@@ -1028,7 +1059,7 @@ Perl_op_clear(pTHX_ OP *o)
      case OP_TRANS:
      case OP_TRANSR:
         if (   (o->op_type == OP_TRANS || o->op_type == OP_TRANSR)
      case OP_TRANS:
      case OP_TRANSR:
         if (   (o->op_type == OP_TRANS || o->op_type == OP_TRANSR)
-            && (o->op_private & (OPpTRANS_FROM_UTF|OPpTRANS_TO_UTF)))
+            && (o->op_private & OPpTRANS_USE_SVOP))
          {
  #ifdef USE_ITHREADS
             if (cPADOPo->op_padix > 0) {
          {
  #ifdef USE_ITHREADS
             if (cPADOPo->op_padix > 0) {
@@ -1271,31 +1302,45 @@ S_forget_pmop(pTHX_ PMOP *const o)
             }
         }
      }
             }
         }
      }
-    if (PL_curpm == o) 
+    if (PL_curpm == o)
         PL_curpm = NULL;
  }
  
         PL_curpm = NULL;
  }
  
+
  STATIC void
  S_find_and_forget_pmops(pTHX_ OP *o)
  {
  STATIC void
  S_find_and_forget_pmops(pTHX_ OP *o)
  {
+    OP* top_op = o;
+
      PERL_ARGS_ASSERT_FIND_AND_FORGET_PMOPS;
  
      PERL_ARGS_ASSERT_FIND_AND_FORGET_PMOPS;
  
-    if (o->op_flags & OPf_KIDS) {
-        OP *kid = cUNOPo->op_first;
-       while (kid) {
-           switch (kid->op_type) {
-           case OP_SUBST:
-           case OP_SPLIT:
-           case OP_MATCH:
-           case OP_QR:
-               forget_pmop((PMOP*)kid);
-           }
-           find_and_forget_pmops(kid);
-           kid = OpSIBLING(kid);
-       }
+    while (1) {
+        switch (o->op_type) {
+        case OP_SUBST:
+        case OP_SPLIT:
+        case OP_MATCH:
+        case OP_QR:
+            forget_pmop((PMOP*)o);
+        }
+
+        if (o->op_flags & OPf_KIDS) {
+            o = cUNOPo->op_first;
+            continue;
+        }
+
+        while (1) {
+            if (o == top_op)
+                return; /* at top; no parents/siblings to try */
+            if (OpHAS_SIBLING(o)) {
+                o = o->op_sibparent; /* process next sibling */
+                break;
+            }
+            o = o->op_sibparent; /*try parent's next sibling */
+        }
      }
  }
  
      }
  }
  
+
  /*
  =for apidoc op_null
  
  /*
  =for apidoc op_null
  
@@ -1600,39 +1645,58 @@ not be called directly.
  =cut
  */
  
  =cut
  */
  
+
  OP *
  Perl_op_linklist(pTHX_ OP *o)
  {
  OP *
  Perl_op_linklist(pTHX_ OP *o)
  {
-    OP *first;
+
+    OP **prevp;
+    OP *kid;
+    OP * top_op = o;
  
      PERL_ARGS_ASSERT_OP_LINKLIST;
  
  
      PERL_ARGS_ASSERT_OP_LINKLIST;
  
-    if (o->op_next)
-       return o->op_next;
+    while (1) {
+        /* Descend down the tree looking for any unprocessed subtrees to
+         * do first */
+        if (!o->op_next) {
+            if (o->op_flags & OPf_KIDS) {
+                o = cUNOPo->op_first;
+                continue;
+            }
+            o->op_next = o; /* leaf node; link to self initially */
+        }
  
  
-    /* establish postfix order */
-    first = cUNOPo->op_first;
-    if (first) {
-        OP *kid;
-       o->op_next = LINKLIST(first);
-       kid = first;
-       for (;;) {
-            OP *sibl = OpSIBLING(kid);
-            if (sibl) {
-                kid->op_next = LINKLIST(sibl);
-                kid = sibl;
-           } else {
-               kid->op_next = o;
-               break;
-           }
-       }
-    }
-    else
-       o->op_next = o;
+        /* if we're at the top level, there either weren't any children
+         * to process, or we've worked our way back to the top. */
+        if (o == top_op)
+            return o->op_next;
+
+        /* o is now processed. Next, process any sibling subtrees */
+
+        if (OpHAS_SIBLING(o)) {
+            o = OpSIBLING(o);
+            continue;
+        }
+
+        /* Done all the subtrees at this level. Go back up a level and
+         * link the parent in with all its (processed) children.
+         */
  
  
-    return o->op_next;
+        o = o->op_sibparent;
+        assert(!o->op_next);
+        prevp = &(o->op_next);
+        kid   = (o->op_flags & OPf_KIDS) ? cUNOPo->op_first : NULL;
+        while (kid) {
+            *prevp = kid->op_next;
+            prevp = &(kid->op_next);
+            kid = OpSIBLING(kid);
+        }
+        *prevp = o;
+    }
  }
  
  }
  
+
  static OP *
  S_scalarkids(pTHX_ OP *o)
  {
  static OP *
  S_scalarkids(pTHX_ OP *o)
  {
@@ -1962,6 +2026,8 @@ Perl_scalar(pTHX_ OP *o)
  }
  
  
  }
  
  
+/* apply void context to the optree arg */
+
  OP *
  Perl_scalarvoid(pTHX_ OP *arg)
  {
  OP *
  Perl_scalarvoid(pTHX_ OP *arg)
  {
@@ -3053,6 +3119,8 @@ S_maybe_multiconcat(pTHX_ OP *o)
              && (SvPOK(sv) || SvIOK(sv))
              && (!SvGMAGICAL(sv))
          ) {
              && (SvPOK(sv) || SvIOK(sv))
              && (!SvGMAGICAL(sv))
          ) {
+            if (argop->op_private & OPpCONST_STRICT)
+                no_bareword_allowed(argop);
              argp++->p = sv;
              utf8   |= cBOOL(SvUTF8(sv));
              nconst++;
              argp++->p = sv;
              utf8   |= cBOOL(SvUTF8(sv));
              nconst++;
@@ -3192,7 +3260,7 @@ S_maybe_multiconcat(pTHX_ OP *o)
              sv_utf8_upgrade_nomg(sv);
          argp->p = SvPV_nomg(sv, argp->len);
          total_len += argp->len;
              sv_utf8_upgrade_nomg(sv);
          argp->p = SvPV_nomg(sv, argp->len);
          total_len += argp->len;
-        
+
          /* see if any strings would grow if converted to utf8 */
          if (!utf8) {
              variant += variant_under_utf8_count((U8 *) argp->p,
          /* see if any strings would grow if converted to utf8 */
          if (!utf8) {
              variant += variant_under_utf8_count((U8 *) argp->p,
@@ -3431,7 +3499,7 @@ S_maybe_multiconcat(pTHX_ OP *o)
              lastkidop = pmop;
      }
  
              lastkidop = pmop;
      }
  
-    /* Optimise 
+    /* Optimise
       *    target  = A.B.C...
       *    target .= A.B.C...
       */
       *    target  = A.B.C...
       *    target .= A.B.C...
       */
@@ -3913,25 +3981,6 @@ S_finalize_op(pTHX_ OP* o)
      } while (( o = traverse_op_tree(top, o)) != NULL);
  }
  
      } while (( o = traverse_op_tree(top, o)) != NULL);
  }
  
-/*
-=for apidoc op_lvalue
-
-Propagate lvalue ("modifiable") context to an op and its children.
-C<type> represents the context type, roughly based on the type of op that
-would do the modifying, although C<local()> is represented by C<OP_NULL>,
-because it has no op type of its own (it is signalled by a flag on
-the lvalue op).
-
-This function detects things that can't be modified, such as C<$x+1>, and
-generates errors for them.  For example, C<$x+1 = 2> would cause it to be
-called with an op of type C<OP_ADD> and a C<type> argument of C<OP_SASSIGN>.
-
-It also flags things that need to behave specially in an lvalue context,
-such as C<$$x = 5> which might have to vivify a reference in C<$x>.
-
-=cut
-*/
-
  static void
  S_mark_padname_lvalue(pTHX_ PADNAME *pn)
  {
  static void
  S_mark_padname_lvalue(pTHX_ PADNAME *pn)
  {
@@ -3969,126 +4018,160 @@ S_vivifies(const OPCODE type)
      return 0;
  }
  
      return 0;
  }
  
+
+/* apply lvalue reference (aliasing) context to the optree o.
+ * E.g. in
+ *     \($x,$y) = (...)
+ * o would be the list ($x,$y) and type would be OP_AASSIGN.
+ * It may descend and apply this to children too, for example in
+ * \( $cond ? $x, $y) = (...)
+ */
+
  static void
  S_lvref(pTHX_ OP *o, I32 type)
  {
      dVAR;
      OP *kid;
  static void
  S_lvref(pTHX_ OP *o, I32 type)
  {
      dVAR;
      OP *kid;
-    switch (o->op_type) {
-    case OP_COND_EXPR:
-       for (kid = OpSIBLING(cUNOPo->op_first); kid;
-            kid = OpSIBLING(kid))
-           S_lvref(aTHX_ kid, type);
-       /* FALLTHROUGH */
-    case OP_PUSHMARK:
-       return;
-    case OP_RV2AV:
-       if (cUNOPo->op_first->op_type != OP_GV) goto badref;
-       o->op_flags |= OPf_STACKED;
-       if (o->op_flags & OPf_PARENS) {
-           if (o->op_private & OPpLVAL_INTRO) {
-                yyerror(Perl_form(aTHX_ "Can't modify reference to "
-                     "localized parenthesized array in list assignment"));
-               return;
-           }
-         slurpy:
-            OpTYPE_set(o, OP_LVAVREF);
-           o->op_private &= OPpLVAL_INTRO|OPpPAD_STATE;
-           o->op_flags |= OPf_MOD|OPf_REF;
-           return;
-       }
-       o->op_private |= OPpLVREF_AV;
-       goto checkgv;
-    case OP_RV2CV:
-       kid = cUNOPo->op_first;
-       if (kid->op_type == OP_NULL)
-           kid = cUNOPx(OpSIBLING(kUNOP->op_first))
-               ->op_first;
-       o->op_private = OPpLVREF_CV;
-       if (kid->op_type == OP_GV)
-           o->op_flags |= OPf_STACKED;
-       else if (kid->op_type == OP_PADCV) {
-           o->op_targ = kid->op_targ;
-           kid->op_targ = 0;
-           op_free(cUNOPo->op_first);
-           cUNOPo->op_first = NULL;
-           o->op_flags &=~ OPf_KIDS;
-       }
-       else goto badref;
-       break;
-    case OP_RV2HV:
-       if (o->op_flags & OPf_PARENS) {
-         parenhash:
-           yyerror(Perl_form(aTHX_ "Can't modify reference to "
-                                "parenthesized hash in list assignment"));
-               return;
-       }
-       o->op_private |= OPpLVREF_HV;
-       /* FALLTHROUGH */
-    case OP_RV2SV:
-      checkgv:
-       if (cUNOPo->op_first->op_type != OP_GV) goto badref;
-       o->op_flags |= OPf_STACKED;
-       break;
-    case OP_PADHV:
-       if (o->op_flags & OPf_PARENS) goto parenhash;
-       o->op_private |= OPpLVREF_HV;
-       /* FALLTHROUGH */
-    case OP_PADSV:
-       PAD_COMPNAME_GEN_set(o->op_targ, PERL_INT_MAX);
-       break;
-    case OP_PADAV:
-       PAD_COMPNAME_GEN_set(o->op_targ, PERL_INT_MAX);
-       if (o->op_flags & OPf_PARENS) goto slurpy;
-       o->op_private |= OPpLVREF_AV;
-       break;
-    case OP_AELEM:
-    case OP_HELEM:
-       o->op_private |= OPpLVREF_ELEM;
-       o->op_flags   |= OPf_STACKED;
-       break;
-    case OP_ASLICE:
-    case OP_HSLICE:
-        OpTYPE_set(o, OP_LVREFSLICE);
-       o->op_private &= OPpLVAL_INTRO;
-       return;
-    case OP_NULL:
-       if (o->op_flags & OPf_SPECIAL)          /* do BLOCK */
-           goto badref;
-       else if (!(o->op_flags & OPf_KIDS))
-           return;
-       if (o->op_targ != OP_LIST) {
-           S_lvref(aTHX_ cBINOPo->op_first, type);
-           return;
-       }
-       /* FALLTHROUGH */
-    case OP_LIST:
-       for (kid = cLISTOPo->op_first; kid; kid = OpSIBLING(kid)) {
-           assert((kid->op_flags & OPf_WANT) != OPf_WANT_VOID);
-           S_lvref(aTHX_ kid, type);
-       }
-       return;
-    case OP_STUB:
-       if (o->op_flags & OPf_PARENS)
-           return;
-       /* FALLTHROUGH */
-    default:
-      badref:
-       /* diag_listed_as: Can't modify reference to %s in %s assignment */
-       yyerror(Perl_form(aTHX_ "Can't modify reference to %s in %s",
-                    o->op_type == OP_NULL && o->op_flags & OPf_SPECIAL
-                     ? "do block"
-                     : OP_DESC(o),
-                    PL_op_desc[type]));
-       return;
-    }
-    OpTYPE_set(o, OP_LVREF);
-    o->op_private &=
-       OPpLVAL_INTRO|OPpLVREF_ELEM|OPpLVREF_TYPE|OPpPAD_STATE;
-    if (type == OP_ENTERLOOP)
-       o->op_private |= OPpLVREF_ITER;
+    OP * top_op = o;
+
+    while (1) {
+        switch (o->op_type) {
+        case OP_COND_EXPR:
+            o = OpSIBLING(cUNOPo->op_first);
+            continue;
+
+        case OP_PUSHMARK:
+            goto do_next;
+
+        case OP_RV2AV:
+            if (cUNOPo->op_first->op_type != OP_GV) goto badref;
+            o->op_flags |= OPf_STACKED;
+            if (o->op_flags & OPf_PARENS) {
+                if (o->op_private & OPpLVAL_INTRO) {
+                     yyerror(Perl_form(aTHX_ "Can't modify reference to "
+                          "localized parenthesized array in list assignment"));
+                    goto do_next;
+                }
+              slurpy:
+                OpTYPE_set(o, OP_LVAVREF);
+                o->op_private &= OPpLVAL_INTRO|OPpPAD_STATE;
+                o->op_flags |= OPf_MOD|OPf_REF;
+                goto do_next;
+            }
+            o->op_private |= OPpLVREF_AV;
+            goto checkgv;
+
+        case OP_RV2CV:
+            kid = cUNOPo->op_first;
+            if (kid->op_type == OP_NULL)
+                kid = cUNOPx(OpSIBLING(kUNOP->op_first))
+                    ->op_first;
+            o->op_private = OPpLVREF_CV;
+            if (kid->op_type == OP_GV)
+                o->op_flags |= OPf_STACKED;
+            else if (kid->op_type == OP_PADCV) {
+                o->op_targ = kid->op_targ;
+                kid->op_targ = 0;
+                op_free(cUNOPo->op_first);
+                cUNOPo->op_first = NULL;
+                o->op_flags &=~ OPf_KIDS;
+            }
+            else goto badref;
+            break;
+
+        case OP_RV2HV:
+            if (o->op_flags & OPf_PARENS) {
+              parenhash:
+                yyerror(Perl_form(aTHX_ "Can't modify reference to "
+                                     "parenthesized hash in list assignment"));
+                    goto do_next;
+            }
+            o->op_private |= OPpLVREF_HV;
+            /* FALLTHROUGH */
+        case OP_RV2SV:
+          checkgv:
+            if (cUNOPo->op_first->op_type != OP_GV) goto badref;
+            o->op_flags |= OPf_STACKED;
+            break;
+
+        case OP_PADHV:
+            if (o->op_flags & OPf_PARENS) goto parenhash;
+            o->op_private |= OPpLVREF_HV;
+            /* FALLTHROUGH */
+        case OP_PADSV:
+            PAD_COMPNAME_GEN_set(o->op_targ, PERL_INT_MAX);
+            break;
+
+        case OP_PADAV:
+            PAD_COMPNAME_GEN_set(o->op_targ, PERL_INT_MAX);
+            if (o->op_flags & OPf_PARENS) goto slurpy;
+            o->op_private |= OPpLVREF_AV;
+            break;
+
+        case OP_AELEM:
+        case OP_HELEM:
+            o->op_private |= OPpLVREF_ELEM;
+            o->op_flags   |= OPf_STACKED;
+            break;
+
+        case OP_ASLICE:
+        case OP_HSLICE:
+            OpTYPE_set(o, OP_LVREFSLICE);
+            o->op_private &= OPpLVAL_INTRO;
+            goto do_next;
+
+        case OP_NULL:
+            if (o->op_flags & OPf_SPECIAL)             /* do BLOCK */
+                goto badref;
+            else if (!(o->op_flags & OPf_KIDS))
+                goto do_next;
+
+            /* the code formerly only recursed into the first child of
+             * a non ex-list OP_NULL. if we ever encounter such a null op with
+             * more than one child, need to decide whether its ok to process
+             * *all* its kids or not */
+            assert(o->op_targ == OP_LIST
+                    || !(OpHAS_SIBLING(cBINOPo->op_first)));
+            /* FALLTHROUGH */
+        case OP_LIST:
+            o = cLISTOPo->op_first;
+            continue;
+
+        case OP_STUB:
+            if (o->op_flags & OPf_PARENS)
+                goto do_next;
+            /* FALLTHROUGH */
+        default:
+          badref:
+            /* diag_listed_as: Can't modify reference to %s in %s assignment */
+            yyerror(Perl_form(aTHX_ "Can't modify reference to %s in %s",
+                         o->op_type == OP_NULL && o->op_flags & OPf_SPECIAL
+                          ? "do block"
+                          : OP_DESC(o),
+                         PL_op_desc[type]));
+            goto do_next;
+        }
+
+        OpTYPE_set(o, OP_LVREF);
+        o->op_private &=
+            OPpLVAL_INTRO|OPpLVREF_ELEM|OPpLVREF_TYPE|OPpPAD_STATE;
+        if (type == OP_ENTERLOOP)
+            o->op_private |= OPpLVREF_ITER;
+
+      do_next:
+        while (1) {
+            if (o == top_op)
+                return; /* at top; no parents/siblings to try */
+            if (OpHAS_SIBLING(o)) {
+                o = o->op_sibparent;
+                break;
+            }
+            o = o->op_sibparent; /*try parent's next sibling */
+        }
+    } /* while */
  }
  
  }
  
+
  PERL_STATIC_INLINE bool
  S_potential_mod_type(I32 type)
  {
  PERL_STATIC_INLINE bool
  S_potential_mod_type(I32 type)
  {
@@ -4097,35 +4180,69 @@ S_potential_mod_type(I32 type)
         || type == OP_REFGEN    || type == OP_LEAVESUBLV;
  }
  
         || type == OP_REFGEN    || type == OP_LEAVESUBLV;
  }
  
+
+/*
+=for apidoc op_lvalue
+
+Propagate lvalue ("modifiable") context to an op and its children.
+C<type> represents the context type, roughly based on the type of op that
+would do the modifying, although C<local()> is represented by C<OP_NULL>,
+because it has no op type of its own (it is signalled by a flag on
+the lvalue op).
+
+This function detects things that can't be modified, such as C<$x+1>, and
+generates errors for them.  For example, C<$x+1 = 2> would cause it to be
+called with an op of type C<OP_ADD> and a C<type> argument of C<OP_SASSIGN>.
+
+It also flags things that need to behave specially in an lvalue context,
+such as C<$$x = 5> which might have to vivify a reference in C<$x>.
+
+=cut
+
+Perl_op_lvalue_flags() is a non-API lower-level interface to
+op_lvalue().  The flags param has these bits:
+    OP_LVALUE_NO_CROAK:  return rather than croaking on error
+
+*/
+
  OP *
  Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
  {
      dVAR;
  OP *
  Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
  {
      dVAR;
-    OP *kid;
-    /* -1 = error on localize, 0 = ignore localize, 1 = ok to localize */
-    int localize = -1;
+    OP *top_op = o;
  
      if (!o || (PL_parser && PL_parser->error_count))
         return o;
  
  
      if (!o || (PL_parser && PL_parser->error_count))
         return o;
  
+    while (1) {
+    OP *kid;
+    /* -1 = error on localize, 0 = ignore localize, 1 = ok to localize */
+    int localize = -1;
+    OP *next_kid = NULL;
+
      if ((o->op_private & OPpTARGET_MY)
         && (PL_opargs[o->op_type] & OA_TARGLEX))/* OPp share the meaning */
      {
      if ((o->op_private & OPpTARGET_MY)
         && (PL_opargs[o->op_type] & OA_TARGLEX))/* OPp share the meaning */
      {
-       return o;
+       goto do_next;
      }
  
      }
  
-    assert( (o->op_flags & OPf_WANT) != OPf_WANT_VOID );
+    /* elements of a list might be in void context because the list is
+       in scalar context or because they are attribute sub calls */
+    if ((o->op_flags & OPf_WANT) == OPf_WANT_VOID)
+        goto do_next;
  
      if (type == OP_PRTF || type == OP_SPRINTF) type = OP_ENTERSUB;
  
      switch (o->op_type) {
      case OP_UNDEF:
         PL_modcount++;
  
      if (type == OP_PRTF || type == OP_SPRINTF) type = OP_ENTERSUB;
  
      switch (o->op_type) {
      case OP_UNDEF:
         PL_modcount++;
-       return o;
+       goto do_next;
+
      case OP_STUB:
         if ((o->op_flags & OPf_PARENS))
             break;
         goto nomod;
      case OP_STUB:
         if ((o->op_flags & OPf_PARENS))
             break;
         goto nomod;
+
      case OP_ENTERSUB:
         if ((type == OP_UNDEF || type == OP_REFGEN || type == OP_LOCK) &&
             !(o->op_flags & OPf_STACKED)) {
      case OP_ENTERSUB:
         if ((type == OP_UNDEF || type == OP_REFGEN || type == OP_LOCK) &&
             !(o->op_flags & OPf_STACKED)) {
@@ -4191,7 +4308,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
                                       "subroutine call of &%" SVf " in %s",
                                       SVfARG(namesv), PL_op_desc[type]),
                             SvUTF8(namesv));
                                       "subroutine call of &%" SVf " in %s",
                                       SVfARG(namesv), PL_op_desc[type]),
                             SvUTF8(namesv));
-                return o;
+                goto do_next;
             }
         }
         /* FALLTHROUGH */
             }
         }
         /* FALLTHROUGH */
@@ -4206,7 +4323,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
                       ? "do block"
                       : OP_DESC(o)),
                      type ? PL_op_desc[type] : "local"));
                       ? "do block"
                       : OP_DESC(o)),
                      type ? PL_op_desc[type] : "local"));
-       return o;
+       goto do_next;
  
      case OP_PREINC:
      case OP_PREDEC:
  
      case OP_PREINC:
      case OP_PREDEC:
@@ -4241,6 +4358,12 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
             goto nomod;
         else {
             const I32 mods = PL_modcount;
             goto nomod;
         else {
             const I32 mods = PL_modcount;
+            /* we recurse rather than iterate here because we need to
+             * calculate and use the delta applied to PL_modcount by the
+             * first child. So in something like
+             *     ($x, ($y) x 3) = split;
+             * split knows that 4 elements are wanted
+             */
             modkids(cBINOPo->op_first, type);
             if (type != OP_AASSIGN)
                 goto nomod;
             modkids(cBINOPo->op_first, type);
             if (type != OP_AASSIGN)
                 goto nomod;
@@ -4258,8 +4381,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
  
      case OP_COND_EXPR:
         localize = 1;
  
      case OP_COND_EXPR:
         localize = 1;
-       for (kid = OpSIBLING(cUNOPo->op_first); kid; kid = OpSIBLING(kid))
-           op_lvalue(kid, type);
+        next_kid = OpSIBLING(cUNOPo->op_first);
         break;
  
      case OP_RV2AV:
         break;
  
      case OP_RV2AV:
@@ -4269,7 +4391,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
             /* Treat \(@foo) like ordinary list, but still mark it as modi-
                fiable since some contexts need to know.  */
             o->op_flags |= OPf_MOD;
             /* Treat \(@foo) like ordinary list, but still mark it as modi-
                fiable since some contexts need to know.  */
             o->op_flags |= OPf_MOD;
-           return o;
+           goto do_next;
         }
         /* FALLTHROUGH */
      case OP_RV2GV:
         }
         /* FALLTHROUGH */
      case OP_RV2GV:
@@ -4293,23 +4415,27 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
      case OP_DBSTATE:
         PL_modcount = RETURN_UNLIMITED_NUMBER;
         break;
      case OP_DBSTATE:
         PL_modcount = RETURN_UNLIMITED_NUMBER;
         break;
+
      case OP_KVHSLICE:
      case OP_KVASLICE:
      case OP_AKEYS:
         if (type == OP_LEAVESUBLV)
             o->op_private |= OPpMAYBE_LVSUB;
          goto nomod;
      case OP_KVHSLICE:
      case OP_KVASLICE:
      case OP_AKEYS:
         if (type == OP_LEAVESUBLV)
             o->op_private |= OPpMAYBE_LVSUB;
          goto nomod;
+
      case OP_AVHVSWITCH:
         if (type == OP_LEAVESUBLV
          && (o->op_private & OPpAVHVSWITCH_MASK) + OP_EACH == OP_KEYS)
             o->op_private |= OPpMAYBE_LVSUB;
          goto nomod;
      case OP_AVHVSWITCH:
         if (type == OP_LEAVESUBLV
          && (o->op_private & OPpAVHVSWITCH_MASK) + OP_EACH == OP_KEYS)
             o->op_private |= OPpMAYBE_LVSUB;
          goto nomod;
+
      case OP_AV2ARYLEN:
         PL_hints |= HINT_BLOCK_SCOPE;
         if (type == OP_LEAVESUBLV)
             o->op_private |= OPpMAYBE_LVSUB;
         PL_modcount++;
         break;
      case OP_AV2ARYLEN:
         PL_hints |= HINT_BLOCK_SCOPE;
         if (type == OP_LEAVESUBLV)
             o->op_private |= OPpMAYBE_LVSUB;
         PL_modcount++;
         break;
+
      case OP_RV2SV:
         ref(cUNOPo->op_first, o->op_type);
         localize = 1;
      case OP_RV2SV:
         ref(cUNOPo->op_first, o->op_type);
         localize = 1;
@@ -4338,7 +4464,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
             /* Treat \(@foo) like ordinary list, but still mark it as modi-
                fiable since some contexts need to know.  */
             o->op_flags |= OPf_MOD;
             /* Treat \(@foo) like ordinary list, but still mark it as modi-
                fiable since some contexts need to know.  */
             o->op_flags |= OPf_MOD;
-           return o;
+           goto do_next;
         }
         if (scalar_mod_type(o, type))
             goto nomod;
         }
         if (scalar_mod_type(o, type))
             goto nomod;
@@ -4375,6 +4501,9 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
         if (type == OP_LEAVESUBLV)
             o->op_private |= OPpMAYBE_LVSUB;
         if (o->op_flags & OPf_KIDS && OpHAS_SIBLING(cBINOPo->op_first)) {
         if (type == OP_LEAVESUBLV)
             o->op_private |= OPpMAYBE_LVSUB;
         if (o->op_flags & OPf_KIDS && OpHAS_SIBLING(cBINOPo->op_first)) {
+            /* we recurse rather than iterate here because the child
+             * needs to be processed with a different 'type' parameter */
+
             /* substr and vec */
             /* If this op is in merely potential (non-fatal) modifiable
                context, then apply OP_ENTERSUB context to
             /* substr and vec */
             /* If this op is in merely potential (non-fatal) modifiable
                context, then apply OP_ENTERSUB context to
@@ -4409,7 +4538,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
      case OP_LINESEQ:
         localize = 0;
         if (o->op_flags & OPf_KIDS)
      case OP_LINESEQ:
         localize = 0;
         if (o->op_flags & OPf_KIDS)
-           op_lvalue(cLISTOPo->op_last, type);
+           next_kid = cLISTOPo->op_last;
         break;
  
      case OP_NULL:
         break;
  
      case OP_NULL:
@@ -4442,30 +4571,31 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
                  /* this should trigger a "Can't modify transliteration" err */
                  op_lvalue(sib, type);
              }
                  /* this should trigger a "Can't modify transliteration" err */
                  op_lvalue(sib, type);
              }
-            op_lvalue(cBINOPo->op_first, type);
+            next_kid = cBINOPo->op_first;
+            /* we assume OP_NULLs which aren't ex-list have no more than 2
+             * children. If this assumption is wrong, increase the scan
+             * limit below */
+            assert(   !OpHAS_SIBLING(next_kid)
+                   || !OpHAS_SIBLING(OpSIBLING(next_kid)));
              break;
         }
         /* FALLTHROUGH */
      case OP_LIST:
         localize = 0;
              break;
         }
         /* FALLTHROUGH */
      case OP_LIST:
         localize = 0;
-       for (kid = cLISTOPo->op_first; kid; kid = OpSIBLING(kid))
-           /* elements might be in void context because the list is
-              in scalar context or because they are attribute sub calls */
-           if ( (kid->op_flags & OPf_WANT) != OPf_WANT_VOID )
-               op_lvalue(kid, type);
+       next_kid = cLISTOPo->op_first;
         break;
  
      case OP_COREARGS:
         break;
  
      case OP_COREARGS:
-       return o;
+       goto do_next;
  
      case OP_AND:
      case OP_OR:
         if (type == OP_LEAVESUBLV
          || !S_vivifies(cLOGOPo->op_first->op_type))
  
      case OP_AND:
      case OP_OR:
         if (type == OP_LEAVESUBLV
          || !S_vivifies(cLOGOPo->op_first->op_type))
-           op_lvalue(cLOGOPo->op_first, type);
-       if (type == OP_LEAVESUBLV
+           next_kid = cLOGOPo->op_first;
+       else if (type == OP_LEAVESUBLV
          || !S_vivifies(OpSIBLING(cLOGOPo->op_first)->op_type))
          || !S_vivifies(OpSIBLING(cLOGOPo->op_first)->op_type))
-           op_lvalue(OpSIBLING(cLOGOPo->op_first), type);
+           next_kid = OpSIBLING(cLOGOPo->op_first);
         goto nomod;
  
      case OP_SREFGEN:
         goto nomod;
  
      case OP_SREFGEN:
@@ -4477,8 +4607,8 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
             Perl_ck_warner_d(aTHX_
                      packWARN(WARN_EXPERIMENTAL__DECLARED_REFS),
                     "Declaring references is experimental");
             Perl_ck_warner_d(aTHX_
                      packWARN(WARN_EXPERIMENTAL__DECLARED_REFS),
                     "Declaring references is experimental");
-           op_lvalue(cUNOPo->op_first, OP_NULL);
-           return o;
+           next_kid = cUNOPo->op_first;
+           goto do_next;
         }
         if (type != OP_AASSIGN && type != OP_SASSIGN
          && type != OP_ENTERLOOP)
         }
         if (type != OP_AASSIGN && type != OP_SASSIGN
          && type != OP_ENTERLOOP)
@@ -4508,7 +4638,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
         if (o->op_type == OP_REFGEN)
             op_null(cUNOPx(cUNOPo->op_first)->op_first); /* pushmark */
         op_null(o);
         if (o->op_type == OP_REFGEN)
             op_null(cUNOPx(cUNOPo->op_first)->op_first); /* pushmark */
         op_null(o);
-       return o;
+       goto do_next;
  
      case OP_SPLIT:
          if ((o->op_private & OPpSPLIT_ASSIGN)) {
  
      case OP_SPLIT:
          if ((o->op_private & OPpSPLIT_ASSIGN)) {
@@ -4527,7 +4657,7 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
         their argument is a filehandle; thus \stat(".") should not set
         it. AMS 20011102 */
      if (type == OP_REFGEN && OP_IS_STAT(o->op_type))
         their argument is a filehandle; thus \stat(".") should not set
         it. AMS 20011102 */
      if (type == OP_REFGEN && OP_IS_STAT(o->op_type))
-        return o;
+        goto do_next;
  
      if (type != OP_LEAVESUBLV)
          o->op_flags |= OPf_MOD;
  
      if (type != OP_LEAVESUBLV)
          o->op_flags |= OPf_MOD;
@@ -4552,9 +4682,40 @@ Perl_op_lvalue_flags(pTHX_ OP *o, I32 type, U32 flags)
      else if (type != OP_GREPSTART && type != OP_ENTERSUB
               && type != OP_LEAVESUBLV && o->op_type != OP_ENTERSUB)
         o->op_flags |= OPf_REF;
      else if (type != OP_GREPSTART && type != OP_ENTERSUB
               && type != OP_LEAVESUBLV && o->op_type != OP_ENTERSUB)
         o->op_flags |= OPf_REF;
-    return o;
+
+  do_next:
+    while (!next_kid) {
+        if (o == top_op)
+            return top_op; /* at top; no parents/siblings to try */
+        if (OpHAS_SIBLING(o)) {
+            next_kid = o->op_sibparent;
+            if (!OpHAS_SIBLING(next_kid)) {
+                /* a few node types don't recurse into their second child */
+                OP *parent = next_kid->op_sibparent;
+                I32 ptype  = parent->op_type;
+                if (   (ptype == OP_NULL && parent->op_targ != OP_LIST)
+                    || (   (ptype == OP_AND || ptype == OP_OR)
+                        && (type != OP_LEAVESUBLV 
+                            && S_vivifies(next_kid->op_type))
+                       )
+                )  {
+                    /*try parent's next sibling */
+                    o = parent;
+                    next_kid =  NULL;
+                }
+            }
+        }
+        else
+            o = o->op_sibparent; /*try parent's next sibling */
+
+    }
+    o = next_kid;
+
+    } /* while */
+
  }
  
  }
  
+
  STATIC bool
  S_scalar_mod_type(const OP *o, I32 type)
  {
  STATIC bool
  S_scalar_mod_type(const OP *o, I32 type)
  {
@@ -4649,104 +4810,143 @@ S_refkids(pTHX_ OP *o, I32 type)
      return o;
  }
  
      return o;
  }
  
+
+/* Apply reference (autovivification) context to the subtree at o.
+ * For example in
+ *     push @{expression}, ....;
+ * o will be the head of 'expression' and type will be OP_RV2AV.
+ * It marks the op o (or a suitable child) as autovivifying, e.g. by
+ * setting  OPf_MOD.
+ * For OP_RV2AV/OP_PADAV and OP_RV2HV/OP_PADHV sets OPf_REF too if
+ * set_op_ref is true.
+ *
+ * Also calls scalar(o).
+ */
+
  OP *
  Perl_doref(pTHX_ OP *o, I32 type, bool set_op_ref)
  {
      dVAR;
  OP *
  Perl_doref(pTHX_ OP *o, I32 type, bool set_op_ref)
  {
      dVAR;
-    OP *kid;
+    OP * top_op = o;
  
      PERL_ARGS_ASSERT_DOREF;
  
      if (PL_parser && PL_parser->error_count)
         return o;
  
  
      PERL_ARGS_ASSERT_DOREF;
  
      if (PL_parser && PL_parser->error_count)
         return o;
  
-    switch (o->op_type) {
-    case OP_ENTERSUB:
-       if ((type == OP_EXISTS || type == OP_DEFINED) &&
-           !(o->op_flags & OPf_STACKED)) {
-            OpTYPE_set(o, OP_RV2CV);             /* entersub => rv2cv */
-           assert(cUNOPo->op_first->op_type == OP_NULL);
-           op_null(((LISTOP*)cUNOPo->op_first)->op_first);     /* disable pushmark */
-           o->op_flags |= OPf_SPECIAL;
-       }
-       else if (type == OP_RV2SV || type == OP_RV2AV || type == OP_RV2HV){
-           o->op_private |= (type == OP_RV2AV ? OPpDEREF_AV
-                             : type == OP_RV2HV ? OPpDEREF_HV
-                             : OPpDEREF_SV);
-           o->op_flags |= OPf_MOD;
-       }
+    while (1) {
+        switch (o->op_type) {
+        case OP_ENTERSUB:
+            if ((type == OP_EXISTS || type == OP_DEFINED) &&
+                !(o->op_flags & OPf_STACKED)) {
+                OpTYPE_set(o, OP_RV2CV);             /* entersub => rv2cv */
+                assert(cUNOPo->op_first->op_type == OP_NULL);
+                /* disable pushmark */
+                op_null(((LISTOP*)cUNOPo->op_first)->op_first);
+                o->op_flags |= OPf_SPECIAL;
+            }
+            else if (type == OP_RV2SV || type == OP_RV2AV || type == OP_RV2HV){
+                o->op_private |= (type == OP_RV2AV ? OPpDEREF_AV
+                                  : type == OP_RV2HV ? OPpDEREF_HV
+                                  : OPpDEREF_SV);
+                o->op_flags |= OPf_MOD;
+            }
  
  
-       break;
+            break;
  
  
-    case OP_COND_EXPR:
-       for (kid = OpSIBLING(cUNOPo->op_first); kid; kid = OpSIBLING(kid))
-           doref(kid, type, set_op_ref);
-       break;
-    case OP_RV2SV:
-       if (type == OP_DEFINED)
-           o->op_flags |= OPf_SPECIAL;         /* don't create GV */
-       doref(cUNOPo->op_first, o->op_type, set_op_ref);
-       /* FALLTHROUGH */
-    case OP_PADSV:
-       if (type == OP_RV2SV || type == OP_RV2AV || type == OP_RV2HV) {
-           o->op_private |= (type == OP_RV2AV ? OPpDEREF_AV
-                             : type == OP_RV2HV ? OPpDEREF_HV
-                             : OPpDEREF_SV);
-           o->op_flags |= OPf_MOD;
-       }
-       break;
+        case OP_COND_EXPR:
+            o = OpSIBLING(cUNOPo->op_first);
+            continue;
  
  
-    case OP_RV2AV:
-    case OP_RV2HV:
-       if (set_op_ref)
-           o->op_flags |= OPf_REF;
-       /* FALLTHROUGH */
-    case OP_RV2GV:
-       if (type == OP_DEFINED)
-           o->op_flags |= OPf_SPECIAL;         /* don't create GV */
-       doref(cUNOPo->op_first, o->op_type, set_op_ref);
-       break;
+        case OP_RV2SV:
+            if (type == OP_DEFINED)
+                o->op_flags |= OPf_SPECIAL;            /* don't create GV */
+            /* FALLTHROUGH */
+        case OP_PADSV:
+            if (type == OP_RV2SV || type == OP_RV2AV || type == OP_RV2HV) {
+                o->op_private |= (type == OP_RV2AV ? OPpDEREF_AV
+                                  : type == OP_RV2HV ? OPpDEREF_HV
+                                  : OPpDEREF_SV);
+                o->op_flags |= OPf_MOD;
+            }
+            if (o->op_flags & OPf_KIDS) {
+                type = o->op_type;
+                o = cUNOPo->op_first;
+                continue;
+            }
+            break;
  
  
-    case OP_PADAV:
-    case OP_PADHV:
-       if (set_op_ref)
-           o->op_flags |= OPf_REF;
-       break;
+        case OP_RV2AV:
+        case OP_RV2HV:
+            if (set_op_ref)
+                o->op_flags |= OPf_REF;
+            /* FALLTHROUGH */
+        case OP_RV2GV:
+            if (type == OP_DEFINED)
+                o->op_flags |= OPf_SPECIAL;            /* don't create GV */
+            type = o->op_type;
+            o = cUNOPo->op_first;
+            continue;
  
  
-    case OP_SCALAR:
-    case OP_NULL:
-       if (!(o->op_flags & OPf_KIDS) || type == OP_DEFINED)
-           break;
-       doref(cBINOPo->op_first, type, set_op_ref);
-       break;
-    case OP_AELEM:
-    case OP_HELEM:
-       doref(cBINOPo->op_first, o->op_type, set_op_ref);
-       if (type == OP_RV2SV || type == OP_RV2AV || type == OP_RV2HV) {
-           o->op_private |= (type == OP_RV2AV ? OPpDEREF_AV
-                             : type == OP_RV2HV ? OPpDEREF_HV
-                             : OPpDEREF_SV);
-           o->op_flags |= OPf_MOD;
-       }
-       break;
+        case OP_PADAV:
+        case OP_PADHV:
+            if (set_op_ref)
+                o->op_flags |= OPf_REF;
+            break;
  
  
-    case OP_SCOPE:
-    case OP_LEAVE:
-       set_op_ref = FALSE;
-       /* FALLTHROUGH */
-    case OP_ENTER:
-    case OP_LIST:
-       if (!(o->op_flags & OPf_KIDS))
-           break;
-       doref(cLISTOPo->op_last, type, set_op_ref);
-       break;
-    default:
-       break;
-    }
-    return scalar(o);
+        case OP_SCALAR:
+        case OP_NULL:
+            if (!(o->op_flags & OPf_KIDS) || type == OP_DEFINED)
+                break;
+             o = cBINOPo->op_first;
+            continue;
  
  
+        case OP_AELEM:
+        case OP_HELEM:
+            if (type == OP_RV2SV || type == OP_RV2AV || type == OP_RV2HV) {
+                o->op_private |= (type == OP_RV2AV ? OPpDEREF_AV
+                                  : type == OP_RV2HV ? OPpDEREF_HV
+                                  : OPpDEREF_SV);
+                o->op_flags |= OPf_MOD;
+            }
+            type = o->op_type;
+            o = cBINOPo->op_first;
+            continue;;
+
+        case OP_SCOPE:
+        case OP_LEAVE:
+            set_op_ref = FALSE;
+            /* FALLTHROUGH */
+        case OP_ENTER:
+        case OP_LIST:
+            if (!(o->op_flags & OPf_KIDS))
+                break;
+            o = cLISTOPo->op_last;
+            continue;
+
+        default:
+            break;
+        } /* switch */
+
+        while (1) {
+            if (o == top_op)
+                return scalar(top_op); /* at top; no parents/siblings to try */
+            if (OpHAS_SIBLING(o)) {
+                o = o->op_sibparent;
+                /* Normally skip all siblings and go straight to the parent;
+                 * the only op that requires two children to be processed
+                 * is OP_COND_EXPR */
+                if (!OpHAS_SIBLING(o)
+                        && o->op_sibparent->op_type == OP_COND_EXPR)
+                    break;
+                continue;
+            }
+            o = o->op_sibparent; /*try parent's next sibling */
+        }
+    } /* while */
  }
  
  }
  
+
  STATIC OP *
  S_dup_attrlist(pTHX_ OP *o)
  {
  STATIC OP *
  S_dup_attrlist(pTHX_ OP *o)
  {
@@ -5126,7 +5326,7 @@ Perl_my_attrs(pTHX_ OP *o, OP *attrs)
             /* The listop in rops might have a pushmark at the beginning,
                which will mess up list assignment. */
             LISTOP * const lrops = (LISTOP *)rops; /* for brevity */
             /* The listop in rops might have a pushmark at the beginning,
                which will mess up list assignment. */
             LISTOP * const lrops = (LISTOP *)rops; /* for brevity */
-           if (rops->op_type == OP_LIST && 
+           if (rops->op_type == OP_LIST &&
                 lrops->op_first && lrops->op_first->op_type == OP_PUSHMARK)
             {
                 OP * const pushmark = lrops->op_first;
                 lrops->op_first && lrops->op_first->op_type == OP_PUSHMARK)
             {
                 OP * const pushmark = lrops->op_first;
@@ -5268,7 +5468,8 @@ Perl_op_scope(pTHX_ OP *o)
      dVAR;
      if (o) {
         if (o->op_flags & OPf_PARENS || PERLDB_NOOPT || TAINTING_get) {
      dVAR;
      if (o) {
         if (o->op_flags & OPf_PARENS || PERLDB_NOOPT || TAINTING_get) {
-           o = op_prepend_elem(OP_LINESEQ, newOP(OP_ENTER, 0), o);
+           o = op_prepend_elem(OP_LINESEQ,
+                    newOP(OP_ENTER, (o->op_flags & OPf_WANT)), o);
              OpTYPE_set(o, OP_LEAVE);
         }
         else if (o->op_type == OP_LINESEQ) {
              OpTYPE_set(o, OP_LEAVE);
         }
         else if (o->op_type == OP_LINESEQ) {
@@ -6513,25 +6714,44 @@ Perl_newBINOP(pTHX_ I32 type, I32 flags, OP *first, OP *last)
      return fold_constants(op_integerize(op_std_init((OP *)binop)));
  }
  
      return fold_constants(op_integerize(op_std_init((OP *)binop)));
  }
  
-/* Helper function for S_pmtrans(): comparison function to sort an array
- * of codepoint range pairs. Sorts by start point, or if equal, by end
- * point */
-
-static int uvcompare(const void *a, const void *b)
-    __attribute__nonnull__(1)
-    __attribute__nonnull__(2)
-    __attribute__pure__;
-static int uvcompare(const void *a, const void *b)
+void
+Perl_invmap_dump(pTHX_ SV* invlist, UV *map)
  {
  {
-    if (*((const UV *)a) < (*(const UV *)b))
-       return -1;
-    if (*((const UV *)a) > (*(const UV *)b))
-       return 1;
-    if (*((const UV *)a+1) < (*(const UV *)b+1))
-       return -1;
-    if (*((const UV *)a+1) > (*(const UV *)b+1))
-       return 1;
-    return 0;
+    const char indent[] = "    ";
+
+    UV len = _invlist_len(invlist);
+    UV * array = invlist_array(invlist);
+    UV i;
+
+    PERL_ARGS_ASSERT_INVMAP_DUMP;
+
+    for (i = 0; i < len; i++) {
+        UV start = array[i];
+        UV end   = (i + 1 < len) ? array[i+1] - 1 : IV_MAX;
+
+        PerlIO_printf(Perl_debug_log, "%s[%" UVuf "] 0x%04" UVXf, indent, i, start);
+        if (end == IV_MAX) {
+            PerlIO_printf(Perl_debug_log, " .. INFTY");
+       }
+       else if (end != start) {
+            PerlIO_printf(Perl_debug_log, " .. 0x%04" UVXf, end);
+       }
+        else {
+            PerlIO_printf(Perl_debug_log, "            ");
+        }
+
+        PerlIO_printf(Perl_debug_log, "\t");
+
+        if (map[i] == TR_UNLISTED) {
+            PerlIO_printf(Perl_debug_log, "TR_UNLISTED\n");
+        }
+        else if (map[i] == TR_SPECIAL_HANDLING) {
+            PerlIO_printf(Perl_debug_log, "TR_SPECIAL_HANDLING\n");
+        }
+        else {
+            PerlIO_printf(Perl_debug_log, "0x%04" UVXf "\n", map[i]);
+        }
+    }
  }
  
  /* Given an OP_TRANS / OP_TRANSR op o, plus OP_CONST ops expr and repl
  }
  
  /* Given an OP_TRANS / OP_TRANSR op o, plus OP_CONST ops expr and repl
@@ -6543,350 +6763,1073 @@ static int uvcompare(const void *a, const void *b)
   *   OPpTRANS_SQUASH
   *   OPpTRANS_DELETE
   * flags as appropriate; this function may add
   *   OPpTRANS_SQUASH
   *   OPpTRANS_DELETE
   * flags as appropriate; this function may add
- *   OPpTRANS_FROM_UTF
- *   OPpTRANS_TO_UTF
+ *   OPpTRANS_USE_SVOP
+ *   OPpTRANS_CAN_FORCE_UTF8
   *   OPpTRANS_IDENTICAL
   *   OPpTRANS_GROWS
   * flags
   */
  
   *   OPpTRANS_IDENTICAL
   *   OPpTRANS_GROWS
   * flags
   */
  
-static OP *
-S_pmtrans(pTHX_ OP *o, OP *expr, OP *repl)
-{
-    SV * const tstr = ((SVOP*)expr)->op_sv;
-    SV * const rstr = ((SVOP*)repl)->op_sv;
-    STRLEN tlen;
-    STRLEN rlen;
-    const U8 *t = (U8*)SvPV_const(tstr, tlen);
-    const U8 *r = (U8*)SvPV_const(rstr, rlen);
-    Size_t i, j;
-    bool grows = FALSE;
-    OPtrans_map *tbl;
-    SSize_t struct_size; /* malloced size of table struct */
+static OP *
+S_pmtrans(pTHX_ OP *o, OP *expr, OP *repl)
+{
+    /* This function compiles a tr///, from data gathered from toke.c, into a
+     * form suitable for use by do_trans() in doop.c at runtime.
+     *
+     * It first normalizes the data, while discarding extraneous inputs; then
+     * writes out the compiled data.  The normalization allows for complete
+     * analysis, and avoids some false negatives and positives earlier versions
+     * of this code had.
+     *
+     * The normalization form is an inversion map (described below in detail).
+     * This is essentially the compiled form for tr///'s that require UTF-8,
+     * and its easy to use it to write the 257-byte table for tr///'s that
+     * don't need UTF-8.  That table is identical to what's been in use for
+     * many perl versions, except that it doesn't handle some edge cases that
+     * it used to, involving code points above 255.  The UTF-8 form now handles
+     * these.  (This could be changed with extra coding should it shown to be
+     * desirable.)
+     *
+     * If the complement (/c) option is specified, the lhs string (tstr) is
+     * parsed into an inversion list.  Complementing these is trivial.  Then a
+     * complemented tstr is built from that, and used thenceforth.  This hides
+     * the fact that it was complemented from almost all successive code.
+     *
+     * One of the important characteristics to know about the input is whether
+     * the transliteration may be done in place, or does a temporary need to be
+     * allocated, then copied.  If the replacement for every character in every
+     * possible string takes up no more bytes than the the character it
+     * replaces, then it can be edited in place.  Otherwise the replacement
+     * could "grow", depending on the strings being processed.  Some inputs
+     * won't grow, and might even shrink under /d, but some inputs could grow,
+     * so we have to assume any given one might grow.  On very long inputs, the
+     * temporary could eat up a lot of memory, so we want to avoid it if
+     * possible.  For non-UTF-8 inputs, everything is single-byte, so can be
+     * edited in place, unless there is something in the pattern that could
+     * force it into UTF-8.  The inversion map makes it feasible to determine
+     * this.  Previous versions of this code pretty much punted on determining
+     * if UTF-8 could be edited in place.  Now, this code is rigorous in making
+     * that determination.
+     *
+     * Another characteristic we need to know is whether the lhs and rhs are
+     * identical.  If so, and no other flags are present, the only effect of
+     * the tr/// is to count the characters present in the input that are
+     * mentioned in the lhs string.  The implementation of that is easier and
+     * runs faster than the more general case.  Normalizing here allows for
+     * accurate determination of this.  Previously there were false negatives
+     * possible.
+     *
+     * Instead of 'transliterated', the comments here use 'unmapped' for the
+     * characters that are left unchanged by the operation; otherwise they are
+     * 'mapped'
+     *
+     * The lhs of the tr/// is here referred to as the t side.
+     * The rhs of the tr/// is here referred to as the r side.
+     */
+
+    SV * const tstr = ((SVOP*)expr)->op_sv;
+    SV * const rstr = ((SVOP*)repl)->op_sv;
+    STRLEN tlen;
+    STRLEN rlen;
+    const U8 * t0 = (U8*)SvPV_const(tstr, tlen);
+    const U8 * r0 = (U8*)SvPV_const(rstr, rlen);
+    const U8 * t = t0;
+    const U8 * r = r0;
+    UV t_count = 0, r_count = 0;  /* Number of characters in search and
+                                         replacement lists */
+
+    /* khw thinks some of the private flags for this op are quaintly named.
+     * OPpTRANS_GROWS for example is TRUE if the replacement for some lhs
+     * character when represented in UTF-8 is longer than the original
+     * character's UTF-8 representation */
+    const bool complement = cBOOL(o->op_private & OPpTRANS_COMPLEMENT);
+    const bool squash     = cBOOL(o->op_private & OPpTRANS_SQUASH);
+    const bool del        = cBOOL(o->op_private & OPpTRANS_DELETE);
+
+    /* Set to true if there is some character < 256 in the lhs that maps to >
+     * 255.  If so, a non-UTF-8 match string can be forced into requiring to be
+     * in UTF-8 by a tr/// operation. */
+    bool can_force_utf8 = FALSE;
+
+    /* What is the maximum expansion factor in UTF-8 transliterations.  If a
+     * 2-byte UTF-8 encoded character is to be replaced by a 3-byte one, its
+     * expansion factor is 1.5.  This number is used at runtime to calculate
+     * how much space to allocate for non-inplace transliterations.  Without
+     * this number, the worst case is 14, which is extremely unlikely to happen
+     * in real life, and would require significant memory overhead. */
+    NV max_expansion = 1.;
+
+    UV t_range_count, r_range_count, min_range_count;
+    UV* t_array;
+    SV* t_invlist;
+    UV* r_map;
+    UV r_cp, t_cp;
+    UV t_cp_end = (UV) -1;
+    UV r_cp_end;
+    Size_t len;
+    AV* invmap;
+    UV final_map = TR_UNLISTED;    /* The final character in the replacement
+                                      list, updated as we go along.  Initialize
+                                      to something illegal */
+
+    bool rstr_utf8 = cBOOL(SvUTF8(rstr));
+    bool tstr_utf8 = cBOOL(SvUTF8(tstr));
+
+    const U8* tend = t + tlen;
+    const U8* rend = r + rlen;
+
+    SV * inverted_tstr = NULL;
+
+    Size_t i;
+    unsigned int pass2;
+
+    /* This routine implements detection of a transliteration having a longer
+     * UTF-8 representation than its source, by partitioning all the possible
+     * code points of the platform into equivalence classes of the same UTF-8
+     * byte length in the first pass.  As it constructs the mappings, it carves
+     * these up into smaller chunks, but doesn't merge any together.  This
+     * makes it easy to find the instances it's looking for.  A second pass is
+     * done after this has been determined which merges things together to
+     * shrink the table for runtime.  For ASCII platforms, the table is
+     * trivial, given below, and uses the fundamental characteristics of UTF-8
+     * to construct the values.  For EBCDIC, it isn't so, and we rely on a
+     * table constructed by the perl script that generates these kinds of
+     * things */
+#ifndef EBCDIC
+    UV PL_partition_by_byte_length[] = {
+        0,
+        0x80,
+        (32 * (1UL << (    UTF_ACCUMULATION_SHIFT))),
+        (16 * (1UL << (2 * UTF_ACCUMULATION_SHIFT))),
+        ( 8 * (1UL << (3 * UTF_ACCUMULATION_SHIFT))),
+        ( 4 * (1UL << (4 * UTF_ACCUMULATION_SHIFT))),
+        ( 2 * (1UL << (5 * UTF_ACCUMULATION_SHIFT)))
+
+#  ifdef UV_IS_QUAD
+                                                    ,
+        ( ((UV) 1U << (6 * UTF_ACCUMULATION_SHIFT)))
+#  endif
+
+    };
+
+#endif
+
+    PERL_ARGS_ASSERT_PMTRANS;
+
+    PL_hints |= HINT_BLOCK_SCOPE;
+
+    /* If /c, the search list is sorted and complemented.  This is now done by
+     * creating an inversion list from it, and then trivially inverting that.
+     * The previous implementation used qsort, but creating the list
+     * automatically keeps it sorted as we go along */
+    if (complement) {
+        UV start, end;
+        SV * inverted_tlist = _new_invlist(tlen);
+        Size_t temp_len;
+
+        DEBUG_y(PerlIO_printf(Perl_debug_log,
+                    "%s: %d: tstr before inversion=\n%s\n",
+                    __FILE__, __LINE__, _byte_dump_string(t, tend - t, 0)));
+
+        while (t < tend) {
+
+            /* Non-utf8 strings don't have ranges, so each character is listed
+             * out */
+            if (! tstr_utf8) {
+                inverted_tlist = add_cp_to_invlist(inverted_tlist, *t);
+                t++;
+            }
+            else {  /* But UTF-8 strings have been parsed in toke.c to have
+                 * ranges if appropriate. */
+                UV t_cp;
+                Size_t t_char_len;
+
+                /* Get the first character */
+                t_cp = valid_utf8_to_uvchr(t, &t_char_len);
+                t += t_char_len;
+
+                /* If the next byte indicates that this wasn't the first
+                 * element of a range, the range is just this one */
+                if (t >= tend || *t != RANGE_INDICATOR) {
+                    inverted_tlist = add_cp_to_invlist(inverted_tlist, t_cp);
+                }
+                else { /* Otherwise, ignore the indicator byte, and get the
+                          final element, and add the whole range */
+                    t++;
+                    t_cp_end = valid_utf8_to_uvchr(t, &t_char_len);
+                    t += t_char_len;
+
+                    inverted_tlist = _add_range_to_invlist(inverted_tlist,
+                                                      t_cp, t_cp_end);
+                }
+            }
+        } /* End of parse through tstr */
+
+        /* The inversion list is done; now invert it */
+        _invlist_invert(inverted_tlist);
+
+        /* Now go through the inverted list and create a new tstr for the rest
+         * of the routine to use.  Since the UTF-8 version can have ranges, and
+         * can be much more compact than the non-UTF-8 version, we create the
+         * string in UTF-8 even if not necessary.  (This is just an intermediate
+         * value that gets thrown away anyway.) */
+        invlist_iterinit(inverted_tlist);
+        inverted_tstr = newSVpvs("");
+        while (invlist_iternext(inverted_tlist, &start, &end)) {
+            U8 temp[UTF8_MAXBYTES];
+            U8 * temp_end_pos;
+
+            /* IV_MAX keeps things from going out of bounds */
+            start = MIN(IV_MAX, start);
+            end   = MIN(IV_MAX, end);
+
+            temp_end_pos = uvchr_to_utf8(temp, start);
+            sv_catpvn(inverted_tstr, (char *) temp, temp_end_pos - temp);
+
+            if (start != end) {
+                Perl_sv_catpvf(aTHX_ inverted_tstr, "%c", RANGE_INDICATOR);
+                temp_end_pos = uvchr_to_utf8(temp, end);
+                sv_catpvn(inverted_tstr, (char *) temp, temp_end_pos - temp);
+            }
+        }
+
+        /* Set up so the remainder of the routine uses this complement, instead
+         * of the actual input */
+        t0 = t = (U8*)SvPV_const(inverted_tstr, temp_len);
+        tend = t0 + temp_len;
+        tstr_utf8 = TRUE;
+
+        SvREFCNT_dec_NN(inverted_tlist);
+    }
+
+    /* For non-/d, an empty rhs means to use the lhs */
+    if (rlen == 0 && ! del) {
+        r0 = t0;
+        rend = tend;
+        rstr_utf8  = tstr_utf8;
+    }
+
+    t_invlist = _new_invlist(1);
+
+    /* Parse the (potentially adjusted) input, creating the inversion map.
+     * This is done in two passes.  The first pass is to determine if the
+     * transliteration can be done in place.  The inversion map it creates
+     * could be used, but generally would be larger and slower to run than the
+     * output of the second pass, which starts with a more compact table and
+     * allows more ranges to be merged */
+    for (pass2 = 0; pass2 < 2; pass2++) {
+
+        /* Initialize to a single range */
+        t_invlist = _add_range_to_invlist(t_invlist, 0, UV_MAX);
+
+        /* In the second pass, we just have the single range */
+
+        if (pass2) {
+            len = 1;
+            t_array = invlist_array(t_invlist);
+        }
+        else {
+
+            /* But in the first pass, the lhs is partitioned such that the
+             * number of UTF-8 bytes required to represent a code point in each
+             * partition is the same as the number for any other code point in
+             * that partion.  We copy the pre-compiled partion. */
+            len = C_ARRAY_LENGTH(PL_partition_by_byte_length);
+            invlist_extend(t_invlist, len);
+            t_array = invlist_array(t_invlist);
+            Copy(PL_partition_by_byte_length, t_array, len, UV);
+            invlist_set_len(t_invlist,
+                            len,
+                            *(get_invlist_offset_addr(t_invlist)));
+            Newx(r_map, len + 1, UV);
+        }
+
+        /* And the mapping of each of the ranges is initialized.  Initially,
+         * everything is TR_UNLISTED. */
+        for (i = 0; i < len; i++) {
+            r_map[i] = TR_UNLISTED;
+        }
+
+        t = t0;
+        t_count = 0;
+        r = r0;
+        r_count = 0;
+        t_range_count = r_range_count = 0;
+
+        DEBUG_y(PerlIO_printf(Perl_debug_log, "%s: %d:\ntstr=%s\n",
+                    __FILE__, __LINE__, _byte_dump_string(t, tend - t, 0)));
+        DEBUG_y(PerlIO_printf(Perl_debug_log, "rstr=%s\n",
+                                        _byte_dump_string(r, rend - r, 0)));
+        DEBUG_y(PerlIO_printf(Perl_debug_log, "/c=%d; /s=%d; /d=%d\n",
+                                                  complement, squash, del));
+        DEBUG_y(invmap_dump(t_invlist, r_map));
+
+        /* Now go through the search list constructing an inversion map.  The
+         * input is not necessarily in any particular order.  Making it an
+         * inversion map orders it, potentially simplifying, and makes it easy
+         * to deal with at run time.  This is the only place in core that
+         * generates an inversion map; if others were introduced, it might be
+         * better to create general purpose routines to handle them.
+         * (Inversion maps are created in perl in other places.)
+         *
+         * An inversion map consists of two parallel arrays.  One is
+         * essentially an inversion list: an ordered list of code points such
+         * that each element gives the first code point of a range of
+         * consecutive code points that map to the element in the other array
+         * that has the same index as this one (in other words, the
+         * corresponding element).  Thus the range extends up to (but not
+         * including) the code point given by the next higher element.  In a
+         * true inversion map, the corresponding element in the other array
+         * gives the mapping of the first code point in the range, with the
+         * understanding that the next higher code point in the inversion
+         * list's range will map to the next higher code point in the map.
+         *
+         * So if at element [i], let's say we have:
+         *
+         *     t_invlist  r_map
+         * [i]    A         a
+         *
+         * This means that A => a, B => b, C => c....  Let's say that the
+         * situation is such that:
+         *
+         * [i+1]  L        -1
+         *
+         * This means the sequence that started at [i] stops at K => k.  This
+         * illustrates that you need to look at the next element to find where
+         * a sequence stops.  Except, the highest element in the inversion list
+         * begins a range that is understood to extend to the platform's
+         * infinity.
+         *
+         * This routine modifies traditional inversion maps to reserve two
+         * mappings:
+         *
+         *  TR_UNLISTED (or -1) indicates that the no code point in the range
+         *      is listed in the tr/// searchlist.  At runtime, these are
+         *      always passed through unchanged.  In the inversion map, all
+         *      points in the range are mapped to -1, instead of increasing,
+         *      like the 'L' in the example above.
+         *
+         *      We start the parse with every code point mapped to this, and as
+         *      we parse and find ones that are listed in the search list, we
+         *      carve out ranges as we go along that override that.
+         *
+         *  TR_SPECIAL_HANDLING (or -2) indicates that every code point in the
+         *      range needs special handling.  Again, all code points in the
+         *      range are mapped to -2, instead of increasing.
+         *
+         *      Under /d this value means the code point should be deleted from
+         *      the transliteration when encountered.
+         *
+         *      Otherwise, it marks that every code point in the range is to
+         *      map to the final character in the replacement list.  This
+         *      happens only when the replacement list is shorter than the
+         *      search one, so there are things in the search list that have no
+         *      correspondence in the replacement list.  For example, in
+         *      tr/a-z/A/, 'A' is the final value, and the inversion map
+         *      generated for this would be like this:
+         *          \0  =>  -1
+         *          a   =>   A
+         *          b-z =>  -2
+         *          z+1 =>  -1
+         *      'A' appears once, then the remainder of the range maps to -2.
+         *      The use of -2 isn't strictly necessary, as an inversion map is
+         *      capable of representing this situation, but not nearly so
+         *      compactly, and this is actually quite commonly encountered.
+         *      Indeed, the original design of this code used a full inversion
+         *      map for this.  But things like
+         *          tr/\0-\x{FFFF}/A/
+         *      generated huge data structures, slowly, and the execution was
+         *      also slow.  So the current scheme was implemented.
+         *
+         *  So, if the next element in our example is:
+         *
+         * [i+2]  Q        q
+         *
+         * Then all of L, M, N, O, and P map to TR_UNLISTED.  If the next
+         * elements are
+         *
+         * [i+3]  R        z
+         * [i+4]  S       TR_UNLISTED
+         *
+         * Then Q => q; R => z; and S => TR_UNLISTED.  If [i+4] (the 'S') is
+         * the final element in the arrays, every code point from S to infinity
+         * maps to TR_UNLISTED.
+         *
+         */
+                           /* Finish up range started in what otherwise would
+                            * have been the final iteration */
+        while (t < tend || t_range_count > 0) {
+            bool adjacent_to_range_above = FALSE;
+            bool adjacent_to_range_below = FALSE;
+
+            bool merge_with_range_above = FALSE;
+            bool merge_with_range_below = FALSE;
+
+            UV span, invmap_range_length_remaining;
+            SSize_t j;
+            Size_t i;
+
+            /* If we are in the middle of processing a range in the 'target'
+             * side, the previous iteration has set us up.  Otherwise, look at
+             * the next character in the search list */
+            if (t_range_count <= 0) {
+                if (! tstr_utf8) {
+
+                    /* Here, not in the middle of a range, and not UTF-8.  The
+                     * next code point is the single byte where we're at */
+                    t_cp = *t;
+                    t_range_count = 1;
+                    t++;
+                }
+                else {
+                    Size_t t_char_len;
+
+                    /* Here, not in the middle of a range, and is UTF-8.  The
+                     * next code point is the next UTF-8 char in the input.  We
+                     * know the input is valid, because the toker constructed
+                     * it */
+                    t_cp = valid_utf8_to_uvchr(t, &t_char_len);
+                    t += t_char_len;
+
+                    /* UTF-8 strings (only) have been parsed in toke.c to have
+                     * ranges.  See if the next byte indicates that this was
+                     * the first element of a range.  If so, get the final
+                     * element and calculate the range size.  If not, the range
+                     * size is 1 */
+                    if (t < tend && *t == RANGE_INDICATOR) {
+                        t++;
+                        t_range_count = valid_utf8_to_uvchr(t, &t_char_len)
+                                      - t_cp + 1;
+                        t += t_char_len;
+                    }
+                    else {
+                        t_range_count = 1;
+                    }
+                }
+
+                /* Count the total number of listed code points * */
+                t_count += t_range_count;
+            }
+
+            /* Similarly, get the next character in the replacement list */
+            if (r_range_count <= 0) {
+                if (r >= rend) {
+
+                    /* But if we've exhausted the rhs, there is nothing to map
+                     * to, except the special handling one, and we make the
+                     * range the same size as the lhs one. */
+                    r_cp = TR_SPECIAL_HANDLING;
+                    r_range_count = t_range_count;
+
+                    if (! del) {
+                        DEBUG_yv(PerlIO_printf(Perl_debug_log,
+                                        "final_map =%" UVXf "\n", final_map));
+                    }
+                }
+                else {
+                    if (! rstr_utf8) {
+                        r_cp = *r;
+                        r_range_count = 1;
+                        r++;
+                    }
+                    else {
+                        Size_t r_char_len;
+
+                        r_cp = valid_utf8_to_uvchr(r, &r_char_len);
+                        r += r_char_len;
+                        if (r < rend && *r == RANGE_INDICATOR) {
+                            r++;
+                            r_range_count = valid_utf8_to_uvchr(r,
+                                                    &r_char_len) - r_cp + 1;
+                            r += r_char_len;
+                        }
+                        else {
+                            r_range_count = 1;
+                        }
+                    }
+
+                    if (r_cp == TR_SPECIAL_HANDLING) {
+                        r_range_count = t_range_count;
+                    }
+
+                    /* This is the final character so far */
+                    final_map = r_cp + r_range_count - 1;
+
+                    r_count += r_range_count;
+                }
+            }
+
+            /* Here, we have the next things ready in both sides.  They are
+             * potentially ranges.  We try to process as big a chunk as
+             * possible at once, but the lhs and rhs must be synchronized, so
+             * things like tr/A-Z/a-ij-z/ will need to be processed in 2 chunks
+             * */
+            min_range_count = MIN(t_range_count, r_range_count);
+
+            /* Search the inversion list for the entry that contains the input
+             * code point <cp>.  The inversion map was initialized to cover the
+             * entire range of possible inputs, so this should not fail.  So
+             * the return value is the index into the list's array of the range
+             * that contains <cp>, that is, 'i' such that array[i] <= cp <
+             * array[i+1] */
+            j = _invlist_search(t_invlist, t_cp);
+            assert(j >= 0);
+            i = j;
+
+            /* Here, the data structure might look like:
+             *
+             * index    t   r     Meaning
+             * [i-1]    J   j   # J-L => j-l
+             * [i]      M  -1   # M => default; as do N, O, P, Q
+             * [i+1]    R   x   # R => x, S => x+1, T => x+2
+             * [i+2]    U   y   # U => y, V => y+1, ...
+             * ...
+             * [-1]     Z  -1   # Z => default; as do Z+1, ... infinity
+             *
+             * where 'x' and 'y' above are not to be taken literally.
+             *
+             * The maximum chunk we can handle in this loop iteration, is the
+             * smallest of the three components: the lhs 't_', the rhs 'r_',
+             * and the remainder of the range in element [i].  (In pass 1, that
+             * range will have everything in it be of the same class; we can't
+             * cross into another class.)  'min_range_count' already contains
+             * the smallest of the first two values.  The final one is
+             * irrelevant if the map is to the special indicator */
+
+            invmap_range_length_remaining = (i + 1 < len)
+                                            ? t_array[i+1] - t_cp
+                                            : IV_MAX - t_cp;
+            span = MAX(1, MIN(min_range_count, invmap_range_length_remaining));
+
+            /* The end point of this chunk is where we are, plus the span, but
+             * never larger than the platform's infinity */
+            t_cp_end = MIN(IV_MAX, t_cp + span - 1);
+
+            if (r_cp == TR_SPECIAL_HANDLING) {
+                r_cp_end = TR_SPECIAL_HANDLING;
+            }
+            else {
+                r_cp_end = MIN(IV_MAX, r_cp + span - 1);
+
+                /* If something on the lhs is below 256, and something on the
+                 * rhs is above, there is a potential mapping here across that
+                 * boundary.  Indeed the only way there isn't is if both sides
+                 * start at the same point.  That means they both cross at the
+                 * same time.  But otherwise one crosses before the other */
+                if (t_cp < 256 && r_cp_end > 255 && r_cp != t_cp) {
+                    can_force_utf8 = TRUE;
+                }
+            }
+
+            /* If a character appears in the search list more than once, the
+             * 2nd and succeeding occurrences are ignored, so only do this
+             * range if haven't already processed this character.  (The range
+             * has been set up so that all members in it will be of the same
+             * ilk) */
+            if (r_map[i] == TR_UNLISTED) {
+                DEBUG_yv(PerlIO_printf(Perl_debug_log,
+                    "Processing %" UVxf "-%" UVxf " => %" UVxf "-%" UVxf "\n",
+                    t_cp, t_cp_end, r_cp, r_cp_end));
+
+                /* This is the first definition for this chunk, hence is valid
+                 * and needs to be processed.  Here and in the comments below,
+                 * we use the above sample data.  The t_cp chunk must be any
+                 * contiguous subset of M, N, O, P, and/or Q.
+                 *
+                 * In the first pass, the t_invlist has been partitioned so
+                 * that all elements in any single range have the same number
+                 * of bytes in their UTF-8 representations.  And the r space is
+                 * either a single byte, or a range of strictly monotonically
+                 * increasing code points.  So the final element in the range
+                 * will be represented by no fewer bytes than the initial one.
+                 * That means that if the final code point in the t range has
+                 * at least as many bytes as the final code point in the r,
+                 * then all code points in the t range have at least as many
+                 * bytes as their corresponding r range element.  But if that's
+                 * not true, the transliteration of at least the final code
+                 * point grows in length.  As an example, suppose we had
+                 *      tr/\x{fff0}-\x{fff1}/\x{ffff}-\x{10000}/
+                 * The UTF-8 for all but 10000 occupies 3 bytes on ASCII
+                 * platforms.  We have deliberately set up the data structure
+                 * so that any range in the lhs gets split into chunks for
+                 * processing, such that every code point in a chunk has the
+                 * same number of UTF-8 bytes.  We only have to check the final
+                 * code point in the rhs against any code point in the lhs. */
+                if ( ! pass2
+                    && r_cp_end != TR_SPECIAL_HANDLING
+                    && UVCHR_SKIP(t_cp_end) < UVCHR_SKIP(r_cp_end))
+                {
+                    /* Consider tr/\xCB/\X{E000}/.  The maximum expansion
+                     * factor is 1 byte going to 3 if the lhs is not UTF-8, but
+                     * 2 bytes going to 3 if it is in UTF-8.  We could pass two
+                     * different values so doop could choose based on the
+                     * UTF-8ness of the target.  But khw thinks (perhaps
+                     * wrongly) that is overkill.  It is used only to make sure
+                     * we malloc enough space.  If no target string can force
+                     * the result to be UTF-8, then we don't have to worry
+                     * about this */
+                    NV t_size = (can_force_utf8 && t_cp < 256)
+                                ? 1
+                                : UVCHR_SKIP(t_cp_end);
+                    NV ratio = UVCHR_SKIP(r_cp_end) / t_size;
+
+                    o->op_private |= OPpTRANS_GROWS;
+
+                    /* Now that we know it grows, we can keep track of the
+                     * largest ratio */
+                    if (ratio > max_expansion) {
+                        max_expansion = ratio;
+                        DEBUG_y(PerlIO_printf(Perl_debug_log,
+                                        "New expansion factor: %" NVgf "\n",
+                                        max_expansion));
+                    }
+                }
+
+                /* The very first range is marked as adjacent to the
+                 * non-existent range below it, as it causes things to "just
+                 * work" (TradeMark)
+                 *
+                 * If the lowest code point in this chunk is M, it adjoins the
+                 * J-L range */
+                if (t_cp == t_array[i]) {
+                    adjacent_to_range_below = TRUE;
+
+                    /* And if the map has the same offset from the beginning of
+                     * the range as does this new code point (or both are for
+                     * TR_SPECIAL_HANDLING), this chunk can be completely
+                     * merged with the range below.  EXCEPT, in the first pass,
+                     * we don't merge ranges whose UTF-8 byte representations
+                     * have different lengths, so that we can more easily
+                     * detect if a replacement is longer than the source, that
+                     * is if it 'grows'.  But in the 2nd pass, there's no
+                     * reason to not merge */
+                    if (   (i > 0 && (   pass2
+                                      || UVCHR_SKIP(t_array[i-1])
+                                                        == UVCHR_SKIP(t_cp)))
+                        && (   (   r_cp == TR_SPECIAL_HANDLING
+                                && r_map[i-1] == TR_SPECIAL_HANDLING)
+                            || (   r_cp != TR_SPECIAL_HANDLING
+                                && r_cp - r_map[i-1] == t_cp - t_array[i-1])))
+                    {
+                        merge_with_range_below = TRUE;
+                    }
+                }
+
+                /* Similarly, if the highest code point in this chunk is 'Q',
+                 * it adjoins the range above, and if the map is suitable, can
+                 * be merged with it */
+                if (    t_cp_end >= IV_MAX - 1
+                    || (   i + 1 < len
+                        && t_cp_end + 1 == t_array[i+1]))
+                {
+                    adjacent_to_range_above = TRUE;
+                    if (i + 1 < len)
+                    if (    (   pass2
+                             || UVCHR_SKIP(t_cp) == UVCHR_SKIP(t_array[i+1]))
+                        && (   (   r_cp == TR_SPECIAL_HANDLING
+                                && r_map[i+1] == (UV) TR_SPECIAL_HANDLING)
+                            || (   r_cp != TR_SPECIAL_HANDLING
+                                && r_cp_end == r_map[i+1] - 1)))
+                    {
+                        merge_with_range_above = TRUE;
+                    }
+                }
+
+                if (merge_with_range_below && merge_with_range_above) {
+
+                    /* Here the new chunk looks like M => m, ... Q => q; and
+                     * the range above is like R => r, ....  Thus, the [i-1]
+                     * and [i+1] ranges should be seamlessly melded so the
+                     * result looks like
+                     *
+                     * [i-1]    J   j   # J-T => j-t
+                     * [i]      U   y   # U => y, V => y+1, ...
+                     * ...
+                     * [-1]     Z  -1   # Z => default; as do Z+1, ... infinity
+                     */
+                    Move(t_array + i + 2, t_array + i, len - i - 2, UV);
+                    Move(r_map   + i + 2, r_map   + i, len - i - 2, UV);
+                    len -= 2;
+                    invlist_set_len(t_invlist,
+                                    len,
+                                    *(get_invlist_offset_addr(t_invlist)));
+                }
+                else if (merge_with_range_below) {
+
+                    /* Here the new chunk looks like M => m, .... But either
+                     * (or both) it doesn't extend all the way up through Q; or
+                     * the range above doesn't start with R => r. */
+                    if (! adjacent_to_range_above) {
+
+                        /* In the first case, let's say the new chunk extends
+                         * through O.  We then want:
+                         *
+                         * [i-1]    J   j   # J-O => j-o
+                         * [i]      P  -1   # P => -1, Q => -1
+                         * [i+1]    R   x   # R => x, S => x+1, T => x+2
+                         * [i+2]    U   y   # U => y, V => y+1, ...
+                         * ...
+                         * [-1]     Z  -1   # Z => default; as do Z+1, ...
+                         *                                            infinity
+                         */
+                        t_array[i] = t_cp_end + 1;
+                        r_map[i] = TR_UNLISTED;
+                    }
+                    else { /* Adjoins the range above, but can't merge with it
+                              (because 'x' is not the next map after q) */
+                        /*
+                         * [i-1]    J   j   # J-Q => j-q
+                         * [i]      R   x   # R => x, S => x+1, T => x+2
+                         * [i+1]    U   y   # U => y, V => y+1, ...
+                         * ...
+                         * [-1]     Z  -1   # Z => default; as do Z+1, ...
+                         *                                          infinity
+                         */
  
  
-    const bool complement = cBOOL(o->op_private & OPpTRANS_COMPLEMENT);
-    const bool squash     = cBOOL(o->op_private & OPpTRANS_SQUASH);
-    const bool del        = cBOOL(o->op_private & OPpTRANS_DELETE);
-    SV* swash;
+                        Move(t_array + i + 1, t_array + i, len - i - 1, UV);
+                        Move(r_map + i + 1, r_map + i, len - i - 1, UV);
+                        len--;
+                        invlist_set_len(t_invlist, len,
+                                        *(get_invlist_offset_addr(t_invlist)));
+                    }
+                }
+                else if (merge_with_range_above) {
+
+                    /* Here the new chunk ends with Q => q, and the range above
+                     * must start with R => r, so the two can be merged. But
+                     * either (or both) the new chunk doesn't extend all the
+                     * way down to M; or the mapping of the final code point
+                     * range below isn't m */
+                    if (! adjacent_to_range_below) {
+
+                        /* In the first case, let's assume the new chunk starts
+                         * with P => p.  Then, because it's merge-able with the
+                         * range above, that range must be R => r.  We want:
+                         *
+                         * [i-1]    J   j   # J-L => j-l
+                         * [i]      M  -1   # M => -1, N => -1
+                         * [i+1]    P   p   # P-T => p-t
+                         * [i+2]    U   y   # U => y, V => y+1, ...
+                         * ...
+                         * [-1]     Z  -1   # Z => default; as do Z+1, ...
+                         *                                          infinity
+                         */
+                        t_array[i+1] = t_cp;
+                        r_map[i+1] = r_cp;
+                    }
+                    else { /* Adjoins the range below, but can't merge with it
+                            */
+                        /*
+                         * [i-1]    J   j   # J-L => j-l
+                         * [i]      M   x   # M-T => x-5 .. x+2
+                         * [i+1]    U   y   # U => y, V => y+1, ...
+                         * ...
+                         * [-1]     Z  -1   # Z => default; as do Z+1, ...
+                         *                                          infinity
+                         */
+                        Move(t_array + i + 1, t_array + i, len - i - 1, UV);
+                        Move(r_map   + i + 1, r_map   + i, len - i - 1, UV);
+                        len--;
+                        t_array[i] = t_cp;
+                        r_map[i] = r_cp;
+                        invlist_set_len(t_invlist, len,
+                                        *(get_invlist_offset_addr(t_invlist)));
+                    }
+                }
+                else if (adjacent_to_range_below && adjacent_to_range_above) {
+                    /* The new chunk completely fills the gap between the
+                     * ranges on either side, but can't merge with either of
+                     * them.
+                     *
+                     * [i-1]    J   j   # J-L => j-l
+                     * [i]      M   z   # M => z, N => z+1 ... Q => z+4
+                     * [i+1]    R   x   # R => x, S => x+1, T => x+2
+                     * [i+2]    U   y   # U => y, V => y+1, ...
+                     * ...
+                     * [-1]     Z  -1   # Z => default; as do Z+1, ... infinity
+                     */
+                    r_map[i] = r_cp;
+                }
+                else if (adjacent_to_range_below) {
+                    /* The new chunk adjoins the range below, but not the range
+                     * above, and can't merge.  Let's assume the chunk ends at
+                     * O.
+                     *
+                     * [i-1]    J   j   # J-L => j-l
+                     * [i]      M   z   # M => z, N => z+1, O => z+2
+                     * [i+1]    P   -1  # P => -1, Q => -1
+                     * [i+2]    R   x   # R => x, S => x+1, T => x+2
+                     * [i+3]    U   y   # U => y, V => y+1, ...
+                     * ...
+                     * [-w]     Z  -1   # Z => default; as do Z+1, ... infinity
+                     */
+                    invlist_extend(t_invlist, len + 1);
+                    t_array = invlist_array(t_invlist);
+                    Renew(r_map, len + 1, UV);
+
+                    Move(t_array + i + 1, t_array + i + 2, len - i - 1, UV);
+                    Move(r_map + i + 1,   r_map   + i + 2, len - i - 1, UV);
+                    r_map[i] = r_cp;
+                    t_array[i+1] = t_cp_end + 1;
+                    r_map[i+1] = TR_UNLISTED;
+                    len++;
+                    invlist_set_len(t_invlist, len,
+                                    *(get_invlist_offset_addr(t_invlist)));
+                }
+                else if (adjacent_to_range_above) {
+                    /* The new chunk adjoins the range above, but not the range
+                     * below, and can't merge.  Let's assume the new chunk
+                     * starts at O
+                     *
+                     * [i-1]    J   j   # J-L => j-l
+                     * [i]      M  -1   # M => default, N => default
+                     * [i+1]    O   z   # O => z, P => z+1, Q => z+2
+                     * [i+2]    R   x   # R => x, S => x+1, T => x+2
+                     * [i+3]    U   y   # U => y, V => y+1, ...
+                     * ...
+                     * [-1]     Z  -1   # Z => default; as do Z+1, ... infinity
+                     */
+                    invlist_extend(t_invlist, len + 1);
+                    t_array = invlist_array(t_invlist);
+                    Renew(r_map, len + 1, UV);
+
+                    Move(t_array + i + 1, t_array + i + 2, len - i - 1, UV);
+                    Move(r_map   + i + 1, r_map   + i + 2, len - i - 1, UV);
+                    t_array[i+1] = t_cp;
+                    r_map[i+1] = r_cp;
+                    len++;
+                    invlist_set_len(t_invlist, len,
+                                    *(get_invlist_offset_addr(t_invlist)));
+                }
+                else {
+                    /* The new chunk adjoins neither the range above, nor the
+                     * range below.  Lets assume it is N..P => n..p
+                     *
+                     * [i-1]    J   j   # J-L => j-l
+                     * [i]      M  -1   # M => default
+                     * [i+1]    N   n   # N..P => n..p
+                     * [i+2]    Q  -1   # Q => default
+                     * [i+3]    R   x   # R => x, S => x+1, T => x+2
+                     * [i+4]    U   y   # U => y, V => y+1, ...
+                     * ...
+                     * [-1]     Z  -1   # Z => default; as do Z+1, ... infinity
+                     */
  
  
-    PERL_ARGS_ASSERT_PMTRANS;
+                    DEBUG_yv(PerlIO_printf(Perl_debug_log,
+                                        "Before fixing up: len=%d, i=%d\n",
+                                        (int) len, (int) i));
+                    DEBUG_yv(invmap_dump(t_invlist, r_map));
  
  
-    PL_hints |= HINT_BLOCK_SCOPE;
+                    invlist_extend(t_invlist, len + 2);
+                    t_array = invlist_array(t_invlist);
+                    Renew(r_map, len + 2, UV);
  
  
-    if (SvUTF8(tstr))
-        o->op_private |= OPpTRANS_FROM_UTF;
+                    Move(t_array + i + 1,
+                         t_array + i + 2 + 1, len - i - (2 - 1), UV);
+                    Move(r_map   + i + 1,
+                         r_map   + i + 2 + 1, len - i - (2 - 1), UV);
  
  
-    if (SvUTF8(rstr))
-        o->op_private |= OPpTRANS_TO_UTF;
+                    len += 2;
+                    invlist_set_len(t_invlist, len,
+                                    *(get_invlist_offset_addr(t_invlist)));
  
  
-    if (o->op_private & (OPpTRANS_FROM_UTF|OPpTRANS_TO_UTF)) {
+                    t_array[i+1] = t_cp;
+                    r_map[i+1] = r_cp;
  
  
-        /* for utf8 translations, op_sv will be set to point to a swash
-         * containing codepoint ranges. This is done by first assembling
-         * a textual representation of the ranges in listsv then compiling
-         * it using swash_init(). For more details of the textual format,
-         * see L<perlunicode.pod/"User-Defined Character Properties"> .
-         */
+                    t_array[i+2] = t_cp_end + 1;
+                    r_map[i+2] = TR_UNLISTED;
+                }
+                DEBUG_yv(PerlIO_printf(Perl_debug_log,
+                          "After iteration: span=%" UVuf ", t_range_count=%"
+                          UVuf " r_range_count=%" UVuf "\n",
+                          span, t_range_count, r_range_count));
+                DEBUG_yv(invmap_dump(t_invlist, r_map));
+            } /* End of this chunk needs to be processed */
+
+            /* Done with this chunk. */
+            t_cp += span;
+            if (t_cp >= IV_MAX) {
+                break;
+            }
+            t_range_count -= span;
+            if (r_cp != TR_SPECIAL_HANDLING) {
+                r_cp += span;
+                r_range_count -= span;
+            }
+            else {
+                r_range_count = 0;
+            }
  
  
-       SV* const listsv = newSVpvs("# comment\n");
-       SV* transv = NULL;
-       const U8* tend = t + tlen;
-       const U8* rend = r + rlen;
-       STRLEN ulen;
-       UV tfirst = 1;
-       UV tlast = 0;
-       IV tdiff;
-       STRLEN tcount = 0;
-       UV rfirst = 1;
-       UV rlast = 0;
-       IV rdiff;
-       STRLEN rcount = 0;
-       IV diff;
-       I32 none = 0;
-       U32 max = 0;
-       I32 bits;
-       I32 havefinal = 0;
-       U32 final = 0;
-       const I32 from_utf  = o->op_private & OPpTRANS_FROM_UTF;
-       const I32 to_utf    = o->op_private & OPpTRANS_TO_UTF;
-       U8* tsave = NULL;
-       U8* rsave = NULL;
-       const U32 flags = UTF8_ALLOW_DEFAULT;
-
-       if (!from_utf) {
-           STRLEN len = tlen;
-           t = tsave = bytes_to_utf8(t, &len);
-           tend = t + len;
-       }
-       if (!to_utf && rlen) {
-           STRLEN len = rlen;
-           r = rsave = bytes_to_utf8(r, &len);
-           rend = r + len;
-       }
+        } /* End of loop through the search list */
  
  
-/* There is a snag with this code on EBCDIC: scan_const() in toke.c has
- * encoded chars in native encoding which makes ranges in the EBCDIC 0..255
- * odd.  */
+        /* We don't need an exact count, but we do need to know if there is
+         * anything left over in the replacement list.  So, just assume it's
+         * one byte per character */
+        if (rend > r) {
+            r_count++;
+        }
+    } /* End of passes */
  
  
-       if (complement) {
-            /* utf8 and /c:
-             * replace t/tlen/tend with a version that has the ranges
-             * complemented
-             */
-           U8 tmpbuf[UTF8_MAXBYTES+1];
-           UV *cp;
-           UV nextmin = 0;
-           Newx(cp, 2*tlen, UV);
-           i = 0;
-           transv = newSVpvs("");
-
-            /* convert search string into array of (start,end) range
-             * codepoint pairs stored in cp[]. Most "ranges" will start
-             * and end at the same char */
-           while (t < tend) {
-               cp[2*i] = utf8n_to_uvchr(t, tend-t, &ulen, flags);
-               t += ulen;
-                /* the toker converts X-Y into (X, ILLEGAL_UTF8_BYTE, Y) */
-               if (t < tend && *t == ILLEGAL_UTF8_BYTE) {
-                   t++;
-                   cp[2*i+1] = utf8n_to_uvchr(t, tend-t, &ulen, flags);
-                   t += ulen;
-               }
-               else {
-                cp[2*i+1] = cp[2*i];
-               }
-               i++;
-           }
+    SvREFCNT_dec(inverted_tstr);
  
  
-            /* sort the ranges */
-           qsort(cp, i, 2*sizeof(UV), uvcompare);
-
-            /* Create a utf8 string containing the complement of the
-             * codepoint ranges. For example if cp[] contains [A,B], [C,D],
-             * then transv will contain the equivalent of:
-             * join '', map chr, 0,     ILLEGAL_UTF8_BYTE, A - 1,
-             *                   B + 1, ILLEGAL_UTF8_BYTE, C - 1,
-             *                   D + 1, ILLEGAL_UTF8_BYTE, 0x7fffffff;
-             * A range of a single char skips the ILLEGAL_UTF8_BYTE and
-             * end cp.
-             */
-           for (j = 0; j < i; j++) {
-               UV  val = cp[2*j];
-               diff = val - nextmin;
-               if (diff > 0) {
-                   t = uvchr_to_utf8(tmpbuf,nextmin);
-                   sv_catpvn(transv, (char*)tmpbuf, t - tmpbuf);
-                   if (diff > 1) {
-                       U8  range_mark = ILLEGAL_UTF8_BYTE;
-                       t = uvchr_to_utf8(tmpbuf, val - 1);
-                       sv_catpvn(transv, (char *)&range_mark, 1);
-                       sv_catpvn(transv, (char*)tmpbuf, t - tmpbuf);
-                   }
-               }
-               val = cp[2*j+1];
-               if (val >= nextmin)
-                   nextmin = val + 1;
-           }
+    DEBUG_y(PerlIO_printf(Perl_debug_log, "After everything: \n"));
+    DEBUG_y(invmap_dump(t_invlist, r_map));
  
  
-           t = uvchr_to_utf8(tmpbuf,nextmin);
-           sv_catpvn(transv, (char*)tmpbuf, t - tmpbuf);
-           {
-               U8 range_mark = ILLEGAL_UTF8_BYTE;
-               sv_catpvn(transv, (char *)&range_mark, 1);
-           }
-           t = uvchr_to_utf8(tmpbuf, 0x7fffffff);
-           sv_catpvn(transv, (char*)tmpbuf, t - tmpbuf);
-           t = (const U8*)SvPVX_const(transv);
-           tlen = SvCUR(transv);
-           tend = t + tlen;
-           Safefree(cp);
-       }
-       else if (!rlen && !del) {
-           r = t; rlen = tlen; rend = tend;
-       }
+    /* We now have normalized the input into an inversion map.
+     *
+     * See if the lhs and rhs are equivalent.  If so, this tr/// is a no-op
+     * except for the count, and streamlined runtime code can be used */
+    if (!del && !squash) {
+
+        /* They are identical if they point to same address, or if everything
+         * maps to UNLISTED or to itself.  This catches things that not looking
+         * at the normalized inversion map doesn't catch, like tr/aa/ab/ or
+         * tr/\x{100}-\x{104}/\x{100}-\x{102}\x{103}-\x{104}  */
+        if (r0 != t0) {
+            for (i = 0; i < len; i++) {
+                if (r_map[i] != TR_UNLISTED && r_map[i] != t_array[i]) {
+                    goto done_identical_check;
+                }
+            }
+        }
  
  
-       if (!squash) {
-               if ((!rlen && !del) || t == r ||
-                   (tlen == rlen && memEQ((char *)t, (char *)r, tlen)))
-               {
-                   o->op_private |= OPpTRANS_IDENTICAL;
-               }
-       }
+        /* Here have gone through entire list, and didn't find any
+         * non-identical mappings */
+        o->op_private |= OPpTRANS_IDENTICAL;
  
  
-        /* extract char ranges from t and r and append them to listsv */
-
-       while (t < tend || tfirst <= tlast) {
-           /* see if we need more "t" chars */
-           if (tfirst > tlast) {
-               tfirst = (I32)utf8n_to_uvchr(t, tend - t, &ulen, flags);
-               t += ulen;
-               if (t < tend && *t == ILLEGAL_UTF8_BYTE) {      /* illegal utf8 val indicates range */
-                   t++;
-                   tlast = (I32)utf8n_to_uvchr(t, tend - t, &ulen, flags);
-                   t += ulen;
-               }
-               else
-                   tlast = tfirst;
-           }
+      done_identical_check: ;
+    }
  
  
-           /* now see if we need more "r" chars */
-           if (rfirst > rlast) {
-               if (r < rend) {
-                   rfirst = (I32)utf8n_to_uvchr(r, rend - r, &ulen, flags);
-                   r += ulen;
-                   if (r < rend && *r == ILLEGAL_UTF8_BYTE) {  /* illegal utf8 val indicates range */
-                       r++;
-                       rlast = (I32)utf8n_to_uvchr(r, rend - r, &ulen, flags);
-                       r += ulen;
-                   }
-                   else
-                       rlast = rfirst;
-               }
-               else {
-                   if (!havefinal++)
-                       final = rlast;
-                   rfirst = rlast = 0xffffffff;
-               }
-           }
+    t_array = invlist_array(t_invlist);
  
  
-           /* now see which range will peter out first, if either. */
-           tdiff = tlast - tfirst;
-           rdiff = rlast - rfirst;
-           tcount += tdiff + 1;
-           rcount += rdiff + 1;
+    /* If has components above 255, we generally need to use the inversion map
+     * implementation */
+    if (   can_force_utf8
+        || (   len > 0
+            && t_array[len-1] > 255
+                 /* If the final range is 0x100-INFINITY and is a special
+                  * mapping, the table implementation can handle it */
+            && ! (   t_array[len-1] == 256
+                  && (   r_map[len-1] == TR_UNLISTED
+                      || r_map[len-1] == TR_SPECIAL_HANDLING))))
+    {
+        SV* r_map_sv;
  
  
-           if (tdiff <= rdiff)
-               diff = tdiff;
-           else
-               diff = rdiff;
+        /* A UTF-8 op is generated, indicated by this flag.  This op is an
+         * sv_op */
+        o->op_private |= OPpTRANS_USE_SVOP;
  
  
-           if (rfirst == 0xffffffff) {
-               diff = tdiff;   /* oops, pretend rdiff is infinite */
-               if (diff > 0)
-                   Perl_sv_catpvf(aTHX_ listsv, "%04lx\t%04lx\tXXXX\n",
-                                  (long)tfirst, (long)tlast);
-               else
-                   Perl_sv_catpvf(aTHX_ listsv, "%04lx\t\tXXXX\n", (long)tfirst);
-           }
-           else {
-               if (diff > 0)
-                   Perl_sv_catpvf(aTHX_ listsv, "%04lx\t%04lx\t%04lx\n",
-                                  (long)tfirst, (long)(tfirst + diff),
-                                  (long)rfirst);
-               else
-                   Perl_sv_catpvf(aTHX_ listsv, "%04lx\t\t%04lx\n",
-                                  (long)tfirst, (long)rfirst);
-
-               if (rfirst + diff > max)
-                   max = rfirst + diff;
-               if (!grows)
-                   grows = (tfirst < rfirst &&
-                            UVCHR_SKIP(tfirst) < UVCHR_SKIP(rfirst + diff));
-               rfirst += diff + 1;
-           }
-           tfirst += diff + 1;
-       }
+        if (can_force_utf8) {
+            o->op_private |= OPpTRANS_CAN_FORCE_UTF8;
+        }
  
  
-        /* compile listsv into a swash and attach to o */
+        /* The inversion map is pushed; first the list. */
+       invmap = MUTABLE_AV(newAV());
+        av_push(invmap, t_invlist);
  
  
-       none = ++max;
-       if (del)
-           ++max;
+        /* 2nd is the mapping */
+        r_map_sv = newSVpvn((char *) r_map, len * sizeof(UV));
+        av_push(invmap, r_map_sv);
  
  
-       if (max > 0xffff)
-           bits = 32;
-       else if (max > 0xff)
-           bits = 16;
-       else
-           bits = 8;
+        /* 3rd is the max possible expansion factor */
+        av_push(invmap, newSVnv(max_expansion));
+
+        /* Characters that are in the search list, but not in the replacement
+         * list are mapped to the final character in the replacement list */
+        if (! del && r_count < t_count) {
+            av_push(invmap, newSVuv(final_map));
+        }
  
  
-       swash = MUTABLE_SV(swash_init("utf8", "", listsv, bits, none));
  #ifdef USE_ITHREADS
  #ifdef USE_ITHREADS
-       cPADOPo->op_padix = pad_alloc(OP_TRANS, SVf_READONLY);
-       SvREFCNT_dec(PAD_SVl(cPADOPo->op_padix));
-       PAD_SETSV(cPADOPo->op_padix, swash);
-       SvPADTMP_on(swash);
-       SvREADONLY_on(swash);
+        cPADOPo->op_padix = pad_alloc(OP_TRANS, SVf_READONLY);
+        SvREFCNT_dec(PAD_SVl(cPADOPo->op_padix));
+        PAD_SETSV(cPADOPo->op_padix, (SV *) invmap);
+        SvPADTMP_on(invmap);
+        SvREADONLY_on(invmap);
  #else
  #else
-       cSVOPo->op_sv = swash;
+        cSVOPo->op_sv = (SV *) invmap;
  #endif
  #endif
-       SvREFCNT_dec(listsv);
-       SvREFCNT_dec(transv);
  
  
-       if (!del && havefinal && rlen)
-           (void)hv_store(MUTABLE_HV(SvRV(swash)), "FINAL", 5,
-                          newSVuv((UV)final), 0);
+    }
+    else {
+        OPtrans_map *tbl;
+        unsigned short i;
+
+        /* The OPtrans_map struct already contains one slot; hence the -1. */
+        SSize_t struct_size = sizeof(OPtrans_map)
+                            + (256 - 1 + 1)*sizeof(short);
+
+        /* Non-utf8 case: set o->op_pv to point to a simple 256+ entry lookup
+        * table. Entries with the value TR_UNMAPPED indicate chars not to be
+        * translated, while TR_DELETE indicates a search char without a
+        * corresponding replacement char under /d.
+        *
+        * In addition, an extra slot at the end is used to store the final
+        * repeating char, or TR_R_EMPTY under an empty replacement list, or
+        * TR_DELETE under /d; which makes the runtime code easier.
+        */
  
  
-       Safefree(tsave);
-       Safefree(rsave);
+        /* Indicate this is an op_pv */
+        o->op_private &= ~OPpTRANS_USE_SVOP;
  
  
-       tlen = tcount;
-       rlen = rcount;
-       if (r < rend)
-           rlen++;
-       else if (rlast == 0xffffffff)
-           rlen = 0;
+        tbl = (OPtrans_map*)PerlMemShared_calloc(struct_size, 1);
+        tbl->size = 256;
+        cPVOPo->op_pv = (char*)tbl;
  
  
-       goto warnins;
-    }
+        for (i = 0; i < len; i++) {
+            STATIC_ASSERT_DECL(TR_SPECIAL_HANDLING == TR_DELETE);
+            short upper = i >= len - 1 ? 256 : (short) t_array[i+1];
+            short to = (short) r_map[i];
+            short j;
+            bool do_increment = TRUE;
  
  
-    /* Non-utf8 case: set o->op_pv to point to a simple 256+ entry lookup
-     * table. Entries with the value -1 indicate chars not to be
-     * translated, while -2 indicates a search char without a
-     * corresponding replacement char under /d.
-     *
-     * Normally, the table has 256 slots. However, in the presence of
-     * /c, the search charlist has an implicit \x{100}-\x{7fffffff}
-     * added, and if there are enough replacement chars to start pairing
-     * with the \x{100},... search chars, then a larger (> 256) table
-     * is allocated.
-     *
-     * In addition, regardless of whether under /c, an extra slot at the
-     * end is used to store the final repeating char, or -3 under an empty
-     * replacement list, or -2 under /d; which makes the runtime code
-     * easier.
-     *
-     * The toker will have already expanded char ranges in t and r.
-     */
+            /* Any code points above our limit should be irrelevant */
+            if (t_array[i] >= tbl->size) break;
  
  
-    /* Initially allocate 257-slot table: 256 for basic (non /c) usage,
-     * plus final slot for repeat/-2/-3. Later we realloc if excess > * 0.
-     * The OPtrans_map struct already contains one slot; hence the -1.
-     */
-    struct_size = sizeof(OPtrans_map) + (256 - 1 + 1)*sizeof(short);
-    tbl = (OPtrans_map*)PerlMemShared_calloc(struct_size, 1);
-    tbl->size = 256;
-    cPVOPo->op_pv = (char*)tbl;
+            /* Set up the map */
+            if (to == (short) TR_SPECIAL_HANDLING && ! del) {
+                to = (short) final_map;
+                do_increment = FALSE;
+            }
+            else if (to < 0) {
+                do_increment = FALSE;
+            }
  
  
-    if (complement) {
-        Size_t excess;
+            /* Create a map for everything in this range.  The value increases
+             * except for the special cases */
+            for (j = (short) t_array[i]; j < upper; j++) {
+                tbl->map[j] = to;
+                if (do_increment) to++;
+            }
+        }
  
  
-        /* in this branch, j is a count of 'consumed' (i.e. paired off
-         * with a search char) replacement chars (so j <= rlen always)
-         */
-       for (i = 0; i < tlen; i++)
-           tbl->map[t[i]] = -1;
-
-       for (i = 0, j = 0; i < 256; i++) {
-           if (!tbl->map[i]) {
-               if (j == rlen) {
-                   if (del)
-                       tbl->map[i] = -2;
-                   else if (rlen)
-                       tbl->map[i] = r[j-1];
-                   else
-                       tbl->map[i] = (short)i;
-               }
-               else {
-                   tbl->map[i] = r[j++];
-               }
-                if (   tbl->map[i] >= 0
-                    &&  UVCHR_IS_INVARIANT((UV)i)
-                    && !UVCHR_IS_INVARIANT((UV)(tbl->map[i]))
-                )
-                    grows = TRUE;
-           }
-       }
+        tbl->map[tbl->size] = del
+                              ? (short) TR_DELETE
+                              : (short) rlen
+                                ? (short) final_map
+                                : (short) TR_R_EMPTY;
+        DEBUG_y(PerlIO_printf(Perl_debug_log,"%s: %d\n", __FILE__, __LINE__));
+        for (i = 0; i < tbl->size; i++) {
+            if (tbl->map[i] < 0) {
+                DEBUG_y(PerlIO_printf(Perl_debug_log," %02x=>%d",
+                                                (unsigned) i, tbl->map[i]));
+            }
+            else {
+                DEBUG_y(PerlIO_printf(Perl_debug_log," %02x=>%02x",
+                                                (unsigned) i, tbl->map[i]));
+            }
+            if ((i+1) % 8 == 0 || i + 1 == (short) tbl->size) {
+                DEBUG_y(PerlIO_printf(Perl_debug_log,"\n"));
+            }
+        }
+        DEBUG_y(PerlIO_printf(Perl_debug_log,"Final map 0x%x=>%02x\n",
+                                (unsigned) tbl->size, tbl->map[tbl->size]));
+
+        SvREFCNT_dec(t_invlist);
+
+#if 0   /* code that added excess above-255 chars at the end of the table, in
+           case we ever want to not use the inversion map implementation for
+           this */
  
          ASSUME(j <= rlen);
          excess = rlen - j;
  
          ASSUME(j <= rlen);
          excess = rlen - j;
@@ -6907,54 +7850,28 @@ S_pmtrans(pTHX_ OP *o, OP *expr, OP *repl)
          }
          else {
              /* no more replacement chars than search chars */
          }
          else {
              /* no more replacement chars than search chars */
-            if (!rlen && !del && !squash)
-                o->op_private |= OPpTRANS_IDENTICAL;
-        }
+#endif
  
  
-        tbl->map[tbl->size] = del ? -2 : rlen ? r[rlen - 1] : -3;
      }
      }
-    else {
-       if (!rlen && !del) {
-           r = t; rlen = tlen;
-           if (!squash)
-               o->op_private |= OPpTRANS_IDENTICAL;
-       }
-       else if (!squash && rlen == tlen && memEQ((char*)t, (char*)r, tlen)) {
-           o->op_private |= OPpTRANS_IDENTICAL;
-       }
  
  
-       for (i = 0; i < 256; i++)
-           tbl->map[i] = -1;
-       for (i = 0, j = 0; i < tlen; i++,j++) {
-           if (j >= rlen) {
-               if (del) {
-                   if (tbl->map[t[i]] == -1)
-                       tbl->map[t[i]] = -2;
-                   continue;
-               }
-               --j;
-           }
-           if (tbl->map[t[i]] == -1) {
-                if (     UVCHR_IS_INVARIANT(t[i])
-                    && ! UVCHR_IS_INVARIANT(r[j]))
-                   grows = TRUE;
-               tbl->map[t[i]] = r[j];
-           }
-       }
-        tbl->map[tbl->size] = del ? -1 : rlen ? -1 : -3;
-    }
+    DEBUG_y(PerlIO_printf(Perl_debug_log,
+            "/d=%d, /s=%d, /c=%d, identical=%d, grows=%d,"
+            " use_svop=%d, can_force_utf8=%d,\nexpansion=%g\n",
+            del, squash, complement,
+            cBOOL(o->op_private & OPpTRANS_IDENTICAL),
+            cBOOL(o->op_private & OPpTRANS_USE_SVOP),
+            cBOOL(o->op_private & OPpTRANS_GROWS),
+            cBOOL(o->op_private & OPpTRANS_CAN_FORCE_UTF8),
+            max_expansion));
  
  
-    /* both non-utf8 and utf8 code paths end up here */
+    Safefree(r_map);
  
  
-  warnins:
-    if(del && rlen == tlen) {
-       Perl_ck_warner(aTHX_ packWARN(WARN_MISC), "Useless use of /d modifier in transliteration operator"); 
-    } else if(rlen > tlen && !complement) {
+    if(del && rlen != 0 && r_count == t_count) {
+       Perl_ck_warner(aTHX_ packWARN(WARN_MISC), "Useless use of /d modifier in transliteration operator");
+    } else if(r_count > t_count) {
         Perl_ck_warner(aTHX_ packWARN(WARN_MISC), "Replacement list is longer than search list");
      }
  
         Perl_ck_warner(aTHX_ packWARN(WARN_MISC), "Replacement list is longer than search list");
      }
  
-    if (grows)
-       o->op_private |= OPpTRANS_GROWS;
      op_free(expr);
      op_free(repl);
  
      op_free(expr);
      op_free(repl);
  
@@ -7061,14 +7978,16 @@ S_set_haseval(pTHX)
   *
   * Flags currently has 2 bits of meaning:
   * 1: isreg indicates that the pattern is part of a regex construct, eg
   *
   * Flags currently has 2 bits of meaning:
   * 1: isreg indicates that the pattern is part of a regex construct, eg
- * $x =~ /pattern/ or split /pattern/, as opposed to $x =~ $pattern or
- * split "pattern", which aren't. In the former case, expr will be a list
- * if the pattern contains more than one term (eg /a$b/).
+ *      $x =~ /pattern/ or split /pattern/, as opposed to $x =~ $pattern or
+ *      split "pattern", which aren't. In the former case, expr will be a list
+ *      if the pattern contains more than one term (eg /a$b/).
   * 2: The pattern is for a split.
   *
   * When the pattern has been compiled within a new anon CV (for
   * qr/(?{...})/ ), then floor indicates the savestack level just before
   * the new sub was created
   * 2: The pattern is for a split.
   *
   * When the pattern has been compiled within a new anon CV (for
   * qr/(?{...})/ ), then floor indicates the savestack level just before
   * the new sub was created
+ *
+ * tr/// is also handled.
   */
  
  OP *
   */
  
  OP *
@@ -7925,9 +8844,16 @@ Perl_newSLICEOP(pTHX_ I32 flags, OP *subscript, OP *listval)
             list(force_list(listval,   1)) );
  }
  
             list(force_list(listval,   1)) );
  }
  
+#define ASSIGN_SCALAR 0
  #define ASSIGN_LIST   1
  #define ASSIGN_REF    2
  
  #define ASSIGN_LIST   1
  #define ASSIGN_REF    2
  
+/* given the optree o on the LHS of an assignment, determine whether its:
+ *  ASSIGN_SCALAR   $x  = ...
+ *  ASSIGN_LIST    ($x) = ...
+ *  ASSIGN_REF     \$x  = ...
+ */
+
  STATIC I32
  S_assignment_type(pTHX_ const OP *o)
  {
  STATIC I32
  S_assignment_type(pTHX_ const OP *o)
  {
@@ -7936,7 +8862,7 @@ S_assignment_type(pTHX_ const OP *o)
      U8 ret;
  
      if (!o)
      U8 ret;
  
      if (!o)
-       return TRUE;
+       return ASSIGN_LIST;
  
      if (o->op_type == OP_SREFGEN)
      {
  
      if (o->op_type == OP_SREFGEN)
      {
@@ -7953,7 +8879,7 @@ S_assignment_type(pTHX_ const OP *o)
             o = cUNOPo->op_first;
         flags = o->op_flags;
         type = o->op_type;
             o = cUNOPo->op_first;
         flags = o->op_flags;
         type = o->op_type;
-       ret = 0;
+       ret = ASSIGN_SCALAR;
      }
  
      if (type == OP_COND_EXPR) {
      }
  
      if (type == OP_COND_EXPR) {
@@ -7965,7 +8891,7 @@ S_assignment_type(pTHX_ const OP *o)
             return ASSIGN_LIST;
         if ((t == ASSIGN_LIST) ^ (f == ASSIGN_LIST))
             yyerror("Assignment to both a list and a scalar");
             return ASSIGN_LIST;
         if ((t == ASSIGN_LIST) ^ (f == ASSIGN_LIST))
             yyerror("Assignment to both a list and a scalar");
-       return FALSE;
+       return ASSIGN_SCALAR;
      }
  
      if (type == OP_LIST &&
      }
  
      if (type == OP_LIST &&
@@ -7977,10 +8903,10 @@ S_assignment_type(pTHX_ const OP *o)
         type == OP_RV2AV || type == OP_RV2HV ||
         type == OP_ASLICE || type == OP_HSLICE ||
          type == OP_KVASLICE || type == OP_KVHSLICE || type == OP_REFGEN)
         type == OP_RV2AV || type == OP_RV2HV ||
         type == OP_ASLICE || type == OP_HSLICE ||
          type == OP_KVASLICE || type == OP_KVHSLICE || type == OP_REFGEN)
-       return TRUE;
+       return ASSIGN_LIST;
  
      if (type == OP_PADAV || type == OP_PADHV)
  
      if (type == OP_PADAV || type == OP_PADHV)
-       return TRUE;
+       return ASSIGN_LIST;
  
      if (type == OP_RV2SV)
         return ret;
  
      if (type == OP_RV2SV)
         return ret;
@@ -8347,17 +9273,26 @@ Perl_newLOGOP(pTHX_ I32 type, I32 flags, OP *first, OP *other)
      return new_logop(type, flags, &first, &other);
  }
  
      return new_logop(type, flags, &first, &other);
  }
  
+
+/* See if the optree o contains a single OP_CONST (plus possibly
+ * surrounding enter/nextstate/null etc). If so, return it, else return
+ * NULL.
+ */
+
  STATIC OP *
  S_search_const(pTHX_ OP *o)
  {
      PERL_ARGS_ASSERT_SEARCH_CONST;
  
  STATIC OP *
  S_search_const(pTHX_ OP *o)
  {
      PERL_ARGS_ASSERT_SEARCH_CONST;
  
+  redo:
      switch (o->op_type) {
         case OP_CONST:
             return o;
         case OP_NULL:
      switch (o->op_type) {
         case OP_CONST:
             return o;
         case OP_NULL:
-           if (o->op_flags & OPf_KIDS)
-               return search_const(cUNOPo->op_first);
+           if (o->op_flags & OPf_KIDS) {
+               o = cUNOPo->op_first;
+                goto redo;
+            }
             break;
         case OP_LEAVE:
         case OP_SCOPE:
             break;
         case OP_LEAVE:
         case OP_SCOPE:
@@ -8367,6 +9302,7 @@ S_search_const(pTHX_ OP *o)
             if (!(o->op_flags & OPf_KIDS))
                 return NULL;
             kid = cLISTOPo->op_first;
             if (!(o->op_flags & OPf_KIDS))
                 return NULL;
             kid = cLISTOPo->op_first;
+
             do {
                 switch (kid->op_type) {
                     case OP_ENTER:
             do {
                 switch (kid->op_type) {
                     case OP_ENTER:
@@ -8380,16 +9316,19 @@ S_search_const(pTHX_ OP *o)
                         goto last;
                 }
             } while (kid);
                         goto last;
                 }
             } while (kid);
+
             if (!kid)
                 kid = cLISTOPo->op_last;
            last:
             if (!kid)
                 kid = cLISTOPo->op_last;
            last:
-           return search_const(kid);
+            o = kid;
+             goto redo;
         }
      }
  
      return NULL;
  }
  
         }
      }
  
      return NULL;
  }
  
+
  STATIC OP *
  S_new_logop(pTHX_ I32 type, I32 flags, OP** firstp, OP** otherp)
  {
  STATIC OP *
  S_new_logop(pTHX_ I32 type, I32 flags, OP** firstp, OP** otherp)
  {
@@ -9076,10 +10015,14 @@ Perl_newFOROP(pTHX_ I32 flags, OP *sv, OP *expr, OP *block, OP *cont)
      /* for my  $x () sets OPpLVAL_INTRO;
       * for our $x () sets OPpOUR_INTRO */
      loop->op_private = (U8)iterpflags;
      /* for my  $x () sets OPpLVAL_INTRO;
       * for our $x () sets OPpOUR_INTRO */
      loop->op_private = (U8)iterpflags;
+
+    /* upgrade loop from a LISTOP to a LOOPOP;
+     * keep it in-place if there's space */
      if (loop->op_slabbed
      if (loop->op_slabbed
-     && DIFF(loop, OpSLOT(loop)->opslot_next)
-        < SIZE_TO_PSIZE(sizeof(LOOP)))
+        &&    OpSLOT(loop)->opslot_size
+            < SIZE_TO_PSIZE(sizeof(LOOP)) + OPSLOT_HEADER_P)
      {
      {
+        /* no space; allocate new op */
         LOOP *tmp;
         NewOp(1234,tmp,1,LOOP);
         Copy(loop,tmp,1,LISTOP);
         LOOP *tmp;
         NewOp(1234,tmp,1,LOOP);
         Copy(loop,tmp,1,LISTOP);
@@ -9090,6 +10033,7 @@ Perl_newFOROP(pTHX_ I32 flags, OP *sv, OP *expr, OP *block, OP *cont)
      }
      else if (!loop->op_slabbed)
      {
      }
      else if (!loop->op_slabbed)
      {
+        /* loop was malloc()ed */
         loop = (LOOP*)PerlMemShared_realloc(loop, sizeof(LOOP));
          OpLASTSIB_set(loop->op_last, (OP*)loop);
      }
         loop = (LOOP*)PerlMemShared_realloc(loop, sizeof(LOOP));
          OpLASTSIB_set(loop->op_last, (OP*)loop);
      }
@@ -9144,7 +10088,7 @@ Perl_newLOOPEX(pTHX_ I32 type, OP *label)
                                 SvPV_nolen_const(((SVOP*)label)->op_sv)));
             }
      }
                                 SvPV_nolen_const(((SVOP*)label)->op_sv)));
             }
      }
-    
+
      /* If we have already created an op, we do not need the label. */
      if (o)
                 op_free(label);
      /* If we have already created an op, we do not need the label. */
      if (o)
                 op_free(label);
@@ -9239,7 +10183,10 @@ S_newGIVWHENOP(pTHX_ OP *cond, OP *block,
      return o;
  }
  
      return o;
  }
  
-/* Does this look like a boolean operation? For these purposes
+
+/* For the purposes of 'when(implied_smartmatch)'
+ *              versus 'when(boolean_expression)',
+ * does this look like a boolean operation? For these purposes
     a boolean operation is:
       - a subroutine call [*]
       - a logical connective
     a boolean operation is:
       - a subroutine call [*]
       - a logical connective
@@ -9247,7 +10194,7 @@ S_newGIVWHENOP(pTHX_ OP *cond, OP *block,
       - a filetest operator, with the exception of -s -M -A -C
       - defined(), exists() or eof()
       - /$re/ or $foo =~ /$re/
       - a filetest operator, with the exception of -s -M -A -C
       - defined(), exists() or eof()
       - /$re/ or $foo =~ /$re/
-   
+
     [*] possibly surprising
   */
  STATIC bool
     [*] possibly surprising
   */
  STATIC bool
@@ -9287,9 +10234,9 @@ S_looks_like_bool(pTHX_ const OP *o)
  
         case OP_SEQ:    case OP_SNE:    case OP_SLT:
         case OP_SGT:    case OP_SLE:    case OP_SGE:
  
         case OP_SEQ:    case OP_SNE:    case OP_SLT:
         case OP_SGT:    case OP_SLE:    case OP_SGE:
-       
+
         case OP_SMARTMATCH:
         case OP_SMARTMATCH:
-       
+
         case OP_FTRREAD:  case OP_FTRWRITE: case OP_FTREXEC:
         case OP_FTEREAD:  case OP_FTEWRITE: case OP_FTEEXEC:
         case OP_FTIS:     case OP_FTEOWNED: case OP_FTROWNED:
         case OP_FTRREAD:  case OP_FTRWRITE: case OP_FTREXEC:
         case OP_FTEREAD:  case OP_FTEWRITE: case OP_FTEEXEC:
         case OP_FTIS:     case OP_FTEOWNED: case OP_FTROWNED:
@@ -9298,7 +10245,7 @@ S_looks_like_bool(pTHX_ const OP *o)
         case OP_FTPIPE:   case OP_FTLINK:   case OP_FTSUID:
         case OP_FTSGID:   case OP_FTSVTX:   case OP_FTTTY:
         case OP_FTTEXT:   case OP_FTBINARY:
         case OP_FTPIPE:   case OP_FTLINK:   case OP_FTSUID:
         case OP_FTSGID:   case OP_FTSVTX:   case OP_FTTTY:
         case OP_FTTEXT:   case OP_FTBINARY:
-       
+
         case OP_DEFINED: case OP_EXISTS:
         case OP_MATCH:   case OP_EOF:
  
         case OP_DEFINED: case OP_EXISTS:
         case OP_MATCH:   case OP_EOF:
  
@@ -9312,12 +10259,12 @@ S_looks_like_bool(pTHX_ const OP *o)
              if (o->op_private & OPpTRUEBOOL)
                  return TRUE;
              return FALSE;
              if (o->op_private & OPpTRUEBOOL)
                  return TRUE;
              return FALSE;
-       
+
         case OP_CONST:
             /* Detect comparisons that have been optimized away */
             if (cSVOPo->op_sv == &PL_sv_yes
             ||  cSVOPo->op_sv == &PL_sv_no)
         case OP_CONST:
             /* Detect comparisons that have been optimized away */
             if (cSVOPo->op_sv == &PL_sv_yes
             ||  cSVOPo->op_sv == &PL_sv_no)
-           
+
                 return TRUE;
             else
                 return FALSE;
                 return TRUE;
             else
                 return FALSE;
@@ -9327,6 +10274,7 @@ S_looks_like_bool(pTHX_ const OP *o)
      }
  }
  
      }
  }
  
+
  /*
  =for apidoc newGIVENOP
  
  /*
  =for apidoc newGIVENOP
  
@@ -9381,7 +10329,7 @@ Perl_newWHENOP(pTHX_ OP *cond, OP *block)
                 newDEFSVOP(),
                 scalar(ref_array_or_hash(cond)));
      }
                 newDEFSVOP(),
                 scalar(ref_array_or_hash(cond)));
      }
-    
+
      return newGIVWHENOP(cond_op, block, OP_ENTERWHEN, OP_LEAVEWHEN, 0);
  }
  
      return newGIVWHENOP(cond_op, block, OP_ENTERWHEN, OP_LEAVEWHEN, 0);
  }
  
@@ -9793,7 +10741,7 @@ Perl_newMYSUB(pTHX_ I32 floor, OP *o, OP *proto, OP *attrs, OP *block)
         age sub (my sub foo; sub bar { sub foo { ... } }), outcv points to
         the package sub.  So check PadnameOUTER(name) too.
       */
         age sub (my sub foo; sub bar { sub foo { ... } }), outcv points to
         the package sub.  So check PadnameOUTER(name) too.
       */
-    if (outcv == CvOUTSIDE(compcv) && !PadnameOUTER(name)) { 
+    if (outcv == CvOUTSIDE(compcv) && !PadnameOUTER(name)) {
         assert(!CvWEAKOUTSIDE(compcv));
         SvREFCNT_dec(CvOUTSIDE(compcv));
         CvWEAKOUTSIDE_on(compcv);
         assert(!CvWEAKOUTSIDE(compcv));
         SvREFCNT_dec(CvOUTSIDE(compcv));
         CvWEAKOUTSIDE_on(compcv);
@@ -10925,7 +11873,7 @@ Perl_newXS_len_flags(pTHX_ const char *name, STRLEN len,
                  cv = NULL;
              }
          }
                  cv = NULL;
              }
          }
-    
+
          if (cv)                                /* must reuse cv if autoloaded */
              cv_undef(cv);
          else {
          if (cv)                                /* must reuse cv if autoloaded */
              cv_undef(cv);
          else {
@@ -11085,7 +12033,7 @@ OP *
  Perl_newANONATTRSUB(pTHX_ I32 floor, OP *proto, OP *attrs, OP *block)
  {
      SV * const cv = MUTABLE_SV(newATTRSUB(floor, 0, proto, attrs, block));
  Perl_newANONATTRSUB(pTHX_ I32 floor, OP *proto, OP *attrs, OP *block)
  {
      SV * const cv = MUTABLE_SV(newATTRSUB(floor, 0, proto, attrs, block));
-    OP * anoncode = 
+    OP * anoncode =
         newSVOP(OP_ANONCODE, 0,
                 cv);
      if (CvANONCONST(cv))
         newSVOP(OP_ANONCODE, 0,
                 cv);
      if (CvANONCONST(cv))
@@ -11624,8 +12572,10 @@ Perl_ck_eval(pTHX_ OP *o)
      if ((PL_hints & HINT_LOCALIZE_HH) != 0
       && !(o->op_private & OPpEVAL_COPHH) && GvHV(PL_hintgv)) {
         /* Store a copy of %^H that pp_entereval can pick up. */
      if ((PL_hints & HINT_LOCALIZE_HH) != 0
       && !(o->op_private & OPpEVAL_COPHH) && GvHV(PL_hintgv)) {
         /* Store a copy of %^H that pp_entereval can pick up. */
-       OP *hhop = newSVOP(OP_HINTSEVAL, 0,
-                          MUTABLE_SV(hv_copy_hints_hv(GvHV(PL_hintgv))));
+        HV *hh = hv_copy_hints_hv(GvHV(PL_hintgv));
+       OP *hhop;
+        STOREFEATUREBITSHH(hh);
+        hhop = newSVOP(OP_HINTSEVAL, 0, MUTABLE_SV(hh));
          /* append hhop to only child  */
          op_sibling_splice(o, cUNOPo->op_first, 0, hhop);
  
          /* append hhop to only child  */
          op_sibling_splice(o, cUNOPo->op_first, 0, hhop);
  
@@ -11911,7 +12861,7 @@ Perl_ck_fun(pTHX_ OP *o)
                                    PL_op_desc[type]);
  
                 if (kid->op_type == OP_CONST
                                    PL_op_desc[type]);
  
                 if (kid->op_type == OP_CONST
-                     && (  !SvROK(cSVOPx_sv(kid)) 
+                     && (  !SvROK(cSVOPx_sv(kid))
                          || SvTYPE(SvRV(cSVOPx_sv(kid))) != SVt_PVAV  )
                         )
                     bad_type_pv(numargs, "array", o, kid);
                          || SvTYPE(SvRV(cSVOPx_sv(kid))) != SVt_PVAV  )
                         )
                     bad_type_pv(numargs, "array", o, kid);
@@ -12325,7 +13275,7 @@ Perl_ck_smartmatch(pTHX_ OP *o)
      if (0 == (o->op_flags & OPf_SPECIAL)) {
         OP *first  = cBINOPo->op_first;
         OP *second = OpSIBLING(first);
      if (0 == (o->op_flags & OPf_SPECIAL)) {
         OP *first  = cBINOPo->op_first;
         OP *second = OpSIBLING(first);
-       
+
         /* Implicitly take a reference to an array or hash */
  
          /* remove the original two siblings, then add back the
         /* Implicitly take a reference to an array or hash */
  
          /* remove the original two siblings, then add back the
@@ -12337,7 +13287,7 @@ Perl_ck_smartmatch(pTHX_ OP *o)
         second = ref_array_or_hash(second);
          op_sibling_splice(o, NULL, 0, second);
          op_sibling_splice(o, NULL, 0, first);
         second = ref_array_or_hash(second);
          op_sibling_splice(o, NULL, 0, second);
          op_sibling_splice(o, NULL, 0, first);
-       
+
         /* Implicitly take a reference to a regular expression */
         if (first->op_type == OP_MATCH && !(first->op_flags & OPf_STACKED)) {
              OpTYPE_set(first, OP_QR);
         /* Implicitly take a reference to a regular expression */
         if (first->op_type == OP_MATCH && !(first->op_flags & OPf_STACKED)) {
              OpTYPE_set(first, OP_QR);
@@ -12346,7 +13296,7 @@ Perl_ck_smartmatch(pTHX_ OP *o)
              OpTYPE_set(second, OP_QR);
          }
      }
              OpTYPE_set(second, OP_QR);
          }
      }
-    
+
      return o;
  }
  
      return o;
  }
  
@@ -12672,8 +13622,9 @@ Perl_ck_require(pTHX_ OP *o)
              HEK *hek;
  
             if (was_readonly) {
              HEK *hek;
  
             if (was_readonly) {
-                   SvREADONLY_off(sv);
-           }   
+                SvREADONLY_off(sv);
+            }
+
             if (SvIsCOW(sv)) sv_force_normal_flags(sv, 0);
  
             s = SvPVX(sv);
             if (SvIsCOW(sv)) sv_force_normal_flags(sv, 0);
  
             s = SvPVX(sv);
@@ -13101,7 +14052,7 @@ Perl_ck_stringify(pTHX_ OP *o)
      }
      return ck_fun(o);
  }
      }
      return ck_fun(o);
  }
-       
+
  OP *
  Perl_ck_join(pTHX_ OP *o)
  {
  OP *
  Perl_ck_join(pTHX_ OP *o)
  {
@@ -13612,7 +14563,7 @@ Perl_ck_entersub_args_core(pTHX_ OP *entersubop, GV *namegv, SV *protosv)
             yyerror_pv(Perl_form(aTHX_ "Too many arguments for %" SVf,
                 SVfARG(namesv)), SvUTF8(namesv));
         }
             yyerror_pv(Perl_form(aTHX_ "Too many arguments for %" SVf,
                 SVfARG(namesv)), SvUTF8(namesv));
         }
-       
+
         op_free(entersubop);
         switch(cvflags >> 16) {
         case 'F': return newSVOP(OP_CONST, 0,
         op_free(entersubop);
         switch(cvflags >> 16) {
         case 'F': return newSVOP(OP_CONST, 0,
@@ -13641,7 +14592,7 @@ Perl_ck_entersub_args_core(pTHX_ OP *entersubop, GV *namegv, SV *protosv)
              parent = aop;
             aop = cUNOPx(aop)->op_first;
          }
              parent = aop;
             aop = cUNOPx(aop)->op_first;
          }
-       
+
         first = prev = aop;
         aop = OpSIBLING(aop);
          /* find last sibling */
         first = prev = aop;
         aop = OpSIBLING(aop);
          /* find last sibling */
@@ -13669,7 +14620,7 @@ Perl_ck_entersub_args_core(pTHX_ OP *entersubop, GV *namegv, SV *protosv)
  
         if (cvflags == (OP_ENTEREVAL | (1<<16)))
             flags |= OPpEVAL_BYTES <<8;
  
         if (cvflags == (OP_ENTEREVAL | (1<<16)))
             flags |= OPpEVAL_BYTES <<8;
-       
+
         switch (PL_opargs[opnum] & OA_CLASS_MASK) {
         case OA_UNOP:
         case OA_BASEOP_OR_UNOP:
         switch (PL_opargs[opnum] & OA_CLASS_MASK) {
         case OA_UNOP:
         case OA_BASEOP_OR_UNOP:
@@ -14140,9 +15091,9 @@ Perl_ck_length(pTHX_ OP *o)
  
  
  
  
  
  
-/* 
+/*
     ---------------------------------------------------------
     ---------------------------------------------------------
- 
+
     Common vars in list assignment
  
     There now follows some enums and static functions for detecting
     Common vars in list assignment
  
     There now follows some enums and static functions for detecting
@@ -14152,43 +15103,43 @@ Perl_ck_length(pTHX_ OP *o)
     ----
  
     First some random observations:
     ----
  
     First some random observations:
-   
+
     * If a lexical var is an alias of something else, e.g.
         for my $x ($lex, $pkg, $a[0]) {...}
       then the act of aliasing will increase the reference count of the SV
     * If a lexical var is an alias of something else, e.g.
         for my $x ($lex, $pkg, $a[0]) {...}
       then the act of aliasing will increase the reference count of the SV
-   
+
     * If a package var is an alias of something else, it may still have a
       reference count of 1, depending on how the alias was created, e.g.
       in *a = *b, $a may have a refcount of 1 since the GP is shared
       with a single GvSV pointer to the SV. So If it's an alias of another
       package var, then RC may be 1; if it's an alias of another scalar, e.g.
       a lexical var or an array element, then it will have RC > 1.
     * If a package var is an alias of something else, it may still have a
       reference count of 1, depending on how the alias was created, e.g.
       in *a = *b, $a may have a refcount of 1 since the GP is shared
       with a single GvSV pointer to the SV. So If it's an alias of another
       package var, then RC may be 1; if it's an alias of another scalar, e.g.
       a lexical var or an array element, then it will have RC > 1.
-   
+
     * There are many ways to create a package alias; ultimately, XS code
       may quite legally do GvSV(gv) = SvREFCNT_inc(sv) for example, so
       run-time tracing mechanisms are unlikely to be able to catch all cases.
     * There are many ways to create a package alias; ultimately, XS code
       may quite legally do GvSV(gv) = SvREFCNT_inc(sv) for example, so
       run-time tracing mechanisms are unlikely to be able to catch all cases.
-   
+
     * When the LHS is all my declarations, the same vars can't appear directly
       on the RHS, but they can indirectly via closures, aliasing and lvalue
       subs. But those techniques all involve an increase in the lexical
       scalar's ref count.
     * When the LHS is all my declarations, the same vars can't appear directly
       on the RHS, but they can indirectly via closures, aliasing and lvalue
       subs. But those techniques all involve an increase in the lexical
       scalar's ref count.
-   
+
     * When the LHS is all lexical vars (but not necessarily my declarations),
       it is possible for the same lexicals to appear directly on the RHS, and
       without an increased ref count, since the stack isn't refcounted.
       This case can be detected at compile time by scanning for common lex
       vars with PL_generation.
     * When the LHS is all lexical vars (but not necessarily my declarations),
       it is possible for the same lexicals to appear directly on the RHS, and
       without an increased ref count, since the stack isn't refcounted.
       This case can be detected at compile time by scanning for common lex
       vars with PL_generation.
-   
+
     * lvalue subs defeat common var detection, but they do at least
       return vars with a temporary ref count increment. Also, you can't
       tell at compile time whether a sub call is lvalue.
     * lvalue subs defeat common var detection, but they do at least
       return vars with a temporary ref count increment. Also, you can't
       tell at compile time whether a sub call is lvalue.
-   
-    
+
+
     So...
     So...
-         
+
     A: There are a few circumstances where there definitely can't be any
       commonality:
     A: There are a few circumstances where there definitely can't be any
       commonality:
-   
+
         LHS empty:  () = (...);
         RHS empty:  (....) = ();
         RHS contains only constants or other 'can't possibly be shared'
         LHS empty:  () = (...);
         RHS empty:  (....) = ();
         RHS contains only constants or other 'can't possibly be shared'
@@ -14201,165 +15152,165 @@ Perl_ck_length(pTHX_ OP *o)
         RHS contains a single element with no aggregate on LHS: e.g.
             ($a,$b,$c)  = ($x); again, once $a has been modified, its value
             won't be used again.
         RHS contains a single element with no aggregate on LHS: e.g.
             ($a,$b,$c)  = ($x); again, once $a has been modified, its value
             won't be used again.
-   
+
     B: If LHS are all 'my' lexical var declarations (or safe ops, which
       we can ignore):
     B: If LHS are all 'my' lexical var declarations (or safe ops, which
       we can ignore):
-   
+
         my ($a, $b, @c) = ...;
         my ($a, $b, @c) = ...;
-   
+
         Due to closure and goto tricks, these vars may already have content.
         For the same reason, an element on the RHS may be a lexical or package
         alias of one of the vars on the left, or share common elements, for
         example:
         Due to closure and goto tricks, these vars may already have content.
         For the same reason, an element on the RHS may be a lexical or package
         alias of one of the vars on the left, or share common elements, for
         example:
-   
+
             my ($x,$y) = f(); # $x and $y on both sides
             sub f : lvalue { ($x,$y) = (1,2); $y, $x }
             my ($x,$y) = f(); # $x and $y on both sides
             sub f : lvalue { ($x,$y) = (1,2); $y, $x }
-   
+
         and
         and
-   
+
             my $ra = f();
             my @a = @$ra;  # elements of @a on both sides
             sub f { @a = 1..4; \@a }
             my $ra = f();
             my @a = @$ra;  # elements of @a on both sides
             sub f { @a = 1..4; \@a }
-   
-   
+
+
         First, just consider scalar vars on LHS:
         First, just consider scalar vars on LHS:
-   
+
             RHS is safe only if (A), or in addition,
                 * contains only lexical *scalar* vars, where neither side's
             RHS is safe only if (A), or in addition,
                 * contains only lexical *scalar* vars, where neither side's
-                 lexicals have been flagged as aliases 
-   
+                 lexicals have been flagged as aliases
+
             If RHS is not safe, then it's always legal to check LHS vars for
             RC==1, since the only RHS aliases will always be associated
             with an RC bump.
             If RHS is not safe, then it's always legal to check LHS vars for
             RC==1, since the only RHS aliases will always be associated
             with an RC bump.
-   
+
             Note that in particular, RHS is not safe if:
             Note that in particular, RHS is not safe if:
-   
+
                 * it contains package scalar vars; e.g.:
                 * it contains package scalar vars; e.g.:
-   
+
                     f();
                     my ($x, $y) = (2, $x_alias);
                     sub f { $x = 1; *x_alias = \$x; }
                     f();
                     my ($x, $y) = (2, $x_alias);
                     sub f { $x = 1; *x_alias = \$x; }
-   
+
                 * It contains other general elements, such as flattened or
                 * spliced or single array or hash elements, e.g.
                 * It contains other general elements, such as flattened or
                 * spliced or single array or hash elements, e.g.
-   
+
                     f();
                     f();
-                   my ($x,$y) = @a; # or $a[0] or @a{@b} etc 
-   
+                   my ($x,$y) = @a; # or $a[0] or @a{@b} etc
+
                     sub f {
                         ($x, $y) = (1,2);
                         use feature 'refaliasing';
                         \($a[0], $a[1]) = \($y,$x);
                     }
                     sub f {
                         ($x, $y) = (1,2);
                         use feature 'refaliasing';
                         \($a[0], $a[1]) = \($y,$x);
                     }
-   
+
                   It doesn't matter if the array/hash is lexical or package.
                   It doesn't matter if the array/hash is lexical or package.
-   
+
                 * it contains a function call that happens to be an lvalue
                   sub which returns one or more of the above, e.g.
                 * it contains a function call that happens to be an lvalue
                   sub which returns one or more of the above, e.g.
-   
+
                     f();
                     my ($x,$y) = f();
                     f();
                     my ($x,$y) = f();
-   
+
                     sub f : lvalue {
                         ($x, $y) = (1,2);
                         *x1 = \$x;
                         $y, $x1;
                     }
                     sub f : lvalue {
                         ($x, $y) = (1,2);
                         *x1 = \$x;
                         $y, $x1;
                     }
-   
+
                     (so a sub call on the RHS should be treated the same
                     as having a package var on the RHS).
                     (so a sub call on the RHS should be treated the same
                     as having a package var on the RHS).
-   
+
                 * any other "dangerous" thing, such an op or built-in that
                   returns one of the above, e.g. pp_preinc
                 * any other "dangerous" thing, such an op or built-in that
                   returns one of the above, e.g. pp_preinc
-   
-   
+
+
             If RHS is not safe, what we can do however is at compile time flag
             that the LHS are all my declarations, and at run time check whether
             all the LHS have RC == 1, and if so skip the full scan.
             If RHS is not safe, what we can do however is at compile time flag
             that the LHS are all my declarations, and at run time check whether
             all the LHS have RC == 1, and if so skip the full scan.
-   
+
         Now consider array and hash vars on LHS: e.g. my (...,@a) = ...;
         Now consider array and hash vars on LHS: e.g. my (...,@a) = ...;
-   
+
             Here the issue is whether there can be elements of @a on the RHS
             which will get prematurely freed when @a is cleared prior to
             assignment. This is only a problem if the aliasing mechanism
             is one which doesn't increase the refcount - only if RC == 1
             will the RHS element be prematurely freed.
             Here the issue is whether there can be elements of @a on the RHS
             which will get prematurely freed when @a is cleared prior to
             assignment. This is only a problem if the aliasing mechanism
             is one which doesn't increase the refcount - only if RC == 1
             will the RHS element be prematurely freed.
-   
+
             Because the array/hash is being INTROed, it or its elements
             can't directly appear on the RHS:
             Because the array/hash is being INTROed, it or its elements
             can't directly appear on the RHS:
-   
+
                 my (@a) = ($a[0], @a, etc) # NOT POSSIBLE
                 my (@a) = ($a[0], @a, etc) # NOT POSSIBLE
-   
+
             but can indirectly, e.g.:
             but can indirectly, e.g.:
-   
+
                 my $r = f();
                 my (@a) = @$r;
                 sub f { @a = 1..3; \@a }
                 my $r = f();
                 my (@a) = @$r;
                 sub f { @a = 1..3; \@a }
-   
+
             So if the RHS isn't safe as defined by (A), we must always
             mortalise and bump the ref count of any remaining RHS elements
             when assigning to a non-empty LHS aggregate.
             So if the RHS isn't safe as defined by (A), we must always
             mortalise and bump the ref count of any remaining RHS elements
             when assigning to a non-empty LHS aggregate.
-   
+
             Lexical scalars on the RHS aren't safe if they've been involved in
             aliasing, e.g.
             Lexical scalars on the RHS aren't safe if they've been involved in
             aliasing, e.g.
-   
+
                 use feature 'refaliasing';
                 use feature 'refaliasing';
-   
+
                 f();
                 \(my $lex) = \$pkg;
                 my @a = ($lex,3); # equivalent to ($a[0],3)
                 f();
                 \(my $lex) = \$pkg;
                 my @a = ($lex,3); # equivalent to ($a[0],3)
-   
+
                 sub f {
                     @a = (1,2);
                     \$pkg = \$a[0];
                 }
                 sub f {
                     @a = (1,2);
                     \$pkg = \$a[0];
                 }
-   
+
             Similarly with lexical arrays and hashes on the RHS:
             Similarly with lexical arrays and hashes on the RHS:
-   
+
                 f();
                 my @b;
                 my @a = (@b);
                 f();
                 my @b;
                 my @a = (@b);
-   
+
                 sub f {
                     @a = (1,2);
                     \$b[0] = \$a[1];
                     \$b[1] = \$a[0];
                 }
                 sub f {
                     @a = (1,2);
                     \$b[0] = \$a[1];
                     \$b[1] = \$a[0];
                 }
-   
-   
-   
+
+
+
     C: As (B), but in addition the LHS may contain non-intro lexicals, e.g.
         my $a; ($a, my $b) = (....);
     C: As (B), but in addition the LHS may contain non-intro lexicals, e.g.
         my $a; ($a, my $b) = (....);
-   
+
         The difference between (B) and (C) is that it is now physically
         possible for the LHS vars to appear on the RHS too, where they
         are not reference counted; but in this case, the compile-time
         PL_generation sweep will detect such common vars.
         The difference between (B) and (C) is that it is now physically
         possible for the LHS vars to appear on the RHS too, where they
         are not reference counted; but in this case, the compile-time
         PL_generation sweep will detect such common vars.
-   
+
         So the rules for (C) differ from (B) in that if common vars are
         detected, the runtime "test RC==1" optimisation can no longer be used,
         and a full mark and sweep is required
         So the rules for (C) differ from (B) in that if common vars are
         detected, the runtime "test RC==1" optimisation can no longer be used,
         and a full mark and sweep is required
-   
+
     D: As (C), but in addition the LHS may contain package vars.
     D: As (C), but in addition the LHS may contain package vars.
-   
+
         Since package vars can be aliased without a corresponding refcount
         increase, all bets are off. It's only safe if (A). E.g.
         Since package vars can be aliased without a corresponding refcount
         increase, all bets are off. It's only safe if (A). E.g.
-   
+
             my ($x, $y) = (1,2);
             my ($x, $y) = (1,2);
-   
+
             for $x_alias ($x) {
                 ($x_alias, $y) = (3, $x); # whoops
             }
             for $x_alias ($x) {
                 ($x_alias, $y) = (3, $x); # whoops
             }
-   
+
         Ditto for LHS aggregate package vars.
         Ditto for LHS aggregate package vars.
-   
+
     E: Any other dangerous ops on LHS, e.g.
             (f(), $a[0], @$r) = (...);
     E: Any other dangerous ops on LHS, e.g.
             (f(), $a[0], @$r) = (...);
-   
+
         this is similar to (E) in that all bets are off. In addition, it's
         impossible to determine at compile time whether the LHS
         contains a scalar or an aggregate, e.g.
         this is similar to (E) in that all bets are off. In addition, it's
         impossible to determine at compile time whether the LHS
         contains a scalar or an aggregate, e.g.
-   
+
             sub f : lvalue { @a }
             (f()) = 1..3;
  
             sub f : lvalue { @a }
             (f()) = 1..3;
  
@@ -14415,7 +15366,6 @@ S_aassign_padcheck(pTHX_ OP* o, bool rhs)
    'rhs' indicates whether we're scanning the LHS or RHS. If the former, we
    set PL_generation on lexical vars; if the latter, we see if
    PL_generation matches.
    'rhs' indicates whether we're scanning the LHS or RHS. If the former, we
    set PL_generation on lexical vars; if the latter, we see if
    PL_generation matches.
-  'top' indicates whether we're recursing or at the top level.
    'scalars_p' is a pointer to a counter of the number of scalar SVs seen.
    This fn will increment it by the number seen. It's not intended to
    be an accurate count (especially as many ops can push a variable
    'scalars_p' is a pointer to a counter of the number of scalar SVs seen.
    This fn will increment it by the number seen. It's not intended to
    be an accurate count (especially as many ops can push a variable
@@ -14424,10 +15374,16 @@ S_aassign_padcheck(pTHX_ OP* o, bool rhs)
  */
  
  static int
  */
  
  static int
-S_aassign_scan(pTHX_ OP* o, bool rhs, bool top, int *scalars_p)
+S_aassign_scan(pTHX_ OP* o, bool rhs, int *scalars_p)
  {
  {
+    OP *top_op           = o;
+    OP *effective_top_op = o;
+    int all_flags = 0;
+
+    while (1) {
+    bool top = o == effective_top_op;
      int flags = 0;
      int flags = 0;
-    bool kid_top = FALSE;
+    OP* next_kid = NULL;
  
      /* first, look for a solitary @_ on the RHS */
      if (   rhs
  
      /* first, look for a solitary @_ on the RHS */
      if (   rhs
@@ -14448,50 +15404,58 @@ S_aassign_scan(pTHX_ OP* o, bool rhs, bool top, int *scalars_p)
              && kid->op_type == OP_GV
              && cGVOPx_gv(kid) == PL_defgv
          )
              && kid->op_type == OP_GV
              && cGVOPx_gv(kid) == PL_defgv
          )
-            flags |= AAS_DEFAV;
+            flags = AAS_DEFAV;
      }
  
      switch (o->op_type) {
      case OP_GVSV:
          (*scalars_p)++;
      }
  
      switch (o->op_type) {
      case OP_GVSV:
          (*scalars_p)++;
-        return AAS_PKG_SCALAR;
+        all_flags |= AAS_PKG_SCALAR;
+        goto do_next;
  
      case OP_PADAV:
      case OP_PADHV:
          (*scalars_p) += 2;
          /* if !top, could be e.g. @a[0,1] */
  
      case OP_PADAV:
      case OP_PADHV:
          (*scalars_p) += 2;
          /* if !top, could be e.g. @a[0,1] */
-        if (top && (o->op_flags & OPf_REF))
-            return (o->op_private & OPpLVAL_INTRO)
-                ? AAS_MY_AGG : AAS_LEX_AGG;
-        return AAS_DANGEROUS;
+        all_flags |=  (top && (o->op_flags & OPf_REF))
+                        ? ((o->op_private & OPpLVAL_INTRO)
+                            ? AAS_MY_AGG : AAS_LEX_AGG)
+                        : AAS_DANGEROUS;
+        goto do_next;
  
      case OP_PADSV:
          {
              int comm = S_aassign_padcheck(aTHX_ o, rhs)
                          ?  AAS_LEX_SCALAR_COMM : 0;
              (*scalars_p)++;
  
      case OP_PADSV:
          {
              int comm = S_aassign_padcheck(aTHX_ o, rhs)
                          ?  AAS_LEX_SCALAR_COMM : 0;
              (*scalars_p)++;
-            return (o->op_private & OPpLVAL_INTRO)
+            all_flags |= (o->op_private & OPpLVAL_INTRO)
                  ? (AAS_MY_SCALAR|comm) : (AAS_LEX_SCALAR|comm);
                  ? (AAS_MY_SCALAR|comm) : (AAS_LEX_SCALAR|comm);
+            goto do_next;
+
          }
  
      case OP_RV2AV:
      case OP_RV2HV:
          (*scalars_p) += 2;
          if (cUNOPx(o)->op_first->op_type != OP_GV)
          }
  
      case OP_RV2AV:
      case OP_RV2HV:
          (*scalars_p) += 2;
          if (cUNOPx(o)->op_first->op_type != OP_GV)
-            return AAS_DANGEROUS; /* @{expr}, %{expr} */
+            all_flags |= AAS_DANGEROUS; /* @{expr}, %{expr} */
          /* @pkg, %pkg */
          /* if !top, could be e.g. @a[0,1] */
          /* @pkg, %pkg */
          /* if !top, could be e.g. @a[0,1] */
-        if (top && (o->op_flags & OPf_REF))
-            return AAS_PKG_AGG;
-        return AAS_DANGEROUS;
+        else if (top && (o->op_flags & OPf_REF))
+            all_flags |= AAS_PKG_AGG;
+        else
+            all_flags |= AAS_DANGEROUS;
+        goto do_next;
  
      case OP_RV2SV:
          (*scalars_p)++;
          if (cUNOPx(o)->op_first->op_type != OP_GV) {
              (*scalars_p) += 2;
  
      case OP_RV2SV:
          (*scalars_p)++;
          if (cUNOPx(o)->op_first->op_type != OP_GV) {
              (*scalars_p) += 2;
-            return AAS_DANGEROUS; /* ${expr} */
+            all_flags |= AAS_DANGEROUS; /* ${expr} */
          }
          }
-        return AAS_PKG_SCALAR; /* $pkg */
+        else
+            all_flags |= AAS_PKG_SCALAR; /* $pkg */
+        goto do_next;
  
      case OP_SPLIT:
          if (o->op_private & OPpSPLIT_ASSIGN) {
  
      case OP_SPLIT:
          if (o->op_private & OPpSPLIT_ASSIGN) {
@@ -14503,23 +15467,25 @@ S_aassign_scan(pTHX_ OP* o, bool rhs, bool top, int *scalars_p)
               *    ... = @a;
               */
  
               *    ... = @a;
               */
  
-            if (o->op_flags & OPf_STACKED)
+            if (o->op_flags & OPf_STACKED) {
                  /* @{expr} = split() - the array expression is tacked
                   * on as an extra child to split - process kid */
                  /* @{expr} = split() - the array expression is tacked
                   * on as an extra child to split - process kid */
-                return S_aassign_scan(aTHX_ cLISTOPo->op_last, rhs,
-                                        top, scalars_p);
+                next_kid = cLISTOPo->op_last;
+                goto do_next;
+            }
  
              /* ... else array is directly attached to split op */
              (*scalars_p) += 2;
  
              /* ... else array is directly attached to split op */
              (*scalars_p) += 2;
-            if (PL_op->op_private & OPpSPLIT_LEX)
-                return (o->op_private & OPpLVAL_INTRO)
-                    ? AAS_MY_AGG : AAS_LEX_AGG;
-            else
-                return AAS_PKG_AGG;
+            all_flags |= (PL_op->op_private & OPpSPLIT_LEX)
+                            ? ((o->op_private & OPpLVAL_INTRO)
+                                ? AAS_MY_AGG : AAS_LEX_AGG)
+                            : AAS_PKG_AGG;
+            goto do_next;
          }
          (*scalars_p)++;
          /* other args of split can't be returned */
          }
          (*scalars_p)++;
          /* other args of split can't be returned */
-        return AAS_SAFE_SCALAR;
+        all_flags |= AAS_SAFE_SCALAR;
+        goto do_next;
  
      case OP_UNDEF:
          /* undef counts as a scalar on the RHS:
  
      case OP_UNDEF:
          /* undef counts as a scalar on the RHS:
@@ -14536,16 +15502,14 @@ S_aassign_scan(pTHX_ OP* o, bool rhs, bool top, int *scalars_p)
          /* these are all no-ops; they don't push a potentially common SV
           * onto the stack, so they are neither AAS_DANGEROUS nor
           * AAS_SAFE_SCALAR */
          /* these are all no-ops; they don't push a potentially common SV
           * onto the stack, so they are neither AAS_DANGEROUS nor
           * AAS_SAFE_SCALAR */
-        return 0;
+        goto do_next;
  
      case OP_PADRANGE: /* Ignore padrange; checking its siblings is enough */
          break;
  
      case OP_NULL:
      case OP_LIST:
  
      case OP_PADRANGE: /* Ignore padrange; checking its siblings is enough */
          break;
  
      case OP_NULL:
      case OP_LIST:
-        /* these do nothing but may have children; but their children
-         * should also be treated as top-level */
-        kid_top = top;
+        /* these do nothing, but may have children */
          break;
  
      default:
          break;
  
      default:
@@ -14559,8 +15523,9 @@ S_aassign_scan(pTHX_ OP* o, bool rhs, bool top, int *scalars_p)
              && (o->op_private & OPpTARGET_MY))
          {
              (*scalars_p)++;
              && (o->op_private & OPpTARGET_MY))
          {
              (*scalars_p)++;
-            return S_aassign_padcheck(aTHX_ o, rhs)
-                ? AAS_LEX_SCALAR_COMM : AAS_LEX_SCALAR;
+            all_flags |= S_aassign_padcheck(aTHX_ o, rhs)
+                            ? AAS_LEX_SCALAR_COMM : AAS_LEX_SCALAR;
+            goto do_next;
          }
  
          /* if its an unrecognised, non-dangerous op, assume that it
          }
  
          /* if its an unrecognised, non-dangerous op, assume that it
@@ -14570,17 +15535,46 @@ S_aassign_scan(pTHX_ OP* o, bool rhs, bool top, int *scalars_p)
          break;
      }
  
          break;
      }
  
-    /* XXX this assumes that all other ops are "transparent" - i.e. that
+    all_flags |= flags;
+
+    /* by default, process all kids next
+     * XXX this assumes that all other ops are "transparent" - i.e. that
       * they can return some of their children. While this true for e.g.
       * sort and grep, it's not true for e.g. map. We really need a
       * 'transparent' flag added to regen/opcodes
       */
      if (o->op_flags & OPf_KIDS) {
       * they can return some of their children. While this true for e.g.
       * sort and grep, it's not true for e.g. map. We really need a
       * 'transparent' flag added to regen/opcodes
       */
      if (o->op_flags & OPf_KIDS) {
-        OP *kid;
-        for (kid = cUNOPo->op_first; kid; kid = OpSIBLING(kid))
-            flags |= S_aassign_scan(aTHX_ kid, rhs, kid_top, scalars_p);
+        next_kid = cUNOPo->op_first;
+        /* these ops do nothing but may have children; but their
+         * children should also be treated as top-level */
+        if (   o == effective_top_op
+            && (o->op_type == OP_NULL || o->op_type == OP_LIST)
+        )
+            effective_top_op = next_kid;
+    }
+
+
+    /* If next_kid is set, someone in the code above wanted us to process
+     * that kid and all its remaining siblings.  Otherwise, work our way
+     * back up the tree */
+  do_next:
+    while (!next_kid) {
+        if (o == top_op)
+            return all_flags; /* at top; no parents/siblings to try */
+        if (OpHAS_SIBLING(o)) {
+            next_kid = o->op_sibparent;
+            if (o == effective_top_op)
+                effective_top_op = next_kid;
+        }
+        else
+            if (o == effective_top_op)
+                effective_top_op = o->op_sibparent;
+            o = o->op_sibparent; /* try parent's next sibling */
+
      }
      }
-    return flags;
+    o = next_kid;
+    } /* while */
+
  }
  
  
  }
  
  
@@ -15827,8 +16821,17 @@ Perl_rpeep(pTHX_ OP *o)
                this optimisation if the first NEXTSTATE has a label.  */
             if (!CopLABEL((COP*)o) && !PERLDB_NOOPT) {
                 OP *nextop = o->op_next;
                this optimisation if the first NEXTSTATE has a label.  */
             if (!CopLABEL((COP*)o) && !PERLDB_NOOPT) {
                 OP *nextop = o->op_next;
-               while (nextop && nextop->op_type == OP_NULL)
-                   nextop = nextop->op_next;
+               while (nextop) {
+                    switch (nextop->op_type) {
+                        case OP_NULL:
+                        case OP_SCALAR:
+                        case OP_LINESEQ:
+                        case OP_SCOPE:
+                            nextop = nextop->op_next;
+                            continue;
+                    }
+                    break;
+                }
  
                 if (nextop && (nextop->op_type == OP_NEXTSTATE)) {
                     op_null(o);
  
                 if (nextop && (nextop->op_type == OP_NEXTSTATE)) {
                     op_null(o);
@@ -16316,7 +17319,7 @@ Perl_rpeep(pTHX_ OP *o)
             }
  
             break;
             }
  
             break;
-        
+
          case OP_NOT:
              break;
  
          case OP_NOT:
              break;
  
@@ -16346,7 +17349,7 @@ Perl_rpeep(pTHX_ OP *o)
             DEFER(cLOGOP->op_other);
             o->op_opt = 1;
             break;
             DEFER(cLOGOP->op_other);
             o->op_opt = 1;
             break;
-       
+
         case OP_GREPWHILE:
              if ((o->op_flags & OPf_WANT) == OPf_WANT_SCALAR)
                  S_check_for_bool_cxt(o, 1, OPpTRUEBOOL, 0);
         case OP_GREPWHILE:
              if ((o->op_flags & OPf_WANT) == OPf_WANT_SCALAR)
                  S_check_for_bool_cxt(o, 1, OPpTRUEBOOL, 0);
@@ -16490,7 +17493,7 @@ Perl_rpeep(pTHX_ OP *o)
             iter = enter->op_next;
             if (!iter || iter->op_type != OP_ITER)
                 break;
             iter = enter->op_next;
             if (!iter || iter->op_type != OP_ITER)
                 break;
-           
+
             expushmark = enter->op_first;
             if (!expushmark || expushmark->op_type != OP_NULL
                 || expushmark->op_targ != OP_PUSHMARK)
             expushmark = enter->op_first;
             if (!expushmark || expushmark->op_type != OP_NULL
                 || expushmark->op_targ != OP_PUSHMARK)
@@ -16643,10 +17646,10 @@ Perl_rpeep(pTHX_ OP *o)
              PL_generation++;
              /* scan LHS */
              lscalars = 0;
              PL_generation++;
              /* scan LHS */
              lscalars = 0;
-            l = S_aassign_scan(aTHX_ cLISTOPo->op_last,  FALSE, 1, &lscalars);
+            l = S_aassign_scan(aTHX_ cLISTOPo->op_last,  FALSE, &lscalars);
              /* scan RHS */
              rscalars = 0;
              /* scan RHS */
              rscalars = 0;
-            r = S_aassign_scan(aTHX_ cLISTOPo->op_first, TRUE, 1, &rscalars);
+            r = S_aassign_scan(aTHX_ cLISTOPo->op_first, TRUE, &rscalars);
              lr = (l|r);
  
  
              lr = (l|r);
  
  
@@ -16746,13 +17749,13 @@ Perl_rpeep(pTHX_ OP *o)
              break;
  
         case OP_CUSTOM: {
              break;
  
         case OP_CUSTOM: {
-           Perl_cpeep_t cpeep = 
+           Perl_cpeep_t cpeep =
                 XopENTRYCUSTOM(o, xop_peep);
             if (cpeep)
                 cpeep(aTHX_ o, oldop);
             break;
         }
                 XopENTRYCUSTOM(o, xop_peep);
             if (cpeep)
                 cpeep(aTHX_ o, oldop);
             break;
         }
-           
+
         }
          /* did we just null the current op? If so, re-process it to handle
           * eliding "empty" ops from the chain */
         }
          /* did we just null the current op? If so, re-process it to handle
           * eliding "empty" ops from the chain */
@@ -16777,7 +17780,7 @@ Perl_peep(pTHX_ OP *o)
  /*
  =head1 Custom Operators
  
  /*
  =head1 Custom Operators
  
-=for apidoc custom_op_xop
+=for apidoc Perl_custom_op_xop
  Return the XOP structure for a given custom op.  This macro should be
  considered internal to C<OP_NAME> and the other access macros: use them instead.
  This macro does call a function.  Prior
  Return the XOP structure for a given custom op.  This macro should be
  considered internal to C<OP_NAME> and the other access macros: use them instead.
  This macro does call a function.  Prior