Update CPAN-Meta to CPAN version 2.132140

[perl5.git] / pp.c
diff --git a/pp.c b/pp.c

index cf59a84..e47500f 100644 (file)
--- a/pp.c
+++ b/pp.c
@@ -47,6 +47,9 @@ extern Pid_t getpid (void);
      _LIB_VERSION_TYPE _LIB_VERSION = _IEEE_;
  #endif
  
+static const STRLEN small_mu_len = sizeof(GREEK_SMALL_LETTER_MU_UTF8) - 1;
+static const STRLEN capital_iota_len = sizeof(GREEK_CAPITAL_LETTER_IOTA_UTF8) - 1;
+
  /* variations on pp_null */
  
  PP(pp_stub)
@@ -65,8 +68,8 @@ PP(pp_padav)
      dVAR; dSP; dTARGET;
      I32 gimme;
      assert(SvTYPE(TARG) == SVt_PVAV);
-    if (PL_op->op_private & OPpLVAL_INTRO)
-       if (!(PL_op->op_private & OPpPAD_STATE))
+    if (UNLIKELY( PL_op->op_private & OPpLVAL_INTRO ))
+       if (LIKELY( !(PL_op->op_private & OPpPAD_STATE) ))
             SAVECLEARSV(PAD_SVl(PL_op->op_targ));
      EXTEND(SP, 1);
      if (PL_op->op_flags & OPf_REF) {
@@ -115,8 +118,8 @@ PP(pp_padhv)
  
      assert(SvTYPE(TARG) == SVt_PVHV);
      XPUSHs(TARG);
-    if (PL_op->op_private & OPpLVAL_INTRO)
-       if (!(PL_op->op_private & OPpPAD_STATE))
+    if (UNLIKELY( PL_op->op_private & OPpLVAL_INTRO ))
+       if (LIKELY( !(PL_op->op_private & OPpPAD_STATE) ))
             SAVECLEARSV(PAD_SVl(PL_op->op_targ));
      if (PL_op->op_flags & OPf_REF)
         RETURN;
@@ -234,13 +237,15 @@ S_rv2gv(pTHX_ SV *sv, const bool vivify_sv, const bool strict,
                         Perl_croak_no_modify();
                     if (cUNOP->op_targ) {
                         SV * const namesv = PAD_SV(cUNOP->op_targ);
+                       HV *stash = CopSTASH(PL_curcop);
+                       if (SvTYPE(stash) != SVt_PVHV) stash = NULL;
                         gv = MUTABLE_GV(newSV(0));
-                       gv_init_sv(gv, CopSTASH(PL_curcop), namesv, 0);
+                       gv_init_sv(gv, stash, namesv, 0);
                     }
                     else {
                         const char * const name = CopSTASHPV(PL_curcop);
                         gv = newGVgen_flags(name,
-                                        HvNAMEUTF8(CopSTASH(PL_curcop)) ? SVf_UTF8 : 0 );
+                                HvNAMEUTF8(CopSTASH(PL_curcop)) ? SVf_UTF8 : 0 );
                     }
                     prepare_SV_for_RV(sv);
                     SvRV_set(sv, MUTABLE_SV(gv));
@@ -425,7 +430,7 @@ PP(pp_pos)
      dVAR; dSP; dPOPss;
  
      if (PL_op->op_flags & OPf_MOD || LVRET) {
-       SV * const ret = sv_2mortal(newSV_type(SVt_PVLV));  /* Not TARG RT#67838 */
+       SV * const ret = sv_2mortal(newSV_type(SVt_PVLV));/* Not TARG RT#67838 */
         sv_magic(ret, NULL, PERL_MAGIC_pos, NULL, 0);
         LvTYPE(ret) = '.';
         LvTARG(ret) = SvREFCNT_inc_simple(sv);
@@ -433,18 +438,16 @@ PP(pp_pos)
         RETURN;
      }
      else {
-       if (SvTYPE(sv) >= SVt_PVMG && SvMAGIC(sv)) {
-           const MAGIC * const mg = mg_find(sv, PERL_MAGIC_regex_global);
-           if (mg && mg->mg_len >= 0) {
+           const MAGIC * const mg = mg_find_mglob(sv);
+           if (mg && mg->mg_len != -1) {
                 dTARGET;
-               I32 i = mg->mg_len;
+               STRLEN i = mg->mg_len;
                 if (DO_UTF8(sv))
-                   sv_pos_b2u(sv, &i);
-               PUSHi(i);
+                   i = sv_pos_b2u_flags(sv, i, SV_GMAGIC|SV_CONST_RETURN);
+               PUSHu(i);
                 RETURN;
             }
-       }
-       RETPUSHUNDEF;
+           RETPUSHUNDEF;
      }
  }
  
@@ -455,7 +458,8 @@ PP(pp_rv2cv)
      HV *stash_unused;
      const I32 flags = (PL_op->op_flags & OPf_SPECIAL)
         ? GV_ADDMG
-       : ((PL_op->op_private & (OPpLVAL_INTRO|OPpMAY_RETURN_CONSTANT)) == OPpMAY_RETURN_CONSTANT)
+       : ((PL_op->op_private & (OPpLVAL_INTRO|OPpMAY_RETURN_CONSTANT))
+                                                    == OPpMAY_RETURN_CONSTANT)
             ? GV_ADD|GV_NOEXPAND
             : GV_ADD;
      /* We usually try to add a non-existent subroutine in case of AUTOLOAD. */
@@ -486,11 +490,8 @@ PP(pp_prototype)
         if (strnEQ(s, "CORE::", 6)) {
             const int code = keyword(s + 6, SvCUR(TOPs) - 6, 1);
             if (!code || code == -KEY_CORE)
-               DIE(aTHX_ "Can't find an opnumber for \"%"SVf"\"",
-                   SVfARG(newSVpvn_flags(
-                       s+6, SvCUR(TOPs)-6,
-                       (SvFLAGS(TOPs) & SVf_UTF8)|SVs_TEMP
-                   )));
+               DIE(aTHX_ "Can't find an opnumber for \"%"UTF8f"\"",
+                  UTF8fARG(SvFLAGS(TOPs) & SVf_UTF8, SvCUR(TOPs)-6, s+6));
             {
                 SV * const sv = core_prototype(NULL, s + 6, code, NULL);
                 if (sv) ret = sv;
@@ -584,10 +585,8 @@ PP(pp_ref)
      dVAR; dSP; dTARGET;
      SV * const sv = POPs;
  
-    if (sv)
-       SvGETMAGIC(sv);
-
-    if (!sv || !SvROK(sv))
+    SvGETMAGIC(sv);
+    if (!SvROK(sv))
         RETPUSHNO;
  
      (void)sv_ref(TARG,SvRV(sv),TRUE);
@@ -601,8 +600,12 @@ PP(pp_bless)
      HV *stash;
  
      if (MAXARG == 1)
+    {
        curstash:
         stash = CopSTASH(PL_curcop);
+       if (SvTYPE(stash) != SVt_PVHV)
+           Perl_croak(aTHX_ "Attempt to bless into a freed package");
+    }
      else {
         SV * const ssv = POPs;
         STRLEN len;
@@ -968,7 +971,12 @@ PP(pp_undef)
                            "Constant subroutine %"SVf" undefined",
                            SVfARG(CvANON((const CV *)sv)
                               ? newSVpvs_flags("(anonymous)", SVs_TEMP)
-                             : sv_2mortal(newSVhek(GvENAME_HEK(CvGV((const CV *)sv))))));
+                             : sv_2mortal(newSVhek(
+                                CvNAMED(sv)
+                                 ? CvNAME_HEK((CV *)sv)
+                                 : GvENAME_HEK(CvGV((const CV *)sv))
+                               ))
+                           ));
         /* FALLTHROUGH */
      case SVt_PVFM:
         {
@@ -1646,14 +1654,15 @@ PP(pp_repeat)
  
      if (GIMME == G_ARRAY && PL_op->op_private & OPpREPEAT_DOLIST) {
         dMARK;
-       static const char oom_list_extend[] = "Out of memory during list extend";
+       static const char* const oom_list_extend = "Out of memory during list extend";
         const I32 items = SP - MARK;
         const I32 max = items * count;
+       const U8 mod = PL_op->op_flags & OPf_MOD;
  
         MEM_WRAP_CHECK_1(max, SV*, oom_list_extend);
         /* Did the max computation overflow? */
         if (items > 0 && max > 0 && (max < items || max < count))
-          Perl_croak(aTHX_ oom_list_extend);
+          Perl_croak(aTHX_ "%s", oom_list_extend);
         MEXTEND(MARK, max);
         if (count > 1) {
             while (SP > MARK) {
@@ -1682,7 +1691,11 @@ PP(pp_repeat)
                 }
  #else
                 if (*SP)
+                {
+                   if (mod && SvPADTMP(*SP) && !IS_PADGV(*SP))
+                       *SP = sv_mortalcopy(*SP);
                    SvTEMP_off((*SP));
+               }
  #endif
                 SP--;
             }
@@ -1698,7 +1711,7 @@ PP(pp_repeat)
         SV * const tmpstr = POPs;
         STRLEN len;
         bool isutf;
-       static const char oom_string_extend[] =
+       static const char* const oom_string_extend =
           "Out of memory during string extend";
  
         if (TARG != tmpstr)
@@ -1711,7 +1724,7 @@ PP(pp_repeat)
             else {
                 const STRLEN max = (UV)count * len;
                 if (len > MEM_SIZE_MAX / count)
-                    Perl_croak(aTHX_ oom_string_extend);
+                    Perl_croak(aTHX_ "%s", oom_string_extend);
                 MEM_WRAP_CHECK_1(max, char, oom_string_extend);
                 SvGROW(TARG, max + 1);
                 repeatcpy(SvPVX(TARG) + len, SvPVX(TARG), len, count - 1);
@@ -2243,7 +2256,8 @@ PP(pp_negate)
             if (SvIsUV(sv)) {
                 if (SvIVX(sv) == IV_MIN) {
                     /* 2s complement assumption. */
-                   SETi(SvIVX(sv));    /* special case: -((UV)IV_MAX+1) == IV_MIN */
+                    SETi(SvIVX(sv));   /* special case: -((UV)IV_MAX+1) ==
+                                           IV_MIN */
                     RETURN;
                 }
                 else if (SvUVX(sv) <= IV_MAX) {
@@ -3428,15 +3442,6 @@ PP(pp_crypt)
  /* Generally UTF-8 and UTF-EBCDIC are indistinguishable at this level.  So 
   * most comments below say UTF-8, when in fact they mean UTF-EBCDIC as well */
  
-/* Generates code to store a unicode codepoint c that is known to occupy
- * exactly two UTF-8 and UTF-EBCDIC bytes; it is stored into p and p+1,
- * and p is advanced to point to the next available byte after the two bytes */
-#define CAT_UNI_TO_UTF8_TWO_BYTE(p, c)                                     \
-    STMT_START {                                                           \
-       *(p)++ = UTF8_TWO_BYTE_HI(c);                                       \
-       *((p)++) = UTF8_TWO_BYTE_LO(c);                                     \
-    } STMT_END
-
  PP(pp_ucfirst)
  {
      /* Actually is both lcfirst() and ucfirst().  Only the first character
@@ -3546,10 +3551,10 @@ PP(pp_ucfirst)
                       * replace just the first character in place. */
                     inplace = FALSE;
  
-                   /* If the result won't fit in a byte, the entire result will
-                    * have to be in UTF-8.  Assume worst case sizing in
-                    * conversion. (all latin1 characters occupy at most two bytes
-                    * in utf8) */
+                    /* If the result won't fit in a byte, the entire result
+                     * will have to be in UTF-8.  Assume worst case sizing in
+                     * conversion. (all latin1 characters occupy at most two
+                     * bytes in utf8) */
                     if (title_ord > 255) {
                         doing_utf8 = TRUE;
                         convert_source_to_utf8 = TRUE;
@@ -3738,7 +3743,7 @@ PP(pp_uc)
  
      if (DO_UTF8(source)) {
         const U8 *const send = s + len;
-       U8 tmpbuf[UTF8_MAXBYTES+1];
+       U8 tmpbuf[UTF8_MAXBYTES_CASE+1];
         bool tainted = FALSE;
  
         /* All occurrences of these are to be moved to follow any other marks.
@@ -3757,13 +3762,11 @@ PP(pp_uc)
             STRLEN u;
             STRLEN ulen;
             UV uv;
-           if (in_iota_subscript && ! is_utf8_mark(s)) {
+           if (in_iota_subscript && ! _is_utf8_mark(s)) {
  
                 /* A non-mark.  Time to output the iota subscript */
-#define GREEK_CAPITAL_LETTER_IOTA 0x0399
-#define COMBINING_GREEK_YPOGEGRAMMENI 0x0345
-
-               CAT_UNI_TO_UTF8_TWO_BYTE(d, GREEK_CAPITAL_LETTER_IOTA);
+               Copy(GREEK_CAPITAL_LETTER_IOTA_UTF8, d, capital_iota_len, U8);
+                d += capital_iota_len;
                 in_iota_subscript = FALSE;
              }
  
@@ -3773,6 +3776,8 @@ PP(pp_uc)
              u = UTF8SKIP(s);
              uv = _to_utf8_upper_flags(s, tmpbuf, &ulen,
                                       cBOOL(IN_LOCALE_RUNTIME), &tainted);
+#define GREEK_CAPITAL_LETTER_IOTA 0x0399
+#define COMBINING_GREEK_YPOGEGRAMMENI 0x0345
              if (uv == GREEK_CAPITAL_LETTER_IOTA
                  && utf8_to_uvchr_buf(s, send, 0) == COMBINING_GREEK_YPOGEGRAMMENI)
              {
@@ -3798,7 +3803,8 @@ PP(pp_uc)
              s += u;
         }
         if (in_iota_subscript) {
-           CAT_UNI_TO_UTF8_TWO_BYTE(d, GREEK_CAPITAL_LETTER_IOTA);
+            Copy(GREEK_CAPITAL_LETTER_IOTA_UTF8, d, capital_iota_len, U8);
+            d += capital_iota_len;
         }
         SvUTF8_on(dest);
         *d = '\0';
@@ -3830,7 +3836,9 @@ PP(pp_uc)
             else {
                 for (; s < send; d++, s++) {
                     *d = toUPPER_LATIN1_MOD(*s);
-                   if (LIKELY(*d != LATIN_SMALL_LETTER_Y_WITH_DIAERESIS)) continue;
+                   if (LIKELY(*d != LATIN_SMALL_LETTER_Y_WITH_DIAERESIS)) {
+                        continue;
+                    }
  
                     /* The mainstream case is the tight loop above.  To avoid
                      * extra tests in that, all three characters that require
@@ -4138,7 +4146,7 @@ PP(pp_fc)
      const U8 *s;
      const U8 *send;
      U8 *d;
-    U8 tmpbuf[UTF8_MAXBYTES * UTF8_MAX_FOLD_CHAR_EXPAND + 1];
+    U8 tmpbuf[UTF8_MAXBYTES_CASE + 1];
      const bool full_folding = TRUE;
      const U8 flags = ( full_folding      ? FOLD_FLAGS_FULL   : 0 )
                     | ( IN_LOCALE_RUNTIME ? FOLD_FLAGS_LOCALE : 0 );
@@ -4194,35 +4202,30 @@ PP(pp_fc)
         }
      } /* Unflagged string */
      else if (len) {
-        /* For locale, bytes, and nothing, the behavior is supposed to be the
-         * same as lc().
-         */
          if ( IN_LOCALE_RUNTIME ) { /* Under locale */
              TAINT;
              SvTAINTED_on(dest);
              for (; s < send; d++, s++)
-                *d = toLOWER_LC(*s);
+                *d = toFOLD_LC(*s);
          }
          else if ( !IN_UNI_8_BIT ) { /* Under nothing, or bytes */
              for (; s < send; d++, s++)
-                *d = toLOWER(*s);
+                *d = toFOLD(*s);
          }
          else {
-            /* For ASCII and the Latin-1 range, there's only two troublesome folds,
-            * \x{DF} (\N{LATIN SMALL LETTER SHARP S}), which under full casefolding
-            * becomes 'ss', and \x{B5} (\N{MICRO SIGN}), which under any fold becomes
-            * \x{3BC} (\N{GREEK SMALL LETTER MU}) -- For the rest, the casefold is
-            * their lowercase.
-            */
+            /* For ASCII and the Latin-1 range, there's only two troublesome
+             * folds, \x{DF} (\N{LATIN SMALL LETTER SHARP S}), which under full
+             * casefolding becomes 'ss'; and \x{B5} (\N{MICRO SIGN}), which
+             * under any fold becomes \x{3BC} (\N{GREEK SMALL LETTER MU}) --
+             * For the rest, the casefold is their lowercase.  */
              for (; s < send; d++, s++) {
                  if (*s == MICRO_SIGN) {
-                    /* \N{MICRO SIGN}'s casefold is \N{GREEK SMALL LETTER MU}, which
-                    * is outside of the latin-1 range. There's a couple of ways to
-                    * deal with this -- khw discusses them in pp_lc/uc, so go there :)
-                    * What we do here is upgrade what we had already casefolded,
-                    * then enter an inner loop that appends the rest of the characters
-                    * as UTF-8.
-                    */
+                    /* \N{MICRO SIGN}'s casefold is \N{GREEK SMALL LETTER MU},
+                     * which is outside of the latin-1 range. There's a couple
+                     * of ways to deal with this -- khw discusses them in
+                     * pp_lc/uc, so go there :) What we do here is upgrade what
+                     * we had already casefolded, then enter an inner loop that
+                     * appends the rest of the characters as UTF-8. */
                      len = d - (U8*)SvPVX_const(dest);
                      SvCUR_set(dest, len);
                      len = sv_utf8_upgrade_flags_grow(dest,
@@ -4232,13 +4235,16 @@ PP(pp_fc)
                                                  (send -s) * 2 + 1);
                      d = (U8*)SvPVX(dest) + len;
  
-                    CAT_UNI_TO_UTF8_TWO_BYTE(d, GREEK_SMALL_LETTER_MU);
+                    Copy(GREEK_SMALL_LETTER_MU_UTF8, d, small_mu_len, U8);
+                    d += small_mu_len;
                      s++;
                      for (; s < send; s++) {
                          STRLEN ulen;
                          UV fc = _to_uni_fold_flags(*s, tmpbuf, &ulen, flags);
                          if UNI_IS_INVARIANT(fc) {
-                            if ( full_folding && *s == LATIN_SMALL_LETTER_SHARP_S) {
+                            if (full_folding
+                                && *s == LATIN_SMALL_LETTER_SHARP_S)
+                            {
                                  *d++ = 's';
                                  *d++ = 's';
                              }
@@ -4253,9 +4259,8 @@ PP(pp_fc)
                      break;
                  }
                  else if (full_folding && *s == LATIN_SMALL_LETTER_SHARP_S) {
-                    /* Under full casefolding, LATIN SMALL LETTER SHARP S becomes "ss",
-                    * which may require growing the SV.
-                    */
+                    /* Under full casefolding, LATIN SMALL LETTER SHARP S
+                     * becomes "ss", which may require growing the SV. */
                      if (SvLEN(dest) < ++min) {
                          const UV o = d - (U8*)SvPVX_const(dest);
                          SvGROW(dest, min);
@@ -4264,7 +4269,8 @@ PP(pp_fc)
                      *(d)++ = 's';
                      *d = 's';
                  }
-                else { /* If it's not one of those two, the fold is their lower case */
+                else { /* If it's not one of those two, the fold is their lower
+                          case */
                      *d = toLOWER_LATIN1(*s);
                  }
               }
@@ -4378,7 +4384,9 @@ PP(pp_rkeys)
         return (SvTYPE(sv) == SVt_PVHV) ? Perl_do_kv(aTHX) : Perl_pp_akeys(aTHX);
      }
      else {
-       return (SvTYPE(sv) == SVt_PVHV) ? Perl_pp_each(aTHX) : Perl_pp_aeach(aTHX);
+       return (SvTYPE(sv) == SVt_PVHV)
+               ? Perl_pp_each(aTHX)
+               : Perl_pp_aeach(aTHX);
      }
  }
  
@@ -4512,7 +4520,8 @@ S_do_delete_local(pTHX)
                 }
                 else {
                     sv = hv_delete_ent(hv, keysv, 0, 0);
-                   SvREFCNT_inc_simple_void(sv); /* De-mortalize */
+                   if (preeminent)
+                       SvREFCNT_inc_simple_void(sv); /* De-mortalize */
                 }
                 if (preeminent) {
                     if (!sv) DIE(aTHX_ PL_no_helem_sv, SVfARG(keysv));
@@ -4547,7 +4556,8 @@ S_do_delete_local(pTHX)
                     }
                     else {
                         sv = av_delete(av, idx, 0);
-                       SvREFCNT_inc_simple_void(sv); /* De-mortalize */
+                       if (preeminent)
+                          SvREFCNT_inc_simple_void(sv); /* De-mortalize */
                     }
                     if (preeminent) {
                         save_aelem_flags(av, idx, &sv, SAVEf_KEEPOLDELEM);
@@ -4659,7 +4669,7 @@ PP(pp_exists)
      SV *tmpsv;
      HV *hv;
  
-    if (PL_op->op_private & OPpEXISTS_SUB) {
+    if (UNLIKELY( PL_op->op_private & OPpEXISTS_SUB )) {
         GV *gv;
         SV * const sv = POPs;
         CV * const cv = sv_2cv(sv, &hv, &gv, 0);
@@ -4671,7 +4681,7 @@ PP(pp_exists)
      }
      tmpsv = POPs;
      hv = MUTABLE_HV(POPs);
-    if (SvTYPE(hv) == SVt_PVHV) {
+    if (LIKELY( SvTYPE(hv) == SVt_PVHV )) {
         if (hv_exists_ent(hv, tmpsv, 0))
             RETPUSHYES;
      }
@@ -4768,6 +4778,7 @@ PP(pp_lslice)
      SV ** const firstlelem = PL_stack_base + POPMARK + 1;
      SV ** const firstrelem = lastlelem + 1;
      I32 is_something_there = FALSE;
+    const U8 mod = PL_op->op_flags & OPf_MOD;
  
      const I32 max = lastrelem - lastlelem;
      SV **lelem;
@@ -4799,6 +4810,8 @@ PP(pp_lslice)
             is_something_there = TRUE;
             if (!(*lelem = firstrelem[ix]))
                 *lelem = &PL_sv_undef;
+           else if (mod && SvPADTMP(*lelem) && !IS_PADGV(*lelem))
+               *lelem = firstrelem[ix] = sv_mortalcopy(*lelem);
         }
      }
      if (is_something_there)
@@ -4810,10 +4823,10 @@ PP(pp_lslice)
  
  PP(pp_anonlist)
  {
-    dVAR; dSP; dMARK; dORIGMARK;
+    dVAR; dSP; dMARK;
      const I32 items = SP - MARK;
      SV * const av = MUTABLE_SV(av_make(items, MARK+1));
-    SP = ORIGMARK;             /* av_make() might realloc stack_sp */
+    SP = MARK;
      mXPUSHs((PL_op->op_flags & OPf_SPECIAL)
             ? newRV_noinc(av) : av);
      RETURN;
@@ -4822,7 +4835,10 @@ PP(pp_anonlist)
  PP(pp_anonhash)
  {
      dVAR; dSP; dMARK; dORIGMARK;
-    HV* const hv = (HV *)sv_2mortal((SV *)newHV());
+    HV* const hv = newHV();
+    SV* const retval = sv_2mortal( PL_op->op_flags & OPf_SPECIAL
+                                    ? newRV_noinc(MUTABLE_SV(hv))
+                                    : MUTABLE_SV(hv) );
  
      while (MARK < SP) {
         SV * const key =
@@ -4843,9 +4859,7 @@ PP(pp_anonhash)
         (void)hv_store_ent(hv,key,val,0);
      }
      SP = ORIGMARK;
-    if (PL_op->op_flags & OPf_SPECIAL)
-       mXPUSHs(newRV_inc(MUTABLE_SV(hv)));
-    else XPUSHs(MUTABLE_SV(hv));
+    XPUSHs(retval);
      RETURN;
  }
  
@@ -4895,7 +4909,7 @@ PP(pp_splice)
      const MAGIC * const mg = SvTIED_mg((const SV *)ary, PERL_MAGIC_tied);
  
      if (mg) {
-       return Perl_tied_method(aTHX_ "SPLICE", mark - 1, MUTABLE_SV(ary), mg,
+       return Perl_tied_method(aTHX_ SV_CONST(SPLICE), mark - 1, MUTABLE_SV(ary), mg,
                                     GIMME_V | TIED_METHOD_ARGUMENTS_ON_STACK,
                                     sp - mark);
      }
@@ -5093,7 +5107,7 @@ PP(pp_push)
         PUSHMARK(MARK);
         PUTBACK;
         ENTER_with_name("call_PUSH");
-       call_method("PUSH",G_SCALAR|G_DISCARD);
+       call_sv(SV_CONST(PUSH),G_SCALAR|G_DISCARD|G_METHOD_NAMED);
         LEAVE_with_name("call_PUSH");
         SPAGAIN;
      }
@@ -5146,7 +5160,7 @@ PP(pp_unshift)
         PUSHMARK(MARK);
         PUTBACK;
         ENTER_with_name("call_UNSHIFT");
-       call_method("UNSHIFT",G_SCALAR|G_DISCARD);
+       call_sv(SV_CONST(UNSHIFT),G_SCALAR|G_DISCARD|G_METHOD_NAMED);
         LEAVE_with_name("call_UNSHIFT");
         SPAGAIN;
      }
@@ -5307,14 +5321,15 @@ PP(pp_split)
      STRLEN len;
      const char *s = SvPV_const(sv, len);
      const bool do_utf8 = DO_UTF8(sv);
-    const bool skipwhite = PL_op->op_flags & OPf_SPECIAL;
      const char *strend = s + len;
      PMOP *pm;
      REGEXP *rx;
      SV *dstr;
      const char *m;
      I32 iters = 0;
-    const STRLEN slen = do_utf8 ? utf8_length((U8*)s, (U8*)strend) : (STRLEN)(strend - s);
+    const STRLEN slen = do_utf8
+                        ? utf8_length((U8*)s, (U8*)strend)
+                        : (STRLEN)(strend - s);
      I32 maxiters = slen + 10;
      I32 trailing_empty = 0;
      const char *orig;
@@ -5338,9 +5353,7 @@ PP(pp_split)
      rx = PM_GETRE(pm);
  
      TAINT_IF(get_regex_charset(RX_EXTFLAGS(rx)) == REGEX_LOCALE_CHARSET &&
-            (RX_EXTFLAGS(rx) & RXf_WHITE || skipwhite));
-
-    RX_MATCH_UTF8_set(rx, do_utf8);
+             (RX_EXTFLAGS(rx) & (RXf_WHITE | RXf_SKIPWHITE)));
  
  #ifdef USE_ITHREADS
      if (pm->op_pmreplrootu.op_pmtargetoff) {
@@ -5369,7 +5382,7 @@ PP(pp_split)
                 AvREAL_on(ary);
                 AvREIFY_off(ary);
                 for (i = AvFILLp(ary); i >= 0; i--)
-                   AvARRAY(ary)[i] = &PL_sv_undef;     /* don't free mere refs */
+                   AvARRAY(ary)[i] = &PL_sv_undef; /* don't free mere refs */
             }
             /* temporarily switch stacks */
             SAVESWITCHSTACK(PL_curstack, ary);
@@ -5378,9 +5391,9 @@ PP(pp_split)
      }
      base = SP - PL_stack_base;
      orig = s;
-    if (skipwhite) {
+    if (RX_EXTFLAGS(rx) & RXf_SKIPWHITE) {
         if (do_utf8) {
-           while (*s == ' ' || is_utf8_space((U8*)s))
+           while (isSPACE_utf8(s))
                 s += UTF8SKIP(s);
         }
         else if (get_regex_charset(RX_EXTFLAGS(rx)) == REGEX_LOCALE_CHARSET) {
@@ -5400,21 +5413,22 @@ PP(pp_split)
  
      if (!limit)
         limit = maxiters + 2;
-    if (RX_EXTFLAGS(rx) & RXf_WHITE || skipwhite) {
+    if (RX_EXTFLAGS(rx) & RXf_WHITE) {
         while (--limit) {
             m = s;
             /* this one uses 'm' and is a negative test */
             if (do_utf8) {
-               while (m < strend && !( *m == ' ' || is_utf8_space((U8*)m) )) {
+               while (m < strend && ! isSPACE_utf8(m) ) {
                     const int t = UTF8SKIP(m);
-                   /* is_utf8_space returns FALSE for malform utf8 */
+                   /* isSPACE_utf8 returns FALSE for malform utf8 */
                     if (strend - m < t)
                         m = strend;
                     else
                         m += t;
                 }
             }
-           else if (get_regex_charset(RX_EXTFLAGS(rx)) == REGEX_LOCALE_CHARSET) {
+           else if (get_regex_charset(RX_EXTFLAGS(rx)) == REGEX_LOCALE_CHARSET)
+            {
                 while (m < strend && !isSPACE_LC(*m))
                     ++m;
              } else {
@@ -5444,10 +5458,11 @@ PP(pp_split)
  
             /* this one uses 's' and is a positive test */
             if (do_utf8) {
-               while (s < strend && ( *s == ' ' || is_utf8_space((U8*)s) ))
+               while (s < strend && isSPACE_utf8(s) )
                     s +=  UTF8SKIP(s);
             }
-           else if (get_regex_charset(RX_EXTFLAGS(rx)) == REGEX_LOCALE_CHARSET) {
+           else if (get_regex_charset(RX_EXTFLAGS(rx)) == REGEX_LOCALE_CHARSET)
+            {
                 while (s < strend && isSPACE_LC(*s))
                     ++s;
              } else {
@@ -5559,7 +5574,7 @@ PP(pp_split)
                         trailing_empty = 0;
                 } else {
                     dstr = newSVpvn_flags(s, m-s,
-                                         (do_utf8 ? SVf_UTF8 : 0) | make_mortal);
+                                        (do_utf8 ? SVf_UTF8 : 0) | make_mortal);
                     XPUSHs(dstr);
                 }
                 /* The rx->minlen is in characters but we want to step
@@ -5583,7 +5598,7 @@ PP(pp_split)
                         trailing_empty = 0;
                 } else {
                     dstr = newSVpvn_flags(s, m-s,
-                                         (do_utf8 ? SVf_UTF8 : 0) | make_mortal);
+                                        (do_utf8 ? SVf_UTF8 : 0) | make_mortal);
                     XPUSHs(dstr);
                 }
                 /* The rx->minlen is in characters but we want to step
@@ -5601,7 +5616,7 @@ PP(pp_split)
         {
             I32 rex_return;
             PUTBACK;
-           rex_return = CALLREGEXEC(rx, (char*)s, (char*)strend, (char*)orig, 1 ,
+           rex_return = CALLREGEXEC(rx, (char*)s, (char*)strend, (char*)orig, 1,
                                      sv, NULL, 0);
             SPAGAIN;
             if (rex_return == 0)
@@ -5703,7 +5718,7 @@ PP(pp_split)
         else {
             PUTBACK;
             ENTER_with_name("call_PUSH");
-           call_method("PUSH",G_SCALAR|G_DISCARD);
+           call_sv(SV_CONST(PUSH),G_SCALAR|G_DISCARD|G_METHOD_NAMED);
             LEAVE_with_name("call_PUSH");
             SPAGAIN;
             if (gimme == G_ARRAY) {