APItest/t/handy.t: Skip some tests on EBCDIC

[perl5.git] / toke.c
diff --git a/toke.c b/toke.c

index d92723a..f40936b 100644 (file)
--- a/toke.c
+++ b/toke.c
@@ -64,7 +64,6 @@ Individual members of C<PL_parser> have their own documentation.
  #define PL_multi_open          (PL_parser->multi_open)
  #define PL_multi_close         (PL_parser->multi_close)
  #define PL_preambled           (PL_parser->preambled)
-#define PL_sublex_info         (PL_parser->sublex_info)
  #define PL_linestr             (PL_parser->linestr)
  #define PL_expect              (PL_parser->expect)
  #define PL_copline             (PL_parser->copline)
@@ -89,6 +88,11 @@ Individual members of C<PL_parser> have their own documentation.
  #  define PL_nexttype          (PL_parser->nexttype)
  #  define PL_nextval           (PL_parser->nextval)
  
+
+#define SvEVALED(sv) \
+    (SvTYPE(sv) >= SVt_PVNV \
+    && ((XPVIV*)SvANY(sv))->xiv_u.xivu_eval_seen)
+
  static const char* const ident_too_long = "Identifier too long";
  
  #  define NEXTVAL_NEXTTOKE PL_nextval[PL_nexttoke]
@@ -242,7 +246,7 @@ static const char* const lex_state_names[] = {
         if (have_x) PL_expect = x; \
         PL_bufptr = s; \
         PL_last_uni = PL_oldbufptr; \
-       PL_last_lop_op = f; \
+       PL_last_lop_op = (f) < 0 ? -(f) : (f); \
         if (*s == '(') \
             return REPORT( (int)FUNC1 ); \
         s = skipspace(s); \
@@ -409,12 +413,12 @@ S_tokereport(pTHX_ I32 rv, const YYSTYPE* lvalp)
         else if (!rv)
             sv_catpvs(report, "EOF");
         else
-           Perl_sv_catpvf(aTHX_ report, "?? %"IVdf, (IV)rv);
+           Perl_sv_catpvf(aTHX_ report, "?? %" IVdf, (IV)rv);
         switch (type) {
         case TOKENTYPE_NONE:
             break;
         case TOKENTYPE_IVAL:
-           Perl_sv_catpvf(aTHX_ report, "(ival=%"IVdf")", (IV)lvalp->ival);
+           Perl_sv_catpvf(aTHX_ report, "(ival=%" IVdf ")", (IV)lvalp->ival);
             break;
         case TOKENTYPE_OPNUM:
             Perl_sv_catpvf(aTHX_ report, "(ival=op_%s)",
@@ -463,7 +467,7 @@ S_printbuf(pTHX_ const char *const fmt, const char *const s)
  static int
  S_deprecate_commaless_var_list(pTHX) {
      PL_expect = XTERM;
-    deprecate("comma-less variable list");
+    deprecate_fatal_in("5.28", "Use of comma-less variable list is deprecated");
      return REPORT(','); /* grandfather non-comma-format format */
  }
  
@@ -523,20 +527,26 @@ S_no_op(pTHX_ const char *const what, char *s)
         if (is_first)
             Perl_warner(aTHX_ packWARN(WARN_SYNTAX),
                     "\t(Missing semicolon on previous line?)\n");
-       else if (PL_oldoldbufptr && isIDFIRST_lazy_if(PL_oldoldbufptr,UTF)) {
+        else if (PL_oldoldbufptr && isIDFIRST_lazy_if_safe(PL_oldoldbufptr,
+                                                           PL_bufend,
+                                                           UTF))
+        {
             const char *t;
-           for (t = PL_oldoldbufptr; (isWORDCHAR_lazy_if(t,UTF) || *t == ':');
-                                                            t += UTF ? UTF8SKIP(t) : 1)
+           for (t = PL_oldoldbufptr;
+                 (isWORDCHAR_lazy_if_safe(t, PL_bufend, UTF) || *t == ':');
+                 t += UTF ? UTF8SKIP(t) : 1)
+            {
                 NOOP;
+            }
             if (t < PL_bufptr && isSPACE(*t))
                 Perl_warner(aTHX_ packWARN(WARN_SYNTAX),
-                       "\t(Do you need to predeclare %"UTF8f"?)\n",
+                       "\t(Do you need to predeclare %" UTF8f "?)\n",
                       UTF8fARG(UTF, t - PL_oldoldbufptr, PL_oldoldbufptr));
         }
         else {
             assert(s >= oldbp);
             Perl_warner(aTHX_ packWARN(WARN_SYNTAX),
-                   "\t(Missing operator before %"UTF8f"?)\n",
+                   "\t(Missing operator before %" UTF8f "?)\n",
                      UTF8fARG(UTF, s - oldbp, oldbp));
         }
      }
@@ -555,26 +565,39 @@ S_no_op(pTHX_ const char *const what, char *s)
  STATIC void
  S_missingterm(pTHX_ char *s)
  {
-    char tmpbuf[3];
+    char tmpbuf[UTF8_MAXBYTES + 1];
      char q;
+    bool uni = FALSE;
+    SV *sv;
      if (s) {
         char * const nl = strrchr(s,'\n');
         if (nl)
             *nl = '\0';
+       uni = UTF;
      }
-    else if ((U8) PL_multi_close < 32) {
+    else if (PL_multi_close < 32) {
         *tmpbuf = '^';
         tmpbuf[1] = (char)toCTRL(PL_multi_close);
         tmpbuf[2] = '\0';
         s = tmpbuf;
      }
      else {
-       *tmpbuf = (char)PL_multi_close;
-       tmpbuf[1] = '\0';
+       if (LIKELY(PL_multi_close < 256)) {
+           *tmpbuf = (char)PL_multi_close;
+           tmpbuf[1] = '\0';
+       }
+       else {
+           uni = TRUE;
+           *uvchr_to_utf8((U8 *)tmpbuf, PL_multi_close) = 0;
+       }
         s = tmpbuf;
      }
      q = strchr(s,'"') ? '\'' : '"';
-    Perl_croak(aTHX_ "Can't find string terminator %c%s%c anywhere before EOF",q,s,q);
+    sv = sv_2mortal(newSVpv(s,0));
+    if (uni)
+       SvUTF8_on(sv);
+    Perl_croak(aTHX_ "Can't find string terminator %c%" SVf
+                    "%c anywhere before EOF",q,SVfARG(sv),q);
  }
  
  #include "feature.h"
@@ -688,8 +711,8 @@ Perl_lex_start(pTHX_ SV *line, PerlIO *rsfp, U32 flags)
      PL_parser = parser;
  
      parser->stack = NULL;
+    parser->stack_max1 = NULL;
      parser->ps = NULL;
-    parser->stack_size = 0;
  
      /* on scope exit, free this parser and restore any outer one */
      SAVEPARSER(parser);
@@ -761,7 +784,7 @@ Perl_parser_free(pTHX_  const yy_parser *parser)
         PerlIO_close(parser->rsfp);
      SvREFCNT_dec(parser->rsfp_filters);
      SvREFCNT_dec(parser->lex_stuff);
-    SvREFCNT_dec(parser->sublex_info.repl);
+    SvREFCNT_dec(parser->lex_sub_repl);
  
      Safefree(parser->lex_brackstack);
      Safefree(parser->lex_casestack);
@@ -906,10 +929,19 @@ Perl_lex_grow_linestr(pTHX_ STRLEN len)
      char *buf;
      STRLEN bufend_pos, bufptr_pos, oldbufptr_pos, oldoldbufptr_pos;
      STRLEN linestart_pos, last_uni_pos, last_lop_pos, re_eval_start_pos;
+    bool current;
+
      linestr = PL_parser->linestr;
      buf = SvPVX(linestr);
      if (len <= SvLEN(linestr))
         return buf;
+
+    /* Is the lex_shared linestr SV the same as the current linestr SV?
+     * Only in this case does re_eval_start need adjusting, since it
+     * points within lex_shared->ls_linestr's buffer */
+    current = (   !PL_parser->lex_shared->ls_linestr
+               || linestr == PL_parser->lex_shared->ls_linestr);
+
      bufend_pos = PL_parser->bufend - buf;
      bufptr_pos = PL_parser->bufptr - buf;
      oldbufptr_pos = PL_parser->oldbufptr - buf;
@@ -917,7 +949,7 @@ Perl_lex_grow_linestr(pTHX_ STRLEN len)
      linestart_pos = PL_parser->linestart - buf;
      last_uni_pos = PL_parser->last_uni ? PL_parser->last_uni - buf : 0;
      last_lop_pos = PL_parser->last_lop ? PL_parser->last_lop - buf : 0;
-    re_eval_start_pos = PL_parser->lex_shared->re_eval_start ?
+    re_eval_start_pos = (current && PL_parser->lex_shared->re_eval_start) ?
                              PL_parser->lex_shared->re_eval_start - buf : 0;
  
      buf = sv_grow(linestr, len);
@@ -931,7 +963,7 @@ Perl_lex_grow_linestr(pTHX_ STRLEN len)
         PL_parser->last_uni = buf + last_uni_pos;
      if (PL_parser->last_lop)
         PL_parser->last_lop = buf + last_lop_pos;
-    if (PL_parser->lex_shared->re_eval_start)
+    if (current && PL_parser->lex_shared->re_eval_start)
          PL_parser->lex_shared->re_eval_start  = buf + re_eval_start_pos;
      return buf;
  }
@@ -1007,13 +1039,11 @@ Perl_lex_stuff_pvn(pTHX_ const char *pv, STRLEN len, U32 flags)
                 } else if (UTF8_IS_NEXT_CHAR_DOWNGRADEABLE(p, e)) {
                     p++;
                     highhalf++;
-               } else if (! UTF8_IS_INVARIANT(c)) {
-                   /* malformed UTF-8 */
-                   ENTER;
-                   SAVESPTR(PL_warnhook);
-                   PL_warnhook = PERL_WARNHOOK_FATAL;
-                   utf8n_to_uvchr((U8*)p, e-p, NULL, 0);
-                   LEAVE;
+                } else if (! UTF8_IS_INVARIANT(c)) {
+                    _force_out_malformed_utf8_message((U8 *) p, (U8 *) e,
+                                                      0,
+                                                      1 /* 1 means die */ );
+                    NOT_REACHED; /* NOTREACHED */
                 }
             }
             if (!highhalf)
@@ -1263,6 +1293,8 @@ Perl_lex_next_chunk(pTHX_ U32 flags)
      STRLEN linestart_pos, last_uni_pos, last_lop_pos;
      bool got_some_for_debugger = 0;
      bool got_some;
+    const U8* first_bad_char_loc;
+
      if (flags & ~(LEX_KEEP_PREVIOUS|LEX_FAKE_EOF|LEX_NO_TERM))
         Perl_croak(aTHX_ "Lexing code internal error (%s)", "lex_next_chunk");
      if (!(flags & LEX_NO_TERM) && PL_lex_inwhat)
@@ -1301,7 +1333,7 @@ Perl_lex_next_chunk(pTHX_ U32 flags)
         got_some = 0;
      } else {
         if (!SvPOK(linestr))   /* can get undefined by filter_gets */
-           sv_setpvs(linestr, "");
+            SvPVCLEAR(linestr);
         eof:
         /* End of real input.  Close filehandle (unless it was STDIN),
          * then add implicit termination.
@@ -1327,6 +1359,18 @@ Perl_lex_next_chunk(pTHX_ U32 flags)
      new_bufend_pos = SvCUR(linestr);
      PL_parser->bufend = buf + new_bufend_pos;
      PL_parser->bufptr = buf + bufptr_pos;
+
+    if (UTF && ! is_utf8_string_loc((U8 *) PL_parser->bufptr,
+                                    PL_parser->bufend - PL_parser->bufptr,
+                                    &first_bad_char_loc))
+    {
+        _force_out_malformed_utf8_message(first_bad_char_loc,
+                                          (U8 *) PL_parser->bufend,
+                                          0,
+                                          1 /* 1 means die */ );
+        NOT_REACHED; /* NOTREACHED */
+    }
+
      PL_parser->oldbufptr = buf + oldbufptr_pos;
      PL_parser->oldoldbufptr = buf + oldoldbufptr_pos;
      PL_parser->linestart = buf + linestart_pos;
@@ -1403,12 +1447,11 @@ Perl_lex_peek_unichar(pTHX_ U32 flags)
         }
         unichar = utf8n_to_uvchr((U8*)s, bufend-s, &retlen, UTF8_CHECK_ONLY);
         if (retlen == (STRLEN)-1) {
-           /* malformed UTF-8 */
-           ENTER;
-           SAVESPTR(PL_warnhook);
-           PL_warnhook = PERL_WARNHOOK_FATAL;
-           utf8n_to_uvchr((U8*)s, bufend-s, NULL, 0);
-           LEAVE;
+            _force_out_malformed_utf8_message((U8 *) s,
+                                              (U8 *) bufend,
+                                              0,
+                                              1 /* 1 means die */ );
+            NOT_REACHED; /* NOTREACHED */
         }
         return unichar;
      } else {
@@ -1556,7 +1599,7 @@ bool
  Perl_validate_proto(pTHX_ SV *name, SV *proto, bool warn)
  {
      STRLEN len, origlen;
-    char *p = proto ? SvPV(proto, len) : NULL;
+    char *p;
      bool bad_proto = FALSE;
      bool in_brackets = FALSE;
      bool after_slash = FALSE;
@@ -1571,6 +1614,7 @@ Perl_validate_proto(pTHX_ SV *name, SV *proto, bool warn)
      if (!proto)
         return TRUE;
  
+    p = SvPV(proto, len);
      origlen = len;
      for (; len--; p++) {
         if (!isSPACE(*p)) {
@@ -1616,19 +1660,19 @@ Perl_validate_proto(pTHX_ SV *name, SV *proto, bool warn)
  
         if (proto_after_greedy_proto)
             Perl_warner(aTHX_ packWARN(WARN_ILLEGALPROTO),
-                       "Prototype after '%c' for %"SVf" : %s",
+                       "Prototype after '%c' for %" SVf " : %s",
                         greedy_proto, SVfARG(name), p);
         if (in_brackets)
             Perl_warner(aTHX_ packWARN(WARN_ILLEGALPROTO),
-                       "Missing ']' in prototype for %"SVf" : %s",
+                       "Missing ']' in prototype for %" SVf " : %s",
                         SVfARG(name), p);
         if (bad_proto)
             Perl_warner(aTHX_ packWARN(WARN_ILLEGALPROTO),
-                       "Illegal character in prototype for %"SVf" : %s",
+                       "Illegal character in prototype for %" SVf " : %s",
                         SVfARG(name), p);
         if (bad_proto_after_underscore)
             Perl_warner(aTHX_ packWARN(WARN_ILLEGALPROTO),
-                       "Illegal character after '_' in prototype for %"SVf" : %s",
+                       "Illegal character after '_' in prototype for %" SVf " : %s",
                         SVfARG(name), p);
      }
  
@@ -1667,7 +1711,7 @@ S_incline(pTHX_ const char *s)
         return;
      while (SPACE_OR_TAB(*s))
         s++;
-    if (strnEQ(s, "line", 4))
+    if (strEQs(s, "line"))
         s += 4;
      else
         return;
@@ -1767,9 +1811,6 @@ S_incline(pTHX_ const char *s)
      CopLINE_set(PL_curcop, line_num);
  }
  
-#define skipspace(s) skipspace_flags(s, 0)
-
-
  STATIC void
  S_update_debugger_info(pTHX_ SV *orig_sv, const char *const buf, STRLEN len)
  {
@@ -1781,7 +1822,7 @@ S_update_debugger_info(pTHX_ SV *orig_sv, const char *const buf, STRLEN len)
             sv = *av_fetch(av, 0, 1);
             SvUPGRADE(sv, SVt_PVMG);
         }
-       if (!SvPOK(sv)) sv_setpvs(sv,"");
+        if (!SvPOK(sv)) SvPVCLEAR(sv);
         if (orig_sv)
             sv_catsv(sv, orig_sv);
         else
@@ -1796,11 +1837,19 @@ S_update_debugger_info(pTHX_ SV *orig_sv, const char *const buf, STRLEN len)
  }
  
  /*
- * S_skipspace
+ * skipspace
   * Called to gobble the appropriate amount and type of whitespace.
   * Skips comments as well.
+ * Returns the next character after the whitespace that is skipped.
+ *
+ * peekspace
+ * Same thing, but look ahead without incrementing line numbers or
+ * adjusting PL_linestart.
   */
  
+#define skipspace(s) skipspace_flags(s, 0)
+#define peekspace(s) skipspace_flags(s, LEX_NO_INCLINE)
+
  STATIC char *
  S_skipspace_flags(pTHX_ char *s, U32 flags)
  {
@@ -1843,13 +1892,13 @@ S_check_uni(pTHX)
      while (isSPACE(*PL_last_uni))
         PL_last_uni++;
      s = PL_last_uni;
-    while (isWORDCHAR_lazy_if(s,UTF) || *s == '-')
+    while (isWORDCHAR_lazy_if_safe(s, PL_bufend, UTF) || *s == '-')
         s += UTF ? UTF8SKIP(s) : 1;
      if ((t = strchr(s, '(')) && t < PL_bufptr)
         return;
  
      Perl_ck_warner_d(aTHX_ packWARN(WARN_AMBIGUOUS),
-                    "Warning: Use of \"%"UTF8f"\" without parentheses is ambiguous",
+                    "Warning: Use of \"%" UTF8f "\" without parentheses is ambiguous",
                      UTF8fARG(UTF, (int)(s - PL_last_uni), PL_last_uni));
  }
  
@@ -1872,7 +1921,7 @@ S_check_uni(pTHX)
   */
  
  STATIC I32
-S_lop(pTHX_ I32 f, int x, char *s)
+S_lop(pTHX_ I32 f, U8 x, char *s)
  {
      PERL_ARGS_ASSERT_LOP;
  
@@ -1979,10 +2028,10 @@ STATIC SV *
  S_newSV_maybe_utf8(pTHX_ const char *const start, STRLEN len)
  {
      SV * const sv = newSVpvn_utf8(start, len,
-                                 !IN_BYTES
-                                 && UTF
-                                 && !is_invariant_string((const U8*)start, len)
-                                 && is_utf8_string((const U8*)start, len));
+                          !IN_BYTES
+                          && UTF
+                          && !is_utf8_invariant_string((const U8*)start, len)
+                          && is_utf8_string((const U8*)start, len));
      return sv;
  }
  
@@ -2013,14 +2062,14 @@ S_force_word(pTHX_ char *start, int token, int check_keyword, int allow_pack)
  
      start = skipspace(start);
      s = start;
-    if (isIDFIRST_lazy_if(s,UTF)
+    if (   isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)
          || (allow_pack && *s == ':' && s[1] == ':') )
      {
         s = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, allow_pack, &len);
         if (check_keyword) {
           char *s2 = PL_tokenbuf;
           STRLEN len2 = len;
-         if (allow_pack && len > 6 && strnEQ(s2, "CORE::", 6))
+         if (allow_pack && len > 6 && strEQs(s2, "CORE::"))
             s2 += 6, len2 -= 6;
           if (keyword(s2, len2, 0))
             return start;
@@ -2034,7 +2083,7 @@ S_force_word(pTHX_ char *start, int token, int check_keyword, int allow_pack)
             }
         }
         NEXTVAL_NEXTTOKE.opval
-           = (OP*)newSVOP(OP_CONST,0,
+            = newSVOP(OP_CONST,0,
                            S_newSV_maybe_utf8(aTHX_ PL_tokenbuf, len));
         NEXTVAL_NEXTTOKE.opval->op_private |= OPpCONST_BARE;
         force_next(token);
@@ -2058,7 +2107,7 @@ S_force_ident(pTHX_ const char *s, int kind)
  
      if (s[0]) {
         const STRLEN len = s[1] ? strlen(s) : 1; /* s = "\"" see yylex */
-       OP* const o = (OP*)newSVOP(OP_CONST, 0, newSVpvn_flags(s, len,
+        OP* const o = newSVOP(OP_CONST, 0, newSVpvn_flags(s, len,
                                                                  UTF ? SVf_UTF8 : 0));
         NEXTVAL_NEXTTOKE.opval = o;
         force_next(BAREWORD);
@@ -2267,12 +2316,12 @@ S_tokeq(pTHX_ SV *sv)
   * Pattern matching will set PL_lex_op to the pattern-matching op to
   * make (we return THING if pl_yylval.ival is OP_NULL, PMFUNC otherwise).
   *
- * OP_CONST and OP_READLINE are easy--just make the new op and return.
+ * OP_CONST is easy--just make the new op and return.
   *
   * Everything else becomes a FUNC.
   *
- * Sets PL_lex_state to LEX_INTERPPUSH unless (ival was OP_NULL or we
- * had an OP_CONST or OP_READLINE).  This just sets us up for a
+ * Sets PL_lex_state to LEX_INTERPPUSH unless ival was OP_NULL or we
+ * had an OP_CONST.  This just sets us up for a
   * call to S_sublex_push().
   */
  
@@ -2299,13 +2348,13 @@ S_sublex_start(pTHX)
             SvREFCNT_dec(sv);
             sv = nsv;
         }
-       pl_yylval.opval = (OP*)newSVOP(op_type, 0, sv);
+        pl_yylval.opval = newSVOP(op_type, 0, sv);
         return THING;
      }
  
-    PL_sublex_info.super_state = PL_lex_state;
-    PL_sublex_info.sub_inwhat = (U16)op_type;
-    PL_sublex_info.sub_op = PL_lex_op;
+    PL_parser->lex_super_state = PL_lex_state;
+    PL_parser->lex_sub_inwhat = (U16)op_type;
+    PL_parser->lex_sub_op = PL_lex_op;
      PL_lex_state = LEX_INTERPPUSH;
  
      PL_expect = XTERM;
@@ -2333,7 +2382,7 @@ S_sublex_push(pTHX)
      const bool is_heredoc = PL_multi_close == '<';
      ENTER;
  
-    PL_lex_state = PL_sublex_info.super_state;
+    PL_lex_state = PL_parser->lex_super_state;
      SAVEI8(PL_lex_dojoin);
      SAVEI32(PL_lex_brackets);
      SAVEI32(PL_lex_allbrackets);
@@ -2352,7 +2401,7 @@ S_sublex_push(pTHX)
         SAVEI32(PL_parser->herelines);
         PL_parser->herelines = 0;
      }
-    SAVEI8(PL_multi_close);
+    SAVEIV(PL_multi_close);
      SAVEPPTR(PL_bufptr);
      SAVEPPTR(PL_bufend);
      SAVEPPTR(PL_oldbufptr);
@@ -2375,16 +2424,16 @@ S_sublex_push(pTHX)
      PL_parser->lex_shared->ls_bufptr  = PL_bufptr;
  
      PL_linestr = PL_lex_stuff;
-    PL_lex_repl = PL_sublex_info.repl;
+    PL_lex_repl = PL_parser->lex_sub_repl;
      PL_lex_stuff = NULL;
-    PL_sublex_info.repl = NULL;
+    PL_parser->lex_sub_repl = NULL;
  
      /* Arrange for PL_lex_stuff to be freed on scope exit, in case it gets
         set for an inner quote-like operator and then an error causes scope-
         popping.  We must not have a PL_lex_stuff value left dangling, as
         that breaks assumptions elsewhere.  See bug #123617.  */
      SAVEGENERICSV(PL_lex_stuff);
-    SAVEGENERICSV(PL_sublex_info.repl);
+    SAVEGENERICSV(PL_parser->lex_sub_repl);
  
      PL_bufend = PL_bufptr = PL_oldbufptr = PL_oldoldbufptr = PL_linestart
         = SvPVX(PL_linestr);
@@ -2406,15 +2455,15 @@ S_sublex_push(pTHX)
      if (is_heredoc)
         CopLINE_set(PL_curcop, (line_t)PL_multi_start);
      PL_copline = NOLINE;
-    
+
      Newxz(shared, 1, LEXSHARED);
      shared->ls_prev = PL_parser->lex_shared;
      PL_parser->lex_shared = shared;
  
-    PL_lex_inwhat = PL_sublex_info.sub_inwhat;
+    PL_lex_inwhat = PL_parser->lex_sub_inwhat;
      if (PL_lex_inwhat == OP_TRANSR) PL_lex_inwhat = OP_TRANS;
      if (PL_lex_inwhat == OP_MATCH || PL_lex_inwhat == OP_QR || PL_lex_inwhat == OP_SUBST)
-       PL_lex_inpat = PL_sublex_info.sub_op;
+       PL_lex_inpat = PL_parser->lex_sub_op;
      else
         PL_lex_inpat = NULL;
  
@@ -2437,7 +2486,7 @@ S_sublex_done(pTHX)
         if (SvUTF8(PL_linestr))
             SvUTF8_on(sv);
         PL_expect = XOPERATOR;
-       pl_yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
+        pl_yylval.opval = newSVOP(OP_CONST, 0, sv);
         return THING;
      }
  
@@ -2476,7 +2525,7 @@ S_sublex_done(pTHX)
         }
         if (SvTYPE(PL_linestr) >= SVt_PVNV) {
             CopLINE(PL_curcop) +=
-               ((XPVNV*)SvANY(PL_linestr))->xnv_u.xpad_cop_seq.xlow
+               ((XPVNV*)SvANY(PL_linestr))->xnv_u.xnv_lines
                  + PL_parser->herelines;
             PL_parser->herelines = 0;
         }
@@ -2494,7 +2543,7 @@ S_sublex_done(pTHX)
      }
  }
  
-PERL_STATIC_INLINE SV*
+STATIC SV*
  S_get_and_check_backslash_N_name(pTHX_ const char* s, const char* const e)
  {
      /* <s> points to first character of interior of \N{}, <e> to one beyond the
@@ -2514,8 +2563,7 @@ S_get_and_check_backslash_N_name(pTHX_ const char* s, const char* const e)
      PERL_ARGS_ASSERT_GET_AND_CHECK_BACKSLASH_N_NAME;
  
      if (!SvCUR(res)) {
-        Perl_ck_warner_d(aTHX_ packWARN(WARN_DEPRECATED),
-                       "Unknown charname '' is deprecated");
+        deprecate_fatal_in("5.28", "Unknown charname '' is deprecated");
          return res;
      }
  
@@ -2523,15 +2571,10 @@ S_get_and_check_backslash_N_name(pTHX_ const char* s, const char* const e)
                                       e - backslash_ptr,
                                       &first_bad_char_loc))
      {
-        /* If warnings are on, this will print a more detailed analysis of what
-         * is wrong than the error message below */
-        utf8n_to_uvchr(first_bad_char_loc,
-                       e - ((char *) first_bad_char_loc),
-                       NULL, 0);
-
-        /* We deliberately don't try to print the malformed character, which
-         * might not print very well; it also may be just the first of many
-         * malformations, so don't print what comes after it */
+        _force_out_malformed_utf8_message(first_bad_char_loc,
+                                          (U8 *) PL_parser->bufend,
+                                          0,
+                                          0 /* 0 means don't die */ );
          yyerror_pv(Perl_form(aTHX_
              "Malformed UTF-8 character immediately after '%.*s'",
              (int) (first_bad_char_loc - (U8 *) backslash_ptr), backslash_ptr),
@@ -2664,15 +2707,10 @@ S_get_and_check_backslash_N_name(pTHX_ const char* s, const char* const e)
          STRLEN len;
          const char* const str = SvPV_const(res, len);
          if (! is_utf8_string_loc((U8 *) str, len, &first_bad_char_loc)) {
-            /* If warnings are on, this will print a more detailed analysis of
-             * what is wrong than the error message below */
-            utf8n_to_uvchr(first_bad_char_loc,
-                           (char *) first_bad_char_loc - str,
-                           NULL, 0);
-
-            /* We deliberately don't try to print the malformed character,
-             * which might not print very well; it also may be just the first
-             * of many malformations, so don't print what comes after it */
+            _force_out_malformed_utf8_message(first_bad_char_loc,
+                                              (U8 *) PL_parser->bufend,
+                                              0,
+                                              0 /* 0 means don't die */ );
              yyerror_pv(
                Perl_form(aTHX_
                  "Malformed UTF-8 returned by %.*s immediately after '%.*s'",
@@ -2746,15 +2784,17 @@ S_get_and_check_backslash_N_name(pTHX_ const char* s, const char* const e)
  
    In transliterations:
      characters are VERY literal, except for - not at the start or end
-    of the string, which indicates a range. If the range is in bytes,
+    of the string, which indicates a range.  However some backslash sequences
+    are recognized: \r, \n, and the like
+                    \007 \o{}, \x{}, \N{}
+    If all elements in the transliteration are below 256,
      scan_const expands the range to the full set of intermediate
      characters. If the range is in utf8, the hyphen is replaced with
      a certain range mark which will be handled by pmtrans() in op.c.
  
    In double-quoted strings:
      backslashes:
-      double-quoted style: \r and \n
-      constants: \x31, etc.
+      all those recognized in transliterations
        deprecated backrefs: \1 (in substitution replacements)
        case and quoting: \U \Q \E
      stops on @ and $
@@ -2812,11 +2852,18 @@ S_scan_const(pTHX_ char *start)
      bool didrange = FALSE;              /* did we just finish a range? */
      bool in_charclass = FALSE;          /* within /[...]/ */
      bool has_utf8 = FALSE;              /* Output constant is UTF8 */
+    bool has_above_latin1 = FALSE;      /* does something require special
+                                           handling in tr/// ? */
      bool  this_utf8 = cBOOL(UTF);       /* Is the source string assumed to be
                                             UTF8?  But, this can show as true
                                             when the source isn't utf8, as for
                                             example when it is entirely composed
                                             of hex constants */
+    STRLEN utf8_variant_count = 0;      /* When not in UTF-8, this counts the
+                                           number of characters found so far
+                                           that will expand (into 2 bytes)
+                                           should we have to convert to
+                                           UTF-8) */
      SV *res;                           /* result from charnames */
      STRLEN offset_to_max;   /* The offset in the output to where the range
                                 high-end character is temporarily placed */
@@ -2831,7 +2878,7 @@ S_scan_const(pTHX_ char *start)
       * the needed size, SvGROW() is called.  Its size parameter each time is
       * based on the best guess estimate at the time, namely the length used so
       * far, plus the length the current construct will occupy, plus room for
-     * the trailing NUL, plus one byte for every input byte still unscanned */ 
+     * the trailing NUL, plus one byte for every input byte still unscanned */
  
      UV uv = UV_MAX; /* Initialize to weird value to try to catch any uses
                         before set */
@@ -2844,10 +2891,10 @@ S_scan_const(pTHX_ char *start)
      PERL_ARGS_ASSERT_SCAN_CONST;
  
      assert(PL_lex_inwhat != OP_TRANSR);
-    if (PL_lex_inwhat == OP_TRANS && PL_sublex_info.sub_op) {
+    if (PL_lex_inwhat == OP_TRANS && PL_parser->lex_sub_op) {
         /* If we are doing a trans and we know we want UTF8 set expectation */
-       has_utf8   = PL_sublex_info.sub_op->op_private & (OPpTRANS_FROM_UTF|OPpTRANS_TO_UTF);
-       this_utf8  = PL_sublex_info.sub_op->op_private & (PL_lex_repl ? OPpTRANS_FROM_UTF : OPpTRANS_TO_UTF);
+       has_utf8   = PL_parser->lex_sub_op->op_private & (OPpTRANS_FROM_UTF|OPpTRANS_TO_UTF);
+       this_utf8  = PL_parser->lex_sub_op->op_private & (PL_lex_repl ? OPpTRANS_FROM_UTF : OPpTRANS_TO_UTF);
      }
  
      /* Protect sv from errors and fatal warnings. */
@@ -2872,15 +2919,15 @@ S_scan_const(pTHX_ char *start)
               *     flag is set and we fix up the range.
               *
               * Ranges entirely within Latin1 are expanded out entirely, in
-             * order to avoid the significant overhead of making a swash.
-             * Ranges that extend above Latin1 have to have a swash, so there
-             * is no advantage to abbreviate them here, so they are stored here
-             * as Min, ILLEGAL_UTF8_BYTE, Max.  The illegal byte signifies a
-             * hyphen without any possible ambiguity.  On EBCDIC machines, if
-             * the range is expressed as Unicode, the Latin1 portion is
-             * expanded out even if the entire range extends above Latin1.
-             * This is because each code point in it has to be processed here
-             * individually to get its native translation */
+             * order to make the transliteration a simple table look-up.
+             * Ranges that extend above Latin1 have to be done differently, so
+             * there is no advantage to expanding them here, so they are
+             * stored here as Min, ILLEGAL_UTF8_BYTE, Max.  The illegal byte
+             * signifies a hyphen without any possible ambiguity.  On EBCDIC
+             * machines, if the range is expressed as Unicode, the Latin1
+             * portion is expanded out even if the range extends above
+             * Latin1.  This is because each code point in it has to be
+             * processed here individually to get its native translation */
  
             if (! dorange) {
  
@@ -2899,6 +2946,15 @@ S_scan_const(pTHX_ char *start)
                      non_portable_endpoint = 0;
                      backslash_N = 0;
  #endif
+                    /* The tests here and the following 'else' for being above
+                     * Latin1 suffice to find all such occurences in the
+                     * constant, except those added by a backslash escape
+                     * sequence, like \x{100}.  And all those set
+                     * 'has_above_latin1' as appropriate */
+                    if (this_utf8 && UTF8_IS_ABOVE_LATIN1(*s)) {
+                        has_above_latin1 = TRUE;
+                    }
+
                      /* Drops down to generic code to process current byte */
                  }
                  else {
@@ -2918,6 +2974,10 @@ S_scan_const(pTHX_ char *start)
                       * pointer).  We'll finish processing the range the next
                       * time through the loop */
                      offset_to_max = d - SvPVX_const(sv);
+
+                    if (this_utf8 && UTF8_IS_ABOVE_LATIN1(*s)) {
+                        has_above_latin1 = TRUE;
+                    }
                  }
              }  /* End of not a range */
              else {
@@ -2937,10 +2997,7 @@ S_scan_const(pTHX_ char *start)
                 IV range_max;   /* last character in range */
                  STRLEN save_offset;
                  STRLEN grow;
-#ifndef EBCDIC  /* Not meaningful except in EBCDIC, so initialize to false */
-                const bool convert_unicode = FALSE;
-                const IV real_range_max = 0;
-#else
+#ifdef EBCDIC
                  bool convert_unicode;
                  IV real_range_max = 0;
  #endif
@@ -2965,13 +3022,13 @@ S_scan_const(pTHX_ char *start)
                   * Unicode value (\N{...}), or if the range is a subset of
                   * [A-Z] or [a-z], and both ends are literal characters,
                   * like 'A', and not like \x{C1} */
-                if ((convert_unicode
-                     = cBOOL(backslash_N)   /* \N{} forces Unicode, hence
+                convert_unicode =
+                       cBOOL(backslash_N)   /* \N{} forces Unicode, hence
                                                 portable range */
                        || (   ! non_portable_endpoint
                            && ((  isLOWER_A(range_min) && isLOWER_A(range_max))
-                             || (isUPPER_A(range_min) && isUPPER_A(range_max))))
-                )) {
+                             || (isUPPER_A(range_min) && isUPPER_A(range_max))));
+                if (convert_unicode) {
  
                      /* Special handling is needed for these portable ranges.
                       * They are defined to all be in Unicode terms, which
@@ -2985,12 +3042,14 @@ S_scan_const(pTHX_ char *start)
  #endif
  
                  if (range_min > range_max) {
+#ifdef EBCDIC
                      if (convert_unicode) {
                          /* Need to convert back to native for meaningful
                           * messages for this platform */
                          range_min = UNI_TO_NATIVE(range_min);
                          range_max = UNI_TO_NATIVE(range_max);
                      }
+#endif
  
                      /* Use the characters themselves for the error message if
                       * ASCII printables; otherwise some visible representation
@@ -3000,17 +3059,19 @@ S_scan_const(pTHX_ char *start)
                          "Invalid range \"%c-%c\" in transliteration operator",
                          (char)range_min, (char)range_max);
                      }
+#ifdef EBCDIC
                      else if (convert_unicode) {
                          /* diag_listed_as: Invalid range "%s" in transliteration operator */
                          Perl_croak(aTHX_
-                              "Invalid range \"\\N{U+%04"UVXf"}-\\N{U+%04"UVXf"}\""
+                              "Invalid range \"\\N{U+%04" UVXf "}-\\N{U+%04" UVXf "}\""
                                 " in transliteration operator",
                                range_min, range_max);
                      }
+#endif
                      else {
                          /* diag_listed_as: Invalid range "%s" in transliteration operator */
                          Perl_croak(aTHX_
-                              "Invalid range \"\\x{%04"UVXf"}-\\x{%04"UVXf"}\""
+                              "Invalid range \"\\x{%04" UVXf "}-\\x{%04" UVXf "}\""
                                 " in transliteration operator",
                                range_min, range_max);
                      }
@@ -3018,14 +3079,15 @@ S_scan_const(pTHX_ char *start)
  
                 if (has_utf8) {
  
-                    /* We try to avoid creating a swash.  If the upper end of
-                     * this range is below 256, this range won't force a swash;
-                     * otherwise it does force a swash, and as long as we have
-                     * to have one, we might as well not expand things out.
-                     * But if it's EBCDIC, we may have to look at each
-                     * character below 256 if we have to convert to/from
-                     * Unicode values */
-                    if (range_max > 255
+                    /* If everything in the transliteration is below 256, we
+                     * can avoid special handling later.  A translation table
+                     * of each of those bytes is created.  And so we expand out
+                     * all ranges to their constituent code points.  But if
+                     * we've encountered something above 255, the expanding
+                     * won't help, so skip doing that.  But if it's EBCDIC, we
+                     * may have to look at each character below 256 if we have
+                     * to convert to/from Unicode values */
+                    if (   has_above_latin1
  #ifdef EBCDIC
                         && (range_min > 255 || ! convert_unicode)
  #endif
@@ -3086,12 +3148,10 @@ S_scan_const(pTHX_ char *start)
  
                  /* Subtract 3 for the bytes that were already accounted for
                   * (min, max, and the hyphen) */
-                SvGROW(sv, SvLEN(sv) + grow - 3);
-               d = SvPVX(sv) + save_offset;    /* refresh d after realloc */
+                d = save_offset + SvGROW(sv, SvLEN(sv) + grow - 3);
  
-                /* Here, we expand out the range.  On ASCII platforms, the
-                 * compiler should optimize out the 'convert_unicode==TRUE'
-                 * portion of this */
+#ifdef EBCDIC
+                /* Here, we expand out the range. */
                  if (convert_unicode) {
                      IV i;
  
@@ -3110,7 +3170,10 @@ S_scan_const(pTHX_ char *start)
                          }
                     }
                 }
-                else {
+                else
+#endif
+                /* Always gets run for ASCII, and sometimes for EBCDIC. */
+                {
                      IV i;
  
                      /* Here, no conversions are necessary, which means that the
@@ -3130,8 +3193,8 @@ S_scan_const(pTHX_ char *start)
                     }
                 }
  
-                /* (Compilers should optimize this out for non-EBCDIC).  If the
-                 * original range extended above 255, add in that portion */
+#ifdef EBCDIC
+                /* If the original range extended above 255, add in that portion. */
                  if (real_range_max) {
                      *d++ = (char) UTF8_TWO_BYTE_HI(0x100);
                      *d++ = (char) UTF8_TWO_BYTE_LO(0x100);
@@ -3140,6 +3203,7 @@ S_scan_const(pTHX_ char *start)
                      if (real_range_max > 0x100)
                          d = (char*)uvchr_to_utf8((U8*)d, real_range_max);
                  }
+#endif
  
                range_done:
                 /* mark the range as done, and continue */
@@ -3160,8 +3224,7 @@ S_scan_const(pTHX_ char *start)
             if (!esc)
                 in_charclass = TRUE;
         }
-
-       else if (*s == ']' && PL_lex_inpat &&  in_charclass) {
+       else if (*s == ']' && PL_lex_inpat && in_charclass) {
             char *s1 = s-1;
             int esc = 0;
             while (s1 >= start && *s1-- == '\\')
@@ -3193,7 +3256,7 @@ S_scan_const(pTHX_ char *start)
                   && !in_charclass
                   && ((PMOP*)PL_lex_inpat)->op_pmflags & RXf_PMf_EXTENDED)
          {
-           while (s+1 < send && *s != '\n')
+           while (s < send && *s != '\n')
                 *d++ = *s++;
         }
  
@@ -3205,8 +3268,12 @@ S_scan_const(pTHX_ char *start)
            (@foo, @::foo, @'foo, @{foo}, @$foo, @+, @-)
            */
         else if (*s == '@' && s[1]) {
-           if (UTF ? isIDFIRST_utf8((U8*)s+1) : isWORDCHAR_A(s[1]))
+           if (UTF
+               ? isIDFIRST_utf8_safe(s+1, send)
+               : isWORDCHAR_A(s[1]))
+            {
                 break;
+            }
             if (strchr(":'{$", s[1]))
                 break;
             if (!PL_lex_inpat && (s[1] == '+' || s[1] == '-'))
@@ -3230,6 +3297,11 @@ S_scan_const(pTHX_ char *start)
  
         /* End of else if chain - OP_TRANS rejoin rest */
  
+        if (UNLIKELY(s >= send)) {
+            assert(s == send);
+            break;
+        }
+
         /* backslashes */
         if (*s == '\\' && s+1 < send) {
             char* e;    /* Can be used for ending '}', etc. */
@@ -3350,51 +3422,65 @@ S_scan_const(pTHX_ char *start)
                 }
                 else {
                     if (!has_utf8 && uv > 255) {
-                       /* Might need to recode whatever we have accumulated so
-                        * far if it contains any chars variant in utf8 or
-                        * utf-ebcdic. */
-                         
-                       SvCUR_set(sv, d - SvPVX_const(sv));
-                       SvPOK_on(sv);
-                       *d = '\0';
-                       /* See Note on sizing above.  */
-                       sv_utf8_upgrade_flags_grow(
-                                       sv,
-                                       SV_GMAGIC|SV_FORCE_UTF8_UPGRADE
-                                                  /* Above-latin1 in string
-                                                   * implies no encoding */
-                                                  |SV_UTF8_NO_ENCODING,
-                                       UVCHR_SKIP(uv) + (STRLEN)(send - s) + 1);
-                       d = SvPVX(sv) + SvCUR(sv);
-                       has_utf8 = TRUE;
+
+                        /* Here, 'uv' won't fit unless we convert to UTF-8.
+                         * If we've only seen invariants so far, all we have to
+                         * do is turn on the flag */
+                        if (utf8_variant_count == 0) {
+                            SvUTF8_on(sv);
+                        }
+                        else {
+                            SvCUR_set(sv, d - SvPVX_const(sv));
+                            SvPOK_on(sv);
+                            *d = '\0';
+
+                            sv_utf8_upgrade_flags_grow(
+                                           sv,
+                                           SV_GMAGIC|SV_FORCE_UTF8_UPGRADE,
+
+                                           /* Since we're having to grow here,
+                                            * make sure we have enough room for
+                                            * this escape and a NUL, so the
+                                            * code immediately below won't have
+                                            * to actually grow again */
+                                          UVCHR_SKIP(uv)
+                                        + (STRLEN)(send - s) + 1);
+                            d = SvPVX(sv) + SvCUR(sv);
+                        }
+
+                        has_above_latin1 = TRUE;
+                        has_utf8 = TRUE;
                      }
  
-                    if (has_utf8) {
+                    if (! has_utf8) {
+                       *d++ = (char)uv;
+                        utf8_variant_count++;
+                    }
+                   else {
                         /* Usually, there will already be enough room in 'sv'
                          * since such escapes are likely longer than any UTF-8
                          * sequence they can end up as.  This isn't the case on
                          * EBCDIC where \x{40000000} contains 12 bytes, and the
                          * UTF-8 for it contains 14.  And, we have to allow for
                          * a trailing NUL.  It probably can't happen on ASCII
-                        * platforms, but be safe */
-                        const STRLEN needed = d - SvPVX(sv) + UVCHR_SKIP(uv)
+                        * platforms, but be safe.  See Note on sizing above. */
+                        const STRLEN needed = d - SvPVX(sv)
+                                            + UVCHR_SKIP(uv)
+                                            + (send - s)
                                              + 1;
                          if (UNLIKELY(needed > SvLEN(sv))) {
                              SvCUR_set(sv, d - SvPVX_const(sv));
-                            d = sv_grow(sv, needed) + SvCUR(sv);
+                            d = SvCUR(sv) + SvGROW(sv, needed);
                          }
  
                         d = (char*)uvchr_to_utf8((U8*)d, uv);
                         if (PL_lex_inwhat == OP_TRANS
-                            && PL_sublex_info.sub_op)
+                            && PL_parser->lex_sub_op)
                          {
-                           PL_sublex_info.sub_op->op_private |=
+                           PL_parser->lex_sub_op->op_private |=
                                 (PL_lex_repl ? OPpTRANS_FROM_UTF
                                              : OPpTRANS_TO_UTF);
                         }
-                    }
-                   else {
-                       *d++ = (char)uv;
                     }
                 }
  #ifdef EBCDIC
@@ -3442,7 +3528,7 @@ S_scan_const(pTHX_ char *start)
                   * braces */
                 s++;
                 if (*s != '{') {
-                   yyerror("Missing braces on \\N{}"); 
+                   yyerror("Missing braces on \\N{}");
                     continue;
                 }
                 s++;
@@ -3508,20 +3594,31 @@ S_scan_const(pTHX_ char *start)
                         if (! has_utf8 && (   uv > 0xFF
                                             || PL_lex_inwhat != OP_TRANS))
                          {
+                           /* See Note on sizing above.  */
+                            const STRLEN extra = OFFUNISKIP(uv) + (send - e) + 1;
+
                             SvCUR_set(sv, d - SvPVX_const(sv));
                             SvPOK_on(sv);
                             *d = '\0';
-                           /* See Note on sizing above.  */
-                           sv_utf8_upgrade_flags_grow(
-                                    sv,
-                                    SV_GMAGIC|SV_FORCE_UTF8_UPGRADE,
-                                   UVCHR_SKIP(uv) + (STRLEN)(send - e) + 1);
-                           d = SvPVX(sv) + SvCUR(sv);
+
+                            if (utf8_variant_count == 0) {
+                                SvUTF8_on(sv);
+                                d = SvCUR(sv) + SvGROW(sv, SvCUR(sv) + extra);
+                            }
+                            else {
+                                sv_utf8_upgrade_flags_grow(
+                                               sv,
+                                               SV_GMAGIC|SV_FORCE_UTF8_UPGRADE,
+                                               extra);
+                                d = SvPVX(sv) + SvCUR(sv);
+                            }
+
                             has_utf8 = TRUE;
+                            has_above_latin1 = TRUE;
                         }
  
                          /* Add the (Unicode) code point to the output. */
-                       if (OFFUNI_IS_INVARIANT(uv)) {
+                       if (! has_utf8 || OFFUNI_IS_INVARIANT(uv)) {
                             *d++ = (char) LATIN1_TO_NATIVE(uv);
                         }
                         else {
@@ -3662,34 +3759,49 @@ S_scan_const(pTHX_ char *start)
                                      (int) (e + 1 - start), start));
                                  goto end_backslash_N;
                              }
+
+                            if (SvUTF8(res) && UTF8_IS_ABOVE_LATIN1(*str)) {
+                                has_above_latin1 = TRUE;
+                            }
+
                          }
                          else if (! SvUTF8(res)) {
                              /* Make sure \N{} return is UTF-8.  This is because
-                            * \N{} implies Unicode semantics, and scalars have to
-                            * be in utf8 to guarantee those semantics; but not
-                            * needed in tr/// */
-                            sv_utf8_upgrade_flags(res, SV_UTF8_NO_ENCODING);
+                             * \N{} implies Unicode semantics, and scalars have
+                             * to be in utf8 to guarantee those semantics; but
+                             * not needed in tr/// */
+                            sv_utf8_upgrade_flags(res, 0);
                              str = SvPV_const(res, len);
                          }
  
                           /* Upgrade destination to be utf8 if this new
                            * component is */
                         if (! has_utf8 && SvUTF8(res)) {
+                           /* See Note on sizing above.  */
+                            const STRLEN extra = len + (send - s) + 1;
+
                             SvCUR_set(sv, d - SvPVX_const(sv));
                             SvPOK_on(sv);
                             *d = '\0';
-                           /* See Note on sizing above.  */
-                           sv_utf8_upgrade_flags_grow(sv,
+
+                            if (utf8_variant_count == 0) {
+                                SvUTF8_on(sv);
+                                d = SvCUR(sv) + SvGROW(sv, SvCUR(sv) + extra);
+                            }
+                            else {
+                                sv_utf8_upgrade_flags_grow(sv,
                                                 SV_GMAGIC|SV_FORCE_UTF8_UPGRADE,
-                                               len + (STRLEN)(send - s) + 1);
-                           d = SvPVX(sv) + SvCUR(sv);
+                                               extra);
+                                d = SvPVX(sv) + SvCUR(sv);
+                            }
                             has_utf8 = TRUE;
                         } else if (len > (STRLEN)(e - s + 4)) { /* I _guess_ 4 is \N{} --jhi */
  
                             /* See Note on sizing above.  (NOTE: SvCUR() is not
                              * set correctly here). */
+                            const STRLEN extra = len + (send - e) + 1;
                             const STRLEN off = d - SvPVX_const(sv);
-                           d = off + SvGROW(sv, off + len + (STRLEN)(send - s) + 1);
+                           d = off + SvGROW(sv, off + extra);
                         }
                         Copy(str, d, len, char);
                         d += len;
@@ -3749,60 +3861,84 @@ S_scan_const(pTHX_ char *start)
         } /* end if (backslash) */
  
      default_action:
-       /* If we started with encoded form, or already know we want it,
-          then encode the next character */
-       if (! NATIVE_BYTE_IS_INVARIANT((U8)(*s)) && (this_utf8 || has_utf8)) {
-           STRLEN len  = 1;
-
-           /* One might think that it is wasted effort in the case of the
-            * source being utf8 (this_utf8 == TRUE) to take the next character
-            * in the source, convert it to an unsigned value, and then convert
-            * it back again.  But the source has not been validated here.  The
-            * routine that does the conversion checks for errors like
-            * malformed utf8 */
+        /* Just copy the input to the output, though we may have to convert
+         * to/from UTF-8.
+         *
+         * If the input has the same representation in UTF-8 as not, it will be
+         * a single byte, and we don't care about UTF8ness; just copy the byte */
+        if (NATIVE_BYTE_IS_INVARIANT((U8)(*s))) {
+           *d++ = *s++;
+        }
+        else if (! this_utf8 && ! has_utf8) {
+            /* If neither source nor output is UTF-8, is also a single byte,
+             * just copy it; but this byte counts should we later have to
+             * convert to UTF-8 */
+           *d++ = *s++;
+            utf8_variant_count++;
+        }
+        else if (this_utf8 && has_utf8) {   /* Both UTF-8, can just copy */
+           const STRLEN len = UTF8SKIP(s);
  
+            /* We expect the source to have already been checked for
+             * malformedness */
+            assert(isUTF8_CHAR((U8 *) s, (U8 *) send));
+
+            Copy(s, d, len, U8);
+            d += len;
+            s += len;
+        }
+        else { /* UTF8ness matters and doesn't match, need to convert */
+           STRLEN len = 1;
             const UV nextuv   = (this_utf8)
                                  ? utf8n_to_uvchr((U8*)s, send - s, &len, 0)
                                  : (UV) ((U8) *s);
-           const STRLEN need = UVCHR_SKIP(nextuv);
+           STRLEN need = UVCHR_SKIP(nextuv);
+
             if (!has_utf8) {
                 SvCUR_set(sv, d - SvPVX_const(sv));
                 SvPOK_on(sv);
                 *d = '\0';
-               /* See Note on sizing above.  */
-               sv_utf8_upgrade_flags_grow(sv,
-                                       SV_GMAGIC|SV_FORCE_UTF8_UPGRADE,
-                                       need + (STRLEN)(send - s) + 1);
-               d = SvPVX(sv) + SvCUR(sv);
+
+                /* See Note on sizing above. */
+                need += (STRLEN)(send - s) + 1;
+
+                if (utf8_variant_count == 0) {
+                    SvUTF8_on(sv);
+                    d = SvCUR(sv) + SvGROW(sv, SvCUR(sv) + need);
+                }
+                else {
+                    sv_utf8_upgrade_flags_grow(sv,
+                                               SV_GMAGIC|SV_FORCE_UTF8_UPGRADE,
+                                               need);
+                    d = SvPVX(sv) + SvCUR(sv);
+                }
                 has_utf8 = TRUE;
             } else if (need > len) {
                 /* encoded value larger than old, may need extra space (NOTE:
                  * SvCUR() is not set correctly here).   See Note on sizing
                  * above.  */
+                const STRLEN extra = need + (send - s) + 1;
                 const STRLEN off = d - SvPVX_const(sv);
-               d = SvGROW(sv, off + need + (STRLEN)(send - s) + 1) + off;
+               d = off + SvGROW(sv, off + extra);
             }
             s += len;
  
             d = (char*)uvchr_to_utf8((U8*)d, nextuv);
         }
-       else {
-           *d++ = *s++;
-       }
      } /* while loop to process each character */
  
      /* terminate the string and set up the sv */
      *d = '\0';
      SvCUR_set(sv, d - SvPVX_const(sv));
      if (SvCUR(sv) >= SvLEN(sv))
-       Perl_croak(aTHX_ "panic: constant overflowed allocated space, %"UVuf
-                  " >= %"UVuf, (UV)SvCUR(sv), (UV)SvLEN(sv));
+       Perl_croak(aTHX_ "panic: constant overflowed allocated space, %" UVuf
+                  " >= %" UVuf, (UV)SvCUR(sv), (UV)SvLEN(sv));
  
      SvPOK_on(sv);
      if (has_utf8) {
         SvUTF8_on(sv);
-       if (PL_lex_inwhat == OP_TRANS && PL_sublex_info.sub_op) {
-           PL_sublex_info.sub_op->op_private |=
+       if (PL_lex_inwhat == OP_TRANS && PL_parser->lex_sub_op) {
+           PL_parser->lex_sub_op->op_private |=
                     (PL_lex_repl ? OPpTRANS_FROM_UTF : OPpTRANS_TO_UTF);
         }
      }
@@ -3845,7 +3981,7 @@ S_scan_const(pTHX_ char *start)
             sv = S_new_constant(aTHX_ start, s - start, key, keylen, sv, NULL,
                                 type, typelen);
         }
-       pl_yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
+        pl_yylval.opval = newSVOP(OP_CONST, 0, sv);
      }
      LEAVE_with_name("scan_const");
      return s;
@@ -3937,7 +4073,7 @@ S_intuit_more(pTHX_ char *s)
             case '&':
             case '$':
                 weight -= seen[un_char] * 10;
-               if (isWORDCHAR_lazy_if(s+1,UTF)) {
+               if (isWORDCHAR_lazy_if_safe(s+1, PL_bufend, UTF)) {
                     int len;
                      char *tmp = PL_bufend;
                      PL_bufend = (char*)send;
@@ -4084,8 +4220,11 @@ S_intuit_method(pTHX_ char *start, SV *ioname, CV *cv)
             tmpbuf[len] = '\0';
             goto bare_package;
         }
-       indirgv = gv_fetchpvn_flags(tmpbuf, len, ( UTF ? SVf_UTF8 : 0 ), SVt_PVCV);
-       if (indirgv && GvCVu(indirgv))
+       indirgv = gv_fetchpvn_flags(tmpbuf, len,
+                                   GV_NOADD_NOINIT|( UTF ? SVf_UTF8 : 0 ),
+                                   SVt_PVCV);
+       if (indirgv && SvTYPE(indirgv) != SVt_NULL
+        && (!isGV(indirgv) || GvCVu(indirgv)))
             return 0;
         /* filehandle or package name makes it a method */
         if (!cv || GvIO(indirgv) || gv_stashpvn(tmpbuf, len, UTF ? SVf_UTF8 : 0)) {
@@ -4093,7 +4232,7 @@ S_intuit_method(pTHX_ char *start, SV *ioname, CV *cv)
             if ((PL_bufend - s) >= 2 && *s == '=' && *(s+1) == '>')
                 return 0;       /* no assumptions -- "=>" quotes bareword */
        bare_package:
-           NEXTVAL_NEXTTOKE.opval = (OP*)newSVOP(OP_CONST, 0,
+            NEXTVAL_NEXTTOKE.opval = newSVOP(OP_CONST, 0,
                                                   S_newSV_maybe_utf8(aTHX_ tmpbuf, len));
             NEXTVAL_NEXTTOKE.opval->op_private = OPpCONST_BARE;
             PL_expect = XTERM;
@@ -4165,7 +4304,7 @@ Perl_filter_add(pTHX_ filter_t funcp, SV *datasv)
                 STRLEN const last_lop_pos =
                     PL_parser->last_lop ? PL_parser->last_lop - buf : 0;
                 av_push(PL_rsfp_filters, linestr);
-               PL_parser->linestr = 
+               PL_parser->linestr =
                     newSVpvn(SvPVX(linestr), ++s-SvPVX(linestr));
                 buf = SvPVX(PL_parser->linestr);
                 PL_parser->bufend = buf + SvCUR(PL_parser->linestr);
@@ -4391,7 +4530,7 @@ S_tokenize_use(pTHX_ int is_use, char *s) {
      static const char* const exp_name[] =
         { "OPERATOR", "TERM", "REF", "STATE", "BLOCK", "ATTRBLOCK",
           "ATTRTERM", "TERMBLOCK", "XBLOCKTERM", "POSTDEREF",
-         "TERMORDORDOR"
+         "SIGVAR", "TERMORDORDOR"
         };
  #endif
  
@@ -4409,12 +4548,18 @@ static void
  S_check_scalar_slice(pTHX_ char *s)
  {
      s++;
-    while (*s == ' ' || *s == '\t') s++;
-    if (*s == 'q' && s[1] == 'w'
-     && !isWORDCHAR_lazy_if(s+2,UTF))
+    while (SPACE_OR_TAB(*s)) s++;
+    if (*s == 'q' && s[1] == 'w' && !isWORDCHAR_lazy_if_safe(s+2,
+                                                             PL_bufend,
+                                                             UTF))
+    {
         return;
-    while (*s && (isWORDCHAR_lazy_if(s,UTF) || strchr(" \t$#+-'\"", *s)))
-       s += UTF ? UTF8SKIP(s) : 1;
+    }
+    while (    isWORDCHAR_lazy_if_safe(s, PL_bufend, UTF)
+           || (*s && strchr(" \t$#+-'\"", *s)))
+    {
+        s += UTF ? UTF8SKIP(s) : 1;
+    }
      if (*s == '}' || *s == ']')
         pl_yylval.ival = OPpSLICEWARNING;
  }
@@ -4505,7 +4650,7 @@ Perl_yylex(pTHX)
  
      DEBUG_T( {
         SV* tmp = newSVpvs("");
-       PerlIO_printf(Perl_debug_log, "### %"IVdf":LEX_%s/X%s %s\n",
+       PerlIO_printf(Perl_debug_log, "### %" IVdf ":LEX_%s/X%s %s\n",
             (IV)CopLINE(PL_curcop),
             lex_state_names[PL_lex_state],
             exp_name[PL_expect],
@@ -4592,9 +4737,7 @@ Perl_yylex(pTHX)
                  if (strnEQ(s, "L\\u", 3) || strnEQ(s, "U\\l", 3))
                      tmp = *s, *s = s[2], s[2] = (char)tmp;     /* misordered... */
                 if ((*s == 'L' || *s == 'U' || *s == 'F')
-                    && (strchr(PL_lex_casestack, 'L')
-                        || strchr(PL_lex_casestack, 'U')
-                        || strchr(PL_lex_casestack, 'F')))
+                    && (strpbrk(PL_lex_casestack, "LUF")))
                  {
                     PL_lex_casestack[--PL_lex_casemods] = '\0';
                     PL_lex_allbrackets--;
@@ -4726,7 +4869,7 @@ Perl_yylex(pTHX)
             else sv = newSVpvn(PL_parser->lex_shared->re_eval_start,
                          PL_bufptr - PL_parser->lex_shared->re_eval_start);
             NEXTVAL_NEXTTOKE.opval =
-                   (OP*)newSVOP(OP_CONST, 0,
+                    newSVOP(OP_CONST, 0,
                                  sv);
             force_next(THING);
             PL_parser->lex_shared->re_eval_start = NULL;
@@ -4748,7 +4891,7 @@ Perl_yylex(pTHX)
         if (SvIVX(PL_linestr) == '\'' && !PL_lex_inpat) {
             SV *sv = newSVsv(PL_linestr);
             sv = tokeq(sv);
-           pl_yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
+            pl_yylval.opval = newSVOP(OP_CONST, 0, sv);
             s = PL_bufend;
         }
         else {
@@ -4795,18 +4938,79 @@ Perl_yylex(pTHX)
      PL_oldbufptr = s;
      PL_parser->saw_infix_sigil = 0;
  
+    if (PL_in_my == KEY_sigvar) {
+        /* we expect the sigil and optional var name part of a
+         * signature element here. Since a '$' is not necessarily
+         * followed by a var name, handle it specially here; the general
+         * yylex code would otherwise try to interpret whatever follows
+         * as a var; e.g. ($, ...) would be seen as the var '$,'
+         */
+
+        char sigil;
+
+        s = skipspace(s);
+        sigil = *s++;
+        PL_bufptr = s; /* for error reporting */
+        switch (sigil) {
+        case '$':
+        case '@':
+        case '%':
+            /* spot stuff that looks like an prototype */
+            if (strchr("$:@%&*;\\[]", *s)) {
+                yyerror("Illegal character following sigil in a subroutine signature");
+                break;
+            }
+            /* '$#' is banned, while '$ # comment' isn't */
+            if (*s == '#') {
+                yyerror("'#' not allowed immediately following a sigil in a subroutine signature");
+                break;
+            }
+            s = skipspace(s);
+            if (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)) {
+                char *dest = PL_tokenbuf + 1;
+                /* read var name, including sigil, into PL_tokenbuf */
+                PL_tokenbuf[0] = sigil;
+                parse_ident(&s, &dest, dest + sizeof(PL_tokenbuf) - 1,
+                    0, cBOOL(UTF), FALSE);
+                *dest = '\0';
+                assert(PL_tokenbuf[1]); /* we have a variable name */
+                NEXTVAL_NEXTTOKE.ival = sigil;
+                force_next('p'); /* force a signature pending identifier */
+            }
+            else
+                PL_in_my = 0;
+            PL_expect = XOPERATOR;
+            break;
+
+        case ')':
+            PL_expect = XBLOCK;
+            break;
+        case ',': /* handle ($a,,$b) */
+            break;
+
+        default:
+            PL_in_my = 0;
+            yyerror("A signature parameter must start with '$', '@' or '%'");
+            /* very crude error recovery: skip to likely next signature
+             * element */
+            while (*s && *s != '$' && *s != '@' && *s != '%' && *s != ')')
+                s++;
+            break;
+        }
+        TOKEN(sigil);
+    }
+
    retry:
      switch (*s) {
      default:
         if (UTF) {
              if (! isUTF8_CHAR((U8 *) s, (U8 *) PL_bufend)) {
-                ENTER;
-                SAVESPTR(PL_warnhook);
-                PL_warnhook = PERL_WARNHOOK_FATAL;
-                utf8n_to_uvchr((U8*)s, PL_bufend-s, NULL, 0);
-                LEAVE;
+                _force_out_malformed_utf8_message((U8 *) s, (U8 *) PL_bufend,
+                                                  0,
+                                                  1 /* 1 means die */ );
+                NOT_REACHED; /* NOTREACHED */
              }
-            if (isIDFIRST_utf8((U8*)s)) {
+            if (isIDFIRST_utf8_safe(s, PL_bufend)) {
                  goto keylookup;
              }
          }
@@ -4815,18 +5019,25 @@ Perl_yylex(pTHX)
         }
      {
          SV *dsv = newSVpvs_flags("", SVs_TEMP);
-        const char *c = UTF ? sv_uni_display(dsv, newSVpvn_flags(s,
-                                                    UTF8SKIP(s),
-                                                    SVs_TEMP | SVf_UTF8),
-                                            10, UNI_DISPLAY_ISPRINT)
-                            : Perl_form(aTHX_ "\\x%02X", (unsigned char)*s);
+        const char *c;
+        if (UTF) {
+            STRLEN skiplen = UTF8SKIP(s);
+            STRLEN stravail = PL_bufend - s;
+            c = sv_uni_display(dsv, newSVpvn_flags(s,
+                                                   skiplen > stravail ? stravail : skiplen,
+                                                   SVs_TEMP | SVf_UTF8),
+                               10, UNI_DISPLAY_ISPRINT);
+        }
+        else {
+            c = Perl_form(aTHX_ "\\x%02X", (unsigned char)*s);
+        }
          len = UTF ? Perl_utf8_length(aTHX_ (U8 *) PL_linestart, (U8 *) s) : (STRLEN) (s - PL_linestart);
          if (len > UNRECOGNIZED_PRECEDE_COUNT) {
-            d = UTF ? (char *) utf8_hop((U8 *) s, -UNRECOGNIZED_PRECEDE_COUNT) : s - UNRECOGNIZED_PRECEDE_COUNT;
+            d = UTF ? (char *) utf8_hop_back((U8 *) s, -UNRECOGNIZED_PRECEDE_COUNT, (U8 *)PL_linestart) : s - UNRECOGNIZED_PRECEDE_COUNT;
          } else {
              d = PL_linestart;
          }
-        Perl_croak(aTHX_  "Unrecognized character %s; marked by <-- HERE after %"UTF8f"<-- HERE near column %d", c,
+        Perl_croak(aTHX_  "Unrecognized character %s; marked by <-- HERE after %" UTF8f "<-- HERE near column %d", c,
                            UTF8fARG(UTF, (s - d), d),
                           (int) len + 1);
      }
@@ -4873,7 +5084,7 @@ Perl_yylex(pTHX)
                 }
                 PL_parser->preambling = CopLINE(PL_curcop);
             } else
-               sv_setpvs(PL_linestr,"");
+                SvPVCLEAR(PL_linestr);
             if (PL_preambleav) {
                 SV **svp = AvARRAY(PL_preambleav);
                 SV **const end = svp + AvFILLp(PL_preambleav);
@@ -4965,8 +5176,8 @@ Perl_yylex(pTHX)
             }
             if (PL_parser->in_pod) {
                 /* Incest with pod. */
-               if (*s == '=' && strnEQ(s, "=cut", 4) && !isALPHA(s[4])) {
-                   sv_setpvs(PL_linestr, "");
+               if (*s == '=' && strEQs(s, "=cut") && !isALPHA(s[4])) {
+                    SvPVCLEAR(PL_linestr);
                     PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
                     PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
                     PL_last_lop = PL_last_uni = NULL;
@@ -5163,7 +5374,7 @@ Perl_yylex(pTHX)
                               /* if we have already added "LINE: while (<>) {",
                                  we must not do it again */
                         {
-                           sv_setpvs(PL_linestr, "");
+                            SvPVCLEAR(PL_linestr);
                             PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
                             PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
                             PL_last_lop = PL_last_uni = NULL;
@@ -5251,7 +5462,7 @@ Perl_yylex(pTHX)
             while (s < PL_bufend && SPACE_OR_TAB(*s))
                 s++;
  
-           if (strnEQ(s,"=>",2)) {
+           if (strEQs(s,"=>")) {
                 s = force_word(PL_bufptr,BAREWORD,FALSE,FALSE);
                 DEBUG_T( { printbuf("### Saw unary minus before =>, forcing word %s\n", s); } );
                 OPERATOR('-');          /* unary minus */
@@ -5332,7 +5543,7 @@ Perl_yylex(pTHX)
                     PL_expect = XPOSTDEREF;
                     TOKEN(ARROW);
                 }
-               if (isIDFIRST_lazy_if(s,UTF)) {
+               if (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)) {
                     s = force_word(s,METHOD,FALSE,TRUE);
                     TOKEN(ARROW);
                 }
@@ -5517,7 +5728,7 @@ Perl_yylex(pTHX)
          grabattrs:
             s = skipspace(s);
             attrs = NULL;
-           while (isIDFIRST_lazy_if(s,UTF)) {
+            while (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)) {
                 I32 tmp;
                 SV *sv;
                 d = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE, &len);
@@ -5540,18 +5751,13 @@ Perl_yylex(pTHX)
                 sv = newSVpvn_flags(s, len, UTF ? SVf_UTF8 : 0);
                 if (*d == '(') {
                     d = scan_str(d,TRUE,TRUE,FALSE,NULL);
-                   COPLINE_SET_FROM_MULTI_END;
                     if (!d) {
-                       /* MUST advance bufptr here to avoid bogus
-                          "at end of line" context messages from yyerror().
-                        */
-                       PL_bufptr = s + len;
-                       yyerror("Unterminated attribute parameter in attribute list");
                         if (attrs)
                             op_free(attrs);
                         sv_free(sv);
-                       return REPORT(0);       /* EOF indicator */
+                        Perl_croak(aTHX_ "Unterminated attribute parameter in attribute list");
                     }
+                   COPLINE_SET_FROM_MULTI_END;
                 }
                 if (PL_lex_stuff) {
                     sv_catsv(sv, PL_lex_stuff);
@@ -5564,7 +5770,8 @@ Perl_yylex(pTHX)
                     if (len == 6 && strnEQ(SvPVX(sv), "unique", len)) {
                         sv_free(sv);
                         if (PL_in_my == KEY_our) {
-                           deprecate(":unique");
+                            deprecate_disappears_in("5.28",
+                                "Attribute \"unique\" is deprecated");
                         }
                         else
                             Perl_croak(aTHX_ "The 'unique' attribute may only be applied to 'our' variables");
@@ -5578,7 +5785,8 @@ Perl_yylex(pTHX)
                     }
                     else if (!PL_in_my && len == 6 && strnEQ(SvPVX(sv), "locked", len)) {
                         sv_free(sv);
-                       deprecate(":locked");
+                        deprecate_disappears_in("5.28",
+                            "Attribute \"locked\" is deprecated");
                     }
                     else if (!PL_in_my && len == 6 && strnEQ(SvPVX(sv), "method", len)) {
                         sv_free(sv);
@@ -5728,7 +5936,7 @@ Perl_yylex(pTHX)
                 while (d < PL_bufend && SPACE_OR_TAB(*d))
                     d++;
             }
-           if (d < PL_bufend && isIDFIRST_lazy_if(d,UTF)) {
+            if (d < PL_bufend && isIDFIRST_lazy_if_safe(d, PL_bufend, UTF)) {
                 d = scan_word(d, PL_tokenbuf + 1, sizeof PL_tokenbuf - 1,
                               FALSE, &len);
                 while (d < PL_bufend && SPACE_OR_TAB(*d))
@@ -5848,13 +6056,19 @@ Perl_yylex(pTHX)
                     }
                     else
                         /* skip plain q word */
-                       while (t < PL_bufend && isWORDCHAR_lazy_if(t,UTF))
+                       while (   t < PL_bufend
+                               && isWORDCHAR_lazy_if_safe(t, PL_bufend, UTF))
+                        {
                             t += UTF ? UTF8SKIP(t) : 1;
+                        }
                 }
-               else if (isWORDCHAR_lazy_if(t,UTF)) {
+               else if (isWORDCHAR_lazy_if_safe(t, PL_bufend, UTF)) {
                     t += UTF ? UTF8SKIP(t) : 1;
-                   while (t < PL_bufend && isWORDCHAR_lazy_if(t,UTF))
+                   while (   t < PL_bufend
+                           && isWORDCHAR_lazy_if_safe(t, PL_bufend, UTF))
+                    {
                         t += UTF ? UTF8SKIP(t) : 1;
+                    }
                 }
                 while (t < PL_bufend && isSPACE(*t))
                     t++;
@@ -5876,7 +6090,7 @@ Perl_yylex(pTHX)
                         PL_expect = XTERM;
                         break;
                     }
-                   if (strnEQ(s, "sub", 3)) {
+                   if (strEQs(s, "sub")) {
                         d = s + 3;
                         d = skipspace(d);
                         if (*d == ':') {
@@ -5949,8 +6163,9 @@ Perl_yylex(pTHX)
         }
         s--;
         if (PL_expect == XOPERATOR) {
-           if (PL_bufptr == PL_linestart && ckWARN(WARN_SEMICOLON)
-               && isIDFIRST_lazy_if(s,UTF))
+           if (   PL_bufptr == PL_linestart
+                && ckWARN(WARN_SEMICOLON)
+               && isIDFIRST_lazy_if_safe(s, PL_bufend, UTF))
             {
                 CopLINE_dec(PL_curcop);
                 Perl_warner(aTHX_ packWARN(WARN_SEMICOLON), "%s", PL_warn_nosemi);
@@ -6009,7 +6224,7 @@ Perl_yylex(pTHX)
         {
             const char tmp = *s++;
             if (tmp == '=') {
-               if ((s == PL_linestart+2 || s[-3] == '\n') && strnEQ(s, "=====", 5)) {
+               if ((s == PL_linestart+2 || s[-3] == '\n') && strEQs(s, "=====")) {
                     s = vcs_conflict_marker(s + 5);
                     goto retry;
                 }
@@ -6047,7 +6262,7 @@ Perl_yylex(pTHX)
                      while (s < d) {
                          if (*s++ == '\n') {
                              incline(s);
-                            if (strnEQ(s,"=cut",4)) {
+                            if (strEQs(s,"=cut")) {
                                  s = strchr(s,'\n');
                                  if (s)
                                      s++;
@@ -6128,7 +6343,7 @@ Perl_yylex(pTHX)
             if (s[1] != '<' && !strchr(s,'>'))
                 check_uni();
             if (s[1] == '<' && s[2] != '>') {
-               if ((s == PL_linestart || s[-1] == '\n') && strnEQ(s+2, "<<<<<", 5)) {
+               if ((s == PL_linestart || s[-1] == '\n') && strEQs(s+2, "<<<<<")) {
                     s = vcs_conflict_marker(s + 7);
                     goto retry;
                 }
@@ -6143,7 +6358,7 @@ Perl_yylex(pTHX)
         {
             char tmp = *s++;
             if (tmp == '<') {
-               if ((s == PL_linestart+2 || s[-3] == '\n') && strnEQ(s, "<<<<<", 5)) {
+               if ((s == PL_linestart+2 || s[-3] == '\n') && strEQs(s, "<<<<<")) {
                      s = vcs_conflict_marker(s + 5);
                     goto retry;
                 }
@@ -6187,7 +6402,7 @@ Perl_yylex(pTHX)
         {
             const char tmp = *s++;
             if (tmp == '>') {
-               if ((s == PL_linestart+2 || s[-3] == '\n') && strnEQ(s, ">>>>>", 5)) {
+               if ((s == PL_linestart+2 || s[-3] == '\n') && strEQs(s, ">>>>>")) {
                     s = vcs_conflict_marker(s + 5);
                     goto retry;
                 }
@@ -6232,7 +6447,10 @@ Perl_yylex(pTHX)
             POSTDEREF('$');
         }
  
-       if (s[1] == '#' && (isIDFIRST_lazy_if(s+2,UTF) || strchr("{$:+-@", s[2]))) {
+       if (   s[1] == '#'
+            && (   isIDFIRST_lazy_if_safe(s+2, PL_bufend, UTF)
+                || strchr("{$:+-@", s[2])))
+        {
             PL_tokenbuf[0] = '@';
             s = scan_ident(s + 1, PL_tokenbuf + 1,
                            sizeof PL_tokenbuf - 1, FALSE);
@@ -6281,14 +6499,18 @@ Perl_yylex(pTHX)
                     if (ckWARN(WARN_SYNTAX)) {
                         char *t = s+1;
  
-                       while (isSPACE(*t) || isWORDCHAR_lazy_if(t,UTF) || *t == '$')
+                        while (   isSPACE(*t)
+                               || isWORDCHAR_lazy_if_safe(t, PL_bufend, UTF)
+                               || *t == '$')
+                        {
                             t += UTF ? UTF8SKIP(t) : 1;
+                        }
                         if (*t++ == ',') {
                             PL_bufptr = skipspace(PL_bufptr); /* XXX can realloc */
                             while (t < PL_bufend && *t != ']')
                                 t++;
                             Perl_warner(aTHX_ packWARN(WARN_SYNTAX),
-                                       "Multidimensional syntax %"UTF8f" not supported",
+                                       "Multidimensional syntax %" UTF8f " not supported",
                                          UTF8fARG(UTF,(int)((t - PL_bufptr) + 1), PL_bufptr));
                         }
                     }
@@ -6303,17 +6525,21 @@ Perl_yylex(pTHX)
                             do {
                                 t++;
                             } while (isSPACE(*t));
-                           if (isIDFIRST_lazy_if(t,UTF)) {
+                           if (isIDFIRST_lazy_if_safe(t, PL_bufend, UTF)) {
                                 STRLEN len;
                                 t = scan_word(t, tmpbuf, sizeof tmpbuf, TRUE,
                                               &len);
                                 while (isSPACE(*t))
                                     t++;
-                               if (*t == ';'
-                                       && get_cvn_flags(tmpbuf, len, UTF ? SVf_UTF8 : 0))
+                                if (  *t == ';'
+                                    && get_cvn_flags(tmpbuf, len, UTF
+                                                                  ? SVf_UTF8
+                                                                  : 0))
+                                {
                                     Perl_warner(aTHX_ packWARN(WARN_SYNTAX),
-                                       "You need to quote \"%"UTF8f"\"",
+                                       "You need to quote \"%" UTF8f "\"",
                                          UTF8fARG(UTF, len, tmpbuf));
+                                }
                             }
                         }
                 }
@@ -6326,9 +6552,12 @@ Perl_yylex(pTHX)
                     PL_expect = XOPERATOR;
                 else if (strchr("$@\"'`q", *s))
                     PL_expect = XTERM;          /* e.g. print $fh "foo" */
-               else if (strchr("&*<%", *s) && isIDFIRST_lazy_if(s+1,UTF))
+               else if (   strchr("&*<%", *s)
+                         && isIDFIRST_lazy_if_safe(s+1, PL_bufend, UTF))
+                {
                     PL_expect = XTERM;          /* e.g. print $fh &sub */
-               else if (isIDFIRST_lazy_if(s,UTF)) {
+                }
+               else if (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)) {
                     char tmpbuf[sizeof PL_tokenbuf];
                     int t2;
                     scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
@@ -6427,10 +6656,10 @@ Perl_yylex(pTHX)
          }
         else {
             /* Disable warning on "study /blah/" */
-           if (PL_oldoldbufptr == PL_last_uni
-            && (*PL_last_uni != 's' || s - PL_last_uni < 5
-                || memNE(PL_last_uni, "study", 5)
-                || isWORDCHAR_lazy_if(PL_last_uni+5,UTF)
+           if (    PL_oldoldbufptr == PL_last_uni
+                && (   *PL_last_uni != 's' || s - PL_last_uni < 5
+                    || memNE(PL_last_uni, "study", 5)
+                    || isWORDCHAR_lazy_if_safe(PL_last_uni+5, PL_bufend, UTF)
              ))
                 check_uni();
             s = scan_pat(s,OP_MATCH);
@@ -6677,7 +6906,7 @@ Perl_yylex(pTHX)
           fat_arrow:
             CLINE;
             pl_yylval.opval
-               = (OP*)newSVOP(OP_CONST, 0,
+                = newSVOP(OP_CONST, 0,
                                S_newSV_maybe_utf8(aTHX_ PL_tokenbuf, len));
             pl_yylval.opval->op_private = OPpCONST_BARE;
             TERM(BAREWORD);
@@ -6800,8 +7029,10 @@ Perl_yylex(pTHX)
             else {                      /* no override */
                 tmp = -tmp;
                 if (tmp == KEY_dump) {
-                   Perl_ck_warner(aTHX_ packWARN(WARN_MISC),
-                                  "dump() better written as CORE::dump()");
+                   Perl_ck_warner_d(aTHX_ packWARN2(WARN_MISC,WARN_DEPRECATED),
+                                    "dump() better written as CORE::dump(). "
+                                     "dump() will no longer be available " 
+                                     "in Perl 5.30");
                 }
                 gv = NULL;
                 gvp = 0;
@@ -6820,7 +7051,7 @@ Perl_yylex(pTHX)
             bool arrow;
             STRLEN bufoff = PL_bufptr - SvPVX(PL_linestr);
             STRLEN   soff = s         - SvPVX(PL_linestr);
-           s = skipspace_flags(s, LEX_NO_INCLINE);
+           s = peekspace(s);
             arrow = *s == '=' && s[1] == '>';
             PL_bufptr = SvPVX(PL_linestr) + bufoff;
             s         = SvPVX(PL_linestr) +   soff;
@@ -6831,12 +7062,10 @@ Perl_yylex(pTHX)
        reserved_word:
         switch (tmp) {
  
-       default:                        /* not a keyword */
             /* Trade off - by using this evil construction we can pull the
                variable gv into the block labelled keylookup. If not, then
                we have to give it function scope so that the goto from the
                earlier ':' case doesn't bypass the initialisation.  */
-           if (0) {
             just_a_word_zero_gv:
                 sv = NULL;
                 cv = NULL;
@@ -6846,7 +7075,7 @@ Perl_yylex(pTHX)
                 orig_keyword = 0;
                 lex = 0;
                 off = 0;
-           }
+       default:                        /* not a keyword */
           just_a_word: {
                 int pkgname = 0;
                 const char lastchar = (PL_bufptr == PL_oldoldbufptr ? 0 : PL_bufptr[-1]);
@@ -6860,7 +7089,7 @@ Perl_yylex(pTHX)
                     s = scan_word(s, PL_tokenbuf + len, sizeof PL_tokenbuf - len,
                                   TRUE, &morelen);
                     if (!morelen)
-                       Perl_croak(aTHX_ "Bad name after %"UTF8f"%s",
+                       Perl_croak(aTHX_ "Bad name after %" UTF8f "%s",
                                 UTF8fARG(UTF, len, PL_tokenbuf),
                                 *s == '\'' ? "'" : "::");
                     len += morelen;
@@ -6888,8 +7117,9 @@ Perl_yylex(pTHX)
                     if (ckWARN(WARN_BAREWORD)
                         && ! gv_fetchpvn_flags(PL_tokenbuf, len, UTF ? SVf_UTF8 : 0, SVt_PVHV))
                         Perl_warner(aTHX_ packWARN(WARN_BAREWORD),
-                         "Bareword \"%"UTF8f"\" refers to nonexistent package",
-                          UTF8fARG(UTF, len, PL_tokenbuf));
+                                    "Bareword \"%" UTF8f
+                                    "\" refers to nonexistent package",
+                                    UTF8fARG(UTF, len, PL_tokenbuf));
                     len -= 2;
                     PL_tokenbuf[len] = '\0';
                     gv = NULL;
@@ -6915,7 +7145,7 @@ Perl_yylex(pTHX)
  
                 /* Presume this is going to be a bareword of some sort. */
                 CLINE;
-               pl_yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
+                pl_yylval.opval = newSVOP(OP_CONST, 0, sv);
                 pl_yylval.opval->op_private = OPpCONST_BARE;
  
                 /* And if "Foo::", then that's what it certainly is. */
@@ -6958,8 +7188,8 @@ Perl_yylex(pTHX)
                     s = skipspace(s);
  
                     /* Two barewords in a row may indicate method call. */
-
-                   if ((isIDFIRST_lazy_if(s,UTF) || *s == '$')
+                   if (   (   isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)
+                            || *s == '$')
                          && (tmp = intuit_method(s, lex ? NULL : sv, cv)))
                      {
                         goto method;
@@ -7044,9 +7274,11 @@ Perl_yylex(pTHX)
  
                 /* If followed by a bareword, see if it looks like indir obj. */
  
-               if (tmp == 1 && !orig_keyword
-                       && (isIDFIRST_lazy_if(s,UTF) || *s == '$')
-                       && (tmp = intuit_method(s, lex ? NULL : sv, cv))) {
+               if (   tmp == 1
+                    && !orig_keyword
+                    && (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF) || *s == '$')
+                    && (tmp = intuit_method(s, lex ? NULL : sv, cv)))
+                {
                   method:
                     if (lex && !off) {
                         assert(cSVOPx(pl_yylval.opval)->op_sv == sv);
@@ -7088,7 +7320,7 @@ Perl_yylex(pTHX)
  
                     op_free(pl_yylval.opval);
                     pl_yylval.opval =
-                       off ? (OP *)newCVREF(0, rv2cv_op) : rv2cv_op;
+                        off ? newCVREF(0, rv2cv_op) : rv2cv_op;
                     pl_yylval.opval->op_private |= OPpENTERSUB_NOPAREN;
                     PL_last_lop = PL_oldbufptr;
                     PL_last_lop_op = OP_ENTERSUB;
@@ -7190,7 +7422,7 @@ Perl_yylex(pTHX)
                 if ((lastchar == '*' || lastchar == '%' || lastchar == '&')
                  && saw_infix_sigil) {
                     Perl_ck_warner_d(aTHX_ packWARN(WARN_AMBIGUOUS),
-                                    "Operator or semicolon missing before %c%"UTF8f,
+                                    "Operator or semicolon missing before %c%" UTF8f,
                                      lastchar,
                                      UTF8fARG(UTF, strlen(PL_tokenbuf),
                                               PL_tokenbuf));
@@ -7203,18 +7435,18 @@ Perl_yylex(pTHX)
  
         case KEY___FILE__:
             FUN0OP(
-               (OP*)newSVOP(OP_CONST, 0, newSVpv(CopFILE(PL_curcop),0))
+                newSVOP(OP_CONST, 0, newSVpv(CopFILE(PL_curcop),0))
             );
  
         case KEY___LINE__:
             FUN0OP(
-               (OP*)newSVOP(OP_CONST, 0,
-                   Perl_newSVpvf(aTHX_ "%"IVdf, (IV)CopLINE(PL_curcop)))
+                newSVOP(OP_CONST, 0,
+                   Perl_newSVpvf(aTHX_ "%" IVdf, (IV)CopLINE(PL_curcop)))
             );
  
         case KEY___PACKAGE__:
             FUN0OP(
-               (OP*)newSVOP(OP_CONST, 0,
+                newSVOP(OP_CONST, 0,
                                         (PL_curstash
                                          ? newSVhek(HvNAME_HEK(PL_curstash))
                                          : &PL_sv_undef))
@@ -7314,7 +7546,7 @@ Perl_yylex(pTHX)
                     goto just_a_word;
                 }
                 if (!tmp)
-                   Perl_croak(aTHX_ "CORE::%"UTF8f" is not a keyword",
+                   Perl_croak(aTHX_ "CORE::%" UTF8f " is not a keyword",
                                       UTF8fARG(UTF, len, PL_tokenbuf));
                 if (tmp < 0)
                     tmp = -tmp;
@@ -7428,7 +7660,9 @@ Perl_yylex(pTHX)
                               1, &len);
                 if (len && (len != 4 || strNE(PL_tokenbuf+1, "CORE"))
                  && !keyword(PL_tokenbuf + 1, len, 0)) {
+                    SSize_t off = s-SvPVX(PL_linestr);
                     d = skipspace(d);
+                    s = SvPVX(PL_linestr)+off;
                     if (*d == '(') {
                         force_ident_maybe_lex('&');
                         s = d;
@@ -7538,20 +7772,22 @@ Perl_yylex(pTHX)
                 return REPORT(0);
             pl_yylval.ival = CopLINE(PL_curcop);
             s = skipspace(s);
-           if (PL_expect == XSTATE && isIDFIRST_lazy_if(s,UTF)) {
+            if (   PL_expect == XSTATE
+                && isIDFIRST_lazy_if_safe(s, PL_bufend, UTF))
+            {
                 char *p = s;
  
                 if ((PL_bufend - p) >= 3
-                    && strnEQ(p, "my", 2) && isSPACE(*(p + 2)))
+                    && strEQs(p, "my") && isSPACE(*(p + 2)))
                  {
                     p += 2;
                  }
                 else if ((PL_bufend - p) >= 4
-                         && strnEQ(p, "our", 3) && isSPACE(*(p + 3)))
+                         && strEQs(p, "our") && isSPACE(*(p + 3)))
                     p += 3;
                 p = skipspace(p);
                  /* skip optional package name, as in "for my abc $x (..)" */
-               if (isIDFIRST_lazy_if(p,UTF)) {
+               if (isIDFIRST_lazy_if_safe(p, PL_bufend, UTF)) {
                     p = scan_word(p, PL_tokenbuf, sizeof PL_tokenbuf, TRUE, &len);
                     p = skipspace(p);
                 }
@@ -7794,9 +8030,9 @@ Perl_yylex(pTHX)
             }
             PL_in_my = (U16)tmp;
             s = skipspace(s);
-           if (isIDFIRST_lazy_if(s,UTF)) {
+            if (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)) {
                 s = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, TRUE, &len);
-               if (len == 3 && strnEQ(PL_tokenbuf, "sub", 3))
+               if (len == 3 && strEQs(PL_tokenbuf, "sub"))
                     goto really_sub;
                 PL_in_my_stash = find_in_my_stash(PL_tokenbuf, len);
                 if (!PL_in_my_stash) {
@@ -7844,10 +8080,10 @@ Perl_yylex(pTHX)
  
         case KEY_open:
             s = skipspace(s);
-           if (isIDFIRST_lazy_if(s,UTF)) {
-          const char *t;
-          d = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE,
-              &len);
+            if (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)) {
+                const char *t;
+                d = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE,
+                              &len);
                 for (t=d; isSPACE(*t);)
                     t++;
                 if ( *t && strchr("|&*+-=!?:.", *t) && ckWARN_d(WARN_PRECEDENCE)
@@ -7857,7 +8093,7 @@ Perl_yylex(pTHX)
                     && !keyword(s, d-s, 0)
                 ) {
                     Perl_warner(aTHX_ packWARN(WARN_PRECEDENCE),
-                      "Precedence problem: open %"UTF8f" should be open(%"UTF8f")",
+                      "Precedence problem: open %" UTF8f " should be open(%" UTF8f ")",
                         UTF8fARG(UTF, d-s, s), UTF8fARG(UTF, d-s, s));
                 }
             }
@@ -8004,9 +8240,13 @@ Perl_yylex(pTHX)
             {
                 *PL_tokenbuf = '\0';
                 s = force_word(s,BAREWORD,TRUE,TRUE);
-               if (isIDFIRST_lazy_if(PL_tokenbuf,UTF))
+                if (isIDFIRST_lazy_if_safe(PL_tokenbuf,
+                                           PL_tokenbuf + sizeof(PL_tokenbuf),
+                                           UTF))
+                {
                     gv_stashpvn(PL_tokenbuf, strlen(PL_tokenbuf),
                                  GV_ADD | (UTF ? SVf_UTF8 : 0));
+                }
                 else if (*s == '<')
                     yyerror("<> at require-statement should be quotes");
             }
@@ -8014,7 +8254,7 @@ Perl_yylex(pTHX)
                 orig_keyword = 0;
                 pl_yylval.ival = 1;
             }
-           else 
+           else
                 pl_yylval.ival = 0;
             PL_expect = PL_nexttoke ? XOPERATOR : XTERM;
             PL_bufptr = s;
@@ -8204,10 +8444,11 @@ Perl_yylex(pTHX)
                 const int key = tmp;
                  SV *format_name = NULL;
  
-               d = s;
+                SSize_t off = s-SvPVX(PL_linestr);
                 s = skipspace(s);
+                d = SvPVX(PL_linestr)+off;
  
-               if (isIDFIRST_lazy_if(s,UTF)
+                if (   isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)
                      || *s == '\''
                      || (*s == ':' && s[1] == ':'))
                 {
@@ -8253,7 +8494,7 @@ Perl_yylex(pTHX)
                 if (key == KEY_format) {
                     if (format_name) {
                          NEXTVAL_NEXTTOKE.opval
-                            = (OP*)newSVOP(OP_CONST,0, format_name);
+                            = newSVOP(OP_CONST,0, format_name);
                          NEXTVAL_NEXTTOKE.opval->op_private |= OPpCONST_BARE;
                          force_next(BAREWORD);
                      }
@@ -8286,12 +8527,12 @@ Perl_yylex(pTHX)
                     if (!have_name)
                         Perl_croak(aTHX_ "Illegal declaration of anonymous subroutine");
                     else if (*s != ';' && *s != '}')
-                       Perl_croak(aTHX_ "Illegal declaration of subroutine %"SVf, SVfARG(PL_subname));
+                       Perl_croak(aTHX_ "Illegal declaration of subroutine %" SVf, SVfARG(PL_subname));
                 }
  
                 if (have_proto) {
                     NEXTVAL_NEXTTOKE.opval =
-                       (OP*)newSVOP(OP_CONST, 0, PL_lex_stuff);
+                        newSVOP(OP_CONST, 0, PL_lex_stuff);
                     PL_lex_stuff = NULL;
                     force_next(THING);
                 }
@@ -8462,6 +8703,9 @@ Perl_yylex(pTHX)
  
    Looks up an identifier in the pad or in a package
  
+  is_sig indicates that this is a subroutine signature variable
+  rather than a plain pad var.
+
    Returns:
      PRIVATEREF if this is a lexical name.
      BAREWORD   if this belongs to a package.
@@ -8504,6 +8748,7 @@ S_pending_ident(pTHX)
              tmp = allocmy(PL_tokenbuf, tokenbuf_len, UTF ? SVf_UTF8 : 0);
          }
          else {
+            OP *o;
              if (has_colon) {
                  /* "my" variable %s can't be in a package */
                  /* PL_no_myglob is constant */
@@ -8516,9 +8761,29 @@ S_pending_ident(pTHX)
                  GCC_DIAG_RESTORE;
              }
  
-            pl_yylval.opval = newOP(OP_PADANY, 0);
-            pl_yylval.opval->op_targ = allocmy(PL_tokenbuf, tokenbuf_len,
+            if (PL_in_my == KEY_sigvar) {
+                /* A signature 'padop' needs in addition, an op_first to
+                 * point to a child sigdefelem, and an extra field to hold
+                 * the signature index. We can achieve both by using an
+                 * UNOP_AUX and (ab)using the op_aux field to hold the
+                 * index. If we ever need more fields, use a real malloced
+                 * aux strut instead.
+                 */
+                o = newUNOP_AUX(OP_ARGELEM, 0, NULL,
+                                    INT2PTR(UNOP_AUX_item *,
+                                        (PL_parser->sig_elems)));
+                o->op_private |= (  PL_tokenbuf[0] == '$' ? OPpARGELEM_SV
+                                  : PL_tokenbuf[0] == '@' ? OPpARGELEM_AV
+                                  :                         OPpARGELEM_HV);
+            }
+            else
+                o = newOP(OP_PADANY, 0);
+            o->op_targ = allocmy(PL_tokenbuf, tokenbuf_len,
                                                          UTF ? SVf_UTF8 : 0);
+            if (PL_in_my == KEY_sigvar)
+                PL_in_my = 0;
+
+            pl_yylval.opval = o;
             return PRIVATEREF;
          }
      }
@@ -8540,7 +8805,7 @@ S_pending_ident(pTHX)
                 SV *  const sym = newSVhek(stashname);
                  sv_catpvs(sym, "::");
                  sv_catpvn_flags(sym, PL_tokenbuf+1, tokenbuf_len - 1, (UTF ? SV_CATUTF8 : SV_CATBYTES ));
-                pl_yylval.opval = (OP*)newSVOP(OP_CONST, 0, sym);
+                pl_yylval.opval = newSVOP(OP_CONST, 0, sym);
                  pl_yylval.opval->op_private = OPpCONST_ENTERED;
                  if (pit != '&')
                    gv_fetchsv(sym,
@@ -8558,8 +8823,8 @@ S_pending_ident(pTHX)
      }
  
      /*
-       Whine if they've said @foo in a doublequoted string,
-       and @foo isn't a variable we can find in the symbol
+       Whine if they've said @foo or @foo{key} in a doublequoted string,
+       and @foo (or %foo) isn't a variable we can find in the symbol
         table.
      */
      if (ckWARN(WARN_AMBIGUOUS)
@@ -8568,23 +8833,21 @@ S_pending_ident(pTHX)
          && !PL_lex_brackets)
      {
          GV *const gv = gv_fetchpvn_flags(PL_tokenbuf + 1, tokenbuf_len - 1,
-                                        ( UTF ? SVf_UTF8 : 0 ), SVt_PVAV);
+                                         ( UTF ? SVf_UTF8 : 0 ) | GV_ADDMG,
+                                         SVt_PVAV);
          if ((!gv || ((PL_tokenbuf[0] == '@') ? !GvAV(gv) : !GvHV(gv)))
-               /* DO NOT warn for @- and @+ */
-               && !( PL_tokenbuf[2] == '\0'
-                      && ( PL_tokenbuf[1] == '-' || PL_tokenbuf[1] == '+' ))
            )
          {
              /* Downgraded from fatal to warning 20000522 mjd */
              Perl_warner(aTHX_ packWARN(WARN_AMBIGUOUS),
-                       "Possible unintended interpolation of %"UTF8f
+                       "Possible unintended interpolation of %" UTF8f
                         " in string",
                         UTF8fARG(UTF, tokenbuf_len, PL_tokenbuf));
          }
      }
  
      /* build ops for a bareword */
-    pl_yylval.opval = (OP*)newSVOP(OP_CONST, 0,
+    pl_yylval.opval = newSVOP(OP_CONST, 0,
                                    newSVpvn_flags(PL_tokenbuf + 1,
                                                       tokenbuf_len - 1,
                                                        UTF ? SVf_UTF8 : 0 ));
@@ -8631,10 +8894,10 @@ S_checkcomma(pTHX_ const char *s, const char *name, const char *what)
         s++;
      while (s < PL_bufend && isSPACE(*s))
         s++;
-    if (isIDFIRST_lazy_if(s,UTF)) {
+    if (isIDFIRST_lazy_if_safe(s, PL_bufend, UTF)) {
         const char * const w = s;
          s += UTF ? UTF8SKIP(s) : 1;
-       while (isWORDCHAR_lazy_if(s,UTF))
+       while (isWORDCHAR_lazy_if_safe(s, PL_bufend, UTF))
             s += UTF ? UTF8SKIP(s) : 1;
         while (s < PL_bufend && isSPACE(*s))
             s++;
@@ -8807,21 +9070,23 @@ S_new_constant(pTHX_ const char *s, STRLEN len, const char *key, STRLEN keylen,
  
  PERL_STATIC_INLINE void
  S_parse_ident(pTHX_ char **s, char **d, char * const e, int allow_package,
-                    bool is_utf8, bool check_dollar) {
+                    bool is_utf8, bool check_dollar)
+{
      PERL_ARGS_ASSERT_PARSE_IDENT;
  
-    for (;;) {
+    while (*s < PL_bufend) {
          if (*d >= e)
              Perl_croak(aTHX_ "%s", ident_too_long);
-        if (is_utf8 && isIDFIRST_utf8((U8*)*s)) {
+        if (is_utf8 && isIDFIRST_utf8_safe(*s, PL_bufend)) {
               /* The UTF-8 case must come first, otherwise things
               * like c\N{COMBINING TILDE} would start failing, as the
               * isWORDCHAR_A case below would gobble the 'c' up.
               */
  
              char *t = *s + UTF8SKIP(*s);
-            while (isIDCONT_utf8((U8*)t))
+            while (isIDCONT_utf8_safe((const U8*) t, (const U8*) PL_bufend)) {
                  t += UTF8SKIP(t);
+            }
              if (*d + (t - *s) > e)
                  Perl_croak(aTHX_ "%s", ident_too_long);
              Copy(*s, *d, t - *s, char);
@@ -8833,7 +9098,10 @@ S_parse_ident(pTHX_ char **s, char **d, char * const e, int allow_package,
                  *(*d)++ = *(*s)++;
              } while (isWORDCHAR_A(**s) && *d < e);
          }
-        else if (allow_package && **s == '\'' && isIDFIRST_lazy_if(*s+1,is_utf8)) {
+        else if (   allow_package
+                 && **s == '\''
+                 && isIDFIRST_lazy_if_safe((*s)+1, PL_bufend, is_utf8))
+        {
              *(*d)++ = ':';
              *(*d)++ = ':';
              (*s)++;
@@ -8884,10 +9152,10 @@ S_scan_word(pTHX_ char *s, char *dest, STRLEN destlen, int allow_package, STRLEN
   *      Because all ASCII characters have the same representation whether
   *      encoded in UTF-8 or not, we can use the foo_A macros below and '\0' and
   *      '{' without knowing if is UTF-8 or not. */
-#define VALID_LEN_ONE_IDENT(s, is_utf8)                                       \
-    (isGRAPH_A(*(s)) || ((is_utf8)                                            \
-                         ? isIDFIRST_utf8((U8*) (s))                          \
-                         : (isGRAPH_L1(*s)                                    \
+#define VALID_LEN_ONE_IDENT(s, e, is_utf8)                                  \
+    (isGRAPH_A(*(s)) || ((is_utf8)                                          \
+                         ? isIDFIRST_utf8_safe(s, e)                        \
+                         : (isGRAPH_L1(*s)                                  \
                              && LIKELY((U8) *(s) != LATIN1_TO_NATIVE(0xAD)))))
  
  STATIC char *
@@ -8928,11 +9196,11 @@ S_scan_ident(pTHX_ char *s, char *dest, STRLEN destlen, I32 ck_uni)
      /* Here, it is not a run-of-the-mill identifier name */
  
      if (*s == '$' && s[1]
-        && (isIDFIRST_lazy_if(s+1,is_utf8)
+        && (   isIDFIRST_lazy_if_safe(s+1, PL_bufend, is_utf8)
              || isDIGIT_A((U8)s[1])
              || s[1] == '$'
              || s[1] == '{'
-            || strnEQ(s+1,"::",2)) )
+            || strEQs(s+1,"::")) )
      {
          /* Dereferencing a value in a scalar variable.
             The alternatives are different syntaxes for a scalar variable.
@@ -8951,7 +9219,7 @@ S_scan_ident(pTHX_ char *s, char *dest, STRLEN destlen, I32 ck_uni)
      if ((s <= PL_bufend - (is_utf8)
                            ? UTF8SKIP(s)
                            : 1)
-        && VALID_LEN_ONE_IDENT(s, is_utf8))
+        && VALID_LEN_ONE_IDENT(s, PL_bufend, is_utf8))
      {
          if (is_utf8) {
              const STRLEN skip = UTF8SKIP(s);
@@ -8976,8 +9244,10 @@ S_scan_ident(pTHX_ char *s, char *dest, STRLEN destlen, I32 ck_uni)
      else if (ck_uni && bracket == -1)
         check_uni();
      if (bracket != -1) {
+        bool skip;
+        char *s2;
          /* If we were processing {...} notation then...  */
-       if (isIDFIRST_lazy_if(d,is_utf8)) {
+        if (isIDFIRST_lazy_if_safe(d, e, is_utf8)) {
              /* if it starts as a valid identifier, assume that it is one.
                 (the later check for } being at the expected point will trap
                 cases where this doesn't pan out.)  */
@@ -9024,13 +9294,19 @@ S_scan_ident(pTHX_ char *s, char *dest, STRLEN destlen, I32 ck_uni)
  
          if ( !tmp_copline )
              tmp_copline = CopLINE(PL_curcop);
-        if (s < PL_bufend && isSPACE(*s)) {
-            s = skipspace(s);
-        }
-           
+        if ((skip = s < PL_bufend && isSPACE(*s)))
+            /* Avoid incrementing line numbers or resetting PL_linestart,
+               in case we have to back up.  */
+            s2 = peekspace(s);
+        else
+            s2 = s;
+
          /* Expect to find a closing } after consuming any trailing whitespace.
           */
-       if (*s == '}') {
+        if (*s2 == '}') {
+            /* Now increment line numbers if applicable.  */
+            if (skip)
+                s = skipspace(s);
             s++;
             if (PL_lex_state == LEX_INTERPNORMAL && !PL_lex_brackets) {
                 PL_lex_state = LEX_INTERPEND;
@@ -9050,7 +9326,7 @@ S_scan_ident(pTHX_ char *s, char *dest, STRLEN destlen, I32 ck_uni)
                      orig_copline = CopLINE(PL_curcop);
                      CopLINE_set(PL_curcop, tmp_copline);
                     Perl_warner(aTHX_ packWARN(WARN_AMBIGUOUS),
-                       "Ambiguous use of %c{%"SVf"} resolved to %c%"SVf,
+                       "Ambiguous use of %c{%" SVf "} resolved to %c%" SVf,
                         funny, SVfARG(tmp), funny, SVfARG(tmp));
                      CopLINE_set(PL_curcop, orig_copline);
                 }
@@ -9087,7 +9363,7 @@ S_pmflag(pTHX_ const char* const valid_flags, U32 * pmfl, char** s, char* charse
      STRLEN charlen = UTF ? UTF8SKIP(*s) : 1;
  
      if ( charlen != 1 || ! strchr(valid_flags, c) ) {
-        if (isWORDCHAR_lazy_if(*s, UTF)) {
+        if (isWORDCHAR_lazy_if_safe( *s, PL_bufend, UTF)) {
              yyerror_pv(Perl_form(aTHX_ "Unknown regexp modifier \"/%.*s\"", (int)charlen, *s),
                         UTF ? SVf_UTF8 : 0);
              (*s) += charlen;
@@ -9231,14 +9507,10 @@ S_scan_pat(pTHX_ char *start, I32 type)
      /* issue a warning if /c is specified,but /g is not */
      if ((pm->op_pmflags & PMf_CONTINUE) && !(pm->op_pmflags & PMf_GLOBAL))
      {
-        Perl_ck_warner(aTHX_ packWARN(WARN_REGEXP), 
+        Perl_ck_warner(aTHX_ packWARN(WARN_REGEXP),
                        "Use of /c modifier is meaningless without /g" );
      }
  
-    if (UNLIKELY((x_mod_count) > 1)) {
-        yyerror("Only one /x regex modifier is allowed");
-    }
-
      PL_lex_op = (OP*)pm;
      pl_yylval.ival = OP_MATCH;
      return s;
@@ -9251,6 +9523,7 @@ S_scan_subst(pTHX_ char *start)
      PMOP *pm;
      I32 first_start;
      line_t first_line;
+    line_t linediff = 0;
      I32 es = 0;
      char charset = '\0';    /* character set modifier */
      unsigned int x_mod_count = 0;
@@ -9292,10 +9565,6 @@ S_scan_subst(pTHX_ char *start)
         }
      }
  
-    if (UNLIKELY((x_mod_count) > 1)) {
-        yyerror("Only one /x regex modifier is allowed");
-    }
-
      if ((pm->op_pmflags & PMf_CONTINUE)) {
          Perl_ck_warner(aTHX_ packWARN(WARN_REGEXP), "Use of /c modifier is meaningless in s///" );
      }
@@ -9312,17 +9581,26 @@ S_scan_subst(pTHX_ char *start)
                 sv_catpvs(repl, "do ");
         }
         sv_catpvs(repl, "{");
-       sv_catsv(repl, PL_sublex_info.repl);
+       sv_catsv(repl, PL_parser->lex_sub_repl);
         sv_catpvs(repl, "}");
-       SvEVALED_on(repl);
-       SvREFCNT_dec(PL_sublex_info.repl);
-       PL_sublex_info.repl = repl;
-    }
-    if (CopLINE(PL_curcop) != first_line) {
-       sv_upgrade(PL_sublex_info.repl, SVt_PVNV);
-       ((XPVNV*)SvANY(PL_sublex_info.repl))->xnv_u.xpad_cop_seq.xlow =
-           CopLINE(PL_curcop) - first_line;
+       SvREFCNT_dec(PL_parser->lex_sub_repl);
+       PL_parser->lex_sub_repl = repl;
+        es = 1;
+    }
+
+
+    linediff = CopLINE(PL_curcop) - first_line;
+    if (linediff)
         CopLINE_set(PL_curcop, first_line);
+
+    if (linediff || es) {
+        /* the IVX field indicates that the replacement string is a s///e;
+         * the NVX field indicates how many src code lines the replacement
+         * spreads over */
+        sv_upgrade(PL_parser->lex_sub_repl, SVt_PVNV);
+        ((XPVNV*)SvANY(PL_parser->lex_sub_repl))->xnv_u.xnv_lines = 0;
+        ((XPVIV*)SvANY(PL_parser->lex_sub_repl))->xiv_u.xivu_eval_seen =
+                                                                    cBOOL(es);
      }
  
      PL_lex_op = (OP*)pm;
@@ -9384,7 +9662,7 @@ S_scan_trans(pTHX_ char *start)
      o->op_private &= ~OPpTRANS_ALL;
      o->op_private |= del|squash|complement|
        (DO_UTF8(PL_lex_stuff)? OPpTRANS_FROM_UTF : 0)|
-      (DO_UTF8(PL_sublex_info.repl) ? OPpTRANS_TO_UTF   : 0);
+      (DO_UTF8(PL_parser->lex_sub_repl) ? OPpTRANS_TO_UTF   : 0);
  
      PL_lex_op = o;
      pl_yylval.ival = nondestruct ? OP_TRANSR : OP_TRANS;
@@ -9427,6 +9705,9 @@ S_scan_heredoc(pTHX_ char *s)
      char *d;
      char *e;
      char *peek;
+    char *indent = 0;
+    I32 indent_len = 0;
+    bool indented = FALSE;
      const bool infile = PL_rsfp || PL_parser->filtered;
      const line_t origline = CopLINE(PL_curcop);
      LEXSHARED *shared = PL_parser->lex_shared;
@@ -9438,6 +9719,10 @@ S_scan_heredoc(pTHX_ char *s)
      e = PL_tokenbuf + sizeof PL_tokenbuf - 1;
      *PL_tokenbuf = '\n';
      peek = s;
+    if (*peek == '~') {
+       indented = TRUE;
+       peek++; s++;
+    }
      while (SPACE_OR_TAB(*peek))
         peek++;
      if (*peek == '`' || *peek == '\'' || *peek =='"') {
@@ -9455,10 +9740,12 @@ S_scan_heredoc(pTHX_ char *s)
             s++, term = '\'';
         else
             term = '"';
-       if (!isWORDCHAR_lazy_if(s,UTF))
-           deprecate("bare << to mean <<\"\"");
+       if (! isWORDCHAR_lazy_if_safe(s, PL_bufend, UTF))
+           deprecate_fatal_in("5.28", "Use of bare << to mean <<\"\" is deprecated");
         peek = s;
-       while (isWORDCHAR_lazy_if(peek,UTF)) {
+        while (
+               isWORDCHAR_lazy_if_safe(peek, PL_bufend, UTF))
+        {
             peek += UTF ? UTF8SKIP(peek) : 1;
         }
         len = (peek - s >= e - d) ? (e - d) : (peek - s);
@@ -9539,7 +9826,9 @@ S_scan_heredoc(pTHX_ char *s)
                might think.  Odd syntax errors like s;@{<<; can gobble up
                the implicit semicolon at the end of a flie, causing the
                file handle to be closed even when we are not in a string
-              eval.  So shared may be null in that case.  */
+              eval.  So shared may be null in that case.
+               (Closing '}' here to balance the earlier open brace for
+               editors that look for matched pairs.) */
             if (UNLIKELY(!shared))
                 goto interminable;
             /* A LEXSHARED struct with a null ls_prev pointer is the outer-
@@ -9558,12 +9847,45 @@ S_scan_heredoc(pTHX_ char *s)
         linestr = shared->ls_linestr;
         bufend = SvEND(linestr);
         d = s;
-       while (s < bufend - len + 1
-               && memNE(s,PL_tokenbuf,len) )
-        {
-           if (*s++ == '\n')
-               ++PL_parser->herelines;
+       if (indented) {
+           char *myolds = s;
+
+           while (s < bufend - len + 1) {
+               if (*s++ == '\n')
+                   ++PL_parser->herelines;
+
+               if (memEQ(s, PL_tokenbuf + 1, len - 1)) {
+                   char *backup = s;
+                   indent_len = 0;
+
+                   /* Only valid if it's preceded by whitespace only */
+                   while (backup != myolds && --backup >= myolds) {
+                       if (! SPACE_OR_TAB(*backup)) {
+                           break;
+                       }
+
+                       indent_len++;
+                   }
+
+                   /* No whitespace or all! */
+                   if (backup == s || *backup == '\n') {
+                       Newxz(indent, indent_len + 1, char);
+                       memcpy(indent, backup + 1, indent_len);
+                       s--; /* before our delimiter */
+                       PL_parser->herelines--; /* this line doesn't count */
+                       break;
+                   }
+               }
+           }
+       } else {
+           while (s < bufend - len + 1
+                  && memNE(s,PL_tokenbuf,len) )
+           {
+               if (*s++ == '\n')
+                   ++PL_parser->herelines;
+           }
         }
+
         if (s >= bufend - len + 1) {
             goto interminable;
         }
@@ -9595,7 +9917,7 @@ S_scan_heredoc(pTHX_ char *s)
              && cx->blk_eval.cur_text == linestr)
          {
             cx->blk_eval.cur_text = newSVsv(linestr);
-           SvSCREAM_on(cx->blk_eval.cur_text);
+           cx->blk_u16 |= 0x40; /* indicate cur_text is ref counted */
         }
         /* Copy everything from s onwards back to d. */
         Move(s,d,bufend-s + 1,char);
@@ -9610,13 +9932,15 @@ S_scan_heredoc(pTHX_ char *s)
      {
        SV *linestr_save;
        char *oldbufptr_save;
+      char *oldoldbufptr_save;
       streaming:
-      sv_setpvs(tmpstr,"");   /* avoid "uninitialized" warning */
+      SvPVCLEAR(tmpstr);   /* avoid "uninitialized" warning */
        term = PL_tokenbuf[1];
        len--;
        linestr_save = PL_linestr; /* must restore this afterwards */
        d = s;                    /* and this */
        oldbufptr_save = PL_oldbufptr;
+      oldoldbufptr_save = PL_oldoldbufptr;
        PL_linestr = newSVpvs("");
        PL_bufend = SvPVX(PL_linestr);
        while (1) {
@@ -9634,6 +9958,7 @@ S_scan_heredoc(pTHX_ char *s)
             SvREFCNT_dec_NN(PL_linestr);
             PL_linestr = linestr_save;
              PL_oldbufptr = oldbufptr_save;
+            PL_oldoldbufptr = oldoldbufptr_save;
             goto interminable;
         }
         CopLINE_set(PL_curcop, origline);
@@ -9662,22 +9987,101 @@ S_scan_heredoc(pTHX_ char *s)
         else if (PL_bufend - PL_linestart == 1 && PL_bufend[-1] == '\r')
             PL_bufend[-1] = '\n';
  #endif
-       if (*s == term && PL_bufend-s >= len
-        && memEQ(s,PL_tokenbuf + 1,len)) {
-           SvREFCNT_dec(PL_linestr);
-           PL_linestr = linestr_save;
-           PL_linestart = SvPVX(linestr_save);
-           PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
-            PL_oldbufptr = oldbufptr_save;
-           s = d;
-           break;
-       }
-       else {
+       if (indented && (PL_bufend-s) >= len) {
+           char * found = ninstr(s, PL_bufend, (PL_tokenbuf + 1), (PL_tokenbuf +1 + len));
+
+           if (found) {
+               char *backup = found;
+               indent_len = 0;
+
+               /* Only valid if it's preceded by whitespace only */
+               while (backup != s && --backup >= s) {
+                   if (! SPACE_OR_TAB(*backup)) {
+                       break;
+                   }
+                   indent_len++;
+               }
+
+               /* All whitespace or none! */
+               if (backup == found || SPACE_OR_TAB(*backup)) {
+                   Newxz(indent, indent_len + 1, char);
+                   memcpy(indent, backup, indent_len);
+                   SvREFCNT_dec(PL_linestr);
+                   PL_linestr = linestr_save;
+                   PL_linestart = SvPVX(linestr_save);
+                   PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
+                   PL_oldbufptr = oldbufptr_save;
+                   PL_oldoldbufptr = oldoldbufptr_save;
+                   s = d;
+                   break;
+               }
+           }
+
+           /* Didn't find it */
             sv_catsv(tmpstr,PL_linestr);
+       } else {
+           if (*s == term && PL_bufend-s >= len
+               && memEQ(s,PL_tokenbuf + 1,len))
+           {
+               SvREFCNT_dec(PL_linestr);
+               PL_linestr = linestr_save;
+               PL_linestart = SvPVX(linestr_save);
+               PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
+               PL_oldbufptr = oldbufptr_save;
+               PL_oldoldbufptr = oldoldbufptr_save;
+               s = d;
+               break;
+           } else {
+               sv_catsv(tmpstr,PL_linestr);
+           }
         }
        }
      }
      PL_multi_end = origline + PL_parser->herelines;
+    if (indented && indent) {
+       STRLEN linecount = 1;
+       STRLEN herelen = SvCUR(tmpstr);
+       char *ss = SvPVX(tmpstr);
+       char *se = ss + herelen;
+        SV *newstr = newSV(herelen+1);
+        SvPOK_on(newstr);
+
+       /* Trim leading whitespace */
+       while (ss < se) {
+           /* newline only? Copy and move on */
+           if (*ss == '\n') {
+               sv_catpv(newstr,"\n");
+               ss++;
+               linecount++;
+
+           /* Found our indentation? Strip it */
+           } else if (se - ss >= indent_len
+                      && memEQ(ss, indent, indent_len))
+           {
+               STRLEN le = 0;
+
+               ss += indent_len;
+
+               while ((ss + le) < se && *(ss + le) != '\n')
+                   le++;
+
+               sv_catpvn(newstr, ss, le);
+
+               ss += le;
+
+           /* Line doesn't begin with our indentation? Croak */
+           } else {
+               Perl_croak(aTHX_
+                   "Indentation on line %d of here-doc doesn't match delimiter",
+                   (int)linecount
+               );
+           }
+       }
+        /* avoid sv_setsv() as we dont wan't to COW here */
+        sv_setpvn(tmpstr,SvPVX(newstr),SvCUR(newstr));
+       Safefree(indent);
+       SvREFCNT_dec_NN(newstr);
+    }
      if (SvCUR(tmpstr) + 5 < SvLEN(tmpstr)) {
         SvPV_shrink_to_cur(tmpstr);
      }
@@ -9696,8 +10100,9 @@ S_scan_heredoc(pTHX_ char *s)
  }
  
  /* scan_inputsymbol
-   takes: current position in input buffer
-   returns: new position in input buffer
+   takes: position of first '<' in input buffer
+   returns: position of first char following the matching '>' in
+           input buffer
     side-effects: pl_yylval and lex_op are set.
  
     This code handles:
@@ -9757,8 +10162,9 @@ S_scan_inputsymbol(pTHX_ char *start)
      if (*d == '$' && d[1]) d++;
  
      /* allow <Pkg'VALUE> or <Pkg::VALUE> */
-    while (*d && (isWORDCHAR_lazy_if(d,UTF) || *d == '\'' || *d == ':'))
+    while (isWORDCHAR_lazy_if_safe(d, e, UTF) || *d == '\'' || *d == ':') {
         d += UTF ? UTF8SKIP(d) : 1;
+    }
  
      /* If we've tried to read what we allow filehandles to look like, and
         there's still text left, then it must be a glob() and not a getline.
@@ -9809,10 +10215,10 @@ S_scan_inputsymbol(pTHX_ char *start)
                     OP * const o = newOP(OP_PADSV, 0);
                     o->op_targ = tmp;
                     PL_lex_op = readline_overriden
-                       ? (OP*)newUNOP(OP_ENTERSUB, OPf_STACKED,
+                        ? newUNOP(OP_ENTERSUB, OPf_STACKED,
                                 op_append_elem(OP_LIST, o,
                                     newCVREF(0, newGVOP(OP_GV,0,gv_readline))))
-                       : (OP*)newUNOP(OP_READLINE, 0, o);
+                        : newUNOP(OP_READLINE, 0, o);
                 }
             }
             else {
@@ -9823,11 +10229,11 @@ S_scan_inputsymbol(pTHX_ char *start)
                                 GV_ADDMULTI | ( UTF ? SVf_UTF8 : 0 ),
                                 SVt_PV);
                 PL_lex_op = readline_overriden
-                   ? (OP*)newUNOP(OP_ENTERSUB, OPf_STACKED,
+                    ? newUNOP(OP_ENTERSUB, OPf_STACKED,
                             op_append_elem(OP_LIST,
                                 newUNOP(OP_RV2SV, 0, newGVOP(OP_GV, 0, gv)),
                                 newCVREF(0, newGVOP(OP_GV, 0, gv_readline))))
-                   : (OP*)newUNOP(OP_READLINE, 0,
+                    : newUNOP(OP_READLINE, 0,
                             newUNOP(OP_RV2SV, 0,
                                 newGVOP(OP_GV, 0, gv)));
             }
@@ -9840,11 +10246,11 @@ S_scan_inputsymbol(pTHX_ char *start)
         else {
             GV * const gv = gv_fetchpv(d, GV_ADD | ( UTF ? SVf_UTF8 : 0 ), SVt_PVIO);
             PL_lex_op = readline_overriden
-               ? (OP*)newUNOP(OP_ENTERSUB, OPf_STACKED,
+                ? newUNOP(OP_ENTERSUB, OPf_STACKED,
                         op_append_elem(OP_LIST,
                             newGVOP(OP_GV, 0, gv),
                             newCVREF(0, newGVOP(OP_GV, 0, gv_readline))))
-               : (OP*)newUNOP(OP_READLINE, nomagicopen ? OPf_SPECIAL : 0, newGVOP(OP_GV, 0, gv));
+                : newUNOP(OP_READLINE, nomagicopen ? OPf_SPECIAL : 0, newGVOP(OP_GV, 0, gv));
             pl_yylval.ival = OP_NULL;
         }
      }
@@ -9917,11 +10323,23 @@ S_scan_str(pTHX_ char *start, int keep_bracketed_quoted, int keep_delims, int re
      char *to;                  /* current position in the sv's data */
      I32 brackets = 1;          /* bracket nesting level */
      bool has_utf8 = FALSE;     /* is there any utf8 content? */
-    I32 termcode;              /* terminating char. code */
+    IV termcode;               /* terminating char. code */
      U8 termstr[UTF8_MAXBYTES]; /* terminating string */
      STRLEN termlen;            /* length of terminating string */
      line_t herelines;
  
+    /* The delimiters that have a mirror-image closing one */
+    const char * opening_delims = "([{<";
+    const char * closing_delims = ")]}>";
+
+    const char * non_grapheme_msg = "Use of unassigned code point or"
+                                    " non-standalone grapheme for a delimiter"
+                                    " will be a fatal error starting in Perl"
+                                    " v5.30";
+    /* The only non-UTF character that isn't a stand alone grapheme is
+     * white-space, hence can't be a delimiter.  So can skip for non-UTF-8 */
+    bool check_grapheme = UTF && ckWARN_d(WARN_DEPRECATED);
+
      PERL_ARGS_ASSERT_SCAN_STR;
  
      /* skip space before the delimiter */
@@ -9934,27 +10352,48 @@ S_scan_str(pTHX_ char *start, int keep_bracketed_quoted, int keep_delims, int re
  
      /* after skipping whitespace, the next character is the terminator */
      term = *s;
-    if (!UTF) {
+    if (!UTF || UTF8_IS_INVARIANT(term)) {
         termcode = termstr[0] = term;
         termlen = 1;
      }
      else {
         termcode = utf8_to_uvchr_buf((U8*)s, (U8*)PL_bufend, &termlen);
+        if (check_grapheme) {
+            if (   UNLIKELY(UNICODE_IS_SUPER(termcode))
+                || UNLIKELY(UNICODE_IS_NONCHAR(termcode)))
+            {
+                /* These are considered graphemes, and since the ending
+                 * delimiter will be the same, we don't have to check the other
+                 * end */
+                check_grapheme = FALSE;
+            }
+            else if (UNLIKELY(! _is_grapheme((U8 *) start,
+                                             (U8 *) s,
+                                             (U8 *) PL_bufend,
+                                             termcode)))
+            {
+                Perl_warner(aTHX_ packWARN(WARN_DEPRECATED), "%s", non_grapheme_msg);
+
+                /* Don't have to check the other end, as have already warned at
+                 * this one */
+                check_grapheme = FALSE;
+            }
+        }
+
         Copy(s, termstr, termlen, U8);
-       if (!UTF8_IS_INVARIANT(term))
-           has_utf8 = TRUE;
      }
  
      /* mark where we are */
      PL_multi_start = CopLINE(PL_curcop);
-    PL_multi_open = term;
+    PL_multi_open = termcode;
      herelines = PL_parser->herelines;
  
-    /* find corresponding closing delimiter */
-    if (term && (tmps = strchr("([{< )]}> )]}>",term)))
-       termcode = termstr[0] = term = tmps[5];
+    /* If the delimiter has a mirror-image closing one, get it */
+    if (term && (tmps = strchr(opening_delims, term))) {
+        termcode = termstr[0] = term = closing_delims[tmps - opening_delims];
+    }
  
-    PL_multi_close = term;
+    PL_multi_close = termcode;
  
      if (PL_multi_open == PL_multi_close) {
          keep_bracketed_quoted = FALSE;
@@ -9999,6 +10438,15 @@ S_scan_str(pTHX_ char *start, int keep_bracketed_quoted, int keep_delims, int re
                     if (termlen == 1)
                         break;
                     if (s+termlen <= PL_bufend && memEQ(s, (char*)termstr, termlen))
+                        if (   check_grapheme
+                            && UNLIKELY(! _is_grapheme((U8 *) start,
+                                                              (U8 *) s,
+                                                              (U8 *) PL_bufend,
+                                                              termcode)))
+                        {
+                            Perl_warner(aTHX_ packWARN(WARN_DEPRECATED),
+                                        "%s", non_grapheme_msg);
+                        }
                         break;
                 }
                 else if (!has_utf8 && !UTF8_IS_INVARIANT((U8)*s) && UTF)
@@ -10075,7 +10523,7 @@ S_scan_str(pTHX_ char *start, int keep_bracketed_quoted, int keep_delims, int re
             CopLINE_set(PL_curcop, (line_t)PL_multi_start);
             return NULL;
         }
-       s = PL_bufptr;
+       s = start = PL_bufptr;
      }
  
      /* at this point, we have successfully read the delimited string */
@@ -10102,7 +10550,7 @@ S_scan_str(pTHX_ char *start, int keep_bracketed_quoted, int keep_delims, int re
      */
  
      if (PL_lex_stuff)
-       PL_sublex_info.repl = sv;
+       PL_parser->lex_sub_repl = sv;
      else
         PL_lex_stuff = sv;
      if (delimp) *delimp = PL_multi_open == PL_multi_close ? s-termlen : s;
@@ -10143,6 +10591,15 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
      bool floatit;                      /* boolean: int or float? */
      const char *lastub = NULL;         /* position of last underbar */
      static const char* const number_too_long = "Number too long";
+    bool warned_about_underscore = 0;
+#define WARN_ABOUT_UNDERSCORE() \
+       do { \
+           if (!warned_about_underscore) { \
+               warned_about_underscore = 1; \
+               Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX), \
+                              "Misplaced _ in number"); \
+           } \
+       } while(0)
      /* Hexadecimal floating point.
       *
       * In many places (where we have quads and NV is IEEE 754 double)
@@ -10227,8 +10684,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
             }
  
             if (*s == '_') {
-               Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                              "Misplaced _ in number");
+               WARN_ABOUT_UNDERSCORE();
                lastub = s++;
             }
  
@@ -10251,8 +10707,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
                 /* _ are ignored -- but warned about if consecutive */
                 case '_':
                     if (lastub && s == lastub + 1)
-                       Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                                      "Misplaced _ in number");
+                       WARN_ABOUT_UNDERSCORE();
                     lastub = s++;
                     break;
  
@@ -10337,9 +10792,8 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
           out:
  
             /* final misplaced underbar check */
-           if (s[-1] == '_') {
-               Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX), "Misplaced _ in number");
-           }
+           if (s[-1] == '_')
+               WARN_ABOUT_UNDERSCORE();
  
              if (UNLIKELY(HEXFP_PEEK(s))) {
                  /* Do sloppy (on the underbars) but quick detection
@@ -10461,6 +10915,14 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
  #ifdef NV_MIN_EXP
                                  if (negexp
                                      && -hexfp_exp < NV_MIN_EXP - 1) {
+                                    /* NOTE: this means that the exponent
+                                     * underflow warning happens for
+                                     * the IEEE 754 subnormals (denormals),
+                                     * because DBL_MIN_EXP etc are the lowest
+                                     * possible binary (or, rather, DBL_RADIX-base)
+                                     * exponent for normals, not subnormals.
+                                     *
+                                     * This may or may not be a good thing. */
                                      Perl_ck_warner(aTHX_ packWARN(WARN_OVERFLOW),
                                                     "Hexadecimal float: exponent underflow");
                                      break;
@@ -10482,7 +10944,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
  #ifdef HEXFP_UQUAD
                          hexfp_exp -= hexfp_frac_bits;
  #endif
-                        hexfp_mult = pow(2.0, hexfp_exp);
+                        hexfp_mult = Perl_pow(2.0, hexfp_exp);
                          hexfp = TRUE;
                          goto decimal;
                      }
@@ -10540,8 +11002,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
             */
             if (*s == '_') {
                 if (lastub && s == lastub + 1)
-                   Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                                  "Misplaced _ in number");
+                   WARN_ABOUT_UNDERSCORE();
                 lastub = s++;
             }
             else {
@@ -10554,9 +11015,8 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
         }
  
         /* final misplaced underbar check */
-       if (lastub && s == lastub + 1) {
-           Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX), "Misplaced _ in number");
-       }
+       if (lastub && s == lastub + 1)
+           WARN_ABOUT_UNDERSCORE();
  
         /* read a decimal portion if there is one.  avoid
            3..5 being interpreted as the number 3. followed
@@ -10567,8 +11027,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
             *d++ = *s++;
  
             if (*s == '_') {
-               Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                              "Misplaced _ in number");
+               WARN_ABOUT_UNDERSCORE();
                 lastub = s;
             }
  
@@ -10584,18 +11043,15 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
                     Perl_croak(aTHX_ "%s", number_too_long);
                 if (*s == '_') {
                    if (lastub && s == lastub + 1)
-                      Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                                     "Misplaced _ in number");
+                       WARN_ABOUT_UNDERSCORE();
                    lastub = s;
                 }
                 else
                     *d++ = *s;
             }
             /* fractional part ending in underbar? */
-           if (s[-1] == '_') {
-               Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                              "Misplaced _ in number");
-           }
+           if (s[-1] == '_')
+               WARN_ABOUT_UNDERSCORE();
             if (*s == '.' && isDIGIT(s[1])) {
                 /* oops, it's really a v-string, but without the "v" */
                 s = start;
@@ -10625,8 +11081,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
  
             /* stray preinitial _ */
             if (*s == '_') {
-               Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                              "Misplaced _ in number");
+               WARN_ABOUT_UNDERSCORE();
                 lastub = s++;
             }
  
@@ -10636,8 +11091,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
  
             /* stray initial _ */
             if (*s == '_') {
-               Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                              "Misplaced _ in number");
+               WARN_ABOUT_UNDERSCORE();
                 lastub = s++;
             }
  
@@ -10651,8 +11105,7 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
                 else {
                    if (((lastub && s == lastub + 1)
                          || (!isDIGIT(s[1]) && s[1] != '_')))
-                      Perl_ck_warner(aTHX_ packWARN(WARN_SYNTAX),
-                                     "Misplaced _ in number");
+                       WARN_ABOUT_UNDERSCORE();
                    lastub = s++;
                 }
             }
@@ -10807,8 +11260,7 @@ S_scan_formline(pTHX_ char *s)
         PL_expect = XSTATE;
         if (needargs) {
             const char *s2 = s;
-           while (*s2 == '\r' || *s2 == ' ' || *s2 == '\t' || *s2 == '\f'
-               || *s2 == '\v')
+           while (isSPACE(*s2) && *s2 != '\n')
                 s2++;
             if (*s2 == '{') {
                 PL_expect = XTERMBLOCK;
@@ -10822,7 +11274,7 @@ S_scan_formline(pTHX_ char *s)
             if (UTF && is_utf8_string((U8*)SvPVX_const(stuff), SvCUR(stuff)))
                 SvUTF8_on(stuff);
         }
-       NEXTVAL_NEXTTOKE.opval = (OP*)newSVOP(OP_CONST, 0, stuff);
+        NEXTVAL_NEXTTOKE.opval = newSVOP(OP_CONST, 0, stuff);
         force_next(THING);
      }
      else {
@@ -10953,32 +11405,32 @@ Perl_yyerror_pvn(pTHX_ const char *const s, STRLEN len, U32 flags)
             Perl_sv_catpvf(aTHX_ where_sv, "\\%03o", yychar & 255);
      }
      msg = newSVpvn_flags(s, len, (flags & SVf_UTF8) | SVs_TEMP);
-    Perl_sv_catpvf(aTHX_ msg, " at %s line %"IVdf", ",
+    Perl_sv_catpvf(aTHX_ msg, " at %s line %" IVdf ", ",
          OutCopFILE(PL_curcop),
          (IV)(PL_parser->preambling == NOLINE
                 ? CopLINE(PL_curcop)
                 : PL_parser->preambling));
      if (context)
-       Perl_sv_catpvf(aTHX_ msg, "near \"%"UTF8f"\"\n",
+       Perl_sv_catpvf(aTHX_ msg, "near \"%" UTF8f "\"\n",
                              UTF8fARG(UTF, contlen, context));
      else
-       Perl_sv_catpvf(aTHX_ msg, "%"SVf"\n", SVfARG(where_sv));
+       Perl_sv_catpvf(aTHX_ msg, "%" SVf "\n", SVfARG(where_sv));
      if (PL_multi_start < PL_multi_end && (U32)(CopLINE(PL_curcop) - PL_multi_end) <= 1) {
          Perl_sv_catpvf(aTHX_ msg,
-        "  (Might be a runaway multi-line %c%c string starting on line %"IVdf")\n",
+        "  (Might be a runaway multi-line %c%c string starting on line %" IVdf ")\n",
                  (int)PL_multi_open,(int)PL_multi_close,(IV)PL_multi_start);
          PL_multi_end = 0;
      }
      if (PL_in_eval & EVAL_WARNONLY) {
         PL_in_eval &= ~EVAL_WARNONLY;
-       Perl_ck_warner_d(aTHX_ packWARN(WARN_SYNTAX), "%"SVf, SVfARG(msg));
+       Perl_ck_warner_d(aTHX_ packWARN(WARN_SYNTAX), "%" SVf, SVfARG(msg));
      }
      else
         qerror(msg);
      if (PL_error_count >= 10) {
         SV * errsv;
         if (PL_in_eval && ((errsv = ERRSV), SvCUR(errsv)))
-           Perl_croak(aTHX_ "%"SVf"%s has too many errors.\n",
+           Perl_croak(aTHX_ "%" SVf "%s has too many errors.\n",
                        SVfARG(errsv), OutCopFILE(PL_curcop));
         else
             Perl_croak(aTHX_ "%s has too many errors.\n",
@@ -11101,10 +11553,10 @@ S_utf16_textfilter(pTHX_ int idx, SV *sv, int maxlen)
         Perl_croak(aTHX_ "panic: utf16_textfilter called in block mode (for %d characters)", maxlen);
      }
      if (status < 0) {
-       Perl_croak(aTHX_ "panic: utf16_textfilter called after error (status=%"IVdf")", status);
+       Perl_croak(aTHX_ "panic: utf16_textfilter called after error (status=%" IVdf ")", status);
      }
      DEBUG_P(PerlIO_printf(Perl_debug_log,
-                         "utf16_textfilter(%p,%ce): idx=%d maxlen=%d status=%"IVdf" utf16=%"UVuf" utf8=%"UVuf"\n",
+                         "utf16_textfilter(%p,%ce): idx=%d maxlen=%d status=%" IVdf " utf16=%" UVuf " utf8=%" UVuf "\n",
                           FPTR2DPTR(void *, S_utf16_textfilter),
                           reverse ? 'l' : 'b', idx, maxlen, status,
                           (UV)SvCUR(utf16_buffer), (UV)SvCUR(utf8_buffer)));
@@ -11159,7 +11611,7 @@ S_utf16_textfilter(pTHX_ int idx, SV *sv, int maxlen)
  
             status = FILTER_READ(idx + 1, utf16_buffer,
                                  160 + (SvCUR(utf16_buffer) & 1));
-           DEBUG_P(PerlIO_printf(Perl_debug_log, "utf16_textfilter status=%"IVdf" SvCUR(sv)=%"UVuf"\n", status, (UV)SvCUR(utf16_buffer)));
+           DEBUG_P(PerlIO_printf(Perl_debug_log, "utf16_textfilter status=%" IVdf " SvCUR(sv)=%" UVuf "\n", status, (UV)SvCUR(utf16_buffer)));
             DEBUG_P({ sv_dump(utf16_buffer); sv_dump(utf8_buffer);});
             if (status < 0) {
                 /* Error */
@@ -11195,7 +11647,7 @@ S_utf16_textfilter(pTHX_ int idx, SV *sv, int maxlen)
         }
      }
      DEBUG_P(PerlIO_printf(Perl_debug_log,
-                         "utf16_textfilter: returns, status=%"IVdf" utf16=%"UVuf" utf8=%"UVuf"\n",
+                         "utf16_textfilter: returns, status=%" IVdf " utf16=%" UVuf " utf8=%" UVuf "\n",
                           status,
                           (UV)SvCUR(utf16_buffer), (UV)SvCUR(utf8_buffer)));
      DEBUG_P({ sv_dump(utf8_buffer); sv_dump(sv);});
@@ -11210,7 +11662,7 @@ S_add_utf16_textfilter(pTHX_ U8 *const s, bool reversed)
      PERL_ARGS_ASSERT_ADD_UTF16_TEXTFILTER;
  
      IoTOP_GV(filter) = MUTABLE_GV(newSVpvn((char *)s, PL_bufend - (char*)s));
-    sv_setpvs(filter, "");
+    SvPVCLEAR(filter);
      IoLINES(filter) = reversed;
      IoPAGE(filter) = 1; /* Not EOF */
  
@@ -11276,7 +11728,7 @@ Perl_scan_vstring(pTHX_ const char *s, const char *const e, SV *sv)
         if (*s == 'v')
             s++;  /* get past 'v' */
  
-       sv_setpvs(sv, "");
+        SvPVCLEAR(sv);
  
         for (;;) {
             /* this is atoi() that tolerates underscores */
@@ -11619,7 +12071,7 @@ Perl_parse_label(pTHX_ U32 flags)
         STRLEN wlen, bufptr_pos;
         lex_read_space(0);
         t = s = PL_bufptr;
-        if (!isIDFIRST_lazy_if(s, UTF))
+        if (!isIDFIRST_lazy_if_safe(s, PL_bufend, UTF))
             goto no_label;
         t = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE, &wlen);
         if (word_takes_any_delimiter(s, wlen))
@@ -11726,219 +12178,6 @@ Perl_parse_stmtseq(pTHX_ U32 flags)
      return stmtseqop;
  }
  
-#define parse_opt_lexvar() S_parse_opt_lexvar(aTHX)
-static OP *
-S_parse_opt_lexvar(pTHX)
-{
-    I32 sigil, c;
-    char *s, *d;
-    OP *var;
-    lex_token_boundary();
-    sigil = lex_read_unichar(0);
-    if (lex_peek_unichar(0) == '#') {
-       qerror(Perl_mess(aTHX_ "Parse error"));
-       return NULL;
-    }
-    lex_read_space(0);
-    c = lex_peek_unichar(0);
-    if (c == -1 || !(UTF ? isIDFIRST_uni(c) : isIDFIRST_A(c)))
-       return NULL;
-    s = PL_bufptr;
-    d = PL_tokenbuf + 1;
-    PL_tokenbuf[0] = (char)sigil;
-    parse_ident(&s, &d, PL_tokenbuf + sizeof(PL_tokenbuf) - 1, 0,
-               cBOOL(UTF), FALSE);
-    PL_bufptr = s;
-    if (d == PL_tokenbuf+1)
-       return NULL;
-    var = newOP(sigil == '$' ? OP_PADSV : sigil == '@' ? OP_PADAV : OP_PADHV,
-               OPf_MOD | (OPpLVAL_INTRO<<8));
-    var->op_targ = allocmy(PL_tokenbuf, d - PL_tokenbuf, UTF ? SVf_UTF8 : 0);
-    return var;
-}
-
-OP *
-Perl_parse_subsignature(pTHX)
-{
-    I32 c;
-    int prev_type = 0, pos = 0, min_arity = 0, max_arity = 0;
-    OP *initops = NULL;
-    lex_read_space(0);
-    c = lex_peek_unichar(0);
-    while (c != /*(*/')') {
-       switch (c) {
-           case '$': {
-               OP *var, *expr;
-               if (prev_type == 2)
-                   qerror(Perl_mess(aTHX_ "Slurpy parameter not last"));
-               var = parse_opt_lexvar();
-               expr = var ?
-                   newBINOP(OP_AELEM, 0,
-                       ref(newUNOP(OP_RV2AV, 0, newGVOP(OP_GV, 0, PL_defgv)),
-                           OP_RV2AV),
-                       newSVOP(OP_CONST, 0, newSViv(pos))) :
-                   NULL;
-               lex_read_space(0);
-               c = lex_peek_unichar(0);
-               if (c == '=') {
-                   lex_token_boundary();
-                   lex_read_unichar(0);
-                   lex_read_space(0);
-                   c = lex_peek_unichar(0);
-                   if (c == ',' || c == /*(*/')') {
-                       if (var)
-                           qerror(Perl_mess(aTHX_ "Optional parameter "
-                                   "lacks default expression"));
-                   } else {
-                       OP *defexpr = parse_termexpr(0);
-                       if (defexpr->op_type == OP_UNDEF
-                            && !(defexpr->op_flags & OPf_KIDS))
-                        {
-                           op_free(defexpr);
-                       } else {
-                           OP *ifop = 
-                               newBINOP(OP_GE, 0,
-                                   scalar(newUNOP(OP_RV2AV, 0,
-                                           newGVOP(OP_GV, 0, PL_defgv))),
-                                   newSVOP(OP_CONST, 0, newSViv(pos+1)));
-                           expr = var ?
-                               newCONDOP(0, ifop, expr, defexpr) :
-                               newLOGOP(OP_OR, 0, ifop, defexpr);
-                       }
-                   }
-                   prev_type = 1;
-               } else {
-                   if (prev_type == 1)
-                       qerror(Perl_mess(aTHX_ "Mandatory parameter "
-                               "follows optional parameter"));
-                   prev_type = 0;
-                   min_arity = pos + 1;
-               }
-               if (var) expr = newASSIGNOP(OPf_STACKED, var, 0, expr);
-               if (expr)
-                   initops = op_append_list(OP_LINESEQ, initops,
-                               newSTATEOP(0, NULL, expr));
-               max_arity = ++pos;
-           } break;
-           case '@':
-           case '%': {
-               OP *var;
-               if (prev_type == 2)
-                   qerror(Perl_mess(aTHX_ "Slurpy parameter not last"));
-               var = parse_opt_lexvar();
-               if (c == '%') {
-                   OP *chkop = newLOGOP((pos & 1) ? OP_OR : OP_AND, 0,
-                           newBINOP(OP_BIT_AND, 0,
-                               scalar(newUNOP(OP_RV2AV, 0,
-                                   newGVOP(OP_GV, 0, PL_defgv))),
-                               newSVOP(OP_CONST, 0, newSViv(1))),
-                           op_convert_list(OP_DIE, 0,
-                               op_convert_list(OP_SPRINTF, 0,
-                                   op_append_list(OP_LIST,
-                                       newSVOP(OP_CONST, 0,
-                                           newSVpvs("Odd name/value argument for subroutine at %s line %d.\n")),
-                                       newSLICEOP(0,
-                                           op_append_list(OP_LIST,
-                                               newSVOP(OP_CONST, 0, newSViv(1)),
-                                               newSVOP(OP_CONST, 0, newSViv(2))),
-                                           newOP(OP_CALLER, 0))))));
-                   if (pos != min_arity)
-                       chkop = newLOGOP(OP_AND, 0,
-                                   newBINOP(OP_GT, 0,
-                                       scalar(newUNOP(OP_RV2AV, 0,
-                                           newGVOP(OP_GV, 0, PL_defgv))),
-                                       newSVOP(OP_CONST, 0, newSViv(pos))),
-                                   chkop);
-                   initops = op_append_list(OP_LINESEQ,
-                               newSTATEOP(0, NULL, chkop),
-                               initops);
-               }
-               if (var) {
-                   OP *slice = pos ?
-                       op_prepend_elem(OP_ASLICE,
-                           newOP(OP_PUSHMARK, 0),
-                           newLISTOP(OP_ASLICE, 0,
-                               list(newRANGE(0,
-                                   newSVOP(OP_CONST, 0, newSViv(pos)),
-                                   newUNOP(OP_AV2ARYLEN, 0,
-                                       ref(newUNOP(OP_RV2AV, 0,
-                                               newGVOP(OP_GV, 0, PL_defgv)),
-                                           OP_AV2ARYLEN)))),
-                               ref(newUNOP(OP_RV2AV, 0,
-                                       newGVOP(OP_GV, 0, PL_defgv)),
-                                   OP_ASLICE))) :
-                       newUNOP(OP_RV2AV, 0, newGVOP(OP_GV, 0, PL_defgv));
-                   initops = op_append_list(OP_LINESEQ, initops,
-                       newSTATEOP(0, NULL,
-                           newASSIGNOP(OPf_STACKED, var, 0, slice)));
-               }
-               prev_type = 2;
-               max_arity = -1;
-           } break;
-           default:
-               parse_error:
-               qerror(Perl_mess(aTHX_ "Parse error"));
-               return NULL;
-       }
-       lex_read_space(0);
-       c = lex_peek_unichar(0);
-       switch (c) {
-           case /*(*/')': break;
-           case ',':
-               do {
-                   lex_token_boundary();
-                   lex_read_unichar(0);
-                   lex_read_space(0);
-                   c = lex_peek_unichar(0);
-               } while (c == ',');
-               break;
-           default:
-               goto parse_error;
-       }
-    }
-    if (min_arity != 0) {
-       initops = op_append_list(OP_LINESEQ,
-           newSTATEOP(0, NULL,
-               newLOGOP(OP_OR, 0,
-                   newBINOP(OP_GE, 0,
-                       scalar(newUNOP(OP_RV2AV, 0,
-                           newGVOP(OP_GV, 0, PL_defgv))),
-                       newSVOP(OP_CONST, 0, newSViv(min_arity))),
-                   op_convert_list(OP_DIE, 0,
-                       op_convert_list(OP_SPRINTF, 0,
-                           op_append_list(OP_LIST,
-                               newSVOP(OP_CONST, 0,
-                                   newSVpvs("Too few arguments for subroutine at %s line %d.\n")),
-                               newSLICEOP(0,
-                                   op_append_list(OP_LIST,
-                                       newSVOP(OP_CONST, 0, newSViv(1)),
-                                       newSVOP(OP_CONST, 0, newSViv(2))),
-                                   newOP(OP_CALLER, 0))))))),
-           initops);
-    }
-    if (max_arity != -1) {
-       initops = op_append_list(OP_LINESEQ,
-           newSTATEOP(0, NULL,
-               newLOGOP(OP_OR, 0,
-                   newBINOP(OP_LE, 0,
-                       scalar(newUNOP(OP_RV2AV, 0,
-                           newGVOP(OP_GV, 0, PL_defgv))),
-                       newSVOP(OP_CONST, 0, newSViv(max_arity))),
-                   op_convert_list(OP_DIE, 0,
-                       op_convert_list(OP_SPRINTF, 0,
-                           op_append_list(OP_LIST,
-                               newSVOP(OP_CONST, 0,
-                                   newSVpvs("Too many arguments for subroutine at %s line %d.\n")),
-                               newSLICEOP(0,
-                                   op_append_list(OP_LIST,
-                                       newSVOP(OP_CONST, 0, newSViv(1)),
-                                       newSVOP(OP_CONST, 0, newSViv(2))),
-                                   newOP(OP_CALLER, 0))))))),
-           initops);
-    }
-    return initops;
-}
-
  /*
   * ex: set ts=8 sts=4 sw=4 et:
   */