function to parse isolated label

[perl5.git] / toke.c
diff --git a/toke.c b/toke.c

index d7d5d4d..a30f60b 100644 (file)
--- a/toke.c
+++ b/toke.c
@@ -39,15 +39,13 @@ Individual members of C<PL_parser> have their own documentation.
  #include "EXTERN.h"
  #define PERL_IN_TOKE_C
  #include "perl.h"
+#include "dquote_static.c"
  
  #define new_constant(a,b,c,d,e,f,g)    \
         S_new_constant(aTHX_ a,b,STR_WITH_LEN(c),d,e,f, g)
  
  #define pl_yylval      (PL_parser->yylval)
  
-/* YYINITDEPTH -- initial size of the parser's stacks.  */
-#define YYINITDEPTH 200
-
  /* XXX temporary backwards compatibility */
  #define PL_lex_brackets                (PL_parser->lex_brackets)
  #define PL_lex_brackstack      (PL_parser->lex_brackstack)
@@ -126,8 +124,9 @@ static const char ident_too_long[] = "Identifier too long";
  #  define NEXTVAL_NEXTTOKE PL_nextval[PL_nexttoke]
  #endif
  
-#define XFAKEBRACK 128
-#define XENUMMASK 127
+#define XENUMMASK  0x3f
+#define XFAKEEOF   0x40
+#define XFAKEBRACK 0x80
  
  #ifdef USE_UTF8_SCRIPTS
  #   define UTF (!IN_BYTES)
@@ -645,29 +644,39 @@ S_cr_textfilter(pTHX_ int idx, SV *sv, int maxlen)
  }
  #endif
  
-
-
  /*
- * Perl_lex_start
- *
- * Create a parser object and initialise its parser and lexer fields
- *
- * rsfp       is the opened file handle to read from (if any),
- *
- * line       holds any initial content already read from the file (or in
- *            the case of no file, such as an eval, the whole contents);
- *
- * new_filter indicates that this is a new file and it shouldn't inherit
- *            the filters from the current parser (ie require).
- */
+=for apidoc Amx|void|lex_start|SV *line|PerlIO *rsfp|U32 flags
+
+Creates and initialises a new lexer/parser state object, supplying
+a context in which to lex and parse from a new source of Perl code.
+A pointer to the new state object is placed in L</PL_parser>.  An entry
+is made on the save stack so that upon unwinding the new state object
+will be destroyed and the former value of L</PL_parser> will be restored.
+Nothing else need be done to clean up the parsing context.
+
+The code to be parsed comes from I<line> and I<rsfp>.  I<line>, if
+non-null, provides a string (in SV form) containing code to be parsed.
+A copy of the string is made, so subsequent modification of I<line>
+does not affect parsing.  I<rsfp>, if non-null, provides an input stream
+from which code will be read to be parsed.  If both are non-null, the
+code in I<line> comes first and must consist of complete lines of input,
+and I<rsfp> supplies the remainder of the source.
+
+The I<flags> parameter is reserved for future use, and must always
+be zero.
+
+=cut
+*/
  
  void
-Perl_lex_start(pTHX_ SV *line, PerlIO *rsfp, bool new_filter)
+Perl_lex_start(pTHX_ SV *line, PerlIO *rsfp, U32 flags)
  {
      dVAR;
      const char *s = NULL;
      STRLEN len;
      yy_parser *parser, *oparser;
+    if (flags)
+       Perl_croak(aTHX_ "Lexing code internal error (%s)", "lex_start");
  
      /* create and initialise a parser */
  
@@ -675,13 +684,9 @@ Perl_lex_start(pTHX_ SV *line, PerlIO *rsfp, bool new_filter)
      parser->old_parser = oparser = PL_parser;
      PL_parser = parser;
  
-    Newx(parser->stack, YYINITDEPTH, yy_stack_frame);
-    parser->ps = parser->stack;
-    parser->stack_size = YYINITDEPTH;
-
-    parser->stack->state = 0;
-    parser->yyerrstatus = 0;
-    parser->yychar = YYEMPTY;          /* Cause a token to be read.  */
+    parser->stack = NULL;
+    parser->ps = NULL;
+    parser->stack_size = 0;
  
      /* on scope exit, free this parser and restore any outer one */
      SAVEPARSER(parser);
@@ -699,8 +704,7 @@ Perl_lex_start(pTHX_ SV *line, PerlIO *rsfp, bool new_filter)
      parser->lex_state = LEX_NORMAL;
      parser->expect = XSTATE;
      parser->rsfp = rsfp;
-    parser->rsfp_filters = (new_filter || !oparser) ? newAV()
-               : MUTABLE_AV(SvREFCNT_inc(oparser->rsfp_filters));
+    parser->rsfp_filters = newAV();
  
      Newx(parser->lex_brackstack, 120, char);
      Newx(parser->lex_casestack, 12, char);
@@ -714,14 +718,10 @@ Perl_lex_start(pTHX_ SV *line, PerlIO *rsfp, bool new_filter)
  
      if (!len) {
         parser->linestr = newSVpvs("\n;");
-    } else if (SvREADONLY(line) || s[len-1] != ';') {
-       parser->linestr = newSVsv(line);
+    } else {
+       parser->linestr = newSVpvn_flags(s, len, SvUTF8(line));
         if (s[len-1] != ';')
             sv_catpvs(parser->linestr, "\n;");
-    } else {
-       SvTEMP_off(line);
-       SvREFCNT_inc_simple_void_NN(line);
-       parser->linestr = line;
      }
      parser->oldoldbufptr =
         parser->oldbufptr =
@@ -729,6 +729,8 @@ Perl_lex_start(pTHX_ SV *line, PerlIO *rsfp, bool new_filter)
         parser->linestart = SvPVX(parser->linestr);
      parser->bufend = parser->bufptr + SvCUR(parser->linestr);
      parser->last_lop = parser->last_uni = NULL;
+
+    parser->in_pod = 0;
  }
  
  
@@ -749,7 +751,6 @@ Perl_parser_free(pTHX_  const yy_parser *parser)
         PerlIO_close(parser->rsfp);
      SvREFCNT_dec(parser->rsfp_filters);
  
-    Safefree(parser->stack);
      Safefree(parser->lex_brackstack);
      Safefree(parser->lex_casestack);
      PL_parser = parser->old_parser;
@@ -758,19 +759,6 @@ Perl_parser_free(pTHX_  const yy_parser *parser)
  
  
  /*
- * Perl_lex_end
- * Finalizer for lexing operations.  Must be called when the parser is
- * done with the lexer.
- */
-
-void
-Perl_lex_end(pTHX)
-{
-    dVAR;
-    PL_doextract = FALSE;
-}
-
-/*
  =for apidoc AmxU|SV *|PL_parser-E<gt>linestr
  
  Buffer scalar containing the chunk currently under consideration of the
@@ -929,7 +917,7 @@ at I<pv>.  These octets are interpreted as either UTF-8 or Latin-1,
  according to whether the C<LEX_STUFF_UTF8> flag is set in I<flags>.
  The characters are recoded for the lexer buffer, according to how the
  buffer is currently being interpreted (L</lex_bufutf8>).  If a string
-to be interpreted is available as a Perl scalar, the L</lex_stuff_sv>
+to be inserted is available as a Perl scalar, the L</lex_stuff_sv>
  function is more convenient.
  
  =cut
@@ -1021,6 +1009,35 @@ Perl_lex_stuff_pvn(pTHX_ const char *pv, STRLEN len, U32 flags)
  }
  
  /*
+=for apidoc Amx|void|lex_stuff_pv|const char *pv|U32 flags
+
+Insert characters into the lexer buffer (L</PL_parser-E<gt>linestr>),
+immediately after the current lexing point (L</PL_parser-E<gt>bufptr>),
+reallocating the buffer if necessary.  This means that lexing code that
+runs later will see the characters as if they had appeared in the input.
+It is not recommended to do this as part of normal parsing, and most
+uses of this facility run the risk of the inserted characters being
+interpreted in an unintended manner.
+
+The string to be inserted is represented by octets starting at I<pv>
+and continuing to the first nul.  These octets are interpreted as either
+UTF-8 or Latin-1, according to whether the C<LEX_STUFF_UTF8> flag is set
+in I<flags>.  The characters are recoded for the lexer buffer, according
+to how the buffer is currently being interpreted (L</lex_bufutf8>).
+If it is not convenient to nul-terminate a string to be inserted, the
+L</lex_stuff_pvn> function is more appropriate.
+
+=cut
+*/
+
+void
+Perl_lex_stuff_pv(pTHX_ const char *pv, U32 flags)
+{
+    PERL_ARGS_ASSERT_LEX_STUFF_PV;
+    lex_stuff_pvn(pv, strlen(pv), flags);
+}
+
+/*
  =for apidoc Amx|void|lex_stuff_sv|SV *sv|U32 flags
  
  Insert characters into the lexer buffer (L</PL_parser-E<gt>linestr>),
@@ -1033,7 +1050,7 @@ interpreted in an unintended manner.
  
  The string to be inserted is the string value of I<sv>.  The characters
  are recoded for the lexer buffer, according to how the buffer is currently
-being interpreted (L</lex_bufutf8>).  If a string to be interpreted is
+being interpreted (L</lex_bufutf8>).  If a string to be inserted is
  not already a Perl scalar, the L</lex_stuff_pvn> function avoids the
  need to construct a scalar.
  
@@ -1248,7 +1265,7 @@ Perl_lex_next_chunk(pTHX_ U32 flags)
         else if (PL_parser->rsfp)
             (void)PerlIO_close(PL_parser->rsfp);
         PL_parser->rsfp = NULL;
-       PL_doextract = FALSE;
+       PL_parser->in_pod = 0;
  #ifdef PERL_MAD
         if (PL_madskills && !PL_in_eval && (PL_minus_p || PL_minus_n))
             PL_faketokens = 1;
@@ -1928,6 +1945,24 @@ S_force_next(pTHX_ I32 type)
  #endif
  }
  
+void
+Perl_yyunlex(pTHX)
+{
+    int yyc = PL_parser->yychar;
+    if (yyc != YYEMPTY) {
+       if (yyc) {
+           start_force(-1);
+           NEXTVAL_NEXTTOKE = PL_parser->yylval;
+           if (yyc == '{'/*}*/ || yyc == HASHBRACK || yyc == '['/*]*/) {
+               PL_lex_brackets--;
+               yyc |= (1<<24) | (PL_lex_brackstack[PL_lex_brackets] << 16);
+           }
+           force_next(yyc);
+       }
+       PL_parser->yychar = YYEMPTY;
+    }
+}
+
  STATIC SV *
  S_newSV_maybe_utf8(pTHX_ const char *const start, STRLEN len)
  {
@@ -2218,7 +2253,8 @@ S_tokeq(pTHX_ SV *sv)
      if (SvTYPE(sv) >= SVt_PVIV && SvIVX(sv) == -1)
         goto finish;
      send = s + len;
-    while (s < send && *s != '\\')
+    /* This is relying on the SV being "well formed" with a trailing '\0'  */
+    while (s < send && !(*s == '\\' && s[1] == '\\'))
         s++;
      if (s == send)
         goto finish;
@@ -2811,7 +2847,8 @@ S_scan_const(pTHX_ char *start)
  
             s++;
  
-           /* deprecate \1 in strings and substitution replacements */
+           /* warn on \1 - \9 in substitution replacements, but note that \11
+            * is an octal; and \19 is \1 followed by '9' */
             if (PL_lex_inwhat == OP_SUBST && !PL_lex_inpat &&
                 isDIGIT(*s) && *s != '0' && !isDIGIT(s[1]))
             {
@@ -2866,7 +2903,7 @@ S_scan_const(pTHX_ char *start)
                     goto default_action;
                 }
  
-           /* eg. \132 indicates the octal constant 0x132 */
+           /* eg. \132 indicates the octal constant 0132 */
             case '0': case '1': case '2': case '3':
             case '4': case '5': case '6': case '7':
                 {
@@ -2877,6 +2914,21 @@ S_scan_const(pTHX_ char *start)
                 }
                 goto NUM_ESCAPE_INSERT;
  
+           /* eg. \o{24} indicates the octal constant \024 */
+           case 'o':
+               {
+                   STRLEN len;
+                   const char* error;
+
+                   bool valid = grok_bslash_o(s, &uv, &len, &error, 1);
+                   s += len;
+                   if (! valid) {
+                       yyerror(error);
+                       continue;
+                   }
+                   goto NUM_ESCAPE_INSERT;
+               }
+
             /* eg. \x24 indicates the hex constant 0x24 */
             case 'x':
                 ++s;
@@ -3463,19 +3515,10 @@ S_intuit_more(pTHX_ register char *s)
  
      /* In a pattern, so maybe we have {n,m}. */
      if (*s == '{') {
-       s++;
-       if (!isDIGIT(*s))
-           return TRUE;
-       while (isDIGIT(*s))
-           s++;
-       if (*s == ',')
-           s++;
-       while (isDIGIT(*s))
-           s++;
-       if (*s == '}')
+       if (regcurly(s)) {
             return FALSE;
+       }
         return TRUE;
-       
      }
  
      /* On the other hand, maybe we have a character class */
@@ -3756,8 +3799,6 @@ Perl_filter_del(pTHX_ filter_t funcp)
      /* if filter is on top of stack (usual case) just pop it off */
      datasv = FILTER_DATA(AvFILLp(PL_rsfp_filters));
      if (IoANY(datasv) == FPTR2DPTR(void *, funcp)) {
-       IoFLAGS(datasv) &= ~IOf_FAKE_DIRP;
-       IoANY(datasv) = (void *)NULL;
         sv_free(av_pop(PL_rsfp_filters));
  
          return;
@@ -3913,7 +3954,7 @@ S_readpipe_override(pTHX)
              && GvCVu(gv_readpipe) && GvIMPORTED_CV(gv_readpipe)))
      {
         PL_lex_op = (OP*)newUNOP(OP_ENTERSUB, OPf_STACKED,
-           append_elem(OP_LIST,
+           op_append_elem(OP_LIST,
                 newSVOP(OP_CONST, 0, &PL_sv_undef), /* value will be read later */
                 newCVREF(0, newGVOP(OP_GV, 0, gv_readpipe))));
      }
@@ -3938,7 +3979,7 @@ Perl_madlex(pTHX)
      PL_thismad = 0;
  
      /* just do what yylex would do on pending identifier; leave PL_thiswhite alone */
-    if (PL_pending_ident)
+    if (PL_lex_state != LEX_KNOWNEXT && PL_pending_ident)
          return S_pending_ident(aTHX);
  
      /* previous token ate up our whitespace? */
@@ -4141,6 +4182,16 @@ S_tokenize_use(pTHX_ int is_use, char *s) {
         };
  #endif
  
+#define word_takes_any_delimeter(p,l) S_word_takes_any_delimeter(p,l)
+STATIC bool
+S_word_takes_any_delimeter(char *p, STRLEN len)
+{
+    return (len == 1 && strchr("msyq", p[0])) ||
+          (len == 2 && (
+           (p[0] == 't' && p[1] == 'r') ||
+           (p[0] == 'q' && strchr("qwxr", p[1]))));
+}
+
  /*
    yylex
  
@@ -4197,7 +4248,7 @@ Perl_yylex(pTHX)
         SvREFCNT_dec(tmp);
      } );
      /* check if there's an identifier for us to look at */
-    if (PL_pending_ident)
+    if (PL_lex_state != LEX_KNOWNEXT && PL_pending_ident)
          return REPORT(S_pending_ident(aTHX));
  
      /* no identifier pending identification */
@@ -4240,12 +4291,26 @@ Perl_yylex(pTHX)
             PL_lex_defer = LEX_NORMAL;
         }
  #endif
+       {
+           I32 next_type;
+#ifdef PERL_MAD
+           next_type = PL_nexttoke[PL_lasttoke].next_type;
+#else
+           next_type = PL_nexttype[PL_nexttoke];
+#endif
+           if (next_type & (1<<24)) {
+               if (PL_lex_brackets > 100)
+                   Renew(PL_lex_brackstack, PL_lex_brackets + 10, char);
+               PL_lex_brackstack[PL_lex_brackets++] = (next_type >> 16) & 0xff;
+               next_type &= 0xffff;
+           }
  #ifdef PERL_MAD
-       /* FIXME - can these be merged?  */
-       return(PL_nexttoke[PL_lasttoke].next_type);
+           /* FIXME - can these be merged?  */
+           return next_type;
  #else
-       return REPORT(PL_nexttype[PL_nexttoke]);
+           return REPORT(next_type);
  #endif
+       }
  
      /* interpolated case modifiers like \L \U, including \Q and \E.
         when we get here, PL_bufptr is at the \
@@ -4535,7 +4600,8 @@ Perl_yylex(pTHX)
         if (!PL_rsfp) {
             PL_last_uni = 0;
             PL_last_lop = 0;
-           if (PL_lex_brackets) {
+           if (PL_lex_brackets &&
+                   PL_lex_brackstack[PL_lex_brackets-1] != XFAKEEOF) {
                 yyerror((const char *)
                         (PL_lex_formbrack
                          ? "Format not terminated"
@@ -4658,7 +4724,7 @@ Perl_yylex(pTHX)
                     s = swallow_bom((U8*)s);
                 }
             }
-           if (PL_doextract) {
+           if (PL_parser->in_pod) {
                 /* Incest with pod. */
  #ifdef PERL_MAD
                 if (PL_madskills)
@@ -4669,12 +4735,12 @@ Perl_yylex(pTHX)
                     PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
                     PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
                     PL_last_lop = PL_last_uni = NULL;
-                   PL_doextract = FALSE;
+                   PL_parser->in_pod = 0;
                 }
             }
             if (PL_rsfp)
                 incline(s);
-       } while (PL_doextract);
+       } while (PL_parser->in_pod);
         PL_oldoldbufptr = PL_oldbufptr = PL_bufptr = PL_linestart = s;
         PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
         PL_last_lop = PL_last_uni = NULL;
@@ -5124,7 +5190,9 @@ Perl_yylex(pTHX)
         s++;
         BOop(OP_BIT_XOR);
      case '[':
-       PL_lex_brackets++;
+       if (PL_lex_brackets > 100)
+           Renew(PL_lex_brackstack, PL_lex_brackets + 10, char);
+       PL_lex_brackstack[PL_lex_brackets++] = 0;
         {
             const char tmp = *s++;
             OPERATOR(tmp);
@@ -5208,7 +5276,7 @@ Perl_yylex(pTHX)
                 }
                 if (PL_lex_stuff) {
                     sv_catsv(sv, PL_lex_stuff);
-                   attrs = append_elem(OP_LIST, attrs,
+                   attrs = op_append_elem(OP_LIST, attrs,
                                         newSVOP(OP_CONST, 0, sv));
                     SvREFCNT_dec(PL_lex_stuff);
                     PL_lex_stuff = NULL;
@@ -5248,7 +5316,7 @@ Perl_yylex(pTHX)
                        justified by the performance win for the common case
                        of applying only built-in attributes.) */
                     else
-                       attrs = append_elem(OP_LIST, attrs,
+                       attrs = op_append_elem(OP_LIST, attrs,
                                             newSVOP(OP_CONST, 0,
                                                     sv));
                 }
@@ -5324,6 +5392,8 @@ Perl_yylex(pTHX)
             TERM(tmp);
         }
      case ']':
+       if (PL_lex_brackets && PL_lex_brackstack[PL_lex_brackets-1] == XFAKEEOF)
+           TOKEN(0);
         s++;
         if (PL_lex_brackets <= 0)
             yyerror("Unmatched right square bracket");
@@ -5501,6 +5571,8 @@ Perl_yylex(pTHX)
             PL_copline = NOLINE;   /* invalidate current command line number */
         TOKEN('{');
      case '}':
+       if (PL_lex_brackets && PL_lex_brackstack[PL_lex_brackets-1] == XFAKEEOF)
+           TOKEN(0);
        rightbracket:
         s++;
         if (PL_lex_brackets <= 0)
@@ -5623,7 +5695,7 @@ Perl_yylex(pTHX)
                     }
  #endif
                     s = PL_bufend;
-                   PL_doextract = TRUE;
+                   PL_parser->in_pod = 1;
                     goto retry;
                 }
         }
@@ -6087,10 +6159,7 @@ Perl_yylex(pTHX)
         s = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE, &len);
  
         /* Some keywords can be followed by any delimiter, including ':' */
-       anydelim = ((len == 1 && strchr("msyq", PL_tokenbuf[0])) ||
-              (len == 2 && ((PL_tokenbuf[0] == 't' && PL_tokenbuf[1] == 'r') ||
-                            (PL_tokenbuf[0] == 'q' &&
-                             strchr("qwxr", PL_tokenbuf[1])))));
+       anydelim = word_takes_any_delimeter(PL_tokenbuf, len);
  
         /* x::* is just a word, unless x is "CORE" */
         if (!anydelim && *s == ':' && s[1] == ':' && strNE(PL_tokenbuf, "CORE"))
@@ -6116,7 +6185,7 @@ Perl_yylex(pTHX)
             int result;
             char *saved_bufptr = PL_bufptr;
             PL_bufptr = s;
-           result = CALL_FPTR(PL_keyword_plugin)(aTHX_ PL_tokenbuf, len, &o);
+           result = PL_keyword_plugin(aTHX_ PL_tokenbuf, len, &o);
             s = PL_bufptr;
             if (result == KEYWORD_PLUGIN_DECLINE) {
                 /* not a plugged-in keyword */
@@ -6190,8 +6259,9 @@ Perl_yylex(pTHX)
                 gvp = 0;
                 if (hgv && tmp != KEY_x && tmp != KEY_CORE)     /* never ambiguous */
                     Perl_ck_warner(aTHX_ packWARN(WARN_AMBIGUOUS),
-                                  "Ambiguous call resolved as CORE::%s(), %s",
-                                  GvENAME(hgv), "qualify as such or use &");
+                                  "Ambiguous call resolved as CORE::%s(), "
+                                  "qualify as such or use &",
+                                  GvENAME(hgv));
             }
         }
  
@@ -6274,16 +6344,15 @@ Perl_yylex(pTHX)
  
                 /* if we saw a global override before, get the right name */
  
+               sv = S_newSV_maybe_utf8(aTHX_ PL_tokenbuf,
+                   len ? len : strlen(PL_tokenbuf));
                 if (gvp) {
+                   SV * const tmp_sv = sv;
                     sv = newSVpvs("CORE::GLOBAL::");
-                   sv_catpv(sv,PL_tokenbuf);
-               }
-               else {
-                   /* If len is 0, newSVpv does strlen(), which is correct.
-                      If len is non-zero, then it will be the true length,
-                      and so the scalar will be created correctly.  */
-                   sv = newSVpv(PL_tokenbuf,len);
+                   sv_catsv(sv, tmp_sv);
+                   SvREFCNT_dec(tmp_sv);
                 }
+
  #ifdef PERL_MAD
                 if (PL_madskills && !PL_thistoken) {
                     char *start = SvPVX(PL_linestr) + PL_realtokenstart;
@@ -6293,43 +6362,20 @@ Perl_yylex(pTHX)
  #endif
  
                 /* Presume this is going to be a bareword of some sort. */
-
                 CLINE;
                 pl_yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
                 pl_yylval.opval->op_private = OPpCONST_BARE;
-               /* UTF-8 package name? */
-               if (UTF && !IN_BYTES &&
-                   is_utf8_string((U8*)SvPVX_const(sv), SvCUR(sv)))
-                   SvUTF8_on(sv);
  
                 /* And if "Foo::", then that's what it certainly is. */
-
                 if (len)
                     goto safe_bareword;
  
-               cv = NULL;
                 {
                     OP *const_op = newSVOP(OP_CONST, 0, SvREFCNT_inc(sv));
                     const_op->op_private = OPpCONST_BARE;
                     rv2cv_op = newCVREF(0, const_op);
                 }
-               if (rv2cv_op->op_type == OP_RV2CV &&
-                       (rv2cv_op->op_flags & OPf_KIDS)) {
-                   OP *rv_op = cUNOPx(rv2cv_op)->op_first;
-                   switch (rv_op->op_type) {
-                       case OP_CONST: {
-                           SV *sv = cSVOPx_sv(rv_op);
-                           if (SvROK(sv) && SvTYPE(SvRV(sv)) == SVt_PVCV)
-                               cv = (CV*)SvRV(sv);
-                       } break;
-                       case OP_GV: {
-                           GV *gv = cGVOPx_gv(rv_op);
-                           CV *maybe_cv = GvCVu(gv);
-                           if (maybe_cv && SvTYPE((SV*)maybe_cv) == SVt_PVCV)
-                               cv = maybe_cv;
-                       } break;
-                   }
-               }
+               cv = rv2cv_op_cv(rv2cv_op, 0);
  
                 /* See if it's the indirect object for a list operator. */
  
@@ -6479,10 +6525,27 @@ Perl_yylex(pTHX)
                         const char *proto = SvPV_const(MUTABLE_SV(cv), protolen);
                         if (!protolen)
                             TERM(FUNC0SUB);
-                       if ((*proto == '$' || *proto == '_') && proto[1] == '\0')
-                           OPERATOR(UNIOPSUB);
                         while (*proto == ';')
                             proto++;
+                       if (
+                           (
+                               (
+                                   *proto == '$' || *proto == '_'
+                                || *proto == '*' || *proto == '+'
+                               )
+                            && proto[1] == '\0'
+                           )
+                        || (
+                            *proto == '\\' && proto[1] && proto[2] == '\0'
+                           )
+                       )
+                           OPERATOR(UNIOPSUB);
+                       if (*proto == '\\' && proto[1] == '[') {
+                           const char *p = proto + 2;
+                           while(*p && *p != ']')
+                               ++p;
+                           if(*p == ']' && !p[1]) OPERATOR(UNIOPSUB);
+                       }
                         if (*proto == '&' && *s == '{') {
                             if (PL_curstash)
                                 sv_setpvs(PL_subname, "__ANON__");
@@ -6864,7 +6927,13 @@ Perl_yylex(pTHX)
             UNI(OP_DELETE);
  
         case KEY_dbmopen:
-           gv_fetchpvs("AnyDBM_File::ISA", GV_ADDMULTI, SVt_PVAV);
+           Perl_populate_isa(aTHX_ STR_WITH_LEN("AnyDBM_File::ISA"),
+                             STR_WITH_LEN("NDBM_File::"),
+                             STR_WITH_LEN("DB_File::"),
+                             STR_WITH_LEN("GDBM_File::"),
+                             STR_WITH_LEN("SDBM_File::"),
+                             STR_WITH_LEN("ODBM_File::"),
+                             NULL);
             LOP(OP_DBMOPEN,XTERM);
  
         case KEY_dbmclose:
@@ -7290,14 +7359,13 @@ Perl_yylex(pTHX)
         case KEY_quotemeta:
             UNI(OP_QUOTEMETA);
  
-       case KEY_qw:
+       case KEY_qw: {
+           OP *words = NULL;
             s = scan_str(s,!!PL_madskills,FALSE);
             if (!s)
                 missingterm(NULL);
             PL_expect = XOPERATOR;
-           force_next(')');
             if (SvCUR(PL_lex_stuff)) {
-               OP *words = NULL;
                 int warned = 0;
                 d = SvPV_force(PL_lex_stuff, len);
                 while (len) {
@@ -7325,22 +7393,21 @@ Perl_yylex(pTHX)
                                 /**/;
                         }
                         sv = newSVpvn_utf8(b, d-b, DO_UTF8(PL_lex_stuff));
-                       words = append_elem(OP_LIST, words,
+                       words = op_append_elem(OP_LIST, words,
                                             newSVOP(OP_CONST, 0, tokeq(sv)));
                     }
                 }
-               if (words) {
-                   start_force(PL_curforce);
-                   NEXTVAL_NEXTTOKE.opval = words;
-                   force_next(THING);
-               }
             }
+           if (!words)
+               words = newNULLLIST();
             if (PL_lex_stuff) {
                 SvREFCNT_dec(PL_lex_stuff);
                 PL_lex_stuff = NULL;
             }
-           PL_expect = XTERM;
-           TOKEN('(');
+           PL_expect = XOPERATOR;
+           pl_yylval.opval = sawparens(words);
+           TOKEN(QWLIST);
+       }
  
         case KEY_qq:
             s = scan_str(s,!!PL_madskills,FALSE);
@@ -7676,7 +7743,7 @@ Perl_yylex(pTHX)
                             if (warnillegalproto) {
                                 if (must_be_last)
                                     proto_after_greedy_proto = TRUE;
-                               if (!strchr("$@%*;[]&\\_", *p)) {
+                               if (!strchr("$@%*;[]&\\_+", *p)) {
                                     bad_proto = TRUE;
                                 }
                                 else {
@@ -11973,8 +12040,14 @@ S_scan_subst(pTHX_ char *start)
         }
         else if (strchr(S_PAT_MODS, *s))
             pm->op_pmflags = S_pmflag(pm->op_pmflags, *s++);
-       else
+       else {
+           if (isALNUM(*s)) {
+               Perl_ck_warner_d(aTHX_ packWARN(WARN_SYNTAX),
+                   "Having no space between pattern and following word is deprecated");
+
+           }
             break;
+       }
      }
  
  #ifdef PERL_MAD
@@ -12487,7 +12560,7 @@ S_scan_inputsymbol(pTHX_ char *start)
                     o->op_targ = tmp;
                     PL_lex_op = readline_overriden
                         ? (OP*)newUNOP(OP_ENTERSUB, OPf_STACKED,
-                               append_elem(OP_LIST, o,
+                               op_append_elem(OP_LIST, o,
                                     newCVREF(0, newGVOP(OP_GV,0,gv_readline))))
                         : (OP*)newUNOP(OP_READLINE, 0, o);
                 }
@@ -12503,7 +12576,7 @@ intro_sym:
                                 SVt_PV);
                 PL_lex_op = readline_overriden
                     ? (OP*)newUNOP(OP_ENTERSUB, OPf_STACKED,
-                           append_elem(OP_LIST,
+                           op_append_elem(OP_LIST,
                                 newUNOP(OP_RV2SV, 0, newGVOP(OP_GV, 0, gv)),
                                 newCVREF(0, newGVOP(OP_GV, 0, gv_readline))))
                     : (OP*)newUNOP(OP_READLINE, 0,
@@ -12522,7 +12595,7 @@ intro_sym:
             GV * const gv = gv_fetchpv(d, GV_ADD, SVt_PVIO);
             PL_lex_op = readline_overriden
                 ? (OP*)newUNOP(OP_ENTERSUB, OPf_STACKED,
-                       append_elem(OP_LIST,
+                       op_append_elem(OP_LIST,
                             newGVOP(OP_GV, 0, gv),
                             newCVREF(0, newGVOP(OP_GV, 0, gv_readline))))
                 : (OP*)newUNOP(OP_READLINE, 0, newGVOP(OP_GV, 0, gv));
@@ -12972,11 +13045,11 @@ Perl_scan_num(pTHX_ const char *start, YYSTYPE* lvalp)
             const char *base, *Base, *max;
  
             /* check for hex */
-           if (s[1] == 'x') {
+           if (s[1] == 'x' || s[1] == 'X') {
                 shift = 4;
                 s += 2;
                 just_zero = FALSE;
-           } else if (s[1] == 'b') {
+           } else if (s[1] == 'b' || s[1] == 'B') {
                 shift = 1;
                 s += 2;
                 just_zero = FALSE;
@@ -13907,6 +13980,282 @@ Perl_keyword_plugin_standard(pTHX_
      return KEYWORD_PLUGIN_DECLINE;
  }
  
+#define parse_recdescent(g) S_parse_recdescent(aTHX_ g)
+static void
+S_parse_recdescent(pTHX_ int gramtype)
+{
+    SAVEI32(PL_lex_brackets);
+    if (PL_lex_brackets > 100)
+       Renew(PL_lex_brackstack, PL_lex_brackets + 10, char);
+    PL_lex_brackstack[PL_lex_brackets++] = XFAKEEOF;
+    if(yyparse(gramtype) && !PL_parser->error_count)
+       qerror(Perl_mess(aTHX_ "Parse error"));
+}
+
+#define parse_recdescent_for_op(g) S_parse_recdescent_for_op(aTHX_ g)
+static OP *
+S_parse_recdescent_for_op(pTHX_ int gramtype)
+{
+    OP *o;
+    ENTER;
+    SAVEVPTR(PL_eval_root);
+    PL_eval_root = NULL;
+    parse_recdescent(gramtype);
+    o = PL_eval_root;
+    LEAVE;
+    return o;
+}
+
+/*
+=for apidoc Amx|OP *|parse_block|U32 flags
+
+Parse a single complete Perl code block.  This consists of an opening
+brace, a sequence of statements, and a closing brace.  The block
+constitutes a lexical scope, so C<my> variables and various compile-time
+effects can be contained within it.  It is up to the caller to ensure
+that the dynamic parser state (L</PL_parser> et al) is correctly set to
+reflect the source of the code to be parsed and the lexical context for
+the statement.
+
+The op tree representing the code block is returned.  This is always a
+real op, never a null pointer.  It will normally be a C<lineseq> list,
+including C<nextstate> or equivalent ops.  No ops to construct any kind
+of runtime scope are included by virtue of it being a block.
+
+If an error occurs in parsing or compilation, in most cases a valid op
+tree (most likely null) is returned anyway.  The error is reflected in
+the parser state, normally resulting in a single exception at the top
+level of parsing which covers all the compilation errors that occurred.
+Some compilation errors, however, will throw an exception immediately.
+
+The I<flags> parameter is reserved for future use, and must always
+be zero.
+
+=cut
+*/
+
+OP *
+Perl_parse_block(pTHX_ U32 flags)
+{
+    if (flags)
+       Perl_croak(aTHX_ "Parsing code internal error (%s)", "parse_block");
+    return parse_recdescent_for_op(GRAMBLOCK);
+}
+
+/*
+=for apidoc Amx|OP *|parse_barestmt|U32 flags
+
+Parse a single unadorned Perl statement.  This may be a normal imperative
+statement or a declaration that has compile-time effect.  It does not
+include any label or other affixture.  It is up to the caller to ensure
+that the dynamic parser state (L</PL_parser> et al) is correctly set to
+reflect the source of the code to be parsed and the lexical context for
+the statement.
+
+The op tree representing the statement is returned.  This may be a
+null pointer if the statement is null, for example if it was actually
+a subroutine definition (which has compile-time side effects).  If not
+null, it will be ops directly implementing the statement, suitable to
+pass to L</newSTATEOP>.  It will not normally include a C<nextstate> or
+equivalent op (except for those embedded in a scope contained entirely
+within the statement).
+
+If an error occurs in parsing or compilation, in most cases a valid op
+tree (most likely null) is returned anyway.  The error is reflected in
+the parser state, normally resulting in a single exception at the top
+level of parsing which covers all the compilation errors that occurred.
+Some compilation errors, however, will throw an exception immediately.
+
+The I<flags> parameter is reserved for future use, and must always
+be zero.
+
+=cut
+*/
+
+OP *
+Perl_parse_barestmt(pTHX_ U32 flags)
+{
+    if (flags)
+       Perl_croak(aTHX_ "Parsing code internal error (%s)", "parse_barestmt");
+    return parse_recdescent_for_op(GRAMBARESTMT);
+}
+
+/*
+=for apidoc Amx|SV *|parse_label|U32 flags
+
+Parse a single label, possibly optional, of the type that may prefix a
+Perl statement.  It is up to the caller to ensure that the dynamic parser
+state (L</PL_parser> et al) is correctly set to reflect the source of
+the code to be parsed.  If I<flags> includes C<PARSE_OPTIONAL> then the
+label is optional, otherwise it is mandatory.
+
+The name of the label is returned in the form of a fresh scalar.  If an
+optional label is absent, a null pointer is returned.
+
+If an error occurs in parsing, which can only occur if the label is
+mandatory, a valid label is returned anyway.  The error is reflected in
+the parser state, normally resulting in a single exception at the top
+level of parsing which covers all the compilation errors that occurred.
+
+=cut
+*/
+
+SV *
+Perl_parse_label(pTHX_ U32 flags)
+{
+    if (flags & ~PARSE_OPTIONAL)
+       Perl_croak(aTHX_ "Parsing code internal error (%s)", "parse_label");
+    if (PL_lex_state == LEX_KNOWNEXT) {
+       PL_parser->yychar = yylex();
+       if (PL_parser->yychar == LABEL) {
+           char *lpv = pl_yylval.pval;
+           STRLEN llen = strlen(lpv);
+           SV *lsv;
+           PL_parser->yychar = YYEMPTY;
+           lsv = newSV_type(SVt_PV);
+           SvPV_set(lsv, lpv);
+           SvCUR_set(lsv, llen);
+           SvLEN_set(lsv, llen+1);
+           SvPOK_on(lsv);
+           return lsv;
+       } else {
+           yyunlex();
+           goto no_label;
+       }
+    } else {
+       char *s, *t;
+       U8 c;
+       STRLEN wlen, bufptr_pos;
+       lex_read_space(0);
+       t = s = PL_bufptr;
+       c = (U8)*s;
+       if (!isIDFIRST_A(c))
+           goto no_label;
+       do {
+           c = (U8)*++t;
+       } while(isWORDCHAR_A(c));
+       wlen = t - s;
+       if (word_takes_any_delimeter(s, wlen))
+           goto no_label;
+       bufptr_pos = s - SvPVX(PL_linestr);
+       PL_bufptr = t;
+       lex_read_space(LEX_KEEP_PREVIOUS);
+       t = PL_bufptr;
+       s = SvPVX(PL_linestr) + bufptr_pos;
+       if (t[0] == ':' && t[1] != ':') {
+           PL_oldoldbufptr = PL_oldbufptr;
+           PL_oldbufptr = s;
+           PL_bufptr = t+1;
+           return newSVpvn(s, wlen);
+       } else {
+           PL_bufptr = s;
+           no_label:
+           if (flags & PARSE_OPTIONAL) {
+               return NULL;
+           } else {
+               qerror(Perl_mess(aTHX_ "Parse error"));
+               return newSVpvs("x");
+           }
+       }
+    }
+}
+
+/*
+=for apidoc Amx|OP *|parse_fullstmt|U32 flags
+
+Parse a single complete Perl statement.  This may be a normal imperative
+statement or a declaration that has compile-time effect, and may include
+an optional label.  It is up to the caller to ensure that the dynamic
+parser state (L</PL_parser> et al) is correctly set to reflect the source
+of the code to be parsed and the lexical context for the statement.
+
+The op tree representing the statement is returned.  This may be a
+null pointer if the statement is null, for example if it was actually
+a subroutine definition (which has compile-time side effects).  If not
+null, it will be the result of a L</newSTATEOP> call, normally including
+a C<nextstate> or equivalent op.
+
+If an error occurs in parsing or compilation, in most cases a valid op
+tree (most likely null) is returned anyway.  The error is reflected in
+the parser state, normally resulting in a single exception at the top
+level of parsing which covers all the compilation errors that occurred.
+Some compilation errors, however, will throw an exception immediately.
+
+The I<flags> parameter is reserved for future use, and must always
+be zero.
+
+=cut
+*/
+
+OP *
+Perl_parse_fullstmt(pTHX_ U32 flags)
+{
+    if (flags)
+       Perl_croak(aTHX_ "Parsing code internal error (%s)", "parse_fullstmt");
+    return parse_recdescent_for_op(GRAMFULLSTMT);
+}
+
+/*
+=for apidoc Amx|OP *|parse_stmtseq|U32 flags
+
+Parse a sequence of zero or more Perl statements.  These may be normal
+imperative statements, including optional labels, or declarations
+that have compile-time effect, or any mixture thereof.  The statement
+sequence ends when a closing brace or end-of-file is encountered in a
+place where a new statement could have validly started.  It is up to
+the caller to ensure that the dynamic parser state (L</PL_parser> et al)
+is correctly set to reflect the source of the code to be parsed and the
+lexical context for the statements.
+
+The op tree representing the statement sequence is returned.  This may
+be a null pointer if the statements were all null, for example if there
+were no statements or if there were only subroutine definitions (which
+have compile-time side effects).  If not null, it will be a C<lineseq>
+list, normally including C<nextstate> or equivalent ops.
+
+If an error occurs in parsing or compilation, in most cases a valid op
+tree is returned anyway.  The error is reflected in the parser state,
+normally resulting in a single exception at the top level of parsing
+which covers all the compilation errors that occurred.  Some compilation
+errors, however, will throw an exception immediately.
+
+The I<flags> parameter is reserved for future use, and must always
+be zero.
+
+=cut
+*/
+
+OP *
+Perl_parse_stmtseq(pTHX_ U32 flags)
+{
+    OP *stmtseqop;
+    I32 c;
+    if (flags)
+       Perl_croak(aTHX_ "Parsing code internal error (%s)", "parse_fullstmt");
+    stmtseqop = parse_recdescent_for_op(GRAMSTMTSEQ);
+    c = lex_peek_unichar(0);
+    if (c != -1 && c != /*{*/'}')
+       qerror(Perl_mess(aTHX_ "Parse error"));
+    return stmtseqop;
+}
+
+void
+Perl_munge_qwlist_to_paren_list(pTHX_ OP *qwlist)
+{
+    PERL_ARGS_ASSERT_MUNGE_QWLIST_TO_PAREN_LIST;
+    deprecate("qw(...) as parentheses");
+    force_next(')');
+    if (qwlist->op_type == OP_STUB) {
+       op_free(qwlist);
+    }
+    else {
+       start_force(PL_curforce);
+       NEXTVAL_NEXTTOKE.opval = qwlist;
+       force_next(THING);
+    }
+    force_next('(');
+}
+
  /*
   * Local variables:
   * c-indentation-style: bsd