This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
update Changes, patchlevel etc.
[perl5.git] / toke.c
CommitLineData
a0d0e21e 1/* toke.c
a687059c 2 *
4eb8286e 3 * Copyright (c) 1991-1999, Larry Wall
a687059c 4 *
d48672a2
LW
5 * You may distribute under the terms of either the GNU General Public
6 * License or the Artistic License, as specified in the README file.
378cc40b 7 *
a0d0e21e
LW
8 */
9
10/*
11 * "It all comes from here, the stench and the peril." --Frodo
378cc40b
LW
12 */
13
9cbb5ea2
GS
14/*
15 * This file is the lexer for Perl. It's closely linked to the
ffb4593c
NT
16 * parser, perly.y.
17 *
18 * The main routine is yylex(), which returns the next token.
19 */
20
378cc40b 21#include "EXTERN.h"
864dbfa3 22#define PERL_IN_TOKE_C
378cc40b 23#include "perl.h"
378cc40b 24
d3b6f988
GS
25#define yychar PL_yychar
26#define yylval PL_yylval
27
fc36a67e 28static char ident_too_long[] = "Identifier too long";
8903cb82 29
51371543
GS
30static void restore_rsfp(pTHXo_ void *f);
31static void restore_expect(pTHXo_ void *e);
32static void restore_lex_expect(pTHXo_ void *e);
33
a0ed51b3 34#define UTF (PL_hints & HINT_UTF8)
834a4ddd
LW
35/*
36 * Note: we try to be careful never to call the isXXX_utf8() functions
37 * unless we're pretty sure we've seen the beginning of a UTF-8 character
38 * (that is, the two high bits are set). Otherwise we risk loading in the
39 * heavy-duty SWASHINIT and SWASHGET routines unnecessarily.
40 */
41#define isIDFIRST_lazy(p) ((!UTF || (*((U8*)p) < 0xc0)) \
42 ? isIDFIRST(*(p)) \
43 : isIDFIRST_utf8((U8*)p))
44#define isALNUM_lazy(p) ((!UTF || (*((U8*)p) < 0xc0)) \
45 ? isALNUM(*(p)) \
46 : isALNUM_utf8((U8*)p))
a0ed51b3 47
2b92dfce
GS
48/* In variables name $^X, these are the legal values for X.
49 * 1999-02-27 mjd-perl-patch@plover.com */
50#define isCONTROLVAR(x) (isUPPER(x) || strchr("[\\]^_?", (x)))
51
ffb4593c
NT
52/* LEX_* are values for PL_lex_state, the state of the lexer.
53 * They are arranged oddly so that the guard on the switch statement
79072805
LW
54 * can get by with a single comparison (if the compiler is smart enough).
55 */
56
fb73857a 57/* #define LEX_NOTPARSING 11 is done in perl.h. */
58
55497cff 59#define LEX_NORMAL 10
60#define LEX_INTERPNORMAL 9
61#define LEX_INTERPCASEMOD 8
62#define LEX_INTERPPUSH 7
63#define LEX_INTERPSTART 6
64#define LEX_INTERPEND 5
65#define LEX_INTERPENDMAYBE 4
66#define LEX_INTERPCONCAT 3
67#define LEX_INTERPCONST 2
68#define LEX_FORMLINE 1
69#define LEX_KNOWNEXT 0
79072805 70
395c3793
LW
71#ifdef I_FCNTL
72#include <fcntl.h>
73#endif
fe14fcc3
LW
74#ifdef I_SYS_FILE
75#include <sys/file.h>
76#endif
395c3793 77
a790bc05 78/* XXX If this causes problems, set i_unistd=undef in the hint file. */
79#ifdef I_UNISTD
80# include <unistd.h> /* Needed for execv() */
81#endif
82
83
79072805
LW
84#ifdef ff_next
85#undef ff_next
d48672a2
LW
86#endif
87
a1a0e61e
TD
88#ifdef USE_PURE_BISON
89YYSTYPE* yylval_pointer = NULL;
90int* yychar_pointer = NULL;
22c35a8c
GS
91# undef yylval
92# undef yychar
e4bfbdd4
JH
93# define yylval (*yylval_pointer)
94# define yychar (*yychar_pointer)
95# define PERL_YYLEX_PARAM yylval_pointer,yychar_pointer
cea2e8a9
GS
96# undef yylex
97# define yylex() Perl_yylex(aTHX_ yylval_pointer, yychar_pointer)
a1a0e61e
TD
98#endif
99
79072805 100#include "keywords.h"
fe14fcc3 101
ffb4593c
NT
102/* CLINE is a macro that ensures PL_copline has a sane value */
103
ae986130
LW
104#ifdef CLINE
105#undef CLINE
106#endif
3280af22
NIS
107#define CLINE (PL_copline = (PL_curcop->cop_line < PL_copline ? PL_curcop->cop_line : PL_copline))
108
ffb4593c
NT
109/*
110 * Convenience functions to return different tokens and prime the
9cbb5ea2 111 * lexer for the next token. They all take an argument.
ffb4593c
NT
112 *
113 * TOKEN : generic token (used for '(', DOLSHARP, etc)
114 * OPERATOR : generic operator
115 * AOPERATOR : assignment operator
116 * PREBLOCK : beginning the block after an if, while, foreach, ...
117 * PRETERMBLOCK : beginning a non-code-defining {} block (eg, hash ref)
118 * PREREF : *EXPR where EXPR is not a simple identifier
119 * TERM : expression term
120 * LOOPX : loop exiting command (goto, last, dump, etc)
121 * FTST : file test operator
122 * FUN0 : zero-argument function
2d2e263d 123 * FUN1 : not used, except for not, which isn't a UNIOP
ffb4593c
NT
124 * BOop : bitwise or or xor
125 * BAop : bitwise and
126 * SHop : shift operator
127 * PWop : power operator
9cbb5ea2 128 * PMop : pattern-matching operator
ffb4593c
NT
129 * Aop : addition-level operator
130 * Mop : multiplication-level operator
131 * Eop : equality-testing operator
132 * Rop : relational operator <= != gt
133 *
134 * Also see LOP and lop() below.
135 */
136
3280af22
NIS
137#define TOKEN(retval) return (PL_bufptr = s,(int)retval)
138#define OPERATOR(retval) return (PL_expect = XTERM,PL_bufptr = s,(int)retval)
139#define AOPERATOR(retval) return ao((PL_expect = XTERM,PL_bufptr = s,(int)retval))
140#define PREBLOCK(retval) return (PL_expect = XBLOCK,PL_bufptr = s,(int)retval)
141#define PRETERMBLOCK(retval) return (PL_expect = XTERMBLOCK,PL_bufptr = s,(int)retval)
142#define PREREF(retval) return (PL_expect = XREF,PL_bufptr = s,(int)retval)
143#define TERM(retval) return (CLINE, PL_expect = XOPERATOR,PL_bufptr = s,(int)retval)
144#define LOOPX(f) return(yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)LOOPEX)
145#define FTST(f) return(yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)UNIOP)
146#define FUN0(f) return(yylval.ival = f,PL_expect = XOPERATOR,PL_bufptr = s,(int)FUNC0)
147#define FUN1(f) return(yylval.ival = f,PL_expect = XOPERATOR,PL_bufptr = s,(int)FUNC1)
148#define BOop(f) return ao((yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)BITOROP))
149#define BAop(f) return ao((yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)BITANDOP))
150#define SHop(f) return ao((yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)SHIFTOP))
151#define PWop(f) return ao((yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)POWOP))
152#define PMop(f) return(yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)MATCHOP)
153#define Aop(f) return ao((yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)ADDOP))
154#define Mop(f) return ao((yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)MULOP))
155#define Eop(f) return(yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)EQOP)
156#define Rop(f) return(yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)RELOP)
2f3197b3 157
a687059c
LW
158/* This bit of chicanery makes a unary function followed by
159 * a parenthesis into a function with one argument, highest precedence.
160 */
2f3197b3 161#define UNI(f) return(yylval.ival = f, \
3280af22
NIS
162 PL_expect = XTERM, \
163 PL_bufptr = s, \
164 PL_last_uni = PL_oldbufptr, \
165 PL_last_lop_op = f, \
a687059c
LW
166 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
167
79072805 168#define UNIBRACK(f) return(yylval.ival = f, \
3280af22
NIS
169 PL_bufptr = s, \
170 PL_last_uni = PL_oldbufptr, \
79072805
LW
171 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
172
9f68db38 173/* grandfather return to old style */
3280af22 174#define OLDLOP(f) return(yylval.ival=f,PL_expect = XTERM,PL_bufptr = s,(int)LSTOP)
79072805 175
ffb4593c
NT
176/*
177 * S_ao
178 *
179 * This subroutine detects &&= and ||= and turns an ANDAND or OROR
180 * into an OP_ANDASSIGN or OP_ORASSIGN
181 */
182
76e3520e 183STATIC int
cea2e8a9 184S_ao(pTHX_ int toketype)
a0d0e21e 185{
3280af22
NIS
186 if (*PL_bufptr == '=') {
187 PL_bufptr++;
a0d0e21e
LW
188 if (toketype == ANDAND)
189 yylval.ival = OP_ANDASSIGN;
190 else if (toketype == OROR)
191 yylval.ival = OP_ORASSIGN;
192 toketype = ASSIGNOP;
193 }
194 return toketype;
195}
196
ffb4593c
NT
197/*
198 * S_no_op
199 * When Perl expects an operator and finds something else, no_op
200 * prints the warning. It always prints "<something> found where
201 * operator expected. It prints "Missing semicolon on previous line?"
202 * if the surprise occurs at the start of the line. "do you need to
203 * predeclare ..." is printed out for code like "sub bar; foo bar $x"
204 * where the compiler doesn't know if foo is a method call or a function.
205 * It prints "Missing operator before end of line" if there's nothing
206 * after the missing operator, or "... before <...>" if there is something
207 * after the missing operator.
208 */
209
76e3520e 210STATIC void
cea2e8a9 211S_no_op(pTHX_ char *what, char *s)
463ee0b2 212{
3280af22
NIS
213 char *oldbp = PL_bufptr;
214 bool is_first = (PL_oldbufptr == PL_linestart);
68dc0745 215
1189a94a
GS
216 if (!s)
217 s = oldbp;
218 else {
219 assert(s >= oldbp);
220 PL_bufptr = s;
221 }
cea2e8a9 222 yywarn(Perl_form(aTHX_ "%s found where operator expected", what));
748a9306 223 if (is_first)
cea2e8a9 224 Perl_warn(aTHX_ "\t(Missing semicolon on previous line?)\n");
834a4ddd 225 else if (PL_oldoldbufptr && isIDFIRST_lazy(PL_oldoldbufptr)) {
748a9306 226 char *t;
834a4ddd 227 for (t = PL_oldoldbufptr; *t && (isALNUM_lazy(t) || *t == ':'); t++) ;
3280af22 228 if (t < PL_bufptr && isSPACE(*t))
cea2e8a9 229 Perl_warn(aTHX_ "\t(Do you need to predeclare %.*s?)\n",
3280af22 230 t - PL_oldoldbufptr, PL_oldoldbufptr);
748a9306
LW
231 }
232 else
cea2e8a9 233 Perl_warn(aTHX_ "\t(Missing operator before %.*s?)\n", s - oldbp, oldbp);
3280af22 234 PL_bufptr = oldbp;
8990e307
LW
235}
236
ffb4593c
NT
237/*
238 * S_missingterm
239 * Complain about missing quote/regexp/heredoc terminator.
240 * If it's called with (char *)NULL then it cauterizes the line buffer.
241 * If we're in a delimited string and the delimiter is a control
242 * character, it's reformatted into a two-char sequence like ^C.
243 * This is fatal.
244 */
245
76e3520e 246STATIC void
cea2e8a9 247S_missingterm(pTHX_ char *s)
8990e307
LW
248{
249 char tmpbuf[3];
250 char q;
251 if (s) {
252 char *nl = strrchr(s,'\n');
d2719217 253 if (nl)
8990e307
LW
254 *nl = '\0';
255 }
9d116dd7
JH
256 else if (
257#ifdef EBCDIC
258 iscntrl(PL_multi_close)
259#else
260 PL_multi_close < 32 || PL_multi_close == 127
261#endif
262 ) {
8990e307 263 *tmpbuf = '^';
3280af22 264 tmpbuf[1] = toCTRL(PL_multi_close);
8990e307
LW
265 s = "\\n";
266 tmpbuf[2] = '\0';
267 s = tmpbuf;
268 }
269 else {
3280af22 270 *tmpbuf = PL_multi_close;
8990e307
LW
271 tmpbuf[1] = '\0';
272 s = tmpbuf;
273 }
274 q = strchr(s,'"') ? '\'' : '"';
cea2e8a9 275 Perl_croak(aTHX_ "Can't find string terminator %c%s%c anywhere before EOF",q,s,q);
463ee0b2 276}
79072805 277
ffb4593c
NT
278/*
279 * Perl_deprecate
ffb4593c
NT
280 */
281
79072805 282void
864dbfa3 283Perl_deprecate(pTHX_ char *s)
a0d0e21e 284{
d008e5eb 285 dTHR;
599cee73 286 if (ckWARN(WARN_DEPRECATED))
cea2e8a9 287 Perl_warner(aTHX_ WARN_DEPRECATED, "Use of %s is deprecated", s);
a0d0e21e
LW
288}
289
ffb4593c
NT
290/*
291 * depcom
9cbb5ea2 292 * Deprecate a comma-less variable list.
ffb4593c
NT
293 */
294
76e3520e 295STATIC void
cea2e8a9 296S_depcom(pTHX)
a0d0e21e
LW
297{
298 deprecate("comma-less variable list");
299}
300
ffb4593c 301/*
9cbb5ea2
GS
302 * experimental text filters for win32 carriage-returns, utf16-to-utf8 and
303 * utf16-to-utf8-reversed.
ffb4593c
NT
304 */
305
a868473f
NIS
306#ifdef WIN32
307
76e3520e 308STATIC I32
cea2e8a9 309S_win32_textfilter(pTHX_ int idx, SV *sv, int maxlen)
a868473f
NIS
310{
311 I32 count = FILTER_READ(idx+1, sv, maxlen);
312 if (count > 0 && !maxlen)
313 win32_strip_return(sv);
314 return count;
315}
316#endif
317
a0ed51b3 318STATIC I32
cea2e8a9 319S_utf16_textfilter(pTHX_ int idx, SV *sv, int maxlen)
a0ed51b3
LW
320{
321 I32 count = FILTER_READ(idx+1, sv, maxlen);
322 if (count) {
dfe13c55
GS
323 U8* tmps;
324 U8* tend;
325 New(898, tmps, SvCUR(sv) * 3 / 2 + 1, U8);
a0ed51b3 326 tend = utf16_to_utf8((U16*)SvPVX(sv), tmps, SvCUR(sv));
dfe13c55 327 sv_usepvn(sv, (char*)tmps, tend - tmps);
a0ed51b3
LW
328
329 }
330 return count;
331}
332
333STATIC I32
cea2e8a9 334S_utf16rev_textfilter(pTHX_ int idx, SV *sv, int maxlen)
a0ed51b3
LW
335{
336 I32 count = FILTER_READ(idx+1, sv, maxlen);
337 if (count) {
dfe13c55
GS
338 U8* tmps;
339 U8* tend;
340 New(898, tmps, SvCUR(sv) * 3 / 2 + 1, U8);
a0ed51b3 341 tend = utf16_to_utf8_reversed((U16*)SvPVX(sv), tmps, SvCUR(sv));
dfe13c55 342 sv_usepvn(sv, (char*)tmps, tend - tmps);
a0ed51b3
LW
343
344 }
345 return count;
346}
a868473f 347
ffb4593c
NT
348/*
349 * Perl_lex_start
9cbb5ea2
GS
350 * Initialize variables. Uses the Perl save_stack to save its state (for
351 * recursive calls to the parser).
ffb4593c
NT
352 */
353
a0d0e21e 354void
864dbfa3 355Perl_lex_start(pTHX_ SV *line)
79072805 356{
0f15f207 357 dTHR;
8990e307
LW
358 char *s;
359 STRLEN len;
360
3280af22
NIS
361 SAVEI32(PL_lex_dojoin);
362 SAVEI32(PL_lex_brackets);
363 SAVEI32(PL_lex_fakebrack);
364 SAVEI32(PL_lex_casemods);
365 SAVEI32(PL_lex_starts);
366 SAVEI32(PL_lex_state);
367 SAVESPTR(PL_lex_inpat);
368 SAVEI32(PL_lex_inwhat);
369 SAVEI16(PL_curcop->cop_line);
370 SAVEPPTR(PL_bufptr);
371 SAVEPPTR(PL_bufend);
372 SAVEPPTR(PL_oldbufptr);
373 SAVEPPTR(PL_oldoldbufptr);
374 SAVEPPTR(PL_linestart);
375 SAVESPTR(PL_linestr);
376 SAVEPPTR(PL_lex_brackstack);
377 SAVEPPTR(PL_lex_casestack);
c76ac1ee 378 SAVEDESTRUCTOR_X(restore_rsfp, PL_rsfp);
3280af22
NIS
379 SAVESPTR(PL_lex_stuff);
380 SAVEI32(PL_lex_defer);
09bef843 381 SAVEI32(PL_sublex_info.sub_inwhat);
3280af22 382 SAVESPTR(PL_lex_repl);
c76ac1ee
GS
383 SAVEDESTRUCTOR_X(restore_expect, PL_tokenbuf + PL_expect); /* encode as pointer */
384 SAVEDESTRUCTOR_X(restore_lex_expect, PL_tokenbuf + PL_expect);
3280af22
NIS
385
386 PL_lex_state = LEX_NORMAL;
387 PL_lex_defer = 0;
388 PL_expect = XSTATE;
389 PL_lex_brackets = 0;
390 PL_lex_fakebrack = 0;
391 New(899, PL_lex_brackstack, 120, char);
392 New(899, PL_lex_casestack, 12, char);
393 SAVEFREEPV(PL_lex_brackstack);
394 SAVEFREEPV(PL_lex_casestack);
395 PL_lex_casemods = 0;
396 *PL_lex_casestack = '\0';
397 PL_lex_dojoin = 0;
398 PL_lex_starts = 0;
399 PL_lex_stuff = Nullsv;
400 PL_lex_repl = Nullsv;
401 PL_lex_inpat = 0;
402 PL_lex_inwhat = 0;
09bef843 403 PL_sublex_info.sub_inwhat = 0;
3280af22
NIS
404 PL_linestr = line;
405 if (SvREADONLY(PL_linestr))
406 PL_linestr = sv_2mortal(newSVsv(PL_linestr));
407 s = SvPV(PL_linestr, len);
8990e307 408 if (len && s[len-1] != ';') {
3280af22
NIS
409 if (!(SvFLAGS(PL_linestr) & SVs_TEMP))
410 PL_linestr = sv_2mortal(newSVsv(PL_linestr));
411 sv_catpvn(PL_linestr, "\n;", 2);
8990e307 412 }
3280af22
NIS
413 SvTEMP_off(PL_linestr);
414 PL_oldoldbufptr = PL_oldbufptr = PL_bufptr = PL_linestart = SvPVX(PL_linestr);
415 PL_bufend = PL_bufptr + SvCUR(PL_linestr);
416 SvREFCNT_dec(PL_rs);
79cb57f6 417 PL_rs = newSVpvn("\n", 1);
3280af22 418 PL_rsfp = 0;
79072805 419}
a687059c 420
ffb4593c
NT
421/*
422 * Perl_lex_end
9cbb5ea2
GS
423 * Finalizer for lexing operations. Must be called when the parser is
424 * done with the lexer.
ffb4593c
NT
425 */
426
463ee0b2 427void
864dbfa3 428Perl_lex_end(pTHX)
463ee0b2 429{
3280af22 430 PL_doextract = FALSE;
463ee0b2
LW
431}
432
ffb4593c
NT
433/*
434 * S_incline
435 * This subroutine has nothing to do with tilting, whether at windmills
436 * or pinball tables. Its name is short for "increment line". It
437 * increments the current line number in PL_curcop->cop_line and checks
438 * to see whether the line starts with a comment of the form
9cbb5ea2
GS
439 * # line 500 "foo.pm"
440 * If so, it sets the current line number and file to the values in the comment.
ffb4593c
NT
441 */
442
76e3520e 443STATIC void
cea2e8a9 444S_incline(pTHX_ char *s)
463ee0b2 445{
0f15f207 446 dTHR;
463ee0b2
LW
447 char *t;
448 char *n;
449 char ch;
450 int sawline = 0;
451
3280af22 452 PL_curcop->cop_line++;
463ee0b2
LW
453 if (*s++ != '#')
454 return;
455 while (*s == ' ' || *s == '\t') s++;
456 if (strnEQ(s, "line ", 5)) {
457 s += 5;
458 sawline = 1;
459 }
460 if (!isDIGIT(*s))
461 return;
462 n = s;
463 while (isDIGIT(*s))
464 s++;
465 while (*s == ' ' || *s == '\t')
466 s++;
467 if (*s == '"' && (t = strchr(s+1, '"')))
468 s++;
469 else {
470 if (!sawline)
471 return; /* false alarm */
472 for (t = s; !isSPACE(*t); t++) ;
473 }
474 ch = *t;
475 *t = '\0';
476 if (t - s > 0)
3280af22 477 PL_curcop->cop_filegv = gv_fetchfile(s);
463ee0b2 478 else
3280af22 479 PL_curcop->cop_filegv = gv_fetchfile(PL_origfilename);
463ee0b2 480 *t = ch;
3280af22 481 PL_curcop->cop_line = atoi(n)-1;
463ee0b2
LW
482}
483
ffb4593c
NT
484/*
485 * S_skipspace
486 * Called to gobble the appropriate amount and type of whitespace.
487 * Skips comments as well.
488 */
489
76e3520e 490STATIC char *
cea2e8a9 491S_skipspace(pTHX_ register char *s)
a687059c 492{
11343788 493 dTHR;
3280af22
NIS
494 if (PL_lex_formbrack && PL_lex_brackets <= PL_lex_formbrack) {
495 while (s < PL_bufend && (*s == ' ' || *s == '\t'))
463ee0b2
LW
496 s++;
497 return s;
498 }
499 for (;;) {
fd049845 500 STRLEN prevlen;
09bef843
SB
501 SSize_t oldprevlen, oldoldprevlen;
502 SSize_t oldloplen, oldunilen;
60e6418e
GS
503 while (s < PL_bufend && isSPACE(*s)) {
504 if (*s++ == '\n' && PL_in_eval && !PL_rsfp)
505 incline(s);
506 }
ffb4593c
NT
507
508 /* comment */
3280af22
NIS
509 if (s < PL_bufend && *s == '#') {
510 while (s < PL_bufend && *s != '\n')
463ee0b2 511 s++;
60e6418e 512 if (s < PL_bufend) {
463ee0b2 513 s++;
60e6418e
GS
514 if (PL_in_eval && !PL_rsfp) {
515 incline(s);
516 continue;
517 }
518 }
463ee0b2 519 }
ffb4593c
NT
520
521 /* only continue to recharge the buffer if we're at the end
522 * of the buffer, we're not reading from a source filter, and
523 * we're in normal lexing mode
524 */
09bef843
SB
525 if (s < PL_bufend || !PL_rsfp || PL_sublex_info.sub_inwhat ||
526 PL_lex_state == LEX_FORMLINE)
463ee0b2 527 return s;
ffb4593c
NT
528
529 /* try to recharge the buffer */
9cbb5ea2
GS
530 if ((s = filter_gets(PL_linestr, PL_rsfp,
531 (prevlen = SvCUR(PL_linestr)))) == Nullch)
532 {
533 /* end of file. Add on the -p or -n magic */
3280af22
NIS
534 if (PL_minus_n || PL_minus_p) {
535 sv_setpv(PL_linestr,PL_minus_p ?
08e9d68e
DD
536 ";}continue{print or die qq(-p destination: $!\\n)" :
537 "");
3280af22
NIS
538 sv_catpv(PL_linestr,";}");
539 PL_minus_n = PL_minus_p = 0;
a0d0e21e
LW
540 }
541 else
3280af22 542 sv_setpv(PL_linestr,";");
ffb4593c
NT
543
544 /* reset variables for next time we lex */
9cbb5ea2
GS
545 PL_oldoldbufptr = PL_oldbufptr = PL_bufptr = s = PL_linestart
546 = SvPVX(PL_linestr);
3280af22 547 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
ffb4593c
NT
548
549 /* Close the filehandle. Could be from -P preprocessor,
550 * STDIN, or a regular file. If we were reading code from
551 * STDIN (because the commandline held no -e or filename)
552 * then we don't close it, we reset it so the code can
553 * read from STDIN too.
554 */
555
3280af22
NIS
556 if (PL_preprocess && !PL_in_eval)
557 (void)PerlProc_pclose(PL_rsfp);
558 else if ((PerlIO*)PL_rsfp == PerlIO_stdin())
559 PerlIO_clearerr(PL_rsfp);
8990e307 560 else
3280af22
NIS
561 (void)PerlIO_close(PL_rsfp);
562 PL_rsfp = Nullfp;
463ee0b2
LW
563 return s;
564 }
ffb4593c
NT
565
566 /* not at end of file, so we only read another line */
09bef843
SB
567 /* make corresponding updates to old pointers, for yyerror() */
568 oldprevlen = PL_oldbufptr - PL_bufend;
569 oldoldprevlen = PL_oldoldbufptr - PL_bufend;
570 if (PL_last_uni)
571 oldunilen = PL_last_uni - PL_bufend;
572 if (PL_last_lop)
573 oldloplen = PL_last_lop - PL_bufend;
3280af22
NIS
574 PL_linestart = PL_bufptr = s + prevlen;
575 PL_bufend = s + SvCUR(PL_linestr);
576 s = PL_bufptr;
09bef843
SB
577 PL_oldbufptr = s + oldprevlen;
578 PL_oldoldbufptr = s + oldoldprevlen;
579 if (PL_last_uni)
580 PL_last_uni = s + oldunilen;
581 if (PL_last_lop)
582 PL_last_lop = s + oldloplen;
a0d0e21e 583 incline(s);
ffb4593c
NT
584
585 /* debugger active and we're not compiling the debugger code,
586 * so store the line into the debugger's array of lines
587 */
3280af22 588 if (PERLDB_LINE && PL_curstash != PL_debstash) {
8990e307
LW
589 SV *sv = NEWSV(85,0);
590
591 sv_upgrade(sv, SVt_PVMG);
3280af22
NIS
592 sv_setpvn(sv,PL_bufptr,PL_bufend-PL_bufptr);
593 av_store(GvAV(PL_curcop->cop_filegv),(I32)PL_curcop->cop_line,sv);
8990e307 594 }
463ee0b2 595 }
a687059c 596}
378cc40b 597
ffb4593c
NT
598/*
599 * S_check_uni
600 * Check the unary operators to ensure there's no ambiguity in how they're
601 * used. An ambiguous piece of code would be:
602 * rand + 5
603 * This doesn't mean rand() + 5. Because rand() is a unary operator,
604 * the +5 is its argument.
605 */
606
76e3520e 607STATIC void
cea2e8a9 608S_check_uni(pTHX)
ba106d47 609{
2f3197b3 610 char *s;
a0d0e21e 611 char *t;
0453d815 612 dTHR;
2f3197b3 613
3280af22 614 if (PL_oldoldbufptr != PL_last_uni)
2f3197b3 615 return;
3280af22
NIS
616 while (isSPACE(*PL_last_uni))
617 PL_last_uni++;
834a4ddd 618 for (s = PL_last_uni; isALNUM_lazy(s) || *s == '-'; s++) ;
3280af22 619 if ((t = strchr(s, '(')) && t < PL_bufptr)
a0d0e21e 620 return;
0453d815 621 if (ckWARN_d(WARN_AMBIGUOUS)){
f248d071 622 char ch = *s;
0453d815
PM
623 *s = '\0';
624 Perl_warner(aTHX_ WARN_AMBIGUOUS,
625 "Warning: Use of \"%s\" without parens is ambiguous",
626 PL_last_uni);
627 *s = ch;
628 }
2f3197b3
LW
629}
630
ffb4593c
NT
631/* workaround to replace the UNI() macro with a function. Only the
632 * hints/uts.sh file mentions this. Other comments elsewhere in the
633 * source indicate Microport Unix might need it too.
634 */
635
ffed7fef
LW
636#ifdef CRIPPLED_CC
637
638#undef UNI
ffed7fef 639#define UNI(f) return uni(f,s)
ffed7fef 640
76e3520e 641STATIC int
cea2e8a9 642S_uni(pTHX_ I32 f, char *s)
ffed7fef
LW
643{
644 yylval.ival = f;
3280af22
NIS
645 PL_expect = XTERM;
646 PL_bufptr = s;
8f872242
NIS
647 PL_last_uni = PL_oldbufptr;
648 PL_last_lop_op = f;
ffed7fef
LW
649 if (*s == '(')
650 return FUNC1;
651 s = skipspace(s);
652 if (*s == '(')
653 return FUNC1;
654 else
655 return UNIOP;
656}
657
a0d0e21e
LW
658#endif /* CRIPPLED_CC */
659
ffb4593c
NT
660/*
661 * LOP : macro to build a list operator. Its behaviour has been replaced
662 * with a subroutine, S_lop() for which LOP is just another name.
663 */
664
a0d0e21e
LW
665#define LOP(f,x) return lop(f,x,s)
666
ffb4593c
NT
667/*
668 * S_lop
669 * Build a list operator (or something that might be one). The rules:
670 * - if we have a next token, then it's a list operator [why?]
671 * - if the next thing is an opening paren, then it's a function
672 * - else it's a list operator
673 */
674
76e3520e 675STATIC I32
cea2e8a9 676S_lop(pTHX_ I32 f, expectation x, char *s)
ffed7fef 677{
0f15f207 678 dTHR;
79072805 679 yylval.ival = f;
35c8bce7 680 CLINE;
3280af22
NIS
681 PL_expect = x;
682 PL_bufptr = s;
683 PL_last_lop = PL_oldbufptr;
684 PL_last_lop_op = f;
685 if (PL_nexttoke)
a0d0e21e 686 return LSTOP;
79072805
LW
687 if (*s == '(')
688 return FUNC;
689 s = skipspace(s);
690 if (*s == '(')
691 return FUNC;
692 else
693 return LSTOP;
694}
695
ffb4593c
NT
696/*
697 * S_force_next
9cbb5ea2 698 * When the lexer realizes it knows the next token (for instance,
ffb4593c 699 * it is reordering tokens for the parser) then it can call S_force_next
9cbb5ea2
GS
700 * to know what token to return the next time the lexer is called. Caller
701 * will need to set PL_nextval[], and possibly PL_expect to ensure the lexer
702 * handles the token correctly.
ffb4593c
NT
703 */
704
76e3520e 705STATIC void
cea2e8a9 706S_force_next(pTHX_ I32 type)
79072805 707{
3280af22
NIS
708 PL_nexttype[PL_nexttoke] = type;
709 PL_nexttoke++;
710 if (PL_lex_state != LEX_KNOWNEXT) {
711 PL_lex_defer = PL_lex_state;
712 PL_lex_expect = PL_expect;
713 PL_lex_state = LEX_KNOWNEXT;
79072805
LW
714 }
715}
716
ffb4593c
NT
717/*
718 * S_force_word
719 * When the lexer knows the next thing is a word (for instance, it has
720 * just seen -> and it knows that the next char is a word char, then
721 * it calls S_force_word to stick the next word into the PL_next lookahead.
722 *
723 * Arguments:
b1b65b59 724 * char *start : buffer position (must be within PL_linestr)
ffb4593c
NT
725 * int token : PL_next will be this type of bare word (e.g., METHOD,WORD)
726 * int check_keyword : if true, Perl checks to make sure the word isn't
727 * a keyword (do this if the word is a label, e.g. goto FOO)
728 * int allow_pack : if true, : characters will also be allowed (require,
729 * use, etc. do this)
9cbb5ea2 730 * int allow_initial_tick : used by the "sub" lexer only.
ffb4593c
NT
731 */
732
76e3520e 733STATIC char *
cea2e8a9 734S_force_word(pTHX_ register char *start, int token, int check_keyword, int allow_pack, int allow_initial_tick)
79072805 735{
463ee0b2
LW
736 register char *s;
737 STRLEN len;
738
739 start = skipspace(start);
740 s = start;
834a4ddd 741 if (isIDFIRST_lazy(s) ||
a0d0e21e 742 (allow_pack && *s == ':') ||
15f0808c 743 (allow_initial_tick && *s == '\'') )
a0d0e21e 744 {
3280af22
NIS
745 s = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, allow_pack, &len);
746 if (check_keyword && keyword(PL_tokenbuf, len))
463ee0b2
LW
747 return start;
748 if (token == METHOD) {
749 s = skipspace(s);
750 if (*s == '(')
3280af22 751 PL_expect = XTERM;
463ee0b2 752 else {
3280af22 753 PL_expect = XOPERATOR;
463ee0b2 754 }
79072805 755 }
3280af22
NIS
756 PL_nextval[PL_nexttoke].opval = (OP*)newSVOP(OP_CONST,0, newSVpv(PL_tokenbuf,0));
757 PL_nextval[PL_nexttoke].opval->op_private |= OPpCONST_BARE;
79072805
LW
758 force_next(token);
759 }
760 return s;
761}
762
ffb4593c
NT
763/*
764 * S_force_ident
9cbb5ea2 765 * Called when the lexer wants $foo *foo &foo etc, but the program
ffb4593c
NT
766 * text only contains the "foo" portion. The first argument is a pointer
767 * to the "foo", and the second argument is the type symbol to prefix.
768 * Forces the next token to be a "WORD".
9cbb5ea2 769 * Creates the symbol if it didn't already exist (via gv_fetchpv()).
ffb4593c
NT
770 */
771
76e3520e 772STATIC void
cea2e8a9 773S_force_ident(pTHX_ register char *s, int kind)
79072805
LW
774{
775 if (s && *s) {
11343788 776 OP* o = (OP*)newSVOP(OP_CONST, 0, newSVpv(s,0));
3280af22 777 PL_nextval[PL_nexttoke].opval = o;
79072805 778 force_next(WORD);
748a9306 779 if (kind) {
e858de61 780 dTHR; /* just for in_eval */
11343788 781 o->op_private = OPpCONST_ENTERED;
55497cff 782 /* XXX see note in pp_entereval() for why we forgo typo
783 warnings if the symbol must be introduced in an eval.
784 GSAR 96-10-12 */
3280af22 785 gv_fetchpv(s, PL_in_eval ? (GV_ADDMULTI | GV_ADDINEVAL) : TRUE,
a0d0e21e
LW
786 kind == '$' ? SVt_PV :
787 kind == '@' ? SVt_PVAV :
788 kind == '%' ? SVt_PVHV :
789 SVt_PVGV
790 );
748a9306 791 }
79072805
LW
792 }
793}
794
ffb4593c
NT
795/*
796 * S_force_version
797 * Forces the next token to be a version number.
798 */
799
76e3520e 800STATIC char *
cea2e8a9 801S_force_version(pTHX_ char *s)
89bfa8cd 802{
803 OP *version = Nullop;
804
805 s = skipspace(s);
806
807 /* default VERSION number -- GBARR */
808
809 if(isDIGIT(*s)) {
810 char *d;
811 int c;
55497cff 812 for( d=s, c = 1; isDIGIT(*d) || *d == '_' || (*d == '.' && c--); d++);
89bfa8cd 813 if((*d == ';' || isSPACE(*d)) && *(skipspace(d)) != ',') {
814 s = scan_num(s);
815 /* real VERSION number -- GBARR */
816 version = yylval.opval;
817 }
818 }
819
820 /* NOTE: The parser sees the package name and the VERSION swapped */
3280af22 821 PL_nextval[PL_nexttoke].opval = version;
89bfa8cd 822 force_next(WORD);
823
824 return (s);
825}
826
ffb4593c
NT
827/*
828 * S_tokeq
829 * Tokenize a quoted string passed in as an SV. It finds the next
830 * chunk, up to end of string or a backslash. It may make a new
831 * SV containing that chunk (if HINT_NEW_STRING is on). It also
832 * turns \\ into \.
833 */
834
76e3520e 835STATIC SV *
cea2e8a9 836S_tokeq(pTHX_ SV *sv)
79072805
LW
837{
838 register char *s;
839 register char *send;
840 register char *d;
b3ac6de7
IZ
841 STRLEN len = 0;
842 SV *pv = sv;
79072805
LW
843
844 if (!SvLEN(sv))
b3ac6de7 845 goto finish;
79072805 846
a0d0e21e 847 s = SvPV_force(sv, len);
748a9306 848 if (SvIVX(sv) == -1)
b3ac6de7 849 goto finish;
463ee0b2 850 send = s + len;
79072805
LW
851 while (s < send && *s != '\\')
852 s++;
853 if (s == send)
b3ac6de7 854 goto finish;
79072805 855 d = s;
3280af22 856 if ( PL_hints & HINT_NEW_STRING )
79cb57f6 857 pv = sv_2mortal(newSVpvn(SvPVX(pv), len));
79072805
LW
858 while (s < send) {
859 if (*s == '\\') {
a0d0e21e 860 if (s + 1 < send && (s[1] == '\\'))
79072805
LW
861 s++; /* all that, just for this */
862 }
863 *d++ = *s++;
864 }
865 *d = '\0';
463ee0b2 866 SvCUR_set(sv, d - SvPVX(sv));
b3ac6de7 867 finish:
3280af22 868 if ( PL_hints & HINT_NEW_STRING )
b3ac6de7 869 return new_constant(NULL, 0, "q", sv, pv, "q");
79072805
LW
870 return sv;
871}
872
ffb4593c
NT
873/*
874 * Now come three functions related to double-quote context,
875 * S_sublex_start, S_sublex_push, and S_sublex_done. They're used when
876 * converting things like "\u\Lgnat" into ucfirst(lc("gnat")). They
877 * interact with PL_lex_state, and create fake ( ... ) argument lists
878 * to handle functions and concatenation.
879 * They assume that whoever calls them will be setting up a fake
880 * join call, because each subthing puts a ',' after it. This lets
881 * "lower \luPpEr"
882 * become
883 * join($, , 'lower ', lcfirst( 'uPpEr', ) ,)
884 *
885 * (I'm not sure whether the spurious commas at the end of lcfirst's
886 * arguments and join's arguments are created or not).
887 */
888
889/*
890 * S_sublex_start
891 * Assumes that yylval.ival is the op we're creating (e.g. OP_LCFIRST).
892 *
893 * Pattern matching will set PL_lex_op to the pattern-matching op to
894 * make (we return THING if yylval.ival is OP_NULL, PMFUNC otherwise).
895 *
896 * OP_CONST and OP_READLINE are easy--just make the new op and return.
897 *
898 * Everything else becomes a FUNC.
899 *
900 * Sets PL_lex_state to LEX_INTERPPUSH unless (ival was OP_NULL or we
901 * had an OP_CONST or OP_READLINE). This just sets us up for a
902 * call to S_sublex_push().
903 */
904
76e3520e 905STATIC I32
cea2e8a9 906S_sublex_start(pTHX)
79072805
LW
907{
908 register I32 op_type = yylval.ival;
79072805
LW
909
910 if (op_type == OP_NULL) {
3280af22
NIS
911 yylval.opval = PL_lex_op;
912 PL_lex_op = Nullop;
79072805
LW
913 return THING;
914 }
915 if (op_type == OP_CONST || op_type == OP_READLINE) {
3280af22 916 SV *sv = tokeq(PL_lex_stuff);
b3ac6de7
IZ
917
918 if (SvTYPE(sv) == SVt_PVIV) {
919 /* Overloaded constants, nothing fancy: Convert to SVt_PV: */
920 STRLEN len;
921 char *p;
922 SV *nsv;
923
924 p = SvPV(sv, len);
79cb57f6 925 nsv = newSVpvn(p, len);
b3ac6de7
IZ
926 SvREFCNT_dec(sv);
927 sv = nsv;
928 }
929 yylval.opval = (OP*)newSVOP(op_type, 0, sv);
3280af22 930 PL_lex_stuff = Nullsv;
79072805
LW
931 return THING;
932 }
933
3280af22
NIS
934 PL_sublex_info.super_state = PL_lex_state;
935 PL_sublex_info.sub_inwhat = op_type;
936 PL_sublex_info.sub_op = PL_lex_op;
937 PL_lex_state = LEX_INTERPPUSH;
55497cff 938
3280af22
NIS
939 PL_expect = XTERM;
940 if (PL_lex_op) {
941 yylval.opval = PL_lex_op;
942 PL_lex_op = Nullop;
55497cff 943 return PMFUNC;
944 }
945 else
946 return FUNC;
947}
948
ffb4593c
NT
949/*
950 * S_sublex_push
951 * Create a new scope to save the lexing state. The scope will be
952 * ended in S_sublex_done. Returns a '(', starting the function arguments
953 * to the uc, lc, etc. found before.
954 * Sets PL_lex_state to LEX_INTERPCONCAT.
955 */
956
76e3520e 957STATIC I32
cea2e8a9 958S_sublex_push(pTHX)
55497cff 959{
0f15f207 960 dTHR;
f46d017c 961 ENTER;
55497cff 962
3280af22
NIS
963 PL_lex_state = PL_sublex_info.super_state;
964 SAVEI32(PL_lex_dojoin);
965 SAVEI32(PL_lex_brackets);
966 SAVEI32(PL_lex_fakebrack);
967 SAVEI32(PL_lex_casemods);
968 SAVEI32(PL_lex_starts);
969 SAVEI32(PL_lex_state);
970 SAVESPTR(PL_lex_inpat);
971 SAVEI32(PL_lex_inwhat);
972 SAVEI16(PL_curcop->cop_line);
973 SAVEPPTR(PL_bufptr);
974 SAVEPPTR(PL_oldbufptr);
975 SAVEPPTR(PL_oldoldbufptr);
976 SAVEPPTR(PL_linestart);
977 SAVESPTR(PL_linestr);
978 SAVEPPTR(PL_lex_brackstack);
979 SAVEPPTR(PL_lex_casestack);
980
981 PL_linestr = PL_lex_stuff;
982 PL_lex_stuff = Nullsv;
983
9cbb5ea2
GS
984 PL_bufend = PL_bufptr = PL_oldbufptr = PL_oldoldbufptr = PL_linestart
985 = SvPVX(PL_linestr);
3280af22
NIS
986 PL_bufend += SvCUR(PL_linestr);
987 SAVEFREESV(PL_linestr);
988
989 PL_lex_dojoin = FALSE;
990 PL_lex_brackets = 0;
991 PL_lex_fakebrack = 0;
992 New(899, PL_lex_brackstack, 120, char);
993 New(899, PL_lex_casestack, 12, char);
994 SAVEFREEPV(PL_lex_brackstack);
995 SAVEFREEPV(PL_lex_casestack);
996 PL_lex_casemods = 0;
997 *PL_lex_casestack = '\0';
998 PL_lex_starts = 0;
999 PL_lex_state = LEX_INTERPCONCAT;
1000 PL_curcop->cop_line = PL_multi_start;
1001
1002 PL_lex_inwhat = PL_sublex_info.sub_inwhat;
1003 if (PL_lex_inwhat == OP_MATCH || PL_lex_inwhat == OP_QR || PL_lex_inwhat == OP_SUBST)
1004 PL_lex_inpat = PL_sublex_info.sub_op;
79072805 1005 else
3280af22 1006 PL_lex_inpat = Nullop;
79072805 1007
55497cff 1008 return '(';
79072805
LW
1009}
1010
ffb4593c
NT
1011/*
1012 * S_sublex_done
1013 * Restores lexer state after a S_sublex_push.
1014 */
1015
76e3520e 1016STATIC I32
cea2e8a9 1017S_sublex_done(pTHX)
79072805 1018{
3280af22
NIS
1019 if (!PL_lex_starts++) {
1020 PL_expect = XOPERATOR;
79cb57f6 1021 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpvn("",0));
79072805
LW
1022 return THING;
1023 }
1024
3280af22
NIS
1025 if (PL_lex_casemods) { /* oops, we've got some unbalanced parens */
1026 PL_lex_state = LEX_INTERPCASEMOD;
cea2e8a9 1027 return yylex();
79072805
LW
1028 }
1029
ffb4593c 1030 /* Is there a right-hand side to take care of? (s//RHS/ or tr//RHS/) */
3280af22
NIS
1031 if (PL_lex_repl && (PL_lex_inwhat == OP_SUBST || PL_lex_inwhat == OP_TRANS)) {
1032 PL_linestr = PL_lex_repl;
1033 PL_lex_inpat = 0;
1034 PL_bufend = PL_bufptr = PL_oldbufptr = PL_oldoldbufptr = PL_linestart = SvPVX(PL_linestr);
1035 PL_bufend += SvCUR(PL_linestr);
1036 SAVEFREESV(PL_linestr);
1037 PL_lex_dojoin = FALSE;
1038 PL_lex_brackets = 0;
1039 PL_lex_fakebrack = 0;
1040 PL_lex_casemods = 0;
1041 *PL_lex_casestack = '\0';
1042 PL_lex_starts = 0;
25da4f38 1043 if (SvEVALED(PL_lex_repl)) {
3280af22
NIS
1044 PL_lex_state = LEX_INTERPNORMAL;
1045 PL_lex_starts++;
e9fa98b2
HS
1046 /* we don't clear PL_lex_repl here, so that we can check later
1047 whether this is an evalled subst; that means we rely on the
1048 logic to ensure sublex_done() is called again only via the
1049 branch (in yylex()) that clears PL_lex_repl, else we'll loop */
79072805 1050 }
e9fa98b2 1051 else {
3280af22 1052 PL_lex_state = LEX_INTERPCONCAT;
e9fa98b2
HS
1053 PL_lex_repl = Nullsv;
1054 }
79072805 1055 return ',';
ffed7fef
LW
1056 }
1057 else {
f46d017c 1058 LEAVE;
3280af22
NIS
1059 PL_bufend = SvPVX(PL_linestr);
1060 PL_bufend += SvCUR(PL_linestr);
1061 PL_expect = XOPERATOR;
09bef843 1062 PL_sublex_info.sub_inwhat = 0;
79072805 1063 return ')';
ffed7fef
LW
1064 }
1065}
1066
02aa26ce
NT
1067/*
1068 scan_const
1069
1070 Extracts a pattern, double-quoted string, or transliteration. This
1071 is terrifying code.
1072
3280af22
NIS
1073 It looks at lex_inwhat and PL_lex_inpat to find out whether it's
1074 processing a pattern (PL_lex_inpat is true), a transliteration
02aa26ce
NT
1075 (lex_inwhat & OP_TRANS is true), or a double-quoted string.
1076
9b599b2a
GS
1077 Returns a pointer to the character scanned up to. Iff this is
1078 advanced from the start pointer supplied (ie if anything was
1079 successfully parsed), will leave an OP for the substring scanned
1080 in yylval. Caller must intuit reason for not parsing further
1081 by looking at the next characters herself.
1082
02aa26ce
NT
1083 In patterns:
1084 backslashes:
1085 double-quoted style: \r and \n
1086 regexp special ones: \D \s
1087 constants: \x3
1088 backrefs: \1 (deprecated in substitution replacements)
1089 case and quoting: \U \Q \E
1090 stops on @ and $, but not for $ as tail anchor
1091
1092 In transliterations:
1093 characters are VERY literal, except for - not at the start or end
1094 of the string, which indicates a range. scan_const expands the
1095 range to the full set of intermediate characters.
1096
1097 In double-quoted strings:
1098 backslashes:
1099 double-quoted style: \r and \n
1100 constants: \x3
1101 backrefs: \1 (deprecated)
1102 case and quoting: \U \Q \E
1103 stops on @ and $
1104
1105 scan_const does *not* construct ops to handle interpolated strings.
1106 It stops processing as soon as it finds an embedded $ or @ variable
1107 and leaves it to the caller to work out what's going on.
1108
1109 @ in pattern could be: @foo, @{foo}, @$foo, @'foo, @:foo.
1110
1111 $ in pattern could be $foo or could be tail anchor. Assumption:
1112 it's a tail anchor if $ is the last thing in the string, or if it's
1113 followed by one of ")| \n\t"
1114
1115 \1 (backreferences) are turned into $1
1116
1117 The structure of the code is
1118 while (there's a character to process) {
1119 handle transliteration ranges
1120 skip regexp comments
1121 skip # initiated comments in //x patterns
1122 check for embedded @foo
1123 check for embedded scalars
1124 if (backslash) {
1125 leave intact backslashes from leave (below)
1126 deprecate \1 in strings and sub replacements
1127 handle string-changing backslashes \l \U \Q \E, etc.
1128 switch (what was escaped) {
1129 handle - in a transliteration (becomes a literal -)
1130 handle \132 octal characters
1131 handle 0x15 hex characters
1132 handle \cV (control V)
1133 handle printf backslashes (\f, \r, \n, etc)
1134 } (end switch)
1135 } (end if backslash)
1136 } (end while character to read)
1137
1138*/
1139
76e3520e 1140STATIC char *
cea2e8a9 1141S_scan_const(pTHX_ char *start)
79072805 1142{
3280af22 1143 register char *send = PL_bufend; /* end of the constant */
02aa26ce
NT
1144 SV *sv = NEWSV(93, send - start); /* sv for the constant */
1145 register char *s = start; /* start of the constant */
1146 register char *d = SvPVX(sv); /* destination for copies */
1147 bool dorange = FALSE; /* are we in a translit range? */
1148 I32 len; /* ? */
ac2262e3 1149 I32 utf = (PL_lex_inwhat == OP_TRANS && PL_sublex_info.sub_op)
a0ed51b3
LW
1150 ? (PL_sublex_info.sub_op->op_private & (OPpTRANS_FROM_UTF|OPpTRANS_TO_UTF))
1151 : UTF;
ac2262e3 1152 I32 thisutf = (PL_lex_inwhat == OP_TRANS && PL_sublex_info.sub_op)
9cbb5ea2
GS
1153 ? (PL_sublex_info.sub_op->op_private & (PL_lex_repl ?
1154 OPpTRANS_FROM_UTF : OPpTRANS_TO_UTF))
a0ed51b3 1155 : UTF;
9cbb5ea2 1156 char *leaveit = /* set of acceptably-backslashed characters */
3280af22 1157 PL_lex_inpat
4a2d328f 1158 ? "\\.^$@AGZdDwWsSbBpPXC+*?|()-nrtfeaxcz0123456789[{]} \t\n\r\f\v#"
9b599b2a 1159 : "";
79072805
LW
1160
1161 while (s < send || dorange) {
02aa26ce 1162 /* get transliterations out of the way (they're most literal) */
3280af22 1163 if (PL_lex_inwhat == OP_TRANS) {
02aa26ce 1164 /* expand a range A-Z to the full set of characters. AIE! */
79072805 1165 if (dorange) {
02aa26ce 1166 I32 i; /* current expanded character */
8ada0baa 1167 I32 min; /* first character in range */
02aa26ce
NT
1168 I32 max; /* last character in range */
1169
1170 i = d - SvPVX(sv); /* remember current offset */
9cbb5ea2
GS
1171 SvGROW(sv, SvLEN(sv) + 256); /* never more than 256 chars in a range */
1172 d = SvPVX(sv) + i; /* refresh d after realloc */
02aa26ce
NT
1173 d -= 2; /* eat the first char and the - */
1174
8ada0baa
JH
1175 min = (U8)*d; /* first char in range */
1176 max = (U8)d[1]; /* last char in range */
1177
1178#ifndef ASCIIish
1179 if ((isLOWER(min) && isLOWER(max)) ||
1180 (isUPPER(min) && isUPPER(max))) {
1181 if (isLOWER(min)) {
1182 for (i = min; i <= max; i++)
1183 if (isLOWER(i))
1184 *d++ = i;
1185 } else {
1186 for (i = min; i <= max; i++)
1187 if (isUPPER(i))
1188 *d++ = i;
1189 }
1190 }
1191 else
1192#endif
1193 for (i = min; i <= max; i++)
1194 *d++ = i;
02aa26ce
NT
1195
1196 /* mark the range as done, and continue */
79072805
LW
1197 dorange = FALSE;
1198 continue;
1199 }
02aa26ce
NT
1200
1201 /* range begins (ignore - as first or last char) */
79072805 1202 else if (*s == '-' && s+1 < send && s != start) {
a0ed51b3 1203 if (utf) {
a176fa2a 1204 *d++ = (char)0xff; /* use illegal utf8 byte--see pmtrans */
a0ed51b3
LW
1205 s++;
1206 continue;
1207 }
79072805
LW
1208 dorange = TRUE;
1209 s++;
1210 }
1211 }
02aa26ce
NT
1212
1213 /* if we get here, we're not doing a transliteration */
1214
0f5d15d6
IZ
1215 /* skip for regexp comments /(?#comment)/ and code /(?{code})/,
1216 except for the last char, which will be done separately. */
3280af22 1217 else if (*s == '(' && PL_lex_inpat && s[1] == '?') {
cc6b7395
IZ
1218 if (s[2] == '#') {
1219 while (s < send && *s != ')')
1220 *d++ = *s++;
0f5d15d6
IZ
1221 } else if (s[2] == '{'
1222 || s[2] == 'p' && s[3] == '{') { /* This should march regcomp.c */
cc6b7395 1223 I32 count = 1;
0f5d15d6 1224 char *regparse = s + (s[2] == '{' ? 3 : 4);
cc6b7395
IZ
1225 char c;
1226
d9f97599
GS
1227 while (count && (c = *regparse)) {
1228 if (c == '\\' && regparse[1])
1229 regparse++;
cc6b7395
IZ
1230 else if (c == '{')
1231 count++;
1232 else if (c == '}')
1233 count--;
d9f97599 1234 regparse++;
cc6b7395 1235 }
5bdf89e7
IZ
1236 if (*regparse != ')') {
1237 regparse--; /* Leave one char for continuation. */
cc6b7395 1238 yyerror("Sequence (?{...}) not terminated or not {}-balanced");
5bdf89e7 1239 }
0f5d15d6 1240 while (s < regparse)
cc6b7395
IZ
1241 *d++ = *s++;
1242 }
748a9306 1243 }
02aa26ce
NT
1244
1245 /* likewise skip #-initiated comments in //x patterns */
3280af22
NIS
1246 else if (*s == '#' && PL_lex_inpat &&
1247 ((PMOP*)PL_lex_inpat)->op_pmflags & PMf_EXTENDED) {
748a9306
LW
1248 while (s+1 < send && *s != '\n')
1249 *d++ = *s++;
1250 }
02aa26ce
NT
1251
1252 /* check for embedded arrays (@foo, @:foo, @'foo, @{foo}, @$foo) */
834a4ddd 1253 else if (*s == '@' && s[1] && (isALNUM_lazy(s+1) || strchr(":'{$", s[1])))
79072805 1254 break;
02aa26ce
NT
1255
1256 /* check for embedded scalars. only stop if we're sure it's a
1257 variable.
1258 */
79072805 1259 else if (*s == '$') {
3280af22 1260 if (!PL_lex_inpat) /* not a regexp, so $ must be var */
79072805 1261 break;
c277df42 1262 if (s + 1 < send && !strchr("()| \n\t", s[1]))
79072805
LW
1263 break; /* in regexp, $ might be tail anchor */
1264 }
02aa26ce 1265
a0ed51b3
LW
1266 /* (now in tr/// code again) */
1267
d008e5eb
GS
1268 if (*s & 0x80 && thisutf) {
1269 dTHR; /* only for ckWARN */
1270 if (ckWARN(WARN_UTF8)) {
dfe13c55 1271 (void)utf8_to_uv((U8*)s, &len); /* could cvt latin-1 to utf8 here... */
d008e5eb
GS
1272 if (len) {
1273 while (len--)
1274 *d++ = *s++;
1275 continue;
1276 }
a0ed51b3
LW
1277 }
1278 }
1279
02aa26ce 1280 /* backslashes */
79072805
LW
1281 if (*s == '\\' && s+1 < send) {
1282 s++;
02aa26ce
NT
1283
1284 /* some backslashes we leave behind */
c9f97d15 1285 if (*leaveit && *s && strchr(leaveit, *s)) {
79072805
LW
1286 *d++ = '\\';
1287 *d++ = *s++;
1288 continue;
1289 }
02aa26ce
NT
1290
1291 /* deprecate \1 in strings and substitution replacements */
3280af22 1292 if (PL_lex_inwhat == OP_SUBST && !PL_lex_inpat &&
a0d0e21e 1293 isDIGIT(*s) && *s != '0' && !isDIGIT(s[1]))
79072805 1294 {
d008e5eb 1295 dTHR; /* only for ckWARN */
599cee73 1296 if (ckWARN(WARN_SYNTAX))
cea2e8a9 1297 Perl_warner(aTHX_ WARN_SYNTAX, "\\%c better written as $%c", *s, *s);
79072805
LW
1298 *--s = '$';
1299 break;
1300 }
02aa26ce
NT
1301
1302 /* string-change backslash escapes */
3280af22 1303 if (PL_lex_inwhat != OP_TRANS && *s && strchr("lLuUEQ", *s)) {
79072805
LW
1304 --s;
1305 break;
1306 }
02aa26ce
NT
1307
1308 /* if we get here, it's either a quoted -, or a digit */
79072805 1309 switch (*s) {
02aa26ce
NT
1310
1311 /* quoted - in transliterations */
79072805 1312 case '-':
3280af22 1313 if (PL_lex_inwhat == OP_TRANS) {
79072805
LW
1314 *d++ = *s++;
1315 continue;
1316 }
1317 /* FALL THROUGH */
1318 default:
11b8faa4
JH
1319 {
1320 dTHR;
1321 if (ckWARN(WARN_UNSAFE) && isALPHA(*s))
cea2e8a9 1322 Perl_warner(aTHX_ WARN_UNSAFE,
11b8faa4
JH
1323 "Unrecognized escape \\%c passed through",
1324 *s);
1325 /* default action is to copy the quoted character */
1326 *d++ = *s++;
1327 continue;
1328 }
02aa26ce
NT
1329
1330 /* \132 indicates an octal constant */
79072805
LW
1331 case '0': case '1': case '2': case '3':
1332 case '4': case '5': case '6': case '7':
1333 *d++ = scan_oct(s, 3, &len);
1334 s += len;
1335 continue;
02aa26ce
NT
1336
1337 /* \x24 indicates a hex constant */
79072805 1338 case 'x':
a0ed51b3
LW
1339 ++s;
1340 if (*s == '{') {
1341 char* e = strchr(s, '}');
1342
adaeee49 1343 if (!e) {
a0ed51b3 1344 yyerror("Missing right brace on \\x{}");
adaeee49
GA
1345 e = s;
1346 }
d008e5eb
GS
1347 if (!utf) {
1348 dTHR;
1349 if (ckWARN(WARN_UTF8))
cea2e8a9 1350 Perl_warner(aTHX_ WARN_UTF8,
d008e5eb
GS
1351 "Use of \\x{} without utf8 declaration");
1352 }
a0ed51b3 1353 /* note: utf always shorter than hex */
dfe13c55
GS
1354 d = (char*)uv_to_utf8((U8*)d,
1355 scan_hex(s + 1, e - s - 1, &len));
a0ed51b3 1356 s = e + 1;
a0ed51b3
LW
1357 }
1358 else {
1359 UV uv = (UV)scan_hex(s, 2, &len);
1360 if (utf && PL_lex_inwhat == OP_TRANS &&
1361 utf != (OPpTRANS_FROM_UTF|OPpTRANS_TO_UTF))
1362 {
dfe13c55 1363 d = (char*)uv_to_utf8((U8*)d, uv); /* doing a CU or UC */
a0ed51b3
LW
1364 }
1365 else {
d008e5eb
GS
1366 if (uv >= 127 && UTF) {
1367 dTHR;
1368 if (ckWARN(WARN_UTF8))
cea2e8a9 1369 Perl_warner(aTHX_ WARN_UTF8,
d008e5eb
GS
1370 "\\x%.*s will produce malformed UTF-8 character; use \\x{%.*s} for that",
1371 len,s,len,s);
1372 }
a0ed51b3
LW
1373 *d++ = (char)uv;
1374 }
1375 s += len;
1376 }
79072805 1377 continue;
02aa26ce 1378
4a2d328f
IZ
1379 /* \N{latin small letter a} is a named character */
1380 case 'N':
423cee85
JH
1381 ++s;
1382 if (*s == '{') {
1383 char* e = strchr(s, '}');
1384 HV *hv;
1385 SV **svp;
1386 SV *res, *cv;
1387 STRLEN len;
1388 char *str;
1389 char *why = Nullch;
1390
1391 if (!e) {
5777a3f7 1392 yyerror("Missing right brace on \\N{}");
423cee85
JH
1393 e = s - 1;
1394 goto cont_scan;
1395 }
1396 res = newSVpvn(s + 1, e - s - 1);
1397 res = new_constant( Nullch, 0, "charnames",
5777a3f7 1398 res, Nullsv, "\\N{...}" );
423cee85
JH
1399 str = SvPV(res,len);
1400 if (len > e - s + 4) {
1401 char *odest = SvPVX(sv);
1402
1403 SvGROW(sv, (SvCUR(sv) + len - (e - s + 4)));
1404 d = SvPVX(sv) + (d - odest);
1405 }
1406 Copy(str, d, len, char);
1407 d += len;
1408 SvREFCNT_dec(res);
1409 cont_scan:
1410 s = e + 1;
1411 }
1412 else
5777a3f7 1413 yyerror("Missing braces on \\N{}");
423cee85
JH
1414 continue;
1415
02aa26ce 1416 /* \c is a control character */
79072805
LW
1417 case 'c':
1418 s++;
9d116dd7
JH
1419#ifdef EBCDIC
1420 *d = *s++;
1421 if (isLOWER(*d))
1422 *d = toUPPER(*d);
1423 *d++ = toCTRL(*d);
1424#else
bbce6d69 1425 len = *s++;
1426 *d++ = toCTRL(len);
9d116dd7 1427#endif
79072805 1428 continue;
02aa26ce
NT
1429
1430 /* printf-style backslashes, formfeeds, newlines, etc */
79072805
LW
1431 case 'b':
1432 *d++ = '\b';
1433 break;
1434 case 'n':
1435 *d++ = '\n';
1436 break;
1437 case 'r':
1438 *d++ = '\r';
1439 break;
1440 case 'f':
1441 *d++ = '\f';
1442 break;
1443 case 't':
1444 *d++ = '\t';
1445 break;
34a3fe2a
PP
1446#ifdef EBCDIC
1447 case 'e':
1448 *d++ = '\047'; /* CP 1047 */
1449 break;
1450 case 'a':
1451 *d++ = '\057'; /* CP 1047 */
1452 break;
1453#else
79072805
LW
1454 case 'e':
1455 *d++ = '\033';
1456 break;
1457 case 'a':
1458 *d++ = '\007';
1459 break;
34a3fe2a 1460#endif
02aa26ce
NT
1461 } /* end switch */
1462
79072805
LW
1463 s++;
1464 continue;
02aa26ce
NT
1465 } /* end if (backslash) */
1466
79072805 1467 *d++ = *s++;
02aa26ce
NT
1468 } /* while loop to process each character */
1469
1470 /* terminate the string and set up the sv */
79072805 1471 *d = '\0';
463ee0b2 1472 SvCUR_set(sv, d - SvPVX(sv));
79072805
LW
1473 SvPOK_on(sv);
1474
02aa26ce 1475 /* shrink the sv if we allocated more than we used */
79072805
LW
1476 if (SvCUR(sv) + 5 < SvLEN(sv)) {
1477 SvLEN_set(sv, SvCUR(sv) + 1);
463ee0b2 1478 Renew(SvPVX(sv), SvLEN(sv), char);
79072805 1479 }
02aa26ce 1480
9b599b2a 1481 /* return the substring (via yylval) only if we parsed anything */
3280af22
NIS
1482 if (s > PL_bufptr) {
1483 if ( PL_hints & ( PL_lex_inpat ? HINT_NEW_RE : HINT_NEW_STRING ) )
1484 sv = new_constant(start, s - start, (PL_lex_inpat ? "qr" : "q"),
b3ac6de7 1485 sv, Nullsv,
3280af22 1486 ( PL_lex_inwhat == OP_TRANS
b3ac6de7 1487 ? "tr"
3280af22 1488 : ( (PL_lex_inwhat == OP_SUBST && !PL_lex_inpat)
b3ac6de7
IZ
1489 ? "s"
1490 : "qq")));
79072805 1491 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
b3ac6de7 1492 } else
8990e307 1493 SvREFCNT_dec(sv);
79072805
LW
1494 return s;
1495}
1496
ffb4593c
NT
1497/* S_intuit_more
1498 * Returns TRUE if there's more to the expression (e.g., a subscript),
1499 * FALSE otherwise.
ffb4593c
NT
1500 *
1501 * It deals with "$foo[3]" and /$foo[3]/ and /$foo[0123456789$]+/
1502 *
1503 * ->[ and ->{ return TRUE
1504 * { and [ outside a pattern are always subscripts, so return TRUE
1505 * if we're outside a pattern and it's not { or [, then return FALSE
1506 * if we're in a pattern and the first char is a {
1507 * {4,5} (any digits around the comma) returns FALSE
1508 * if we're in a pattern and the first char is a [
1509 * [] returns FALSE
1510 * [SOMETHING] has a funky algorithm to decide whether it's a
1511 * character class or not. It has to deal with things like
1512 * /$foo[-3]/ and /$foo[$bar]/ as well as /$foo[$\d]+/
1513 * anything else returns TRUE
1514 */
1515
9cbb5ea2
GS
1516/* This is the one truly awful dwimmer necessary to conflate C and sed. */
1517
76e3520e 1518STATIC int
cea2e8a9 1519S_intuit_more(pTHX_ register char *s)
79072805 1520{
3280af22 1521 if (PL_lex_brackets)
79072805
LW
1522 return TRUE;
1523 if (*s == '-' && s[1] == '>' && (s[2] == '[' || s[2] == '{'))
1524 return TRUE;
1525 if (*s != '{' && *s != '[')
1526 return FALSE;
3280af22 1527 if (!PL_lex_inpat)
79072805
LW
1528 return TRUE;
1529
1530 /* In a pattern, so maybe we have {n,m}. */
1531 if (*s == '{') {
1532 s++;
1533 if (!isDIGIT(*s))
1534 return TRUE;
1535 while (isDIGIT(*s))
1536 s++;
1537 if (*s == ',')
1538 s++;
1539 while (isDIGIT(*s))
1540 s++;
1541 if (*s == '}')
1542 return FALSE;
1543 return TRUE;
1544
1545 }
1546
1547 /* On the other hand, maybe we have a character class */
1548
1549 s++;
1550 if (*s == ']' || *s == '^')
1551 return FALSE;
1552 else {
ffb4593c 1553 /* this is terrifying, and it works */
79072805
LW
1554 int weight = 2; /* let's weigh the evidence */
1555 char seen[256];
f27ffc4a 1556 unsigned char un_char = 255, last_un_char;
93a17b20 1557 char *send = strchr(s,']');
3280af22 1558 char tmpbuf[sizeof PL_tokenbuf * 4];
79072805
LW
1559
1560 if (!send) /* has to be an expression */
1561 return TRUE;
1562
1563 Zero(seen,256,char);
1564 if (*s == '$')
1565 weight -= 3;
1566 else if (isDIGIT(*s)) {
1567 if (s[1] != ']') {
1568 if (isDIGIT(s[1]) && s[2] == ']')
1569 weight -= 10;
1570 }
1571 else
1572 weight -= 100;
1573 }
1574 for (; s < send; s++) {
1575 last_un_char = un_char;
1576 un_char = (unsigned char)*s;
1577 switch (*s) {
1578 case '@':
1579 case '&':
1580 case '$':
1581 weight -= seen[un_char] * 10;
834a4ddd 1582 if (isALNUM_lazy(s+1)) {
8903cb82 1583 scan_ident(s, send, tmpbuf, sizeof tmpbuf, FALSE);
a0d0e21e 1584 if ((int)strlen(tmpbuf) > 1 && gv_fetchpv(tmpbuf,FALSE, SVt_PV))
79072805
LW
1585 weight -= 100;
1586 else
1587 weight -= 10;
1588 }
1589 else if (*s == '$' && s[1] &&
93a17b20
LW
1590 strchr("[#!%*<>()-=",s[1])) {
1591 if (/*{*/ strchr("])} =",s[2]))
79072805
LW
1592 weight -= 10;
1593 else
1594 weight -= 1;
1595 }
1596 break;
1597 case '\\':
1598 un_char = 254;
1599 if (s[1]) {
93a17b20 1600 if (strchr("wds]",s[1]))
79072805
LW
1601 weight += 100;
1602 else if (seen['\''] || seen['"'])
1603 weight += 1;
93a17b20 1604 else if (strchr("rnftbxcav",s[1]))
79072805
LW
1605 weight += 40;
1606 else if (isDIGIT(s[1])) {
1607 weight += 40;
1608 while (s[1] && isDIGIT(s[1]))
1609 s++;
1610 }
1611 }
1612 else
1613 weight += 100;
1614 break;
1615 case '-':
1616 if (s[1] == '\\')
1617 weight += 50;
93a17b20 1618 if (strchr("aA01! ",last_un_char))
79072805 1619 weight += 30;
93a17b20 1620 if (strchr("zZ79~",s[1]))
79072805 1621 weight += 30;
f27ffc4a
GS
1622 if (last_un_char == 255 && (isDIGIT(s[1]) || s[1] == '$'))
1623 weight -= 5; /* cope with negative subscript */
79072805
LW
1624 break;
1625 default:
93a17b20 1626 if (!isALNUM(last_un_char) && !strchr("$@&",last_un_char) &&
79072805
LW
1627 isALPHA(*s) && s[1] && isALPHA(s[1])) {
1628 char *d = tmpbuf;
1629 while (isALPHA(*s))
1630 *d++ = *s++;
1631 *d = '\0';
1632 if (keyword(tmpbuf, d - tmpbuf))
1633 weight -= 150;
1634 }
1635 if (un_char == last_un_char + 1)
1636 weight += 5;
1637 weight -= seen[un_char];
1638 break;
1639 }
1640 seen[un_char]++;
1641 }
1642 if (weight >= 0) /* probably a character class */
1643 return FALSE;
1644 }
1645
1646 return TRUE;
1647}
ffed7fef 1648
ffb4593c
NT
1649/*
1650 * S_intuit_method
1651 *
1652 * Does all the checking to disambiguate
1653 * foo bar
1654 * between foo(bar) and bar->foo. Returns 0 if not a method, otherwise
1655 * FUNCMETH (bar->foo(args)) or METHOD (bar->foo args).
1656 *
1657 * First argument is the stuff after the first token, e.g. "bar".
1658 *
1659 * Not a method if bar is a filehandle.
1660 * Not a method if foo is a subroutine prototyped to take a filehandle.
1661 * Not a method if it's really "Foo $bar"
1662 * Method if it's "foo $bar"
1663 * Not a method if it's really "print foo $bar"
1664 * Method if it's really "foo package::" (interpreted as package->foo)
1665 * Not a method if bar is known to be a subroutne ("sub bar; foo bar")
1666 * Not a method if bar is a filehandle or package, but is quotd with
1667 * =>
1668 */
1669
76e3520e 1670STATIC int
cea2e8a9 1671S_intuit_method(pTHX_ char *start, GV *gv)
a0d0e21e
LW
1672{
1673 char *s = start + (*start == '$');
3280af22 1674 char tmpbuf[sizeof PL_tokenbuf];
a0d0e21e
LW
1675 STRLEN len;
1676 GV* indirgv;
1677
1678 if (gv) {
b6c543e3 1679 CV *cv;
a0d0e21e
LW
1680 if (GvIO(gv))
1681 return 0;
b6c543e3
IZ
1682 if ((cv = GvCVu(gv))) {
1683 char *proto = SvPVX(cv);
1684 if (proto) {
1685 if (*proto == ';')
1686 proto++;
1687 if (*proto == '*')
1688 return 0;
1689 }
1690 } else
a0d0e21e
LW
1691 gv = 0;
1692 }
8903cb82 1693 s = scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
ffb4593c
NT
1694 /* start is the beginning of the possible filehandle/object,
1695 * and s is the end of it
1696 * tmpbuf is a copy of it
1697 */
1698
a0d0e21e 1699 if (*start == '$') {
3280af22 1700 if (gv || PL_last_lop_op == OP_PRINT || isUPPER(*PL_tokenbuf))
a0d0e21e
LW
1701 return 0;
1702 s = skipspace(s);
3280af22
NIS
1703 PL_bufptr = start;
1704 PL_expect = XREF;
a0d0e21e
LW
1705 return *s == '(' ? FUNCMETH : METHOD;
1706 }
1707 if (!keyword(tmpbuf, len)) {
c3e0f903
GS
1708 if (len > 2 && tmpbuf[len - 2] == ':' && tmpbuf[len - 1] == ':') {
1709 len -= 2;
1710 tmpbuf[len] = '\0';
1711 goto bare_package;
1712 }
1713 indirgv = gv_fetchpv(tmpbuf, FALSE, SVt_PVCV);
8ebc5c01 1714 if (indirgv && GvCVu(indirgv))
a0d0e21e
LW
1715 return 0;
1716 /* filehandle or package name makes it a method */
89bfa8cd 1717 if (!gv || GvIO(indirgv) || gv_stashpvn(tmpbuf, len, FALSE)) {
a0d0e21e 1718 s = skipspace(s);
3280af22 1719 if ((PL_bufend - s) >= 2 && *s == '=' && *(s+1) == '>')
55497cff 1720 return 0; /* no assumptions -- "=>" quotes bearword */
c3e0f903 1721 bare_package:
3280af22 1722 PL_nextval[PL_nexttoke].opval = (OP*)newSVOP(OP_CONST, 0,
79cb57f6 1723 newSVpvn(tmpbuf,len));
3280af22
NIS
1724 PL_nextval[PL_nexttoke].opval->op_private = OPpCONST_BARE;
1725 PL_expect = XTERM;
a0d0e21e 1726 force_next(WORD);
3280af22 1727 PL_bufptr = s;
a0d0e21e
LW
1728 return *s == '(' ? FUNCMETH : METHOD;
1729 }
1730 }
1731 return 0;
1732}
1733
ffb4593c
NT
1734/*
1735 * S_incl_perldb
1736 * Return a string of Perl code to load the debugger. If PERL5DB
1737 * is set, it will return the contents of that, otherwise a
1738 * compile-time require of perl5db.pl.
1739 */
1740
76e3520e 1741STATIC char*
cea2e8a9 1742S_incl_perldb(pTHX)
a0d0e21e 1743{
3280af22 1744 if (PL_perldb) {
76e3520e 1745 char *pdb = PerlEnv_getenv("PERL5DB");
a0d0e21e
LW
1746
1747 if (pdb)
1748 return pdb;
61bb5906 1749 SETERRNO(0,SS$_NORMAL);
a0d0e21e
LW
1750 return "BEGIN { require 'perl5db.pl' }";
1751 }
1752 return "";
1753}
1754
1755
16d20bd9
AD
1756/* Encoded script support. filter_add() effectively inserts a
1757 * 'pre-processing' function into the current source input stream.
1758 * Note that the filter function only applies to the current source file
1759 * (e.g., it will not affect files 'require'd or 'use'd by this one).
1760 *
1761 * The datasv parameter (which may be NULL) can be used to pass
1762 * private data to this instance of the filter. The filter function
1763 * can recover the SV using the FILTER_DATA macro and use it to
1764 * store private buffers and state information.
1765 *
1766 * The supplied datasv parameter is upgraded to a PVIO type
1767 * and the IoDIRP field is used to store the function pointer.
1768 * Note that IoTOP_NAME, IoFMT_NAME, IoBOTTOM_NAME, if set for
1769 * private use must be set using malloc'd pointers.
1770 */
16d20bd9
AD
1771
1772SV *
864dbfa3 1773Perl_filter_add(pTHX_ filter_t funcp, SV *datasv)
16d20bd9
AD
1774{
1775 if (!funcp){ /* temporary handy debugging hack to be deleted */
80252599 1776 PL_filter_debug = atoi((char*)datasv);
16d20bd9
AD
1777 return NULL;
1778 }
3280af22
NIS
1779 if (!PL_rsfp_filters)
1780 PL_rsfp_filters = newAV();
16d20bd9 1781 if (!datasv)
8c52afec 1782 datasv = NEWSV(255,0);
16d20bd9 1783 if (!SvUPGRADE(datasv, SVt_PVIO))
cea2e8a9 1784 Perl_die(aTHX_ "Can't upgrade filter_add data to SVt_PVIO");
16d20bd9 1785 IoDIRP(datasv) = (DIR*)funcp; /* stash funcp into spare field */
0453d815 1786#ifdef DEBUGGING
80252599 1787 if (PL_filter_debug) {
2d8e6c8d 1788 STRLEN n_a;
cea2e8a9 1789 Perl_warn(aTHX_ "filter_add func %p (%s)", funcp, SvPV(datasv, n_a));
2d8e6c8d 1790 }
0453d815 1791#endif /* DEBUGGING */
3280af22
NIS
1792 av_unshift(PL_rsfp_filters, 1);
1793 av_store(PL_rsfp_filters, 0, datasv) ;
16d20bd9
AD
1794 return(datasv);
1795}
1796
1797
1798/* Delete most recently added instance of this filter function. */
a0d0e21e 1799void
864dbfa3 1800Perl_filter_del(pTHX_ filter_t funcp)
16d20bd9 1801{
0453d815 1802#ifdef DEBUGGING
80252599 1803 if (PL_filter_debug)
cea2e8a9 1804 Perl_warn(aTHX_ "filter_del func %p", funcp);
0453d815 1805#endif /* DEBUGGING */
3280af22 1806 if (!PL_rsfp_filters || AvFILLp(PL_rsfp_filters)<0)
16d20bd9
AD
1807 return;
1808 /* if filter is on top of stack (usual case) just pop it off */
677ca527 1809 if (IoDIRP(FILTER_DATA(AvFILLp(PL_rsfp_filters))) == (DIR*)funcp){
a6c40364 1810 IoDIRP(FILTER_DATA(AvFILLp(PL_rsfp_filters))) = NULL;
3280af22 1811 sv_free(av_pop(PL_rsfp_filters));
e50aee73 1812
16d20bd9
AD
1813 return;
1814 }
1815 /* we need to search for the correct entry and clear it */
cea2e8a9 1816 Perl_die(aTHX_ "filter_del can only delete in reverse order (currently)");
16d20bd9
AD
1817}
1818
1819
1820/* Invoke the n'th filter function for the current rsfp. */
1821I32
864dbfa3 1822Perl_filter_read(pTHX_ int idx, SV *buf_sv, int maxlen)
8ac85365
NIS
1823
1824
1825 /* 0 = read one text line */
a0d0e21e 1826{
16d20bd9
AD
1827 filter_t funcp;
1828 SV *datasv = NULL;
e50aee73 1829
3280af22 1830 if (!PL_rsfp_filters)
16d20bd9 1831 return -1;
3280af22 1832 if (idx > AvFILLp(PL_rsfp_filters)){ /* Any more filters? */
16d20bd9
AD
1833 /* Provide a default input filter to make life easy. */
1834 /* Note that we append to the line. This is handy. */
0453d815 1835#ifdef DEBUGGING
80252599 1836 if (PL_filter_debug)
cea2e8a9 1837 Perl_warn(aTHX_ "filter_read %d: from rsfp\n", idx);
0453d815 1838#endif /* DEBUGGING */
16d20bd9
AD
1839 if (maxlen) {
1840 /* Want a block */
1841 int len ;
1842 int old_len = SvCUR(buf_sv) ;
1843
1844 /* ensure buf_sv is large enough */
1845 SvGROW(buf_sv, old_len + maxlen) ;
3280af22
NIS
1846 if ((len = PerlIO_read(PL_rsfp, SvPVX(buf_sv) + old_len, maxlen)) <= 0){
1847 if (PerlIO_error(PL_rsfp))
37120919
AD
1848 return -1; /* error */
1849 else
1850 return 0 ; /* end of file */
1851 }
16d20bd9
AD
1852 SvCUR_set(buf_sv, old_len + len) ;
1853 } else {
1854 /* Want a line */
3280af22
NIS
1855 if (sv_gets(buf_sv, PL_rsfp, SvCUR(buf_sv)) == NULL) {
1856 if (PerlIO_error(PL_rsfp))
37120919
AD
1857 return -1; /* error */
1858 else
1859 return 0 ; /* end of file */
1860 }
16d20bd9
AD
1861 }
1862 return SvCUR(buf_sv);
1863 }
1864 /* Skip this filter slot if filter has been deleted */
3280af22 1865 if ( (datasv = FILTER_DATA(idx)) == &PL_sv_undef){
0453d815 1866#ifdef DEBUGGING
80252599 1867 if (PL_filter_debug)
cea2e8a9 1868 Perl_warn(aTHX_ "filter_read %d: skipped (filter deleted)\n", idx);
0453d815 1869#endif /* DEBUGGING */
16d20bd9
AD
1870 return FILTER_READ(idx+1, buf_sv, maxlen); /* recurse */
1871 }
1872 /* Get function pointer hidden within datasv */
1873 funcp = (filter_t)IoDIRP(datasv);
0453d815 1874#ifdef DEBUGGING
80252599 1875 if (PL_filter_debug) {
2d8e6c8d 1876 STRLEN n_a;
cea2e8a9 1877 Perl_warn(aTHX_ "filter_read %d: via function %p (%s)\n",
2d8e6c8d
GS
1878 idx, funcp, SvPV(datasv,n_a));
1879 }
0453d815 1880#endif /* DEBUGGING */
16d20bd9
AD
1881 /* Call function. The function is expected to */
1882 /* call "FILTER_READ(idx+1, buf_sv)" first. */
37120919 1883 /* Return: <0:error, =0:eof, >0:not eof */
0cb96387 1884 return (*funcp)(aTHXo_ idx, buf_sv, maxlen);
16d20bd9
AD
1885}
1886
76e3520e 1887STATIC char *
cea2e8a9 1888S_filter_gets(pTHX_ register SV *sv, register PerlIO *fp, STRLEN append)
16d20bd9 1889{
a868473f 1890#ifdef WIN32FILTER
3280af22 1891 if (!PL_rsfp_filters) {
a868473f
NIS
1892 filter_add(win32_textfilter,NULL);
1893 }
1894#endif
3280af22 1895 if (PL_rsfp_filters) {
16d20bd9 1896
55497cff 1897 if (!append)
1898 SvCUR_set(sv, 0); /* start with empty line */
16d20bd9
AD
1899 if (FILTER_READ(0, sv, 0) > 0)
1900 return ( SvPVX(sv) ) ;
1901 else
1902 return Nullch ;
1903 }
9d116dd7 1904 else
fd049845 1905 return (sv_gets(sv, fp, append));
a0d0e21e
LW
1906}
1907
1908
748a9306
LW
1909#ifdef DEBUGGING
1910 static char* exp_name[] =
09bef843
SB
1911 { "OPERATOR", "TERM", "REF", "STATE", "BLOCK", "ATTRBLOCK",
1912 "ATTRTERM", "TERMBLOCK"
1913 };
748a9306 1914#endif
463ee0b2 1915
02aa26ce
NT
1916/*
1917 yylex
1918
1919 Works out what to call the token just pulled out of the input
1920 stream. The yacc parser takes care of taking the ops we return and
1921 stitching them into a tree.
1922
1923 Returns:
1924 PRIVATEREF
1925
1926 Structure:
1927 if read an identifier
1928 if we're in a my declaration
1929 croak if they tried to say my($foo::bar)
1930 build the ops for a my() declaration
1931 if it's an access to a my() variable
1932 are we in a sort block?
1933 croak if my($a); $a <=> $b
1934 build ops for access to a my() variable
1935 if in a dq string, and they've said @foo and we can't find @foo
1936 croak
1937 build ops for a bareword
1938 if we already built the token before, use it.
1939*/
1940
864dbfa3
GS
1941int
1942#ifdef USE_PURE_BISON
cea2e8a9 1943Perl_yylex(pTHX_ YYSTYPE *lvalp, int *lcharp)
864dbfa3 1944#else
cea2e8a9 1945Perl_yylex(pTHX)
864dbfa3 1946#endif
378cc40b 1947{
11343788 1948 dTHR;
79072805 1949 register char *s;
378cc40b 1950 register char *d;
79072805 1951 register I32 tmp;
463ee0b2 1952 STRLEN len;
161b471a
NIS
1953 GV *gv = Nullgv;
1954 GV **gvp = 0;
a687059c 1955
a1a0e61e
TD
1956#ifdef USE_PURE_BISON
1957 yylval_pointer = lvalp;
1958 yychar_pointer = lcharp;
1959#endif
1960
02aa26ce 1961 /* check if there's an identifier for us to look at */
3280af22 1962 if (PL_pending_ident) {
02aa26ce 1963 /* pit holds the identifier we read and pending_ident is reset */
3280af22
NIS
1964 char pit = PL_pending_ident;
1965 PL_pending_ident = 0;
bbce6d69 1966
02aa26ce
NT
1967 /* if we're in a my(), we can't allow dynamics here.
1968 $foo'bar has already been turned into $foo::bar, so
1969 just check for colons.
1970
1971 if it's a legal name, the OP is a PADANY.
1972 */
3280af22 1973 if (PL_in_my) {
77ca0c92
LW
1974 if (PL_in_my == KEY_our) { /* "our" is merely analogous to "my" */
1975 tmp = pad_allocmy(PL_tokenbuf);
1976 }
1977 else {
1978 if (strchr(PL_tokenbuf,':'))
1979 yyerror(Perl_form(aTHX_ PL_no_myglob,PL_tokenbuf));
02aa26ce 1980
77ca0c92
LW
1981 yylval.opval = newOP(OP_PADANY, 0);
1982 yylval.opval->op_targ = pad_allocmy(PL_tokenbuf);
1983 return PRIVATEREF;
1984 }
bbce6d69 1985 }
1986
02aa26ce
NT
1987 /*
1988 build the ops for accesses to a my() variable.
1989
1990 Deny my($a) or my($b) in a sort block, *if* $a or $b is
1991 then used in a comparison. This catches most, but not
1992 all cases. For instance, it catches
1993 sort { my($a); $a <=> $b }
1994 but not
1995 sort { my($a); $a < $b ? -1 : $a == $b ? 0 : 1; }
1996 (although why you'd do that is anyone's guess).
1997 */
1998
3280af22 1999 if (!strchr(PL_tokenbuf,':')) {
a863c7d1 2000#ifdef USE_THREADS
54b9620d 2001 /* Check for single character per-thread SVs */
3280af22
NIS
2002 if (PL_tokenbuf[0] == '$' && PL_tokenbuf[2] == '\0'
2003 && !isALPHA(PL_tokenbuf[1]) /* Rule out obvious non-threadsvs */
2004 && (tmp = find_threadsv(&PL_tokenbuf[1])) != NOT_IN_PAD)
554b3eca 2005 {
2faa37cc 2006 yylval.opval = newOP(OP_THREADSV, 0);
a863c7d1
MB
2007 yylval.opval->op_targ = tmp;
2008 return PRIVATEREF;
2009 }
2010#endif /* USE_THREADS */
3280af22 2011 if ((tmp = pad_findmy(PL_tokenbuf)) != NOT_IN_PAD) {
77ca0c92
LW
2012 /* might be an "our" variable" */
2013 if (SvFLAGS(AvARRAY(PL_comppad_name)[tmp]) & SVpad_OUR) {
2014 /* build ops for a bareword */
2015 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(PL_tokenbuf+1, 0));
2016 yylval.opval->op_private = OPpCONST_ENTERED;
2017 gv_fetchpv(PL_tokenbuf+1,
2018 (PL_in_eval
2019 ? (GV_ADDMULTI | GV_ADDINEVAL | GV_ADDOUR)
2020 : GV_ADDOUR
2021 ),
2022 ((PL_tokenbuf[0] == '$') ? SVt_PV
2023 : (PL_tokenbuf[0] == '@') ? SVt_PVAV
2024 : SVt_PVHV));
2025 return WORD;
2026 }
2027
02aa26ce 2028 /* if it's a sort block and they're naming $a or $b */
3280af22
NIS
2029 if (PL_last_lop_op == OP_SORT &&
2030 PL_tokenbuf[0] == '$' &&
2031 (PL_tokenbuf[1] == 'a' || PL_tokenbuf[1] == 'b')
2032 && !PL_tokenbuf[2])
bbce6d69 2033 {
3280af22
NIS
2034 for (d = PL_in_eval ? PL_oldoldbufptr : PL_linestart;
2035 d < PL_bufend && *d != '\n';
a863c7d1
MB
2036 d++)
2037 {
2038 if (strnEQ(d,"<=>",3) || strnEQ(d,"cmp",3)) {
cea2e8a9 2039 Perl_croak(aTHX_ "Can't use \"my %s\" in sort comparison",
3280af22 2040 PL_tokenbuf);
a863c7d1 2041 }
bbce6d69 2042 }
2043 }
bbce6d69 2044
a863c7d1
MB
2045 yylval.opval = newOP(OP_PADANY, 0);
2046 yylval.opval->op_targ = tmp;
2047 return PRIVATEREF;
2048 }
bbce6d69 2049 }
2050
02aa26ce
NT
2051 /*
2052 Whine if they've said @foo in a doublequoted string,
2053 and @foo isn't a variable we can find in the symbol
2054 table.
2055 */
3280af22
NIS
2056 if (pit == '@' && PL_lex_state != LEX_NORMAL && !PL_lex_brackets) {
2057 GV *gv = gv_fetchpv(PL_tokenbuf+1, FALSE, SVt_PVAV);
2058 if (!gv || ((PL_tokenbuf[0] == '@') ? !GvAV(gv) : !GvHV(gv)))
cea2e8a9 2059 yyerror(Perl_form(aTHX_ "In string, %s now must be written as \\%s",
3280af22 2060 PL_tokenbuf, PL_tokenbuf));
bbce6d69 2061 }
2062
02aa26ce 2063 /* build ops for a bareword */
3280af22 2064 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(PL_tokenbuf+1, 0));
bbce6d69 2065 yylval.opval->op_private = OPpCONST_ENTERED;
3280af22
NIS
2066 gv_fetchpv(PL_tokenbuf+1, PL_in_eval ? (GV_ADDMULTI | GV_ADDINEVAL) : TRUE,
2067 ((PL_tokenbuf[0] == '$') ? SVt_PV
2068 : (PL_tokenbuf[0] == '@') ? SVt_PVAV
bbce6d69 2069 : SVt_PVHV));
2070 return WORD;
2071 }
2072
02aa26ce
NT
2073 /* no identifier pending identification */
2074
3280af22 2075 switch (PL_lex_state) {
79072805
LW
2076#ifdef COMMENTARY
2077 case LEX_NORMAL: /* Some compilers will produce faster */
2078 case LEX_INTERPNORMAL: /* code if we comment these out. */
2079 break;
2080#endif
2081
09bef843 2082 /* when we've already built the next token, just pull it out of the queue */
79072805 2083 case LEX_KNOWNEXT:
3280af22
NIS
2084 PL_nexttoke--;
2085 yylval = PL_nextval[PL_nexttoke];
2086 if (!PL_nexttoke) {
2087 PL_lex_state = PL_lex_defer;
2088 PL_expect = PL_lex_expect;
2089 PL_lex_defer = LEX_NORMAL;
463ee0b2 2090 }
3280af22 2091 return(PL_nexttype[PL_nexttoke]);
79072805 2092
02aa26ce 2093 /* interpolated case modifiers like \L \U, including \Q and \E.
3280af22 2094 when we get here, PL_bufptr is at the \
02aa26ce 2095 */
79072805
LW
2096 case LEX_INTERPCASEMOD:
2097#ifdef DEBUGGING
3280af22 2098 if (PL_bufptr != PL_bufend && *PL_bufptr != '\\')
cea2e8a9 2099 Perl_croak(aTHX_ "panic: INTERPCASEMOD");
79072805 2100#endif
02aa26ce 2101 /* handle \E or end of string */
3280af22 2102 if (PL_bufptr == PL_bufend || PL_bufptr[1] == 'E') {
a0d0e21e 2103 char oldmod;
02aa26ce
NT
2104
2105 /* if at a \E */
3280af22
NIS
2106 if (PL_lex_casemods) {
2107 oldmod = PL_lex_casestack[--PL_lex_casemods];
2108 PL_lex_casestack[PL_lex_casemods] = '\0';
02aa26ce 2109
3280af22
NIS
2110 if (PL_bufptr != PL_bufend && strchr("LUQ", oldmod)) {
2111 PL_bufptr += 2;
2112 PL_lex_state = LEX_INTERPCONCAT;
a0d0e21e 2113 }
79072805
LW
2114 return ')';
2115 }
3280af22
NIS
2116 if (PL_bufptr != PL_bufend)
2117 PL_bufptr += 2;
2118 PL_lex_state = LEX_INTERPCONCAT;
cea2e8a9 2119 return yylex();
79072805
LW
2120 }
2121 else {
3280af22 2122 s = PL_bufptr + 1;
79072805
LW
2123 if (strnEQ(s, "L\\u", 3) || strnEQ(s, "U\\l", 3))
2124 tmp = *s, *s = s[2], s[2] = tmp; /* misordered... */
a0d0e21e 2125 if (strchr("LU", *s) &&
3280af22 2126 (strchr(PL_lex_casestack, 'L') || strchr(PL_lex_casestack, 'U')))
a0d0e21e 2127 {
3280af22 2128 PL_lex_casestack[--PL_lex_casemods] = '\0';
a0d0e21e
LW
2129 return ')';
2130 }
3280af22
NIS
2131 if (PL_lex_casemods > 10) {
2132 char* newlb = Renew(PL_lex_casestack, PL_lex_casemods + 2, char);
2133 if (newlb != PL_lex_casestack) {
a0d0e21e 2134 SAVEFREEPV(newlb);
3280af22 2135 PL_lex_casestack = newlb;
a0d0e21e
LW
2136 }
2137 }
3280af22
NIS
2138 PL_lex_casestack[PL_lex_casemods++] = *s;
2139 PL_lex_casestack[PL_lex_casemods] = '\0';
2140 PL_lex_state = LEX_INTERPCONCAT;
2141 PL_nextval[PL_nexttoke].ival = 0;
79072805
LW
2142 force_next('(');
2143 if (*s == 'l')
3280af22 2144 PL_nextval[PL_nexttoke].ival = OP_LCFIRST;
79072805 2145 else if (*s == 'u')
3280af22 2146 PL_nextval[PL_nexttoke].ival = OP_UCFIRST;
79072805 2147 else if (*s == 'L')
3280af22 2148 PL_nextval[PL_nexttoke].ival = OP_LC;
79072805 2149 else if (*s == 'U')
3280af22 2150 PL_nextval[PL_nexttoke].ival = OP_UC;
a0d0e21e 2151 else if (*s == 'Q')
3280af22 2152 PL_nextval[PL_nexttoke].ival = OP_QUOTEMETA;
79072805 2153 else
cea2e8a9 2154 Perl_croak(aTHX_ "panic: yylex");
3280af22 2155 PL_bufptr = s + 1;
79072805 2156 force_next(FUNC);
3280af22
NIS
2157 if (PL_lex_starts) {
2158 s = PL_bufptr;
2159 PL_lex_starts = 0;
79072805
LW
2160 Aop(OP_CONCAT);
2161 }
2162 else
cea2e8a9 2163 return yylex();
79072805
LW
2164 }
2165
55497cff 2166 case LEX_INTERPPUSH:
2167 return sublex_push();
2168
79072805 2169 case LEX_INTERPSTART:
3280af22 2170 if (PL_bufptr == PL_bufend)
79072805 2171 return sublex_done();
3280af22
NIS
2172 PL_expect = XTERM;
2173 PL_lex_dojoin = (*PL_bufptr == '@');
2174 PL_lex_state = LEX_INTERPNORMAL;
2175 if (PL_lex_dojoin) {
2176 PL_nextval[PL_nexttoke].ival = 0;
79072805 2177 force_next(',');
554b3eca 2178#ifdef USE_THREADS
533c011a
NIS
2179 PL_nextval[PL_nexttoke].opval = newOP(OP_THREADSV, 0);
2180 PL_nextval[PL_nexttoke].opval->op_targ = find_threadsv("\"");
554b3eca
MB
2181 force_next(PRIVATEREF);
2182#else
a0d0e21e 2183 force_ident("\"", '$');
554b3eca 2184#endif /* USE_THREADS */
3280af22 2185 PL_nextval[PL_nexttoke].ival = 0;
79072805 2186 force_next('$');
3280af22 2187 PL_nextval[PL_nexttoke].ival = 0;
79072805 2188 force_next('(');
3280af22 2189 PL_nextval[PL_nexttoke].ival = OP_JOIN; /* emulate join($", ...) */
79072805
LW
2190 force_next(FUNC);
2191 }
3280af22
NIS
2192 if (PL_lex_starts++) {
2193 s = PL_bufptr;
79072805
LW
2194 Aop(OP_CONCAT);
2195 }
cea2e8a9 2196 return yylex();
79072805
LW
2197
2198 case LEX_INTERPENDMAYBE:
3280af22
NIS
2199 if (intuit_more(PL_bufptr)) {
2200 PL_lex_state = LEX_INTERPNORMAL; /* false alarm, more expr */
79072805
LW
2201 break;
2202 }
2203 /* FALL THROUGH */
2204
2205 case LEX_INTERPEND:
3280af22
NIS
2206 if (PL_lex_dojoin) {
2207 PL_lex_dojoin = FALSE;
2208 PL_lex_state = LEX_INTERPCONCAT;
79072805
LW
2209 return ')';
2210 }
43a16006 2211 if (PL_lex_inwhat == OP_SUBST && PL_linestr == PL_lex_repl
25da4f38 2212 && SvEVALED(PL_lex_repl))
43a16006 2213 {
e9fa98b2 2214 if (PL_bufptr != PL_bufend)
cea2e8a9 2215 Perl_croak(aTHX_ "Bad evalled substitution pattern");
e9fa98b2
HS
2216 PL_lex_repl = Nullsv;
2217 }
79072805
LW
2218 /* FALLTHROUGH */
2219 case LEX_INTERPCONCAT:
2220#ifdef DEBUGGING
3280af22 2221 if (PL_lex_brackets)
cea2e8a9 2222 Perl_croak(aTHX_ "panic: INTERPCONCAT");
79072805 2223#endif
3280af22 2224 if (PL_bufptr == PL_bufend)
79072805
LW
2225 return sublex_done();
2226
3280af22
NIS
2227 if (SvIVX(PL_linestr) == '\'') {
2228 SV *sv = newSVsv(PL_linestr);
2229 if (!PL_lex_inpat)
76e3520e 2230 sv = tokeq(sv);
3280af22 2231 else if ( PL_hints & HINT_NEW_RE )
b3ac6de7 2232 sv = new_constant(NULL, 0, "qr", sv, sv, "q");
79072805 2233 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
3280af22 2234 s = PL_bufend;
79072805
LW
2235 }
2236 else {
3280af22 2237 s = scan_const(PL_bufptr);
79072805 2238 if (*s == '\\')
3280af22 2239 PL_lex_state = LEX_INTERPCASEMOD;
79072805 2240 else
3280af22 2241 PL_lex_state = LEX_INTERPSTART;
79072805
LW
2242 }
2243
3280af22
NIS
2244 if (s != PL_bufptr) {
2245 PL_nextval[PL_nexttoke] = yylval;
2246 PL_expect = XTERM;
79072805 2247 force_next(THING);
3280af22 2248 if (PL_lex_starts++)
79072805
LW
2249 Aop(OP_CONCAT);
2250 else {
3280af22 2251 PL_bufptr = s;
cea2e8a9 2252 return yylex();
79072805
LW
2253 }
2254 }
2255
cea2e8a9 2256 return yylex();
a0d0e21e 2257 case LEX_FORMLINE:
3280af22
NIS
2258 PL_lex_state = LEX_NORMAL;
2259 s = scan_formline(PL_bufptr);
2260 if (!PL_lex_formbrack)
a0d0e21e
LW
2261 goto rightbracket;
2262 OPERATOR(';');
79072805
LW
2263 }
2264
3280af22
NIS
2265 s = PL_bufptr;
2266 PL_oldoldbufptr = PL_oldbufptr;
2267 PL_oldbufptr = s;
79072805 2268 DEBUG_p( {
bf49b057
GS
2269 PerlIO_printf(Perl_debug_log, "### Tokener expecting %s at %s\n",
2270 exp_name[PL_expect], s);
79072805 2271 } )
463ee0b2
LW
2272
2273 retry:
378cc40b
LW
2274 switch (*s) {
2275 default:
834a4ddd
LW
2276 if (isIDFIRST_lazy(s))
2277 goto keylookup;
cea2e8a9 2278 Perl_croak(aTHX_ "Unrecognized character \\x%02X", *s & 255);
e929a76b
LW
2279 case 4:
2280 case 26:
2281 goto fake_eof; /* emulate EOF on ^D or ^Z */
378cc40b 2282 case 0:
3280af22
NIS
2283 if (!PL_rsfp) {
2284 PL_last_uni = 0;
2285 PL_last_lop = 0;
2286 if (PL_lex_brackets)
d98d5fff 2287 yyerror("Missing right curly or square bracket");
79072805 2288 TOKEN(0);
463ee0b2 2289 }
3280af22 2290 if (s++ < PL_bufend)
a687059c 2291 goto retry; /* ignore stray nulls */
3280af22
NIS
2292 PL_last_uni = 0;
2293 PL_last_lop = 0;
2294 if (!PL_in_eval && !PL_preambled) {
2295 PL_preambled = TRUE;
2296 sv_setpv(PL_linestr,incl_perldb());
2297 if (SvCUR(PL_linestr))
2298 sv_catpv(PL_linestr,";");
2299 if (PL_preambleav){
2300 while(AvFILLp(PL_preambleav) >= 0) {
2301 SV *tmpsv = av_shift(PL_preambleav);
2302 sv_catsv(PL_linestr, tmpsv);
2303 sv_catpv(PL_linestr, ";");
91b7def8 2304 sv_free(tmpsv);
2305 }
3280af22
NIS
2306 sv_free((SV*)PL_preambleav);
2307 PL_preambleav = NULL;
91b7def8 2308 }
3280af22
NIS
2309 if (PL_minus_n || PL_minus_p) {
2310 sv_catpv(PL_linestr, "LINE: while (<>) {");
2311 if (PL_minus_l)
2312 sv_catpv(PL_linestr,"chomp;");
2313 if (PL_minus_a) {
8fd239a7
CS
2314 GV* gv = gv_fetchpv("::F", TRUE, SVt_PVAV);
2315 if (gv)
2316 GvIMPORTED_AV_on(gv);
3280af22
NIS
2317 if (PL_minus_F) {
2318 if (strchr("/'\"", *PL_splitstr)
2319 && strchr(PL_splitstr + 1, *PL_splitstr))
cea2e8a9 2320 Perl_sv_catpvf(aTHX_ PL_linestr, "@F=split(%s);", PL_splitstr);
54310121 2321 else {
2322 char delim;
2323 s = "'~#\200\1'"; /* surely one char is unused...*/
3280af22 2324 while (s[1] && strchr(PL_splitstr, *s)) s++;
54310121 2325 delim = *s;
cea2e8a9 2326 Perl_sv_catpvf(aTHX_ PL_linestr, "@F=split(%s%c",
46fc3d4c 2327 "q" + (delim == '\''), delim);
3280af22 2328 for (s = PL_splitstr; *s; s++) {
54310121 2329 if (*s == '\\')
3280af22
NIS
2330 sv_catpvn(PL_linestr, "\\", 1);
2331 sv_catpvn(PL_linestr, s, 1);
54310121 2332 }
cea2e8a9 2333 Perl_sv_catpvf(aTHX_ PL_linestr, "%c);", delim);
54310121 2334 }
2304df62
AD
2335 }
2336 else
3280af22 2337 sv_catpv(PL_linestr,"@F=split(' ');");
2304df62 2338 }
79072805 2339 }
3280af22
NIS
2340 sv_catpv(PL_linestr, "\n");
2341 PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
2342 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
2343 if (PERLDB_LINE && PL_curstash != PL_debstash) {
a0d0e21e
LW
2344 SV *sv = NEWSV(85,0);
2345
2346 sv_upgrade(sv, SVt_PVMG);
3280af22
NIS
2347 sv_setsv(sv,PL_linestr);
2348 av_store(GvAV(PL_curcop->cop_filegv),(I32)PL_curcop->cop_line,sv);
a0d0e21e 2349 }
79072805 2350 goto retry;
a687059c 2351 }
e929a76b 2352 do {
3280af22 2353 if ((s = filter_gets(PL_linestr, PL_rsfp, 0)) == Nullch) {
e929a76b 2354 fake_eof:
3280af22
NIS
2355 if (PL_rsfp) {
2356 if (PL_preprocess && !PL_in_eval)
2357 (void)PerlProc_pclose(PL_rsfp);
2358 else if ((PerlIO *)PL_rsfp == PerlIO_stdin())
2359 PerlIO_clearerr(PL_rsfp);
395c3793 2360 else
3280af22
NIS
2361 (void)PerlIO_close(PL_rsfp);
2362 PL_rsfp = Nullfp;
4a9ae47a 2363 PL_doextract = FALSE;
395c3793 2364 }
3280af22
NIS
2365 if (!PL_in_eval && (PL_minus_n || PL_minus_p)) {
2366 sv_setpv(PL_linestr,PL_minus_p ? ";}continue{print" : "");
2367 sv_catpv(PL_linestr,";}");
2368 PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
2369 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
2370 PL_minus_n = PL_minus_p = 0;
e929a76b
LW
2371 goto retry;
2372 }
3280af22
NIS
2373 PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
2374 sv_setpv(PL_linestr,"");
79072805 2375 TOKEN(';'); /* not infinite loop because rsfp is NULL now */
378cc40b 2376 }
3280af22 2377 if (PL_doextract) {
a0d0e21e 2378 if (*s == '#' && s[1] == '!' && instr(s,"perl"))
3280af22 2379 PL_doextract = FALSE;
a0d0e21e
LW
2380
2381 /* Incest with pod. */
2382 if (*s == '=' && strnEQ(s, "=cut", 4)) {
3280af22
NIS
2383 sv_setpv(PL_linestr, "");
2384 PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
2385 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
2386 PL_doextract = FALSE;
a0d0e21e
LW
2387 }
2388 }
463ee0b2 2389 incline(s);
3280af22
NIS
2390 } while (PL_doextract);
2391 PL_oldoldbufptr = PL_oldbufptr = PL_bufptr = PL_linestart = s;
2392 if (PERLDB_LINE && PL_curstash != PL_debstash) {
79072805 2393 SV *sv = NEWSV(85,0);
a687059c 2394
93a17b20 2395 sv_upgrade(sv, SVt_PVMG);
3280af22
NIS
2396 sv_setsv(sv,PL_linestr);
2397 av_store(GvAV(PL_curcop->cop_filegv),(I32)PL_curcop->cop_line,sv);
a687059c 2398 }
3280af22
NIS
2399 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
2400 if (PL_curcop->cop_line == 1) {
2401 while (s < PL_bufend && isSPACE(*s))
79072805 2402 s++;
a0d0e21e 2403 if (*s == ':' && s[1] != ':') /* for csh execing sh scripts */
79072805 2404 s++;
44a8e56a 2405 d = Nullch;
3280af22 2406 if (!PL_in_eval) {
44a8e56a 2407 if (*s == '#' && *(s+1) == '!')
2408 d = s + 2;
2409#ifdef ALTERNATE_SHEBANG
2410 else {
2411 static char as[] = ALTERNATE_SHEBANG;
2412 if (*s == as[0] && strnEQ(s, as, sizeof(as) - 1))
2413 d = s + (sizeof(as) - 1);
2414 }
2415#endif /* ALTERNATE_SHEBANG */
2416 }
2417 if (d) {
b8378b72 2418 char *ipath;
774d564b 2419 char *ipathend;
b8378b72 2420
774d564b 2421 while (isSPACE(*d))
b8378b72
CS
2422 d++;
2423 ipath = d;
774d564b 2424 while (*d && !isSPACE(*d))
2425 d++;
2426 ipathend = d;
2427
2428#ifdef ARG_ZERO_IS_SCRIPT
2429 if (ipathend > ipath) {
2430 /*
2431 * HP-UX (at least) sets argv[0] to the script name,
2432 * which makes $^X incorrect. And Digital UNIX and Linux,
2433 * at least, set argv[0] to the basename of the Perl
2434 * interpreter. So, having found "#!", we'll set it right.
2435 */
2436 SV *x = GvSV(gv_fetchpv("\030", TRUE, SVt_PV));
2437 assert(SvPOK(x) || SvGMAGICAL(x));
6b88bc9c 2438 if (sv_eq(x, GvSV(PL_curcop->cop_filegv))) {
774d564b 2439 sv_setpvn(x, ipath, ipathend - ipath);
9607fc9c 2440 SvSETMAGIC(x);
2441 }
774d564b 2442 TAINT_NOT; /* $^X is always tainted, but that's OK */
8ebc5c01 2443 }
774d564b 2444#endif /* ARG_ZERO_IS_SCRIPT */
b8378b72
CS
2445
2446 /*
2447 * Look for options.
2448 */
748a9306 2449 d = instr(s,"perl -");
84e30d1a 2450 if (!d) {
748a9306 2451 d = instr(s,"perl");
84e30d1a
GS
2452#if defined(DOSISH)
2453 /* avoid getting into infinite loops when shebang
2454 * line contains "Perl" rather than "perl" */
2455 if (!d) {
2456 for (d = ipathend-4; d >= ipath; --d) {
2457 if ((*d == 'p' || *d == 'P')
2458 && !ibcmp(d, "perl", 4))
2459 {
2460 break;
2461 }
2462 }
2463 if (d < ipath)
2464 d = Nullch;
2465 }
2466#endif
2467 }
44a8e56a 2468#ifdef ALTERNATE_SHEBANG
2469 /*
2470 * If the ALTERNATE_SHEBANG on this system starts with a
2471 * character that can be part of a Perl expression, then if
2472 * we see it but not "perl", we're probably looking at the
2473 * start of Perl code, not a request to hand off to some
2474 * other interpreter. Similarly, if "perl" is there, but
2475 * not in the first 'word' of the line, we assume the line
2476 * contains the start of the Perl program.
44a8e56a 2477 */
2478 if (d && *s != '#') {
774d564b 2479 char *c = ipath;
44a8e56a 2480 while (*c && !strchr("; \t\r\n\f\v#", *c))
2481 c++;
2482 if (c < d)
2483 d = Nullch; /* "perl" not in first word; ignore */
2484 else
2485 *s = '#'; /* Don't try to parse shebang line */
2486 }
774d564b 2487#endif /* ALTERNATE_SHEBANG */
748a9306 2488 if (!d &&
44a8e56a 2489 *s == '#' &&
774d564b 2490 ipathend > ipath &&
3280af22 2491 !PL_minus_c &&
748a9306 2492 !instr(s,"indir") &&
3280af22 2493 instr(PL_origargv[0],"perl"))
748a9306 2494 {
9f68db38 2495 char **newargv;
9f68db38 2496
774d564b 2497 *ipathend = '\0';
2498 s = ipathend + 1;
3280af22 2499 while (s < PL_bufend && isSPACE(*s))
9f68db38 2500 s++;
3280af22
NIS
2501 if (s < PL_bufend) {
2502 Newz(899,newargv,PL_origargc+3,char*);
9f68db38 2503 newargv[1] = s;
3280af22 2504 while (s < PL_bufend && !isSPACE(*s))
9f68db38
LW
2505 s++;
2506 *s = '\0';
3280af22 2507 Copy(PL_origargv+1, newargv+2, PL_origargc+1, char*);
9f68db38
LW
2508 }
2509 else
3280af22 2510 newargv = PL_origargv;
774d564b 2511 newargv[0] = ipath;
80252599 2512 PerlProc_execv(ipath, newargv);
cea2e8a9 2513 Perl_croak(aTHX_ "Can't exec %s", ipath);
9f68db38 2514 }
748a9306 2515 if (d) {
3280af22
NIS
2516 U32 oldpdb = PL_perldb;
2517 bool oldn = PL_minus_n;
2518 bool oldp = PL_minus_p;
748a9306
LW
2519
2520 while (*d && !isSPACE(*d)) d++;
89bfa8cd 2521 while (*d == ' ' || *d == '\t') d++;
748a9306
LW
2522
2523 if (*d++ == '-') {
8cc95fdb 2524 do {
2525 if (*d == 'M' || *d == 'm') {
2526 char *m = d;
2527 while (*d && !isSPACE(*d)) d++;
cea2e8a9 2528 Perl_croak(aTHX_ "Too late for \"-%.*s\" option",
8cc95fdb 2529 (int)(d - m), m);
2530 }
2531 d = moreswitches(d);
2532 } while (d);
84902520 2533 if (PERLDB_LINE && !oldpdb ||
3280af22 2534 ( PL_minus_n || PL_minus_p ) && !(oldn || oldp) )
b084f20b 2535 /* if we have already added "LINE: while (<>) {",
2536 we must not do it again */
748a9306 2537 {
3280af22
NIS
2538 sv_setpv(PL_linestr, "");
2539 PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = SvPVX(PL_linestr);
2540 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
2541 PL_preambled = FALSE;
84902520 2542 if (PERLDB_LINE)
3280af22 2543 (void)gv_fetchfile(PL_origfilename);
748a9306
LW
2544 goto retry;
2545 }
a0d0e21e 2546 }
79072805 2547 }
9f68db38 2548 }
79072805 2549 }
3280af22
NIS
2550 if (PL_lex_formbrack && PL_lex_brackets <= PL_lex_formbrack) {
2551 PL_bufptr = s;
2552 PL_lex_state = LEX_FORMLINE;
cea2e8a9 2553 return yylex();
ae986130 2554 }
378cc40b 2555 goto retry;
4fdae800 2556 case '\r':
6a27c188 2557#ifdef PERL_STRICT_CR
cea2e8a9
GS
2558 Perl_warn(aTHX_ "Illegal character \\%03o (carriage return)", '\r');
2559 Perl_croak(aTHX_
54310121 2560 "(Maybe you didn't strip carriage returns after a network transfer?)\n");
a868473f 2561#endif
4fdae800 2562 case ' ': case '\t': case '\f': case 013:
378cc40b
LW
2563 s++;
2564 goto retry;
378cc40b 2565 case '#':
e929a76b 2566 case '\n':
3280af22
NIS
2567 if (PL_lex_state != LEX_NORMAL || (PL_in_eval && !PL_rsfp)) {
2568 d = PL_bufend;
a687059c 2569 while (s < d && *s != '\n')
378cc40b 2570 s++;
0f85fab0 2571 if (s < d)
378cc40b 2572 s++;
463ee0b2 2573 incline(s);
3280af22
NIS
2574 if (PL_lex_formbrack && PL_lex_brackets <= PL_lex_formbrack) {
2575 PL_bufptr = s;
2576 PL_lex_state = LEX_FORMLINE;
cea2e8a9 2577 return yylex();
a687059c 2578 }
378cc40b 2579 }
a687059c 2580 else {
378cc40b 2581 *s = '\0';
3280af22 2582 PL_bufend = s;
a687059c 2583 }
378cc40b
LW
2584 goto retry;
2585 case '-':
79072805 2586 if (s[1] && isALPHA(s[1]) && !isALNUM(s[2])) {
378cc40b 2587 s++;
3280af22 2588 PL_bufptr = s;
748a9306
LW
2589 tmp = *s++;
2590
3280af22 2591 while (s < PL_bufend && (*s == ' ' || *s == '\t'))
748a9306
LW
2592 s++;
2593
2594 if (strnEQ(s,"=>",2)) {
3280af22 2595 s = force_word(PL_bufptr,WORD,FALSE,FALSE,FALSE);
748a9306
LW
2596 OPERATOR('-'); /* unary minus */
2597 }
3280af22
NIS
2598 PL_last_uni = PL_oldbufptr;
2599 PL_last_lop_op = OP_FTEREAD; /* good enough */
748a9306 2600 switch (tmp) {
79072805
LW
2601 case 'r': FTST(OP_FTEREAD);
2602 case 'w': FTST(OP_FTEWRITE);
2603 case 'x': FTST(OP_FTEEXEC);
2604 case 'o': FTST(OP_FTEOWNED);
2605 case 'R': FTST(OP_FTRREAD);
2606 case 'W': FTST(OP_FTRWRITE);
2607 case 'X': FTST(OP_FTREXEC);
2608 case 'O': FTST(OP_FTROWNED);
2609 case 'e': FTST(OP_FTIS);
2610 case 'z': FTST(OP_FTZERO);
2611 case 's': FTST(OP_FTSIZE);
2612 case 'f': FTST(OP_FTFILE);
2613 case 'd': FTST(OP_FTDIR);
2614 case 'l': FTST(OP_FTLINK);
2615 case 'p': FTST(OP_FTPIPE);
2616 case 'S': FTST(OP_FTSOCK);
2617 case 'u': FTST(OP_FTSUID);
2618 case 'g': FTST(OP_FTSGID);
2619 case 'k': FTST(OP_FTSVTX);
2620 case 'b': FTST(OP_FTBLK);
2621 case 'c': FTST(OP_FTCHR);
2622 case 't': FTST(OP_FTTTY);
2623 case 'T': FTST(OP_FTTEXT);
2624 case 'B': FTST(OP_FTBINARY);
85e6fe83
LW
2625 case 'M': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTMTIME);
2626 case 'A': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTATIME);
2627 case 'C': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTCTIME);
378cc40b 2628 default:
cea2e8a9 2629 Perl_croak(aTHX_ "Unrecognized file test: -%c", (int)tmp);
378cc40b
LW
2630 break;
2631 }
2632 }
a687059c
LW
2633 tmp = *s++;
2634 if (*s == tmp) {
2635 s++;
3280af22 2636 if (PL_expect == XOPERATOR)
79072805
LW
2637 TERM(POSTDEC);
2638 else
2639 OPERATOR(PREDEC);
2640 }
2641 else if (*s == '>') {
2642 s++;
2643 s = skipspace(s);
834a4ddd 2644 if (isIDFIRST_lazy(s)) {
a0d0e21e 2645 s = force_word(s,METHOD,FALSE,TRUE,FALSE);
463ee0b2 2646 TOKEN(ARROW);
79072805 2647 }
748a9306
LW
2648 else if (*s == '$')
2649 OPERATOR(ARROW);
463ee0b2 2650 else
748a9306 2651 TERM(ARROW);
a687059c 2652 }
3280af22 2653 if (PL_expect == XOPERATOR)
79072805
LW
2654 Aop(OP_SUBTRACT);
2655 else {
3280af22 2656 if (isSPACE(*s) || !isSPACE(*PL_bufptr))
2f3197b3 2657 check_uni();
79072805 2658 OPERATOR('-'); /* unary minus */
2f3197b3 2659 }
79072805 2660
378cc40b 2661 case '+':
a687059c
LW
2662 tmp = *s++;
2663 if (*s == tmp) {
378cc40b 2664 s++;
3280af22 2665 if (PL_expect == XOPERATOR)
79072805
LW
2666 TERM(POSTINC);
2667 else
2668 OPERATOR(PREINC);
378cc40b 2669 }
3280af22 2670 if (PL_expect == XOPERATOR)
79072805
LW
2671 Aop(OP_ADD);
2672 else {
3280af22 2673 if (isSPACE(*s) || !isSPACE(*PL_bufptr))
2f3197b3 2674 check_uni();
a687059c 2675 OPERATOR('+');
2f3197b3 2676 }
a687059c 2677
378cc40b 2678 case '*':
3280af22
NIS
2679 if (PL_expect != XOPERATOR) {
2680 s = scan_ident(s, PL_bufend, PL_tokenbuf, sizeof PL_tokenbuf, TRUE);
2681 PL_expect = XOPERATOR;
2682 force_ident(PL_tokenbuf, '*');
2683 if (!*PL_tokenbuf)
a0d0e21e 2684 PREREF('*');
79072805 2685 TERM('*');
a687059c 2686 }
79072805
LW
2687 s++;
2688 if (*s == '*') {
a687059c 2689 s++;
79072805 2690 PWop(OP_POW);
a687059c 2691 }
79072805
LW
2692 Mop(OP_MULTIPLY);
2693
378cc40b 2694 case '%':
3280af22 2695 if (PL_expect == XOPERATOR) {
bbce6d69 2696 ++s;
2697 Mop(OP_MODULO);
a687059c 2698 }
3280af22
NIS
2699 PL_tokenbuf[0] = '%';
2700 s = scan_ident(s, PL_bufend, PL_tokenbuf + 1, sizeof PL_tokenbuf - 1, TRUE);
2701 if (!PL_tokenbuf[1]) {
2702 if (s == PL_bufend)
bbce6d69 2703 yyerror("Final % should be \\% or %name");
2704 PREREF('%');
a687059c 2705 }
3280af22 2706 PL_pending_ident = '%';
bbce6d69 2707 TERM('%');
a687059c 2708
378cc40b 2709 case '^':
79072805 2710 s++;
a0d0e21e 2711 BOop(OP_BIT_XOR);
79072805 2712 case '[':
3280af22 2713 PL_lex_brackets++;
79072805 2714 /* FALL THROUGH */
378cc40b 2715 case '~':
378cc40b 2716 case ',':
378cc40b
LW
2717 tmp = *s++;
2718 OPERATOR(tmp);
a0d0e21e
LW
2719 case ':':
2720 if (s[1] == ':') {
2721 len = 0;
2722 goto just_a_word;
2723 }
2724 s++;
09bef843
SB
2725 switch (PL_expect) {
2726 OP *attrs;
2727 case XOPERATOR:
2728 if (!PL_in_my || PL_lex_state != LEX_NORMAL)
2729 break;
2730 PL_bufptr = s; /* update in case we back off */
2731 goto grabattrs;
2732 case XATTRBLOCK:
2733 PL_expect = XBLOCK;
2734 goto grabattrs;
2735 case XATTRTERM:
2736 PL_expect = XTERMBLOCK;
2737 grabattrs:
2738 s = skipspace(s);
2739 attrs = Nullop;
2740 while (isIDFIRST_lazy(s)) {
2741 d = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE, &len);
2742 if (*d == '(') {
2743 d = scan_str(d,TRUE,TRUE);
2744 if (!d) {
2745 if (PL_lex_stuff) {
2746 SvREFCNT_dec(PL_lex_stuff);
2747 PL_lex_stuff = Nullsv;
2748 }
2749 /* MUST advance bufptr here to avoid bogus
2750 "at end of line" context messages from yyerror().
2751 */
2752 PL_bufptr = s + len;
2753 yyerror("Unterminated attribute parameter in attribute list");
2754 if (attrs)
2755 op_free(attrs);
2756 return 0; /* EOF indicator */
2757 }
2758 }
2759 if (PL_lex_stuff) {
2760 SV *sv = newSVpvn(s, len);
2761 sv_catsv(sv, PL_lex_stuff);
2762 attrs = append_elem(OP_LIST, attrs,
2763 newSVOP(OP_CONST, 0, sv));
2764 SvREFCNT_dec(PL_lex_stuff);
2765 PL_lex_stuff = Nullsv;
2766 }
2767 else {
2768 attrs = append_elem(OP_LIST, attrs,
2769 newSVOP(OP_CONST, 0,
2770 newSVpvn(s, len)));
2771 }
2772 s = skipspace(d);
2773 while (*s == ',')
2774 s = skipspace(s+1);
2775 }
2776 tmp = (PL_expect == XOPERATOR ? '=' : '{'); /*'}' for vi */
2777 if (*s != ';' && *s != tmp) {
2778 char q = ((*s == '\'') ? '"' : '\'');
2779 /* If here for an expression, and parsed no attrs, back off. */
2780 if (tmp == '=' && !attrs) {
2781 s = PL_bufptr;
2782 break;
2783 }
2784 /* MUST advance bufptr here to avoid bogus "at end of line"
2785 context messages from yyerror().
2786 */
2787 PL_bufptr = s;
2788 if (!*s)
2789 yyerror("Unterminated attribute list");
2790 else
2791 yyerror(Perl_form(aTHX_ "Invalid separator character %c%c%c in attribute list",
2792 q, *s, q));
2793 if (attrs)
2794 op_free(attrs);
2795 OPERATOR(':');
2796 }
2797 if (attrs) {
2798 PL_nextval[PL_nexttoke].opval = attrs;
2799 force_next(THING);
2800 }
2801 TOKEN(COLONATTR);
2802 }
a0d0e21e 2803 OPERATOR(':');
8990e307
LW
2804 case '(':
2805 s++;
3280af22
NIS
2806 if (PL_last_lop == PL_oldoldbufptr || PL_last_uni == PL_oldoldbufptr)
2807 PL_oldbufptr = PL_oldoldbufptr; /* allow print(STDOUT 123) */
a0d0e21e 2808 else
3280af22 2809 PL_expect = XTERM;
a0d0e21e 2810 TOKEN('(');
378cc40b 2811 case ';':
3280af22
NIS
2812 if (PL_curcop->cop_line < PL_copline)
2813 PL_copline = PL_curcop->cop_line;
378cc40b
LW
2814 tmp = *s++;
2815 OPERATOR(tmp);
2816 case ')':
378cc40b 2817 tmp = *s++;
16d20bd9
AD
2818 s = skipspace(s);
2819 if (*s == '{')
2820 PREBLOCK(tmp);
378cc40b 2821 TERM(tmp);
79072805
LW
2822 case ']':
2823 s++;
3280af22 2824 if (PL_lex_brackets <= 0)
d98d5fff 2825 yyerror("Unmatched right square bracket");
463ee0b2 2826 else
3280af22
NIS
2827 --PL_lex_brackets;
2828 if (PL_lex_state == LEX_INTERPNORMAL) {
2829 if (PL_lex_brackets == 0) {
a0d0e21e 2830 if (*s != '[' && *s != '{' && (*s != '-' || s[1] != '>'))
3280af22 2831 PL_lex_state = LEX_INTERPEND;
79072805
LW
2832 }
2833 }
4633a7c4 2834 TERM(']');
79072805
LW
2835 case '{':
2836 leftbracket:
79072805 2837 s++;
3280af22
NIS
2838 if (PL_lex_brackets > 100) {
2839 char* newlb = Renew(PL_lex_brackstack, PL_lex_brackets + 1, char);
2840 if (newlb != PL_lex_brackstack) {
8990e307 2841 SAVEFREEPV(newlb);
3280af22 2842 PL_lex_brackstack = newlb;
8990e307
LW
2843 }
2844 }
3280af22 2845 switch (PL_expect) {
a0d0e21e 2846 case XTERM:
3280af22 2847 if (PL_lex_formbrack) {
a0d0e21e
LW
2848 s--;
2849 PRETERMBLOCK(DO);
2850 }
3280af22
NIS
2851 if (PL_oldoldbufptr == PL_last_lop)
2852 PL_lex_brackstack[PL_lex_brackets++] = XTERM;
a0d0e21e 2853 else
3280af22 2854 PL_lex_brackstack[PL_lex_brackets++] = XOPERATOR;
79072805 2855 OPERATOR(HASHBRACK);
a0d0e21e 2856 case XOPERATOR:
3280af22 2857 while (s < PL_bufend && (*s == ' ' || *s == '\t'))
748a9306 2858 s++;
44a8e56a 2859 d = s;
3280af22
NIS
2860 PL_tokenbuf[0] = '\0';
2861 if (d < PL_bufend && *d == '-') {
2862 PL_tokenbuf[0] = '-';
44a8e56a 2863 d++;
3280af22 2864 while (d < PL_bufend && (*d == ' ' || *d == '\t'))
44a8e56a 2865 d++;
2866 }
834a4ddd 2867 if (d < PL_bufend && isIDFIRST_lazy(d)) {
3280af22 2868 d = scan_word(d, PL_tokenbuf + 1, sizeof PL_tokenbuf - 1,
8903cb82 2869 FALSE, &len);
3280af22 2870 while (d < PL_bufend && (*d == ' ' || *d == '\t'))
748a9306
LW
2871 d++;
2872 if (*d == '}') {
3280af22 2873 char minus = (PL_tokenbuf[0] == '-');
44a8e56a 2874 s = force_word(s + minus, WORD, FALSE, TRUE, FALSE);
2875 if (minus)
2876 force_next('-');
748a9306
LW
2877 }
2878 }
2879 /* FALL THROUGH */
09bef843 2880 case XATTRBLOCK:
748a9306 2881 case XBLOCK:
3280af22
NIS
2882 PL_lex_brackstack[PL_lex_brackets++] = XSTATE;
2883 PL_expect = XSTATE;
a0d0e21e 2884 break;
09bef843 2885 case XATTRTERM:
a0d0e21e 2886 case XTERMBLOCK:
3280af22
NIS
2887 PL_lex_brackstack[PL_lex_brackets++] = XOPERATOR;
2888 PL_expect = XSTATE;
a0d0e21e
LW
2889 break;
2890 default: {
2891 char *t;
3280af22
NIS
2892 if (PL_oldoldbufptr == PL_last_lop)
2893 PL_lex_brackstack[PL_lex_brackets++] = XTERM;
a0d0e21e 2894 else
3280af22 2895 PL_lex_brackstack[PL_lex_brackets++] = XOPERATOR;
a0d0e21e 2896 s = skipspace(s);
09ecc4b6 2897 if (*s == '}')
a0d0e21e 2898 OPERATOR(HASHBRACK);
b8a4b1be
GS
2899 /* This hack serves to disambiguate a pair of curlies
2900 * as being a block or an anon hash. Normally, expectation
2901 * determines that, but in cases where we're not in a
2902 * position to expect anything in particular (like inside
2903 * eval"") we have to resolve the ambiguity. This code
2904 * covers the case where the first term in the curlies is a
2905 * quoted string. Most other cases need to be explicitly
2906 * disambiguated by prepending a `+' before the opening
2907 * curly in order to force resolution as an anon hash.
2908 *
2909 * XXX should probably propagate the outer expectation
2910 * into eval"" to rely less on this hack, but that could
2911 * potentially break current behavior of eval"".
2912 * GSAR 97-07-21
2913 */
2914 t = s;
2915 if (*s == '\'' || *s == '"' || *s == '`') {
2916 /* common case: get past first string, handling escapes */
3280af22 2917 for (t++; t < PL_bufend && *t != *s;)
b8a4b1be
GS
2918 if (*t++ == '\\' && (*t == '\\' || *t == *s))
2919 t++;
2920 t++;
a0d0e21e 2921 }
b8a4b1be 2922 else if (*s == 'q') {
3280af22 2923 if (++t < PL_bufend
b8a4b1be 2924 && (!isALNUM(*t)
3280af22 2925 || ((*t == 'q' || *t == 'x') && ++t < PL_bufend
b8a4b1be
GS
2926 && !isALNUM(*t)))) {
2927 char *tmps;
2928 char open, close, term;
2929 I32 brackets = 1;
2930
3280af22 2931 while (t < PL_bufend && isSPACE(*t))
b8a4b1be
GS
2932 t++;
2933 term = *t;
2934 open = term;
2935 if (term && (tmps = strchr("([{< )]}> )]}>",term)))
2936 term = tmps[5];
2937 close = term;
2938 if (open == close)
3280af22
NIS
2939 for (t++; t < PL_bufend; t++) {
2940 if (*t == '\\' && t+1 < PL_bufend && open != '\\')
b8a4b1be 2941 t++;
6d07e5e9 2942 else if (*t == open)
b8a4b1be
GS
2943 break;
2944 }
2945 else
3280af22
NIS
2946 for (t++; t < PL_bufend; t++) {
2947 if (*t == '\\' && t+1 < PL_bufend)
b8a4b1be 2948 t++;
6d07e5e9 2949 else if (*t == close && --brackets <= 0)
b8a4b1be
GS
2950 break;
2951 else if (*t == open)
2952 brackets++;
2953 }
2954 }
2955 t++;
a0d0e21e 2956 }
834a4ddd
LW
2957 else if (isIDFIRST_lazy(s)) {
2958 for (t++; t < PL_bufend && isALNUM_lazy(t); t++) ;
a0d0e21e 2959 }
3280af22 2960 while (t < PL_bufend && isSPACE(*t))
a0d0e21e 2961 t++;
b8a4b1be
GS
2962 /* if comma follows first term, call it an anon hash */
2963 /* XXX it could be a comma expression with loop modifiers */
3280af22 2964 if (t < PL_bufend && ((*t == ',' && (*s == 'q' || !isLOWER(*s)))
b8a4b1be 2965 || (*t == '=' && t[1] == '>')))
a0d0e21e 2966 OPERATOR(HASHBRACK);
3280af22 2967 if (PL_expect == XREF)
4e4e412b 2968 PL_expect = XTERM;
a0d0e21e 2969 else {
3280af22
NIS
2970 PL_lex_brackstack[PL_lex_brackets-1] = XSTATE;
2971 PL_expect = XSTATE;
a0d0e21e 2972 }
8990e307 2973 }
a0d0e21e 2974 break;
463ee0b2 2975 }
3280af22 2976 yylval.ival = PL_curcop->cop_line;
79072805 2977 if (isSPACE(*s) || *s == '#')
3280af22 2978 PL_copline = NOLINE; /* invalidate current command line number */
79072805 2979 TOKEN('{');
378cc40b 2980 case '}':
79072805
LW
2981 rightbracket:
2982 s++;
3280af22 2983 if (PL_lex_brackets <= 0)
d98d5fff 2984 yyerror("Unmatched right curly bracket");
463ee0b2 2985 else
3280af22
NIS
2986 PL_expect = (expectation)PL_lex_brackstack[--PL_lex_brackets];
2987 if (PL_lex_brackets < PL_lex_formbrack)
2988 PL_lex_formbrack = 0;
2989 if (PL_lex_state == LEX_INTERPNORMAL) {
2990 if (PL_lex_brackets == 0) {
2991 if (PL_lex_fakebrack) {
2992 PL_lex_state = LEX_INTERPEND;
2993 PL_bufptr = s;
cea2e8a9 2994 return yylex(); /* ignore fake brackets */
79072805 2995 }
fa83b5b6 2996 if (*s == '-' && s[1] == '>')
3280af22 2997 PL_lex_state = LEX_INTERPENDMAYBE;
fa83b5b6 2998 else if (*s != '[' && *s != '{')
3280af22 2999 PL_lex_state = LEX_INTERPEND;
79072805
LW
3000 }
3001 }
3280af22
NIS
3002 if (PL_lex_brackets < PL_lex_fakebrack) {
3003 PL_bufptr = s;
3004 PL_lex_fakebrack = 0;
cea2e8a9 3005 return yylex(); /* ignore fake brackets */
748a9306 3006 }
79072805
LW
3007 force_next('}');
3008 TOKEN(';');
378cc40b
LW
3009 case '&':
3010 s++;
3011 tmp = *s++;
3012 if (tmp == '&')
a0d0e21e 3013 AOPERATOR(ANDAND);
378cc40b 3014 s--;
3280af22 3015 if (PL_expect == XOPERATOR) {
834a4ddd 3016 if (ckWARN(WARN_SEMICOLON) && isIDFIRST_lazy(s) && PL_bufptr == PL_linestart) {
3280af22 3017 PL_curcop->cop_line--;
cea2e8a9 3018 Perl_warner(aTHX_ WARN_SEMICOLON, PL_warn_nosemi);
3280af22 3019 PL_curcop->cop_line++;
463ee0b2 3020 }
79072805 3021 BAop(OP_BIT_AND);
463ee0b2 3022 }
79072805 3023
3280af22
NIS
3024 s = scan_ident(s - 1, PL_bufend, PL_tokenbuf, sizeof PL_tokenbuf, TRUE);
3025 if (*PL_tokenbuf) {
3026 PL_expect = XOPERATOR;
3027 force_ident(PL_tokenbuf, '&');
463ee0b2 3028 }
79072805
LW
3029 else
3030 PREREF('&');
c07a80fd 3031 yylval.ival = (OPpENTERSUB_AMPER<<8);
79072805
LW
3032 TERM('&');
3033
378cc40b
LW
3034 case '|':
3035 s++;
3036 tmp = *s++;
3037 if (tmp == '|')
a0d0e21e 3038 AOPERATOR(OROR);
378cc40b 3039 s--;
79072805 3040 BOop(OP_BIT_OR);
378cc40b
LW
3041 case '=':
3042 s++;
3043 tmp = *s++;
3044 if (tmp == '=')
79072805
LW
3045 Eop(OP_EQ);
3046 if (tmp == '>')
3047 OPERATOR(',');
378cc40b 3048 if (tmp == '~')
79072805 3049 PMop(OP_MATCH);
599cee73 3050 if (ckWARN(WARN_SYNTAX) && tmp && isSPACE(*s) && strchr("+-*/%.^&|<",tmp))
cea2e8a9 3051 Perl_warner(aTHX_ WARN_SYNTAX, "Reversed %c= operator",(int)tmp);
378cc40b 3052 s--;
3280af22
NIS
3053 if (PL_expect == XSTATE && isALPHA(tmp) &&
3054 (s == PL_linestart+1 || s[-2] == '\n') )
748a9306 3055 {
3280af22
NIS
3056 if (PL_in_eval && !PL_rsfp) {
3057 d = PL_bufend;
a5f75d66
AD
3058 while (s < d) {
3059 if (*s++ == '\n') {
3060 incline(s);
3061 if (strnEQ(s,"=cut",4)) {
3062 s = strchr(s,'\n');
3063 if (s)
3064 s++;
3065 else
3066 s = d;
3067 incline(s);
3068 goto retry;
3069 }
3070 }
3071 }
3072 goto retry;
3073 }
3280af22
NIS
3074 s = PL_bufend;
3075 PL_doextract = TRUE;
a0d0e21e
LW
3076 goto retry;
3077 }
3280af22 3078 if (PL_lex_brackets < PL_lex_formbrack) {
a0d0e21e 3079 char *t;
51882d45 3080#ifdef PERL_STRICT_CR
a0d0e21e 3081 for (t = s; *t == ' ' || *t == '\t'; t++) ;
51882d45
GS
3082#else
3083 for (t = s; *t == ' ' || *t == '\t' || *t == '\r'; t++) ;
3084#endif
a0d0e21e
LW
3085 if (*t == '\n' || *t == '#') {
3086 s--;
3280af22 3087 PL_expect = XBLOCK;
a0d0e21e
LW
3088 goto leftbracket;
3089 }
79072805 3090 }
a0d0e21e
LW
3091 yylval.ival = 0;
3092 OPERATOR(ASSIGNOP);
378cc40b
LW
3093 case '!':
3094 s++;
3095 tmp = *s++;
3096 if (tmp == '=')
79072805 3097 Eop(OP_NE);
378cc40b 3098 if (tmp == '~')
79072805 3099 PMop(OP_NOT);
378cc40b
LW
3100 s--;
3101 OPERATOR('!');
3102 case '<':
3280af22 3103 if (PL_expect != XOPERATOR) {
93a17b20 3104 if (s[1] != '<' && !strchr(s,'>'))
2f3197b3 3105 check_uni();
79072805
LW
3106 if (s[1] == '<')
3107 s = scan_heredoc(s);
3108 else
3109 s = scan_inputsymbol(s);
3110 TERM(sublex_start());
378cc40b
LW
3111 }
3112 s++;
3113 tmp = *s++;
3114 if (tmp == '<')
79072805 3115 SHop(OP_LEFT_SHIFT);
395c3793
LW
3116 if (tmp == '=') {
3117 tmp = *s++;
3118 if (tmp == '>')
79072805 3119 Eop(OP_NCMP);
395c3793 3120 s--;
79072805 3121 Rop(OP_LE);
395c3793 3122 }
378cc40b 3123 s--;
79072805 3124 Rop(OP_LT);
378cc40b
LW
3125 case '>':
3126 s++;
3127 tmp = *s++;
3128 if (tmp == '>')
79072805 3129 SHop(OP_RIGHT_SHIFT);
378cc40b 3130 if (tmp == '=')
79072805 3131 Rop(OP_GE);
378cc40b 3132 s--;
79072805 3133 Rop(OP_GT);
378cc40b
LW
3134
3135 case '$':
bbce6d69 3136 CLINE;
3137
3280af22
NIS
3138 if (PL_expect == XOPERATOR) {
3139 if (PL_lex_formbrack && PL_lex_brackets == PL_lex_formbrack) {
3140 PL_expect = XTERM;
a0d0e21e 3141 depcom();
bbce6d69 3142 return ','; /* grandfather non-comma-format format */
a0d0e21e 3143 }
8990e307 3144 }
a0d0e21e 3145
834a4ddd 3146 if (s[1] == '#' && (isIDFIRST_lazy(s+2) || strchr("{$:+-", s[2]))) {
3280af22 3147 PL_tokenbuf[0] = '@';
376b8730
SM
3148 s = scan_ident(s + 1, PL_bufend, PL_tokenbuf + 1,
3149 sizeof PL_tokenbuf - 1, FALSE);
3150 if (PL_expect == XOPERATOR)
3151 no_op("Array length", s);
3280af22 3152 if (!PL_tokenbuf[1])
a0d0e21e 3153 PREREF(DOLSHARP);
3280af22
NIS
3154 PL_expect = XOPERATOR;
3155 PL_pending_ident = '#';
463ee0b2 3156 TOKEN(DOLSHARP);
79072805 3157 }
bbce6d69 3158
3280af22 3159 PL_tokenbuf[0] = '$';
376b8730
SM
3160 s = scan_ident(s, PL_bufend, PL_tokenbuf + 1,
3161 sizeof PL_tokenbuf - 1, FALSE);
3162 if (PL_expect == XOPERATOR)
3163 no_op("Scalar", s);
3280af22
NIS
3164 if (!PL_tokenbuf[1]) {
3165 if (s == PL_bufend)
bbce6d69 3166 yyerror("Final $ should be \\$ or $name");
3167 PREREF('$');
8990e307 3168 }
a0d0e21e 3169
bbce6d69 3170 /* This kludge not intended to be bulletproof. */
3280af22 3171 if (PL_tokenbuf[1] == '[' && !PL_tokenbuf[2]) {
bbce6d69 3172 yylval.opval = newSVOP(OP_CONST, 0,
3280af22 3173 newSViv((IV)PL_compiling.cop_arybase));
bbce6d69 3174 yylval.opval->op_private = OPpCONST_ARYBASE;
3175 TERM(THING);
3176 }
3177
ff68c719 3178 d = s;
69d2bceb 3179 tmp = (I32)*s;
3280af22 3180 if (PL_lex_state == LEX_NORMAL)
ff68c719 3181 s = skipspace(s);
3182
3280af22 3183 if ((PL_expect != XREF || PL_oldoldbufptr == PL_last_lop) && intuit_more(s)) {
bbce6d69 3184 char *t;
3185 if (*s == '[') {
3280af22 3186 PL_tokenbuf[0] = '@';
599cee73 3187 if (ckWARN(WARN_SYNTAX)) {
bbce6d69 3188 for(t = s + 1;
834a4ddd 3189 isSPACE(*t) || isALNUM_lazy(t) || *t == '$';
bbce6d69 3190 t++) ;
a0d0e21e 3191 if (*t++ == ',') {
3280af22
NIS
3192 PL_bufptr = skipspace(PL_bufptr);
3193 while (t < PL_bufend && *t != ']')
bbce6d69 3194 t++;
cea2e8a9 3195 Perl_warner(aTHX_ WARN_SYNTAX,
599cee73
PM
3196 "Multidimensional syntax %.*s not supported",
3197 (t - PL_bufptr) + 1, PL_bufptr);
a0d0e21e
LW
3198 }
3199 }
bbce6d69 3200 }
3201 else if (*s == '{') {
3280af22 3202 PL_tokenbuf[0] = '%';
599cee73 3203 if (ckWARN(WARN_SYNTAX) && strEQ(PL_tokenbuf+1, "SIG") &&
bbce6d69 3204 (t = strchr(s, '}')) && (t = strchr(t, '=')))
3205 {
3280af22 3206 char tmpbuf[sizeof PL_tokenbuf];
a0d0e21e
LW
3207 STRLEN len;
3208 for (t++; isSPACE(*t); t++) ;
834a4ddd 3209 if (isIDFIRST_lazy(t)) {
8903cb82 3210 t = scan_word(t, tmpbuf, sizeof tmpbuf, TRUE, &len);
59a6d928 3211 for (; isSPACE(*t); t++) ;
864dbfa3 3212 if (*t == ';' && get_cv(tmpbuf, FALSE))
cea2e8a9 3213 Perl_warner(aTHX_ WARN_SYNTAX,
599cee73 3214 "You need to quote \"%s\"", tmpbuf);
748a9306 3215 }
93a17b20
LW
3216 }
3217 }
2f3197b3 3218 }
bbce6d69 3219
3280af22 3220 PL_expect = XOPERATOR;
69d2bceb 3221 if (PL_lex_state == LEX_NORMAL && isSPACE((char)tmp)) {
3280af22
NIS
3222 bool islop = (PL_last_lop == PL_oldoldbufptr);
3223 if (!islop || PL_last_lop_op == OP_GREPSTART)
3224 PL_expect = XOPERATOR;
bbce6d69 3225 else if (strchr("$@\"'`q", *s))
3280af22 3226 PL_expect = XTERM; /* e.g. print $fh "foo" */
834a4ddd 3227 else if (strchr("&*<%", *s) && isIDFIRST_lazy(s+1))
3280af22 3228 PL_expect = XTERM; /* e.g. print $fh &sub */
834a4ddd 3229 else if (isIDFIRST_lazy(s)) {
3280af22 3230 char tmpbuf[sizeof PL_tokenbuf];
8903cb82 3231 scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
84902520
TB
3232 if (tmp = keyword(tmpbuf, len)) {
3233 /* binary operators exclude handle interpretations */
3234 switch (tmp) {
3235 case -KEY_x:
3236 case -KEY_eq:
3237 case -KEY_ne:
3238 case -KEY_gt:
3239 case -KEY_lt:
3240 case -KEY_ge:
3241 case -KEY_le:
3242 case -KEY_cmp:
3243 break;
3244 default:
3280af22 3245 PL_expect = XTERM; /* e.g. print $fh length() */
84902520
TB
3246 break;
3247 }
3248 }
68dc0745 3249 else {
3250 GV *gv = gv_fetchpv(tmpbuf, FALSE, SVt_PVCV);
3251 if (gv && GvCVu(gv))
3280af22 3252 PL_expect = XTERM; /* e.g. print $fh subr() */
93a17b20 3253 }
93a17b20 3254 }
bbce6d69 3255 else if (isDIGIT(*s))
3280af22 3256 PL_expect = XTERM; /* e.g. print $fh 3 */
bbce6d69 3257 else if (*s == '.' && isDIGIT(s[1]))
3280af22 3258 PL_expect = XTERM; /* e.g. print $fh .3 */
e0587a03 3259 else if (strchr("/?-+", *s) && !isSPACE(s[1]) && s[1] != '=')
3280af22 3260 PL_expect = XTERM; /* e.g. print $fh -1 */
e0587a03 3261 else if (*s == '<' && s[1] == '<' && !isSPACE(s[2]) && s[2] != '=')
3280af22 3262 PL_expect = XTERM; /* print $fh <<"EOF" */
bbce6d69 3263 }
3280af22 3264 PL_pending_ident = '$';
79072805 3265 TOKEN('$');
378cc40b
LW
3266
3267 case '@':
3280af22 3268 if (PL_expect == XOPERATOR)
bbce6d69 3269 no_op("Array", s);
3280af22
NIS
3270 PL_tokenbuf[0] = '@';
3271 s = scan_ident(s, PL_bufend, PL_tokenbuf + 1, sizeof PL_tokenbuf - 1, FALSE);
3272 if (!PL_tokenbuf[1]) {
3273 if (s == PL_bufend)
bbce6d69 3274 yyerror("Final @ should be \\@ or @name");
3275 PREREF('@');
3276 }
3280af22 3277 if (PL_lex_state == LEX_NORMAL)
ff68c719 3278 s = skipspace(s);
3280af22 3279 if ((PL_expect != XREF || PL_oldoldbufptr == PL_last_lop) && intuit_more(s)) {
bbce6d69 3280 if (*s == '{')
3280af22 3281 PL_tokenbuf[0] = '%';
a0d0e21e
LW
3282
3283 /* Warn about @ where they meant $. */
599cee73 3284 if (ckWARN(WARN_SYNTAX)) {
a0d0e21e
LW
3285 if (*s == '[' || *s == '{') {
3286 char *t = s + 1;
834a4ddd 3287 while (*t && (isALNUM_lazy(t) || strchr(" \t$#+-'\"", *t)))
a0d0e21e
LW
3288 t++;
3289 if (*t == '}' || *t == ']') {
3290 t++;
3280af22 3291 PL_bufptr = skipspace(PL_bufptr);
cea2e8a9 3292 Perl_warner(aTHX_ WARN_SYNTAX,
599cee73 3293 "Scalar value %.*s better written as $%.*s",
3280af22 3294 t-PL_bufptr, PL_bufptr, t-PL_bufptr-1, PL_bufptr+1);
a0d0e21e 3295 }
93a17b20
LW
3296 }
3297 }
463ee0b2 3298 }
3280af22 3299 PL_pending_ident = '@';
79072805 3300 TERM('@');
378cc40b
LW
3301
3302 case '/': /* may either be division or pattern */
3303 case '?': /* may either be conditional or pattern */
3280af22 3304 if (PL_expect != XOPERATOR) {
c277df42 3305 /* Disable warning on "study /blah/" */
3280af22
NIS
3306 if (PL_oldoldbufptr == PL_last_uni
3307 && (*PL_last_uni != 's' || s - PL_last_uni < 5
834a4ddd 3308 || memNE(PL_last_uni, "study", 5) || isALNUM_lazy(PL_last_uni+5)))
c277df42 3309 check_uni();
8782bef2 3310 s = scan_pat(s,OP_MATCH);
79072805 3311 TERM(sublex_start());
378cc40b
LW
3312 }
3313 tmp = *s++;
a687059c 3314 if (tmp == '/')
79072805 3315 Mop(OP_DIVIDE);
378cc40b
LW
3316 OPERATOR(tmp);
3317
3318 case '.':
51882d45
GS
3319 if (PL_lex_formbrack && PL_lex_brackets == PL_lex_formbrack
3320#ifdef PERL_STRICT_CR
3321 && s[1] == '\n'
3322#else
3323 && (s[1] == '\n' || (s[1] == '\r' && s[2] == '\n'))
3324#endif
3325 && (s == PL_linestart || s[-1] == '\n') )
3326 {
3280af22
NIS
3327 PL_lex_formbrack = 0;
3328 PL_expect = XSTATE;
79072805
LW
3329 goto rightbracket;
3330 }
3280af22 3331 if (PL_expect == XOPERATOR || !isDIGIT(s[1])) {
378cc40b 3332 tmp = *s++;
a687059c
LW
3333 if (*s == tmp) {
3334 s++;
2f3197b3
LW
3335 if (*s == tmp) {
3336 s++;
79072805 3337 yylval.ival = OPf_SPECIAL;
2f3197b3
LW
3338 }
3339 else
79072805 3340 yylval.ival = 0;
378cc40b 3341 OPERATOR(DOTDOT);
a687059c 3342 }
3280af22 3343 if (PL_expect != XOPERATOR)
2f3197b3 3344 check_uni();
79072805 3345 Aop(OP_CONCAT);
378cc40b
LW
3346 }
3347 /* FALL THROUGH */
3348 case '0': case '1': case '2': case '3': case '4':
3349 case '5': case '6': case '7': case '8': case '9':
79072805 3350 s = scan_num(s);
3280af22 3351 if (PL_expect == XOPERATOR)
8990e307 3352 no_op("Number",s);
79072805
LW
3353 TERM(THING);
3354
3355 case '\'':
09bef843 3356 s = scan_str(s,FALSE,FALSE);
3280af22
NIS
3357 if (PL_expect == XOPERATOR) {
3358 if (PL_lex_formbrack && PL_lex_brackets == PL_lex_formbrack) {
3359 PL_expect = XTERM;
a0d0e21e
LW
3360 depcom();
3361 return ','; /* grandfather non-comma-format format */
3362 }
463ee0b2 3363 else
8990e307 3364 no_op("String",s);
463ee0b2 3365 }
79072805 3366 if (!s)
85e6fe83 3367 missingterm((char*)0);
79072805
LW
3368 yylval.ival = OP_CONST;
3369 TERM(sublex_start());
3370
3371 case '"':
09bef843 3372 s = scan_str(s,FALSE,FALSE);
3280af22
NIS
3373 if (PL_expect == XOPERATOR) {
3374 if (PL_lex_formbrack && PL_lex_brackets == PL_lex_formbrack) {
3375 PL_expect = XTERM;
a0d0e21e
LW
3376 depcom();
3377 return ','; /* grandfather non-comma-format format */
3378 }
463ee0b2 3379 else
8990e307 3380 no_op("String",s);
463ee0b2 3381 }
79072805 3382 if (!s)
85e6fe83 3383 missingterm((char*)0);
4633a7c4 3384 yylval.ival = OP_CONST;
3280af22 3385 for (d = SvPV(PL_lex_stuff, len); len; len--, d++) {
a0ed51b3 3386 if (*d == '$' || *d == '@' || *d == '\\' || *d & 0x80) {
4633a7c4
LW
3387 yylval.ival = OP_STRINGIFY;
3388 break;
3389 }
3390 }
79072805
LW
3391 TERM(sublex_start());
3392
3393 case '`':
09bef843 3394 s = scan_str(s,FALSE,FALSE);
3280af22 3395 if (PL_expect == XOPERATOR)
8990e307 3396 no_op("Backticks",s);
79072805 3397 if (!s)
85e6fe83 3398 missingterm((char*)0);
79072805
LW
3399 yylval.ival = OP_BACKTICK;
3400 set_csh();
3401 TERM(sublex_start());
3402
3403 case '\\':
3404 s++;
599cee73 3405 if (ckWARN(WARN_SYNTAX) && PL_lex_inwhat && isDIGIT(*s))
cea2e8a9 3406 Perl_warner(aTHX_ WARN_SYNTAX,"Can't use \\%c to mean $%c in expression",
599cee73 3407 *s, *s);
3280af22 3408 if (PL_expect == XOPERATOR)
8990e307 3409 no_op("Backslash",s);
79072805
LW
3410 OPERATOR(REFGEN);
3411
3412 case 'x':
3280af22 3413 if (isDIGIT(s[1]) && PL_expect == XOPERATOR) {
79072805
LW
3414 s++;
3415 Mop(OP_REPEAT);
2f3197b3 3416 }
79072805
LW
3417 goto keylookup;
3418
378cc40b 3419 case '_':
79072805
LW
3420 case 'a': case 'A':
3421 case 'b': case 'B':
3422 case 'c': case 'C':
3423 case 'd': case 'D':
3424 case 'e': case 'E':
3425 case 'f': case 'F':
3426 case 'g': case 'G':
3427 case 'h': case 'H':
3428 case 'i': case 'I':
3429 case 'j': case 'J':
3430 case 'k': case 'K':
3431 case 'l': case 'L':
3432 case 'm': case 'M':
3433 case 'n': case 'N':
3434 case 'o': case 'O':
3435 case 'p': case 'P':
3436 case 'q': case 'Q':
3437 case 'r': case 'R':
3438 case 's': case 'S':
3439 case 't': case 'T':
3440 case 'u': case 'U':
3441 case 'v': case 'V':
3442 case 'w': case 'W':
3443 case 'X':
3444 case 'y': case 'Y':
3445 case 'z': case 'Z':
3446
49dc05e3 3447 keylookup: {
2d8e6c8d 3448 STRLEN n_a;
161b471a
NIS
3449 gv = Nullgv;
3450 gvp = 0;
49dc05e3 3451
3280af22
NIS
3452 PL_bufptr = s;
3453 s = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE, &len);
8ebc5c01 3454
3455 /* Some keywords can be followed by any delimiter, including ':' */
3280af22
NIS
3456 tmp = (len == 1 && strchr("msyq", PL_tokenbuf[0]) ||
3457 len == 2 && ((PL_tokenbuf[0] == 't' && PL_tokenbuf[1] == 'r') ||
3458 (PL_tokenbuf[0] == 'q' &&
3459 strchr("qwxr", PL_tokenbuf[1]))));
8ebc5c01 3460
3461 /* x::* is just a word, unless x is "CORE" */
3280af22 3462 if (!tmp && *s == ':' && s[1] == ':' && strNE(PL_tokenbuf, "CORE"))
4633a7c4
LW
3463 goto just_a_word;
3464
3643fb5f 3465 d = s;
3280af22 3466 while (d < PL_bufend && isSPACE(*d))
3643fb5f
CS
3467 d++; /* no comments skipped here, or s### is misparsed */
3468
3469 /* Is this a label? */
3280af22
NIS
3470 if (!tmp && PL_expect == XSTATE
3471 && d < PL_bufend && *d == ':' && *(d + 1) != ':') {
8ebc5c01 3472 s = d + 1;
3280af22 3473 yylval.pval = savepv(PL_tokenbuf);
8ebc5c01 3474 CLINE;
3475 TOKEN(LABEL);
3643fb5f
CS
3476 }
3477
3478 /* Check for keywords */
3280af22 3479 tmp = keyword(PL_tokenbuf, len);
748a9306
LW
3480
3481 /* Is this a word before a => operator? */
748a9306
LW
3482 if (strnEQ(d,"=>",2)) {
3483 CLINE;
3280af22 3484 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(PL_tokenbuf,0));
748a9306
LW
3485 yylval.opval->op_private = OPpCONST_BARE;
3486 TERM(WORD);
3487 }
3488
a0d0e21e 3489 if (tmp < 0) { /* second-class keyword? */
56f7f34b
CS
3490 GV *ogv = Nullgv; /* override (winner) */
3491 GV *hgv = Nullgv; /* hidden (loser) */
3280af22 3492 if (PL_expect != XOPERATOR && (*s != ':' || s[1] != ':')) {
56f7f34b 3493 CV *cv;
3280af22 3494 if ((gv = gv_fetchpv(PL_tokenbuf, FALSE, SVt_PVCV)) &&
56f7f34b
CS
3495 (cv = GvCVu(gv)))
3496 {
3497 if (GvIMPORTED_CV(gv))
3498 ogv = gv;
3499 else if (! CvMETHOD(cv))
3500 hgv = gv;
3501 }
3502 if (!ogv &&
3280af22
NIS
3503 (gvp = (GV**)hv_fetch(PL_globalstash,PL_tokenbuf,len,FALSE)) &&
3504 (gv = *gvp) != (GV*)&PL_sv_undef &&
56f7f34b
CS
3505 GvCVu(gv) && GvIMPORTED_CV(gv))
3506 {
3507 ogv = gv;
3508 }
3509 }
3510 if (ogv) {
3511 tmp = 0; /* overridden by import or by GLOBAL */
6e7b2336
GS
3512 }
3513 else if (gv && !gvp
3514 && -tmp==KEY_lock /* XXX generalizable kludge */
3280af22 3515 && !hv_fetch(GvHVn(PL_incgv), "Thread.pm", 9, FALSE))
6e7b2336
GS
3516 {
3517 tmp = 0; /* any sub overrides "weak" keyword */
a0d0e21e 3518 }
56f7f34b
CS
3519 else { /* no override */
3520 tmp = -tmp;
3521 gv = Nullgv;
3522 gvp = 0;
4944e2f7
GS
3523 if (ckWARN(WARN_AMBIGUOUS) && hgv
3524 && tmp != KEY_x && tmp != KEY_CORE) /* never ambiguous */
cea2e8a9 3525 Perl_warner(aTHX_ WARN_AMBIGUOUS,
599cee73 3526 "Ambiguous call resolved as CORE::%s(), %s",
2f3ca594 3527 GvENAME(hgv), "qualify as such or use &");
49dc05e3 3528 }
a0d0e21e
LW
3529 }
3530
3531 reserved_word:
3532 switch (tmp) {
79072805
LW
3533
3534 default: /* not a keyword */
93a17b20 3535 just_a_word: {
96e4d5b1 3536 SV *sv;
3280af22 3537 char lastchar = (PL_bufptr == PL_oldoldbufptr ? 0 : PL_bufptr[-1]);
8990e307
LW
3538
3539 /* Get the rest if it looks like a package qualifier */
3540
a0d0e21e 3541 if (*s == '\'' || *s == ':' && s[1] == ':') {
c3e0f903 3542 STRLEN morelen;
3280af22 3543 s = scan_word(s, PL_tokenbuf + len, sizeof PL_tokenbuf - len,
c3e0f903
GS
3544 TRUE, &morelen);
3545 if (!morelen)
cea2e8a9 3546 Perl_croak(aTHX_ "Bad name after %s%s", PL_tokenbuf,
ec2ab091 3547 *s == '\'' ? "'" : "::");
c3e0f903 3548 len += morelen;
a0d0e21e 3549 }
8990e307 3550
3280af22
NIS
3551 if (PL_expect == XOPERATOR) {
3552 if (PL_bufptr == PL_linestart) {
3553 PL_curcop->cop_line--;
cea2e8a9 3554 Perl_warner(aTHX_ WARN_SEMICOLON, PL_warn_nosemi);
3280af22 3555 PL_curcop->cop_line++;
463ee0b2
LW
3556 }
3557 else
54310121 3558 no_op("Bareword",s);
463ee0b2 3559 }
8990e307 3560
c3e0f903
GS
3561 /* Look for a subroutine with this name in current package,
3562 unless name is "Foo::", in which case Foo is a bearword
3563 (and a package name). */
3564
3565 if (len > 2 &&
3280af22 3566 PL_tokenbuf[len - 2] == ':' && PL_tokenbuf[len - 1] == ':')
c3e0f903 3567 {
599cee73 3568 if (ckWARN(WARN_UNSAFE) && ! gv_fetchpv(PL_tokenbuf, FALSE, SVt_PVHV))
cea2e8a9 3569 Perl_warner(aTHX_ WARN_UNSAFE,
599cee73 3570 "Bareword \"%s\" refers to nonexistent package",
3280af22 3571 PL_tokenbuf);
c3e0f903 3572 len -= 2;
3280af22 3573 PL_tokenbuf[len] = '\0';
c3e0f903
GS
3574 gv = Nullgv;
3575 gvp = 0;
3576 }
3577 else {
3578 len = 0;
3579 if (!gv)
3280af22 3580 gv = gv_fetchpv(PL_tokenbuf, FALSE, SVt_PVCV);
c3e0f903
GS
3581 }
3582
3583 /* if we saw a global override before, get the right name */
8990e307 3584
49dc05e3 3585 if (gvp) {
79cb57f6 3586 sv = newSVpvn("CORE::GLOBAL::",14);
3280af22 3587 sv_catpv(sv,PL_tokenbuf);
49dc05e3
GS
3588 }
3589 else
3280af22 3590 sv = newSVpv(PL_tokenbuf,0);
8990e307 3591
a0d0e21e
LW
3592 /* Presume this is going to be a bareword of some sort. */
3593
3594 CLINE;
49dc05e3 3595 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
a0d0e21e
LW
3596 yylval.opval->op_private = OPpCONST_BARE;
3597
c3e0f903
GS
3598 /* And if "Foo::", then that's what it certainly is. */
3599
3600 if (len)
3601 goto safe_bareword;
3602
8990e307
LW
3603 /* See if it's the indirect object for a list operator. */
3604
3280af22
NIS
3605 if (PL_oldoldbufptr &&
3606 PL_oldoldbufptr < PL_bufptr &&
65cec589
GS
3607 (PL_oldoldbufptr == PL_last_lop
3608 || PL_oldoldbufptr == PL_last_uni) &&
a0d0e21e 3609 /* NO SKIPSPACE BEFORE HERE! */
a9ef352a
GS
3610 (PL_expect == XREF ||
3611 ((PL_opargs[PL_last_lop_op] >> OASHIFT)& 7) == OA_FILEREF))
a0d0e21e 3612 {
748a9306
LW
3613 bool immediate_paren = *s == '(';
3614
a0d0e21e
LW
3615 /* (Now we can afford to cross potential line boundary.) */
3616 s = skipspace(s);
3617
3618 /* Two barewords in a row may indicate method call. */
3619
834a4ddd 3620 if ((isIDFIRST_lazy(s) || *s == '$') && (tmp=intuit_method(s,gv)))
a0d0e21e
LW
3621 return tmp;
3622
3623 /* If not a declared subroutine, it's an indirect object. */
3624 /* (But it's an indir obj regardless for sort.) */
3625
3280af22 3626 if ((PL_last_lop_op == OP_SORT ||
a9ef352a
GS
3627 (!immediate_paren && (!gv || !GvCVu(gv)))) &&
3628 (PL_last_lop_op != OP_MAPSTART &&
3629 PL_last_lop_op != OP_GREPSTART))
3630 {
3280af22 3631 PL_expect = (PL_last_lop == PL_oldoldbufptr) ? XTERM : XOPERATOR;
748a9306 3632 goto bareword;
93a17b20
LW
3633 }
3634 }
8990e307
LW
3635
3636 /* If followed by a paren, it's certainly a subroutine. */
3637
3280af22 3638 PL_expect = XOPERATOR;
8990e307 3639 s = skipspace(s);
93a17b20 3640 if (*s == '(') {
79072805 3641 CLINE;
96e4d5b1 3642 if (gv && GvCVu(gv)) {
3643 for (d = s + 1; *d == ' ' || *d == '\t'; d++) ;
7a52d87a 3644 if (*d == ')' && (sv = cv_const_sv(GvCV(gv)))) {
96e4d5b1 3645 s = d + 1;
3646 goto its_constant;
3647 }
3648 }
3280af22
NIS
3649 PL_nextval[PL_nexttoke].opval = yylval.opval;
3650 PL_expect = XOPERATOR;
93a17b20 3651 force_next(WORD);
c07a80fd 3652 yylval.ival = 0;
463ee0b2 3653 TOKEN('&');
79072805 3654 }
93a17b20 3655
a0d0e21e 3656 /* If followed by var or block, call it a method (unless sub) */
8990e307 3657
8ebc5c01 3658 if ((*s == '$' || *s == '{') && (!gv || !GvCVu(gv))) {
3280af22
NIS
3659 PL_last_lop = PL_oldbufptr;
3660 PL_last_lop_op = OP_METHOD;
93a17b20 3661 PREBLOCK(METHOD);
463ee0b2
LW
3662 }
3663
8990e307
LW
3664 /* If followed by a bareword, see if it looks like indir obj. */
3665
834a4ddd 3666 if ((isIDFIRST_lazy(s) || *s == '$') && (tmp = intuit_method(s,gv)))
a0d0e21e 3667 return tmp;
93a17b20 3668
8990e307
LW
3669 /* Not a method, so call it a subroutine (if defined) */
3670
8ebc5c01 3671 if (gv && GvCVu(gv)) {
46fc3d4c 3672 CV* cv;
0453d815
PM
3673 if (lastchar == '-' && ckWARN_d(WARN_AMBIGUOUS))
3674 Perl_warner(aTHX_ WARN_AMBIGUOUS,
3675 "Ambiguous use of -%s resolved as -&%s()",
3280af22 3676 PL_tokenbuf, PL_tokenbuf);
89bfa8cd 3677 /* Check for a constant sub */
46fc3d4c 3678 cv = GvCV(gv);
96e4d5b1 3679 if ((sv = cv_const_sv(cv))) {
3680 its_constant:
3681 SvREFCNT_dec(((SVOP*)yylval.opval)->op_sv);
3682 ((SVOP*)yylval.opval)->op_sv = SvREFCNT_inc(sv);
3683 yylval.opval->op_private = 0;
3684 TOKEN(WORD);
89bfa8cd 3685 }
3686
a5f75d66
AD
3687 /* Resolve to GV now. */
3688 op_free(yylval.opval);
3689 yylval.opval = newCVREF(0, newGVOP(OP_GV, 0, gv));
9675f7ac 3690 yylval.opval->op_private |= OPpENTERSUB_NOPAREN;
7a52d87a 3691 PL_last_lop = PL_oldbufptr;
bf848113 3692 PL_last_lop_op = OP_ENTERSUB;
4633a7c4
LW
3693 /* Is there a prototype? */
3694 if (SvPOK(cv)) {
3695 STRLEN len;
7a52d87a 3696 char *proto = SvPV((SV*)cv, len);
4633a7c4
LW
3697 if (!len)
3698 TERM(FUNC0SUB);
7a52d87a 3699 if (strEQ(proto, "$"))
4633a7c4 3700 OPERATOR(UNIOPSUB);
7a52d87a 3701 if (*proto == '&' && *s == '{') {
3280af22 3702 sv_setpv(PL_subname,"__ANON__");
4633a7c4
LW
3703 PREBLOCK(LSTOPSUB);
3704 }
a9ef352a 3705 }
3280af22
NIS
3706 PL_nextval[PL_nexttoke].opval = yylval.opval;
3707 PL_expect = XTERM;
8990e307
LW
3708 force_next(WORD);
3709 TOKEN(NOAMP);
3710 }
748a9306 3711
8990e307
LW
3712 /* Call it a bare word */
3713
5603f27d
GS
3714 if (PL_hints & HINT_STRICT_SUBS)
3715 yylval.opval->op_private |= OPpCONST_STRICT;
3716 else {
3717 bareword:
3718 if (ckWARN(WARN_RESERVED)) {
3719 if (lastchar != '-') {
3720 for (d = PL_tokenbuf; *d && isLOWER(*d); d++) ;
3721 if (!*d)
cea2e8a9 3722 Perl_warner(aTHX_ WARN_RESERVED, PL_warn_reserved,
5603f27d
GS
3723 PL_tokenbuf);
3724 }
748a9306
LW
3725 }
3726 }
c3e0f903
GS
3727
3728 safe_bareword:
f248d071 3729 if (lastchar && strchr("*%&", lastchar) && ckWARN_d(WARN_AMBIGUOUS)) {
0453d815
PM
3730 Perl_warner(aTHX_ WARN_AMBIGUOUS,
3731 "Operator or semicolon missing before %c%s",
3280af22 3732 lastchar, PL_tokenbuf);
0453d815
PM
3733 Perl_warner(aTHX_ WARN_AMBIGUOUS,
3734 "Ambiguous use of %c resolved as operator %c",
748a9306
LW
3735 lastchar, lastchar);
3736 }
93a17b20 3737 TOKEN(WORD);
79072805 3738 }
79072805 3739
68dc0745 3740 case KEY___FILE__:
46fc3d4c 3741 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
3280af22 3742 newSVsv(GvSV(PL_curcop->cop_filegv)));
46fc3d4c 3743 TERM(THING);
3744
79072805 3745 case KEY___LINE__:
cf2093f6 3746 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
57def98f 3747 Perl_newSVpvf(aTHX_ "%"IVdf, (IV)PL_curcop->cop_line));
79072805 3748 TERM(THING);
68dc0745 3749
3750 case KEY___PACKAGE__:
3751 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
3280af22
NIS
3752 (PL_curstash
3753 ? newSVsv(PL_curstname)
3754 : &PL_sv_undef));
79072805 3755 TERM(THING);
79072805 3756
e50aee73 3757 case KEY___DATA__:
79072805
LW
3758 case KEY___END__: {
3759 GV *gv;
79072805
LW
3760
3761 /*SUPPRESS 560*/
3280af22 3762 if (PL_rsfp && (!PL_in_eval || PL_tokenbuf[2] == 'D')) {
e50aee73 3763 char *pname = "main";
3280af22
NIS
3764 if (PL_tokenbuf[2] == 'D')
3765 pname = HvNAME(PL_curstash ? PL_curstash : PL_defstash);
cea2e8a9 3766 gv = gv_fetchpv(Perl_form(aTHX_ "%s::DATA", pname), TRUE, SVt_PVIO);
a5f75d66 3767 GvMULTI_on(gv);
79072805 3768 if (!GvIO(gv))
a0d0e21e 3769 GvIOp(gv) = newIO();
3280af22 3770 IoIFP(GvIOp(gv)) = PL_rsfp;
a0d0e21e
LW
3771#if defined(HAS_FCNTL) && defined(F_SETFD)
3772 {
3280af22 3773 int fd = PerlIO_fileno(PL_rsfp);
a0d0e21e
LW
3774 fcntl(fd,F_SETFD,fd >= 3);
3775 }
79072805 3776#endif
fd049845 3777 /* Mark this internal pseudo-handle as clean */
3778 IoFLAGS(GvIOp(gv)) |= IOf_UNTAINT;
3280af22 3779 if (PL_preprocess)
a0d0e21e 3780 IoTYPE(GvIOp(gv)) = '|';
3280af22 3781 else if ((PerlIO*)PL_rsfp == PerlIO_stdin())
a0d0e21e 3782 IoTYPE(GvIOp(gv)) = '-';
79072805 3783 else
a0d0e21e 3784 IoTYPE(GvIOp(gv)) = '<';
3280af22 3785 PL_rsfp = Nullfp;
79072805
LW
3786 }
3787 goto fake_eof;
e929a76b 3788 }
de3bb511 3789
8990e307 3790 case KEY_AUTOLOAD:
ed6116ce 3791 case KEY_DESTROY:
79072805
LW
3792 case KEY_BEGIN:
3793 case KEY_END:
7d07dbc2 3794 case KEY_INIT:
3280af22
NIS
3795 if (PL_expect == XSTATE) {
3796 s = PL_bufptr;
93a17b20 3797 goto really_sub;
79072805
LW
3798 }
3799 goto just_a_word;
3800
a0d0e21e
LW
3801 case KEY_CORE:
3802 if (*s == ':' && s[1] == ':') {
3803 s += 2;
748a9306 3804 d = s;
3280af22
NIS
3805 s = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, FALSE, &len);
3806 tmp = keyword(PL_tokenbuf, len);
a0d0e21e
LW
3807 if (tmp < 0)
3808 tmp = -tmp;
3809 goto reserved_word;
3810 }
3811 goto just_a_word;
3812
463ee0b2
LW
3813 case KEY_abs:
3814 UNI(OP_ABS);
3815
79072805
LW
3816 case KEY_alarm:
3817 UNI(OP_ALARM);
3818
3819 case KEY_accept:
a0d0e21e 3820 LOP(OP_ACCEPT,XTERM);
79072805 3821
463ee0b2
LW
3822 case KEY_and:
3823 OPERATOR(ANDOP);
3824
79072805 3825 case KEY_atan2:
a0d0e21e 3826 LOP(OP_ATAN2,XTERM);
85e6fe83 3827
79072805 3828 case KEY_bind:
a0d0e21e 3829 LOP(OP_BIND,XTERM);
79072805
LW
3830
3831 case KEY_binmode:
3832 UNI(OP_BINMODE);
3833
3834 case KEY_bless:
a0d0e21e 3835 LOP(OP_BLESS,XTERM);
79072805
LW
3836
3837 case KEY_chop:
3838 UNI(OP_CHOP);
3839
3840 case KEY_continue:
3841 PREBLOCK(CONTINUE);
3842
3843 case KEY_chdir:
85e6fe83 3844 (void)gv_fetchpv("ENV",TRUE, SVt_PVHV); /* may use HOME */
79072805
LW
3845 UNI(OP_CHDIR);
3846
3847 case KEY_close:
3848 UNI(OP_CLOSE);
3849
3850 case KEY_closedir:
3851 UNI(OP_CLOSEDIR);
3852
3853 case KEY_cmp:
3854 Eop(OP_SCMP);
3855
3856 case KEY_caller:
3857 UNI(OP_CALLER);
3858
3859 case KEY_crypt:
3860#ifdef FCRYPT
6b88bc9c 3861 if (!PL_cryptseen++)
de3bb511 3862 init_des();
a687059c 3863#endif
a0d0e21e 3864 LOP(OP_CRYPT,XTERM);
79072805
LW
3865
3866 case KEY_chmod:
599cee73 3867 if (ckWARN(WARN_OCTAL)) {
3280af22 3868 for (d = s; d < PL_bufend && (isSPACE(*d) || *d == '('); d++) ;
748a9306 3869 if (*d != '0' && isDIGIT(*d))
4438c4b7
JH
3870 Perl_warner(aTHX_ WARN_OCTAL,
3871 "chmod: mode argument is missing initial 0");
748a9306 3872 }
a0d0e21e 3873 LOP(OP_CHMOD,XTERM);
79072805
LW
3874
3875 case KEY_chown:
a0d0e21e 3876 LOP(OP_CHOWN,XTERM);
79072805
LW
3877
3878 case KEY_connect:
a0d0e21e 3879 LOP(OP_CONNECT,XTERM);
79072805 3880
463ee0b2
LW
3881 case KEY_chr:
3882 UNI(OP_CHR);
3883
79072805
LW
3884 case KEY_cos:
3885 UNI(OP_COS);
3886
3887 case KEY_chroot:
3888 UNI(OP_CHROOT);
3889
3890 case KEY_do:
3891 s = skipspace(s);
3892 if (*s == '{')
a0d0e21e 3893 PRETERMBLOCK(DO);
79072805 3894 if (*s != '\'')
a0d0e21e 3895 s = force_word(s,WORD,FALSE,TRUE,FALSE);
378cc40b 3896 OPERATOR(DO);
79072805
LW
3897
3898 case KEY_die:
3280af22 3899 PL_hints |= HINT_BLOCK_SCOPE;
a0d0e21e 3900 LOP(OP_DIE,XTERM);
79072805
LW
3901
3902 case KEY_defined:
3903 UNI(OP_DEFINED);
3904
3905 case KEY_delete:
a0d0e21e 3906 UNI(OP_DELETE);
79072805
LW
3907
3908 case KEY_dbmopen:
a0d0e21e
LW
3909 gv_fetchpv("AnyDBM_File::ISA", GV_ADDMULTI, SVt_PVAV);
3910 LOP(OP_DBMOPEN,XTERM);
79072805
LW
3911
3912 case KEY_dbmclose:
3913 UNI(OP_DBMCLOSE);
3914
3915 case KEY_dump:
a0d0e21e 3916 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
3917 LOOPX(OP_DUMP);
3918
3919 case KEY_else:
3920 PREBLOCK(ELSE);
3921
3922 case KEY_elsif:
3280af22 3923 yylval.ival = PL_curcop->cop_line;
79072805
LW
3924 OPERATOR(ELSIF);
3925
3926 case KEY_eq:
3927 Eop(OP_SEQ);
3928
a0d0e21e
LW
3929 case KEY_exists:
3930 UNI(OP_EXISTS);
3931
79072805
LW
3932 case KEY_exit:
3933 UNI(OP_EXIT);
3934
3935 case KEY_eval:
79072805 3936 s = skipspace(s);
3280af22 3937 PL_expect = (*s == '{') ? XTERMBLOCK : XTERM;
463ee0b2 3938 UNIBRACK(OP_ENTEREVAL);
79072805
LW
3939
3940 case KEY_eof:
3941 UNI(OP_EOF);
3942
3943 case KEY_exp:
3944 UNI(OP_EXP);
3945
3946 case KEY_each:
3947 UNI(OP_EACH);
3948
3949 case KEY_exec:
3950 set_csh();
a0d0e21e 3951 LOP(OP_EXEC,XREF);
79072805
LW
3952
3953 case KEY_endhostent:
3954 FUN0(OP_EHOSTENT);
3955
3956 case KEY_endnetent:
3957 FUN0(OP_ENETENT);
3958
3959 case KEY_endservent:
3960 FUN0(OP_ESERVENT);
3961
3962 case KEY_endprotoent:
3963 FUN0(OP_EPROTOENT);
3964
3965 case KEY_endpwent:
3966 FUN0(OP_EPWENT);
3967
3968 case KEY_endgrent:
3969 FUN0(OP_EGRENT);
3970
3971 case KEY_for:
3972 case KEY_foreach:
3280af22 3973 yylval.ival = PL_curcop->cop_line;
55497cff 3974 s = skipspace(s);
834a4ddd 3975 if (PL_expect == XSTATE && isIDFIRST_lazy(s)) {
55497cff 3976 char *p = s;
3280af22 3977 if ((PL_bufend - p) >= 3 &&
55497cff 3978 strnEQ(p, "my", 2) && isSPACE(*(p + 2)))
3979 p += 2;
77ca0c92
LW
3980 else if ((PL_bufend - p) >= 4 &&
3981 strnEQ(p, "our", 3) && isSPACE(*(p + 3)))
3982 p += 3;
55497cff 3983 p = skipspace(p);
77ca0c92
LW
3984 if (isIDFIRST_lazy(p)) {
3985 p = scan_ident(p, PL_bufend,
3986 PL_tokenbuf, sizeof PL_tokenbuf, TRUE);
3987 p = skipspace(p);
3988 }
3989 if (*p != '$')
cea2e8a9 3990 Perl_croak(aTHX_ "Missing $ on loop variable");
55497cff 3991 }
79072805
LW
3992 OPERATOR(FOR);
3993
3994 case KEY_formline:
a0d0e21e 3995 LOP(OP_FORMLINE,XTERM);
79072805
LW
3996
3997 case KEY_fork:
3998 FUN0(OP_FORK);
3999
4000 case KEY_fcntl:
a0d0e21e 4001 LOP(OP_FCNTL,XTERM);
79072805
LW
4002
4003 case KEY_fileno:
4004 UNI(OP_FILENO);
4005
4006 case KEY_flock:
a0d0e21e 4007 LOP(OP_FLOCK,XTERM);
79072805
LW
4008
4009 case KEY_gt:
4010 Rop(OP_SGT);
4011
4012 case KEY_ge:
4013 Rop(OP_SGE);
4014
4015 case KEY_grep:
a0d0e21e 4016 LOP(OP_GREPSTART, *s == '(' ? XTERM : XREF);
79072805
LW
4017
4018 case KEY_goto:
a0d0e21e 4019 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
4020 LOOPX(OP_GOTO);
4021
4022 case KEY_gmtime:
4023 UNI(OP_GMTIME);
4024
4025 case KEY_getc:
4026 UNI(OP_GETC);
4027
4028 case KEY_getppid:
4029 FUN0(OP_GETPPID);
4030
4031 case KEY_getpgrp:
4032 UNI(OP_GETPGRP);
4033
4034 case KEY_getpriority:
a0d0e21e 4035 LOP(OP_GETPRIORITY,XTERM);
79072805
LW
4036
4037 case KEY_getprotobyname:
4038 UNI(OP_GPBYNAME);
4039
4040 case KEY_getprotobynumber:
a0d0e21e 4041 LOP(OP_GPBYNUMBER,XTERM);
79072805
LW
4042
4043 case KEY_getprotoent:
4044 FUN0(OP_GPROTOENT);
4045
4046 case KEY_getpwent:
4047 FUN0(OP_GPWENT);
4048
4049 case KEY_getpwnam:
ff68c719 4050 UNI(OP_GPWNAM);
79072805
LW
4051
4052 case KEY_getpwuid:
ff68c719 4053 UNI(OP_GPWUID);
79072805
LW
4054
4055 case KEY_getpeername:
4056 UNI(OP_GETPEERNAME);
4057
4058 case KEY_gethostbyname:
4059 UNI(OP_GHBYNAME);
4060
4061 case KEY_gethostbyaddr:
a0d0e21e 4062 LOP(OP_GHBYADDR,XTERM);
79072805
LW
4063
4064 case KEY_gethostent:
4065 FUN0(OP_GHOSTENT);
4066
4067 case KEY_getnetbyname:
4068 UNI(OP_GNBYNAME);
4069
4070 case KEY_getnetbyaddr:
a0d0e21e 4071 LOP(OP_GNBYADDR,XTERM);
79072805
LW
4072
4073 case KEY_getnetent:
4074 FUN0(OP_GNETENT);
4075
4076 case KEY_getservbyname:
a0d0e21e 4077 LOP(OP_GSBYNAME,XTERM);
79072805
LW
4078
4079 case KEY_getservbyport:
a0d0e21e 4080 LOP(OP_GSBYPORT,XTERM);
79072805
LW
4081
4082 case KEY_getservent:
4083 FUN0(OP_GSERVENT);
4084
4085 case KEY_getsockname:
4086 UNI(OP_GETSOCKNAME);
4087
4088 case KEY_getsockopt:
a0d0e21e 4089 LOP(OP_GSOCKOPT,XTERM);
79072805
LW
4090
4091 case KEY_getgrent:
4092 FUN0(OP_GGRENT);
4093
4094 case KEY_getgrnam:
ff68c719 4095 UNI(OP_GGRNAM);
79072805
LW
4096
4097 case KEY_getgrgid:
ff68c719 4098 UNI(OP_GGRGID);
79072805
LW
4099
4100 case KEY_getlogin:
4101 FUN0(OP_GETLOGIN);
4102
93a17b20 4103 case KEY_glob:
a0d0e21e
LW
4104 set_csh();
4105 LOP(OP_GLOB,XTERM);
93a17b20 4106
79072805
LW
4107 case KEY_hex:
4108 UNI(OP_HEX);
4109
4110 case KEY_if:
3280af22 4111 yylval.ival = PL_curcop->cop_line;
79072805
LW
4112 OPERATOR(IF);
4113
4114 case KEY_index:
a0d0e21e 4115 LOP(OP_INDEX,XTERM);
79072805
LW
4116
4117 case KEY_int:
4118 UNI(OP_INT);
4119
4120 case KEY_ioctl:
a0d0e21e 4121 LOP(OP_IOCTL,XTERM);
79072805
LW
4122
4123 case KEY_join:
a0d0e21e 4124 LOP(OP_JOIN,XTERM);
79072805
LW
4125
4126 case KEY_keys:
4127 UNI(OP_KEYS);
4128
4129 case KEY_kill:
a0d0e21e 4130 LOP(OP_KILL,XTERM);
79072805
LW
4131
4132 case KEY_last:
a0d0e21e 4133 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805 4134 LOOPX(OP_LAST);
a0d0e21e 4135
79072805
LW
4136 case KEY_lc:
4137 UNI(OP_LC);
4138
4139 case KEY_lcfirst:
4140 UNI(OP_LCFIRST);
4141
4142 case KEY_local:
09bef843 4143 yylval.ival = 0;
79072805
LW
4144 OPERATOR(LOCAL);
4145
4146 case KEY_length:
4147 UNI(OP_LENGTH);
4148
4149 case KEY_lt:
4150 Rop(OP_SLT);
4151
4152 case KEY_le:
4153 Rop(OP_SLE);
4154
4155 case KEY_localtime:
4156 UNI(OP_LOCALTIME);
4157
4158 case KEY_log:
4159 UNI(OP_LOG);
4160
4161 case KEY_link:
a0d0e21e 4162 LOP(OP_LINK,XTERM);
79072805
LW
4163
4164 case KEY_listen:
a0d0e21e 4165 LOP(OP_LISTEN,XTERM);
79072805 4166
c0329465
MB
4167 case KEY_lock:
4168 UNI(OP_LOCK);
4169
79072805
LW
4170 case KEY_lstat:
4171 UNI(OP_LSTAT);
4172
4173 case KEY_m:
8782bef2 4174 s = scan_pat(s,OP_MATCH);
79072805
LW
4175 TERM(sublex_start());
4176
a0d0e21e 4177 case KEY_map:
4e4e412b
GS
4178 LOP(OP_MAPSTART, *s == '(' ? XTERM : XREF);
4179
79072805 4180 case KEY_mkdir:
a0d0e21e 4181 LOP(OP_MKDIR,XTERM);
79072805
LW
4182
4183 case KEY_msgctl:
a0d0e21e 4184 LOP(OP_MSGCTL,XTERM);
79072805
LW
4185
4186 case KEY_msgget:
a0d0e21e 4187 LOP(OP_MSGGET,XTERM);
79072805
LW
4188
4189 case KEY_msgrcv:
a0d0e21e 4190 LOP(OP_MSGRCV,XTERM);
79072805
LW
4191
4192 case KEY_msgsnd:
a0d0e21e 4193 LOP(OP_MSGSND,XTERM);
79072805 4194
77ca0c92 4195 case KEY_our:
93a17b20 4196 case KEY_my:
77ca0c92 4197 PL_in_my = tmp;
c750a3ec 4198 s = skipspace(s);
834a4ddd 4199 if (isIDFIRST_lazy(s)) {
3280af22 4200 s = scan_word(s, PL_tokenbuf, sizeof PL_tokenbuf, TRUE, &len);
09bef843
SB
4201 if (len == 3 && strnEQ(PL_tokenbuf, "sub", 3))
4202 goto really_sub;
3280af22
NIS
4203 PL_in_my_stash = gv_stashpv(PL_tokenbuf, FALSE);
4204 if (!PL_in_my_stash) {
c750a3ec 4205 char tmpbuf[1024];
3280af22
NIS
4206 PL_bufptr = s;
4207 sprintf(tmpbuf, "No such class %.1000s", PL_tokenbuf);
c750a3ec
MB
4208 yyerror(tmpbuf);
4209 }
4210 }
09bef843 4211 yylval.ival = 1;
55497cff 4212 OPERATOR(MY);
93a17b20 4213
79072805 4214 case KEY_next:
a0d0e21e 4215 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
4216 LOOPX(OP_NEXT);
4217
4218 case KEY_ne:
4219 Eop(OP_SNE);
4220
a0d0e21e 4221 case KEY_no:
3280af22 4222 if (PL_expect != XSTATE)
a0d0e21e
LW
4223 yyerror("\"no\" not allowed in expression");
4224 s = force_word(s,WORD,FALSE,TRUE,FALSE);
89bfa8cd 4225 s = force_version(s);
a0d0e21e
LW
4226 yylval.ival = 0;
4227 OPERATOR(USE);
4228
4229 case KEY_not:
2d2e263d
LW
4230 if (*s == '(' || (s = skipspace(s), *s == '('))
4231 FUN1(OP_NOT);
4232 else
4233 OPERATOR(NOTOP);
a0d0e21e 4234
79072805 4235 case KEY_open:
93a17b20 4236 s = skipspace(s);
834a4ddd 4237 if (isIDFIRST_lazy(s)) {
93a17b20 4238 char *t;
834a4ddd 4239 for (d = s; isALNUM_lazy(d); d++) ;
93a17b20 4240 t = skipspace(d);
0453d815
PM
4241 if (strchr("|&*+-=!?:.", *t) && ckWARN_d(WARN_AMBIGUOUS))
4242 Perl_warner(aTHX_ WARN_AMBIGUOUS,
4243 "Precedence problem: open %.*s should be open(%.*s)",
4244 d-s,s, d-s,s);
93a17b20 4245 }
a0d0e21e 4246 LOP(OP_OPEN,XTERM);
79072805 4247
463ee0b2 4248 case KEY_or:
a0d0e21e 4249 yylval.ival = OP_OR;
463ee0b2
LW
4250 OPERATOR(OROP);
4251
79072805
LW
4252 case KEY_ord:
4253 UNI(OP_ORD);
4254
4255 case KEY_oct:
4256 UNI(OP_OCT);
4257
4258 case KEY_opendir:
a0d0e21e 4259 LOP(OP_OPEN_DIR,XTERM);
79072805
LW
4260
4261 case KEY_print:
3280af22 4262 checkcomma(s,PL_tokenbuf,"filehandle");
a0d0e21e 4263 LOP(OP_PRINT,XREF);
79072805
LW
4264
4265 case KEY_printf:
3280af22 4266 checkcomma(s,PL_tokenbuf,"filehandle");
a0d0e21e 4267 LOP(OP_PRTF,XREF);
79072805 4268
c07a80fd 4269 case KEY_prototype:
4270 UNI(OP_PROTOTYPE);
4271
79072805 4272 case KEY_push:
a0d0e21e 4273 LOP(OP_PUSH,XTERM);
79072805
LW
4274
4275 case KEY_pop:
4276 UNI(OP_POP);
4277
a0d0e21e
LW
4278 case KEY_pos:
4279 UNI(OP_POS);
4280
79072805 4281 case KEY_pack:
a0d0e21e 4282 LOP(OP_PACK,XTERM);
79072805
LW
4283
4284 case KEY_package:
a0d0e21e 4285 s = force_word(s,WORD,FALSE,TRUE,FALSE);
79072805
LW
4286 OPERATOR(PACKAGE);
4287
4288 case KEY_pipe:
a0d0e21e 4289 LOP(OP_PIPE_OP,XTERM);
79072805
LW
4290
4291 case KEY_q:
09bef843 4292 s = scan_str(s,FALSE,FALSE);
79072805 4293 if (!s)
85e6fe83 4294 missingterm((char*)0);
79072805
LW
4295 yylval.ival = OP_CONST;
4296 TERM(sublex_start());
4297
a0d0e21e
LW
4298 case KEY_quotemeta:
4299 UNI(OP_QUOTEMETA);
4300
8990e307 4301 case KEY_qw:
09bef843 4302 s = scan_str(s,FALSE,FALSE);
8990e307 4303 if (!s)
85e6fe83 4304 missingterm((char*)0);
8127e0e3
GS
4305 force_next(')');
4306 if (SvCUR(PL_lex_stuff)) {
4307 OP *words = Nullop;
4308 int warned = 0;
3280af22 4309 d = SvPV_force(PL_lex_stuff, len);
8127e0e3
GS
4310 while (len) {
4311 for (; isSPACE(*d) && len; --len, ++d) ;
4312 if (len) {
4313 char *b = d;
4314 if (!warned && ckWARN(WARN_SYNTAX)) {
4315 for (; !isSPACE(*d) && len; --len, ++d) {
4316 if (*d == ',') {
cea2e8a9 4317 Perl_warner(aTHX_ WARN_SYNTAX,
8127e0e3
GS
4318 "Possible attempt to separate words with commas");
4319 ++warned;
4320 }
4321 else if (*d == '#') {
cea2e8a9 4322 Perl_warner(aTHX_ WARN_SYNTAX,
8127e0e3
GS
4323 "Possible attempt to put comments in qw() list");
4324 ++warned;
4325 }
4326 }
4327 }
4328 else {
4329 for (; !isSPACE(*d) && len; --len, ++d) ;
4330 }
4331 words = append_elem(OP_LIST, words,
4332 newSVOP(OP_CONST, 0, newSVpvn(b, d-b)));
55497cff 4333 }
4334 }
8127e0e3
GS
4335 if (words) {
4336 PL_nextval[PL_nexttoke].opval = words;
4337 force_next(THING);
4338 }
55497cff 4339 }
8127e0e3
GS
4340 if (PL_lex_stuff)
4341 SvREFCNT_dec(PL_lex_stuff);
3280af22 4342 PL_lex_stuff = Nullsv;
3280af22 4343 PL_expect = XTERM;
8127e0e3 4344 TOKEN('(');
8990e307 4345
79072805 4346 case KEY_qq:
09bef843 4347 s = scan_str(s,FALSE,FALSE);
79072805 4348 if (!s)
85e6fe83 4349 missingterm((char*)0);
a0d0e21e 4350 yylval.ival = OP_STRINGIFY;
3280af22
NIS
4351 if (SvIVX(PL_lex_stuff) == '\'')
4352 SvIVX(PL_lex_stuff) = 0; /* qq'$foo' should intepolate */
79072805
LW
4353 TERM(sublex_start());
4354
8782bef2
GB
4355 case KEY_qr:
4356 s = scan_pat(s,OP_QR);
4357 TERM(sublex_start());
4358
79072805 4359 case KEY_qx:
09bef843 4360 s = scan_str(s,FALSE,FALSE);
79072805 4361 if (!s)
85e6fe83 4362 missingterm((char*)0);
79072805
LW
4363 yylval.ival = OP_BACKTICK;
4364 set_csh();
4365 TERM(sublex_start());
4366
4367 case KEY_return:
4368 OLDLOP(OP_RETURN);
4369
4370 case KEY_require:
3280af22 4371 *PL_tokenbuf = '\0';
a0d0e21e 4372 s = force_word(s,WORD,TRUE,TRUE,FALSE);
834a4ddd 4373 if (isIDFIRST_lazy(PL_tokenbuf))
3280af22 4374 gv_stashpvn(PL_tokenbuf, strlen(PL_tokenbuf), TRUE);
748a9306 4375 else if (*s == '<')
a0d0e21e 4376 yyerror("<> should be quotes");
463ee0b2 4377 UNI(OP_REQUIRE);
79072805
LW
4378
4379 case KEY_reset:
4380 UNI(OP_RESET);
4381
4382 case KEY_redo:
a0d0e21e 4383 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
4384 LOOPX(OP_REDO);
4385
4386 case KEY_rename:
a0d0e21e 4387 LOP(OP_RENAME,XTERM);
79072805
LW
4388
4389 case KEY_rand:
4390 UNI(OP_RAND);
4391
4392 case KEY_rmdir:
4393 UNI(OP_RMDIR);
4394
4395 case KEY_rindex:
a0d0e21e 4396 LOP(OP_RINDEX,XTERM);
79072805
LW
4397
4398 case KEY_read:
a0d0e21e 4399 LOP(OP_READ,XTERM);
79072805
LW
4400
4401 case KEY_readdir:
4402 UNI(OP_READDIR);
4403
93a17b20
LW
4404 case KEY_readline:
4405 set_csh();
4406 UNI(OP_READLINE);
4407
4408 case KEY_readpipe:
4409 set_csh();
4410 UNI(OP_BACKTICK);
4411
79072805
LW
4412 case KEY_rewinddir:
4413 UNI(OP_REWINDDIR);
4414
4415 case KEY_recv:
a0d0e21e 4416 LOP(OP_RECV,XTERM);
79072805
LW
4417
4418 case KEY_reverse:
a0d0e21e 4419 LOP(OP_REVERSE,XTERM);
79072805
LW
4420
4421 case KEY_readlink:
4422 UNI(OP_READLINK);
4423
4424 case KEY_ref:
4425 UNI(OP_REF);
4426
4427 case KEY_s:
4428 s = scan_subst(s);
4429 if (yylval.opval)
4430 TERM(sublex_start());
4431 else
4432 TOKEN(1); /* force error */
4433
a0d0e21e
LW
4434 case KEY_chomp:
4435 UNI(OP_CHOMP);
4436
79072805
LW
4437 case KEY_scalar:
4438 UNI(OP_SCALAR);
4439
4440 case KEY_select:
a0d0e21e 4441 LOP(OP_SELECT,XTERM);
79072805
LW
4442
4443 case KEY_seek:
a0d0e21e 4444 LOP(OP_SEEK,XTERM);
79072805
LW
4445
4446 case KEY_semctl:
a0d0e21e 4447 LOP(OP_SEMCTL,XTERM);
79072805
LW
4448
4449 case KEY_semget:
a0d0e21e 4450 LOP(OP_SEMGET,XTERM);
79072805
LW
4451
4452 case KEY_semop:
a0d0e21e 4453 LOP(OP_SEMOP,XTERM);
79072805
LW
4454
4455 case KEY_send:
a0d0e21e 4456 LOP(OP_SEND,XTERM);
79072805
LW
4457
4458 case KEY_setpgrp:
a0d0e21e 4459 LOP(OP_SETPGRP,XTERM);
79072805
LW
4460
4461 case KEY_setpriority:
a0d0e21e 4462 LOP(OP_SETPRIORITY,XTERM);
79072805
LW
4463
4464 case KEY_sethostent:
ff68c719 4465 UNI(OP_SHOSTENT);
79072805
LW
4466
4467 case KEY_setnetent:
ff68c719 4468 UNI(OP_SNETENT);
79072805
LW
4469
4470 case KEY_setservent:
ff68c719 4471 UNI(OP_SSERVENT);
79072805
LW
4472
4473 case KEY_setprotoent:
ff68c719 4474 UNI(OP_SPROTOENT);
79072805
LW
4475
4476 case KEY_setpwent:
4477 FUN0(OP_SPWENT);
4478
4479 case KEY_setgrent:
4480 FUN0(OP_SGRENT);
4481
4482 case KEY_seekdir:
a0d0e21e 4483 LOP(OP_SEEKDIR,XTERM);
79072805
LW
4484
4485 case KEY_setsockopt:
a0d0e21e 4486 LOP(OP_SSOCKOPT,XTERM);
79072805
LW
4487
4488 case KEY_shift:
4489 UNI(OP_SHIFT);
4490
4491 case KEY_shmctl:
a0d0e21e 4492 LOP(OP_SHMCTL,XTERM);
79072805
LW
4493
4494 case KEY_shmget:
a0d0e21e 4495 LOP(OP_SHMGET,XTERM);
79072805
LW
4496
4497 case KEY_shmread:
a0d0e21e 4498 LOP(OP_SHMREAD,XTERM);
79072805
LW
4499
4500 case KEY_shmwrite:
a0d0e21e 4501 LOP(OP_SHMWRITE,XTERM);
79072805
LW
4502
4503 case KEY_shutdown:
a0d0e21e 4504 LOP(OP_SHUTDOWN,XTERM);
79072805
LW
4505
4506 case KEY_sin:
4507 UNI(OP_SIN);
4508
4509 case KEY_sleep:
4510 UNI(OP_SLEEP);
4511
4512 case KEY_socket:
a0d0e21e 4513 LOP(OP_SOCKET,XTERM);
79072805
LW
4514
4515 case KEY_socketpair:
a0d0e21e 4516 LOP(OP_SOCKPAIR,XTERM);
79072805
LW
4517
4518 case KEY_sort:
3280af22 4519 checkcomma(s,PL_tokenbuf,"subroutine name");
79072805
LW
4520 s = skipspace(s);
4521 if (*s == ';' || *s == ')') /* probably a close */
cea2e8a9 4522 Perl_croak(aTHX_ "sort is now a reserved word");
3280af22 4523 PL_expect = XTERM;
15f0808c 4524 s = force_word(s,WORD,TRUE,TRUE,FALSE);
a0d0e21e 4525 LOP(OP_SORT,XREF);
79072805
LW
4526
4527 case KEY_split:
a0d0e21e 4528 LOP(OP_SPLIT,XTERM);
79072805
LW
4529
4530 case KEY_sprintf:
a0d0e21e 4531 LOP(OP_SPRINTF,XTERM);
79072805
LW
4532
4533 case KEY_splice:
a0d0e21e 4534 LOP(OP_SPLICE,XTERM);
79072805
LW
4535
4536 case KEY_sqrt:
4537 UNI(OP_SQRT);
4538
4539 case KEY_srand:
4540 UNI(OP_SRAND);
4541
4542 case KEY_stat:
4543 UNI(OP_STAT);
4544
4545 case KEY_study:
3280af22 4546 PL_sawstudy++;
79072805
LW
4547 UNI(OP_STUDY);
4548
4549 case KEY_substr:
a0d0e21e 4550 LOP(OP_SUBSTR,XTERM);
79072805
LW
4551
4552 case KEY_format:
4553 case KEY_sub:
93a17b20 4554 really_sub:
09bef843 4555 {
3280af22 4556 char tmpbuf[sizeof PL_tokenbuf];
b1b65b59 4557 SSize_t tboffset;
09bef843
SB
4558 expectation attrful;
4559 bool have_name, have_proto;
4560 int key = tmp;
4561
4562 s = skipspace(s);
4563
4564 if (isIDFIRST_lazy(s) || *s == '\'' ||
4565 (*s == ':' && s[1] == ':'))
4566 {
4567 PL_expect = XBLOCK;
4568 attrful = XATTRBLOCK;
b1b65b59
JH
4569 /* remember buffer pos'n for later force_word */
4570 tboffset = s - PL_oldbufptr;
09bef843
SB
4571 d = scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
4572 if (strchr(tmpbuf, ':'))
4573 sv_setpv(PL_subname, tmpbuf);
4574 else {
4575 sv_setsv(PL_subname,PL_curstname);
4576 sv_catpvn(PL_subname,"::",2);
4577 sv_catpvn(PL_subname,tmpbuf,len);
4578 }
4579 s = skipspace(d);
4580 have_name = TRUE;
4581 }
463ee0b2 4582 else {
09bef843
SB
4583 if (key == KEY_my)
4584 Perl_croak(aTHX_ "Missing name in \"my sub\"");
4585 PL_expect = XTERMBLOCK;
4586 attrful = XATTRTERM;
4587 sv_setpv(PL_subname,"?");
4588 have_name = FALSE;
463ee0b2 4589 }
4633a7c4 4590
09bef843
SB
4591 if (key == KEY_format) {
4592 if (*s == '=')
4593 PL_lex_formbrack = PL_lex_brackets + 1;
4594 if (have_name)
b1b65b59
JH
4595 (void) force_word(PL_oldbufptr + tboffset, WORD,
4596 FALSE, TRUE, TRUE);
09bef843
SB
4597 OPERATOR(FORMAT);
4598 }
79072805 4599
09bef843
SB
4600 /* Look for a prototype */
4601 if (*s == '(') {
4602 char *p;
4603
4604 s = scan_str(s,FALSE,FALSE);
4605 if (!s) {
4606 if (PL_lex_stuff)
4607 SvREFCNT_dec(PL_lex_stuff);
4608 PL_lex_stuff = Nullsv;
4609 Perl_croak(aTHX_ "Prototype not terminated");
4610 }
4611 /* strip spaces */
4612 d = SvPVX(PL_lex_stuff);
4613 tmp = 0;
4614 for (p = d; *p; ++p) {
4615 if (!isSPACE(*p))
4616 d[tmp++] = *p;
4617 }
4618 d[tmp] = '\0';
4619 SvCUR(PL_lex_stuff) = tmp;
4620 have_proto = TRUE;
68dc0745 4621
09bef843 4622 s = skipspace(s);
4633a7c4 4623 }
09bef843
SB
4624 else
4625 have_proto = FALSE;
4626
4627 if (*s == ':' && s[1] != ':')
4628 PL_expect = attrful;
4629
4630 if (have_proto) {
b1b65b59
JH
4631 PL_nextval[PL_nexttoke].opval =
4632 (OP*)newSVOP(OP_CONST, 0, PL_lex_stuff);
09bef843
SB
4633 PL_lex_stuff = Nullsv;
4634 force_next(THING);
68dc0745 4635 }
09bef843
SB
4636 if (!have_name) {
4637 sv_setpv(PL_subname,"__ANON__");
4638 TOKEN(ANONSUB);
4633a7c4 4639 }
b1b65b59
JH
4640 (void) force_word(PL_oldbufptr + tboffset, WORD,
4641 FALSE, TRUE, TRUE);
09bef843
SB
4642 if (key == KEY_my)
4643 TOKEN(MYSUB);
4644 TOKEN(SUB);
4633a7c4 4645 }
79072805
LW
4646
4647 case KEY_system:
4648 set_csh();
a0d0e21e 4649 LOP(OP_SYSTEM,XREF);
79072805
LW
4650
4651 case KEY_symlink:
a0d0e21e 4652 LOP(OP_SYMLINK,XTERM);
79072805
LW
4653
4654 case KEY_syscall:
a0d0e21e 4655 LOP(OP_SYSCALL,XTERM);
79072805 4656
c07a80fd 4657 case KEY_sysopen:
4658 LOP(OP_SYSOPEN,XTERM);
4659
137443ea 4660 case KEY_sysseek:
4661 LOP(OP_SYSSEEK,XTERM);
4662
79072805 4663 case KEY_sysread:
a0d0e21e 4664 LOP(OP_SYSREAD,XTERM);
79072805
LW
4665
4666 case KEY_syswrite:
a0d0e21e 4667 LOP(OP_SYSWRITE,XTERM);
79072805
LW
4668
4669 case KEY_tr:
4670 s = scan_trans(s);
4671 TERM(sublex_start());
4672
4673 case KEY_tell:
4674 UNI(OP_TELL);
4675
4676 case KEY_telldir:
4677 UNI(OP_TELLDIR);
4678
463ee0b2 4679 case KEY_tie:
a0d0e21e 4680 LOP(OP_TIE,XTERM);
463ee0b2 4681
c07a80fd 4682 case KEY_tied:
4683 UNI(OP_TIED);
4684
79072805
LW
4685 case KEY_time:
4686 FUN0(OP_TIME);
4687
4688 case KEY_times:
4689 FUN0(OP_TMS);
4690
4691 case KEY_truncate:
a0d0e21e 4692 LOP(OP_TRUNCATE,XTERM);
79072805
LW
4693
4694 case KEY_uc:
4695 UNI(OP_UC);
4696
4697 case KEY_ucfirst:
4698 UNI(OP_UCFIRST);
4699
463ee0b2
LW
4700 case KEY_untie:
4701 UNI(OP_UNTIE);
4702
79072805 4703 case KEY_until:
3280af22 4704 yylval.ival = PL_curcop->cop_line;
79072805
LW
4705 OPERATOR(UNTIL);
4706
4707 case KEY_unless:
3280af22 4708 yylval.ival = PL_curcop->cop_line;
79072805
LW
4709 OPERATOR(UNLESS);
4710
4711 case KEY_unlink:
a0d0e21e 4712 LOP(OP_UNLINK,XTERM);
79072805
LW
4713
4714 case KEY_undef:
4715 UNI(OP_UNDEF);
4716
4717 case KEY_unpack:
a0d0e21e 4718 LOP(OP_UNPACK,XTERM);
79072805
LW
4719
4720 case KEY_utime:
a0d0e21e 4721 LOP(OP_UTIME,XTERM);
79072805
LW
4722
4723 case KEY_umask:
599cee73 4724 if (ckWARN(WARN_OCTAL)) {
3280af22 4725 for (d = s; d < PL_bufend && (isSPACE(*d) || *d == '('); d++) ;
4438c4b7
JH
4726 if (*d != '0' && isDIGIT(*d))
4727 Perl_warner(aTHX_ WARN_OCTAL,
4728 "umask: argument is missing initial 0");
748a9306 4729 }
79072805
LW
4730 UNI(OP_UMASK);
4731
4732 case KEY_unshift:
a0d0e21e
LW
4733 LOP(OP_UNSHIFT,XTERM);
4734
4735 case KEY_use:
3280af22 4736 if (PL_expect != XSTATE)
a0d0e21e 4737 yyerror("\"use\" not allowed in expression");
89bfa8cd 4738 s = skipspace(s);
4739 if(isDIGIT(*s)) {
4740 s = force_version(s);
4741 if(*s == ';' || (s = skipspace(s), *s == ';')) {
3280af22 4742 PL_nextval[PL_nexttoke].opval = Nullop;
89bfa8cd 4743 force_next(WORD);
4744 }
4745 }
4746 else {
4747 s = force_word(s,WORD,FALSE,TRUE,FALSE);
4748 s = force_version(s);
4749 }
a0d0e21e
LW
4750 yylval.ival = 1;
4751 OPERATOR(USE);
79072805
LW
4752
4753 case KEY_values:
4754 UNI(OP_VALUES);
4755
4756 case KEY_vec:
3280af22 4757 PL_sawvec = TRUE;
a0d0e21e 4758 LOP(OP_VEC,XTERM);
79072805
LW
4759
4760 case KEY_while:
3280af22 4761 yylval.ival = PL_curcop->cop_line;
79072805
LW
4762 OPERATOR(WHILE);
4763
4764 case KEY_warn:
3280af22 4765 PL_hints |= HINT_BLOCK_SCOPE;
a0d0e21e 4766 LOP(OP_WARN,XTERM);
79072805
LW
4767
4768 case KEY_wait:
4769 FUN0(OP_WAIT);
4770
4771 case KEY_waitpid:
a0d0e21e 4772 LOP(OP_WAITPID,XTERM);
79072805
LW
4773
4774 case KEY_wantarray:
4775 FUN0(OP_WANTARRAY);
4776
4777 case KEY_write:
9d116dd7
JH
4778#ifdef EBCDIC
4779 {
4780 static char ctl_l[2];
4781
4782 if (ctl_l[0] == '\0')
4783 ctl_l[0] = toCTRL('L');
4784 gv_fetchpv(ctl_l,TRUE, SVt_PV);
4785 }
4786#else
4787 gv_fetchpv("\f",TRUE, SVt_PV); /* Make sure $^L is defined */
4788#endif
79072805
LW
4789 UNI(OP_ENTERWRITE);
4790
4791 case KEY_x:
3280af22 4792 if (PL_expect == XOPERATOR)
79072805
LW
4793 Mop(OP_REPEAT);
4794 check_uni();
4795 goto just_a_word;
4796
a0d0e21e
LW
4797 case KEY_xor:
4798 yylval.ival = OP_XOR;
4799 OPERATOR(OROP);
4800
79072805
LW
4801 case KEY_y:
4802 s = scan_trans(s);
4803 TERM(sublex_start());
4804 }
49dc05e3 4805 }}
79072805
LW
4806}
4807
4808I32
864dbfa3 4809Perl_keyword(pTHX_ register char *d, I32 len)
79072805
LW
4810{
4811 switch (*d) {
4812 case '_':
4813 if (d[1] == '_') {
a0d0e21e 4814 if (strEQ(d,"__FILE__")) return -KEY___FILE__;
68dc0745 4815 if (strEQ(d,"__LINE__")) return -KEY___LINE__;
4816 if (strEQ(d,"__PACKAGE__")) return -KEY___PACKAGE__;
e50aee73 4817 if (strEQ(d,"__DATA__")) return KEY___DATA__;
79072805
LW
4818 if (strEQ(d,"__END__")) return KEY___END__;
4819 }
4820 break;
8990e307
LW
4821 case 'A':
4822 if (strEQ(d,"AUTOLOAD")) return KEY_AUTOLOAD;
4823 break;
79072805 4824 case 'a':
463ee0b2
LW
4825 switch (len) {
4826 case 3:
a0d0e21e
LW
4827 if (strEQ(d,"and")) return -KEY_and;
4828 if (strEQ(d,"abs")) return -KEY_abs;
85e6fe83 4829 break;
463ee0b2 4830 case 5:
a0d0e21e
LW
4831 if (strEQ(d,"alarm")) return -KEY_alarm;
4832 if (strEQ(d,"atan2")) return -KEY_atan2;
463ee0b2
LW
4833 break;
4834 case 6:
a0d0e21e 4835 if (strEQ(d,"accept")) return -KEY_accept;
463ee0b2
LW
4836 break;
4837 }
79072805
LW
4838 break;
4839 case 'B':
4840 if (strEQ(d,"BEGIN")) return KEY_BEGIN;
93a17b20 4841 break;
79072805 4842 case 'b':
a0d0e21e
LW
4843 if (strEQ(d,"bless")) return -KEY_bless;
4844 if (strEQ(d,"bind")) return -KEY_bind;
4845 if (strEQ(d,"binmode")) return -KEY_binmode;
4846 break;
4847 case 'C':
4848 if (strEQ(d,"CORE")) return -KEY_CORE;
79072805
LW
4849 break;
4850 case 'c':
4851 switch (len) {
4852 case 3:
a0d0e21e
LW
4853 if (strEQ(d,"cmp")) return -KEY_cmp;
4854 if (strEQ(d,"chr")) return -KEY_chr;
4855 if (strEQ(d,"cos")) return -KEY_cos;
79072805
LW
4856 break;
4857 case 4:
4858 if (strEQ(d,"chop")) return KEY_chop;
4859 break;
4860 case 5:
a0d0e21e
LW
4861 if (strEQ(d,"close")) return -KEY_close;
4862 if (strEQ(d,"chdir")) return -KEY_chdir;
4863 if (strEQ(d,"chomp")) return KEY_chomp;
4864 if (strEQ(d,"chmod")) return -KEY_chmod;
4865 if (strEQ(d,"chown")) return -KEY_chown;
4866 if (strEQ(d,"crypt")) return -KEY_crypt;
79072805
LW
4867 break;
4868 case 6:
a0d0e21e
LW
4869 if (strEQ(d,"chroot")) return -KEY_chroot;
4870 if (strEQ(d,"caller")) return -KEY_caller;
79072805
LW
4871 break;
4872 case 7:
a0d0e21e 4873 if (strEQ(d,"connect")) return -KEY_connect;
79072805
LW
4874 break;
4875 case 8:
a0d0e21e
LW
4876 if (strEQ(d,"closedir")) return -KEY_closedir;
4877 if (strEQ(d,"continue")) return -KEY_continue;
79072805
LW
4878 break;
4879 }
4880 break;
ed6116ce
LW
4881 case 'D':
4882 if (strEQ(d,"DESTROY")) return KEY_DESTROY;
4883 break;
79072805
LW
4884 case 'd':
4885 switch (len) {
4886 case 2:
4887 if (strEQ(d,"do")) return KEY_do;
4888 break;
4889 case 3:
a0d0e21e 4890 if (strEQ(d,"die")) return -KEY_die;
79072805
LW
4891 break;
4892 case 4:
a0d0e21e 4893 if (strEQ(d,"dump")) return -KEY_dump;
79072805
LW
4894 break;
4895 case 6:
4896 if (strEQ(d,"delete")) return KEY_delete;
4897 break;
4898 case 7:
4899 if (strEQ(d,"defined")) return KEY_defined;
a0d0e21e 4900 if (strEQ(d,"dbmopen")) return -KEY_dbmopen;
79072805
LW
4901 break;
4902 case 8:
a0d0e21e 4903 if (strEQ(d,"dbmclose")) return -KEY_dbmclose;
79072805
LW
4904 break;
4905 }
4906 break;
4907 case 'E':
a0d0e21e 4908 if (strEQ(d,"EQ")) { deprecate(d); return -KEY_eq;}
79072805
LW
4909 if (strEQ(d,"END")) return KEY_END;
4910 break;
4911 case 'e':
4912 switch (len) {
4913 case 2:
a0d0e21e 4914 if (strEQ(d,"eq")) return -KEY_eq;
79072805
LW
4915 break;
4916 case 3:
a0d0e21e
LW
4917 if (strEQ(d,"eof")) return -KEY_eof;
4918 if (strEQ(d,"exp")) return -KEY_exp;
79072805
LW
4919 break;
4920 case 4:
4921 if (strEQ(d,"else")) return KEY_else;
a0d0e21e 4922 if (strEQ(d,"exit")) return -KEY_exit;
79072805 4923 if (strEQ(d,"eval")) return KEY_eval;
a0d0e21e 4924 if (strEQ(d,"exec")) return -KEY_exec;
79072805
LW
4925 if (strEQ(d,"each")) return KEY_each;
4926 break;
4927 case 5:
4928 if (strEQ(d,"elsif")) return KEY_elsif;
4929 break;
a0d0e21e
LW
4930 case 6:
4931 if (strEQ(d,"exists")) return KEY_exists;
cea2e8a9 4932 if (strEQ(d,"elseif")) Perl_warn(aTHX_ "elseif should be elsif");
a0d0e21e 4933 break;
79072805 4934 case 8:
a0d0e21e
LW
4935 if (strEQ(d,"endgrent")) return -KEY_endgrent;
4936 if (strEQ(d,"endpwent")) return -KEY_endpwent;
79072805
LW
4937 break;
4938 case 9:
a0d0e21e 4939 if (strEQ(d,"endnetent")) return -KEY_endnetent;
79072805
LW
4940 break;
4941 case 10:
a0d0e21e
LW
4942 if (strEQ(d,"endhostent")) return -KEY_endhostent;
4943 if (strEQ(d,"endservent")) return -KEY_endservent;
79072805
LW
4944 break;
4945 case 11:
a0d0e21e 4946 if (strEQ(d,"endprotoent")) return -KEY_endprotoent;
79072805 4947 break;
a687059c 4948 }
a687059c 4949 break;
79072805
LW
4950 case 'f':
4951 switch (len) {
4952 case 3:
4953 if (strEQ(d,"for")) return KEY_for;
4954 break;
4955 case 4:
a0d0e21e 4956 if (strEQ(d,"fork")) return -KEY_fork;
79072805
LW
4957 break;
4958 case 5:
a0d0e21e
LW
4959 if (strEQ(d,"fcntl")) return -KEY_fcntl;
4960 if (strEQ(d,"flock")) return -KEY_flock;
79072805
LW
4961 break;
4962 case 6:
4963 if (strEQ(d,"format")) return KEY_format;
a0d0e21e 4964 if (strEQ(d,"fileno")) return -KEY_fileno;
79072805
LW
4965 break;
4966 case 7:
4967 if (strEQ(d,"foreach")) return KEY_foreach;
4968 break;
4969 case 8:
a0d0e21e 4970 if (strEQ(d,"formline")) return -KEY_formline;
79072805 4971 break;
378cc40b 4972 }
a687059c 4973 break;
79072805
LW
4974 case 'G':
4975 if (len == 2) {
a0d0e21e
LW
4976 if (strEQ(d,"GT")) { deprecate(d); return -KEY_gt;}
4977 if (strEQ(d,"GE")) { deprecate(d); return -KEY_ge;}
9f68db38 4978 }
a687059c 4979 break;
79072805 4980 case 'g':
a687059c
LW
4981 if (strnEQ(d,"get",3)) {
4982 d += 3;
4983 if (*d == 'p') {
79072805
LW
4984 switch (len) {
4985 case 7:
a0d0e21e
LW
4986 if (strEQ(d,"ppid")) return -KEY_getppid;
4987 if (strEQ(d,"pgrp")) return -KEY_getpgrp;
79072805
LW
4988 break;
4989 case 8:
a0d0e21e
LW
4990 if (strEQ(d,"pwent")) return -KEY_getpwent;
4991 if (strEQ(d,"pwnam")) return -KEY_getpwnam;
4992 if (strEQ(d,"pwuid")) return -KEY_getpwuid;
79072805
LW
4993 break;
4994 case 11:
a0d0e21e
LW
4995 if (strEQ(d,"peername")) return -KEY_getpeername;
4996 if (strEQ(d,"protoent")) return -KEY_getprotoent;
4997 if (strEQ(d,"priority")) return -KEY_getpriority;
79072805
LW
4998 break;
4999 case 14:
a0d0e21e 5000 if (strEQ(d,"protobyname")) return -KEY_getprotobyname;
79072805
LW
5001 break;
5002 case 16:
a0d0e21e 5003 if (strEQ(d,"protobynumber"))return -KEY_getprotobynumber;
79072805
LW
5004 break;
5005 }
a687059c
LW
5006 }
5007 else if (*d == 'h') {
a0d0e21e
LW
5008 if (strEQ(d,"hostbyname")) return -KEY_gethostbyname;
5009 if (strEQ(d,"hostbyaddr")) return -KEY_gethostbyaddr;
5010 if (strEQ(d,"hostent")) return -KEY_gethostent;
a687059c
LW
5011 }
5012 else if (*d == 'n') {
a0d0e21e
LW
5013 if (strEQ(d,"netbyname")) return -KEY_getnetbyname;
5014 if (strEQ(d,"netbyaddr")) return -KEY_getnetbyaddr;
5015 if (strEQ(d,"netent")) return -KEY_getnetent;
a687059c
LW
5016 }
5017 else if (*d == 's') {
a0d0e21e
LW
5018 if (strEQ(d,"servbyname")) return -KEY_getservbyname;
5019 if (strEQ(d,"servbyport")) return -KEY_getservbyport;
5020 if (strEQ(d,"servent")) return -KEY_getservent;
5021 if (strEQ(d,"sockname")) return -KEY_getsockname;
5022 if (strEQ(d,"sockopt")) return -KEY_getsockopt;
a687059c
LW
5023 }
5024 else if (*d == 'g') {
a0d0e21e
LW
5025 if (strEQ(d,"grent")) return -KEY_getgrent;
5026 if (strEQ(d,"grnam")) return -KEY_getgrnam;
5027 if (strEQ(d,"grgid")) return -KEY_getgrgid;
a687059c
LW
5028 }
5029 else if (*d == 'l') {
a0d0e21e 5030 if (strEQ(d,"login")) return -KEY_getlogin;
a687059c 5031 }
a0d0e21e 5032 else if (strEQ(d,"c")) return -KEY_getc;
79072805 5033 break;
a687059c 5034 }
79072805
LW
5035 switch (len) {
5036 case 2:
a0d0e21e
LW
5037 if (strEQ(d,"gt")) return -KEY_gt;
5038 if (strEQ(d,"ge")) return -KEY_ge;
79072805
LW
5039 break;
5040 case 4:
5041 if (strEQ(d,"grep")) return KEY_grep;
5042 if (strEQ(d,"goto")) return KEY_goto;
fb73857a 5043 if (strEQ(d,"glob")) return KEY_glob;
79072805
LW
5044 break;
5045 case 6:
a0d0e21e 5046 if (strEQ(d,"gmtime")) return -KEY_gmtime;
79072805 5047 break;
378cc40b 5048 }
a687059c 5049 break;
79072805 5050 case 'h':
a0d0e21e 5051 if (strEQ(d,"hex")) return -KEY_hex;
a687059c 5052 break;
7d07dbc2
MB
5053 case 'I':
5054 if (strEQ(d,"INIT")) return KEY_INIT;
5055 break;
79072805
LW
5056 case 'i':
5057 switch (len) {
5058 case 2:
5059 if (strEQ(d,"if")) return KEY_if;
5060 break;
5061 case 3:
a0d0e21e 5062 if (strEQ(d,"int")) return -KEY_int;
79072805
LW
5063 break;
5064 case 5:
a0d0e21e
LW
5065 if (strEQ(d,"index")) return -KEY_index;
5066 if (strEQ(d,"ioctl")) return -KEY_ioctl;
79072805
LW
5067 break;
5068 }
a687059c 5069 break;
79072805 5070 case 'j':
a0d0e21e 5071 if (strEQ(d,"join")) return -KEY_join;
a687059c 5072 break;
79072805
LW
5073 case 'k':
5074 if (len == 4) {
5075 if (strEQ(d,"keys")) return KEY_keys;
a0d0e21e 5076 if (strEQ(d,"kill")) return -KEY_kill;
663a0e37 5077 }
79072805
LW
5078 break;
5079 case 'L':
5080 if (len == 2) {
a0d0e21e
LW
5081 if (strEQ(d,"LT")) { deprecate(d); return -KEY_lt;}
5082 if (strEQ(d,"LE")) { deprecate(d); return -KEY_le;}
378cc40b 5083 }
79072805
LW
5084 break;
5085 case 'l':
5086 switch (len) {
5087 case 2:
a0d0e21e
LW
5088 if (strEQ(d,"lt")) return -KEY_lt;
5089 if (strEQ(d,"le")) return -KEY_le;
5090 if (strEQ(d,"lc")) return -KEY_lc;
79072805
LW
5091 break;
5092 case 3:
a0d0e21e 5093 if (strEQ(d,"log")) return -KEY_log;
79072805
LW
5094 break;
5095 case 4:
5096 if (strEQ(d,"last")) return KEY_last;
a0d0e21e 5097 if (strEQ(d,"link")) return -KEY_link;
c0329465 5098 if (strEQ(d,"lock")) return -KEY_lock;
395c3793 5099 break;
79072805
LW
5100 case 5:
5101 if (strEQ(d,"local")) return KEY_local;
a0d0e21e 5102 if (strEQ(d,"lstat")) return -KEY_lstat;
79072805
LW
5103 break;
5104 case 6:
a0d0e21e
LW
5105 if (strEQ(d,"length")) return -KEY_length;
5106 if (strEQ(d,"listen")) return -KEY_listen;
79072805
LW
5107 break;
5108 case 7:
a0d0e21e 5109 if (strEQ(d,"lcfirst")) return -KEY_lcfirst;
79072805
LW
5110 break;
5111 case 9:
a0d0e21e 5112 if (strEQ(d,"localtime")) return -KEY_localtime;
395c3793
LW
5113 break;
5114 }
a687059c 5115 break;
79072805
LW
5116 case 'm':
5117 switch (len) {
5118 case 1: return KEY_m;
93a17b20
LW
5119 case 2:
5120 if (strEQ(d,"my")) return KEY_my;
5121 break;
a0d0e21e
LW
5122 case 3:
5123 if (strEQ(d,"map")) return KEY_map;
5124 break;
79072805 5125 case 5:
a0d0e21e 5126 if (strEQ(d,"mkdir")) return -KEY_mkdir;
79072805
LW
5127 break;
5128 case 6:
a0d0e21e
LW
5129 if (strEQ(d,"msgctl")) return -KEY_msgctl;
5130 if (strEQ(d,"msgget")) return -KEY_msgget;
5131 if (strEQ(d,"msgrcv")) return -KEY_msgrcv;
5132 if (strEQ(d,"msgsnd")) return -KEY_msgsnd;
79072805
LW
5133 break;
5134 }
a687059c 5135 break;
79072805 5136 case 'N':
a0d0e21e 5137 if (strEQ(d,"NE")) { deprecate(d); return -KEY_ne;}
a687059c 5138 break;
79072805
LW
5139 case 'n':
5140 if (strEQ(d,"next")) return KEY_next;
a0d0e21e
LW
5141 if (strEQ(d,"ne")) return -KEY_ne;
5142 if (strEQ(d,"not")) return -KEY_not;
5143 if (strEQ(d,"no")) return KEY_no;
a687059c 5144 break;
79072805
LW
5145 case 'o':
5146 switch (len) {
463ee0b2 5147 case 2:
a0d0e21e 5148 if (strEQ(d,"or")) return -KEY_or;
463ee0b2 5149 break;
79072805 5150 case 3:
a0d0e21e
LW
5151 if (strEQ(d,"ord")) return -KEY_ord;
5152 if (strEQ(d,"oct")) return -KEY_oct;
77ca0c92 5153 if (strEQ(d,"our")) return KEY_our;
79072805
LW
5154 break;
5155 case 4:
a0d0e21e 5156 if (strEQ(d,"open")) return -KEY_open;
79072805
LW
5157 break;
5158 case 7:
a0d0e21e 5159 if (strEQ(d,"opendir")) return -KEY_opendir;
79072805 5160 break;
fe14fcc3 5161 }
a687059c 5162 break;
79072805
LW
5163 case 'p':
5164 switch (len) {
5165 case 3:
5166 if (strEQ(d,"pop")) return KEY_pop;
a0d0e21e 5167 if (strEQ(d,"pos")) return KEY_pos;
79072805
LW
5168 break;
5169 case 4:
5170 if (strEQ(d,"push")) return KEY_push;
a0d0e21e
LW
5171 if (strEQ(d,"pack")) return -KEY_pack;
5172 if (strEQ(d,"pipe")) return -KEY_pipe;
79072805
LW
5173 break;
5174 case 5:
5175 if (strEQ(d,"print")) return KEY_print;
5176 break;
5177 case 6:
5178 if (strEQ(d,"printf")) return KEY_printf;
5179 break;
5180 case 7:
5181 if (strEQ(d,"package")) return KEY_package;
5182 break;
c07a80fd 5183 case 9:
5184 if (strEQ(d,"prototype")) return KEY_prototype;
663a0e37 5185 }
79072805
LW
5186 break;
5187 case 'q':
5188 if (len <= 2) {
5189 if (strEQ(d,"q")) return KEY_q;
8782bef2 5190 if (strEQ(d,"qr")) return KEY_qr;
79072805 5191 if (strEQ(d,"qq")) return KEY_qq;
8990e307 5192 if (strEQ(d,"qw")) return KEY_qw;
79072805 5193 if (strEQ(d,"qx")) return KEY_qx;
663a0e37 5194 }
a0d0e21e 5195 else if (strEQ(d,"quotemeta")) return -KEY_quotemeta;
79072805
LW
5196 break;
5197 case 'r':
5198 switch (len) {
5199 case 3:
a0d0e21e 5200 if (strEQ(d,"ref")) return -KEY_ref;
79072805
LW
5201 break;
5202 case 4:
a0d0e21e
LW
5203 if (strEQ(d,"read")) return -KEY_read;
5204 if (strEQ(d,"rand")) return -KEY_rand;
5205 if (strEQ(d,"recv")) return -KEY_recv;
79072805
LW
5206 if (strEQ(d,"redo")) return KEY_redo;
5207 break;
5208 case 5:
a0d0e21e
LW
5209 if (strEQ(d,"rmdir")) return -KEY_rmdir;
5210 if (strEQ(d,"reset")) return -KEY_reset;
79072805
LW
5211 break;
5212 case 6:
5213 if (strEQ(d,"return")) return KEY_return;
a0d0e21e
LW
5214 if (strEQ(d,"rename")) return -KEY_rename;
5215 if (strEQ(d,"rindex")) return -KEY_rindex;
79072805
LW
5216 break;
5217 case 7:
a0d0e21e
LW
5218 if (strEQ(d,"require")) return -KEY_require;
5219 if (strEQ(d,"reverse")) return -KEY_reverse;
5220 if (strEQ(d,"readdir")) return -KEY_readdir;
79072805
LW
5221 break;
5222 case 8:
a0d0e21e
LW
5223 if (strEQ(d,"readlink")) return -KEY_readlink;
5224 if (strEQ(d,"readline")) return -KEY_readline;
5225 if (strEQ(d,"readpipe")) return -KEY_readpipe;
79072805
LW
5226 break;
5227 case 9:
a0d0e21e 5228 if (strEQ(d,"rewinddir")) return -KEY_rewinddir;
79072805 5229 break;
a687059c 5230 }
79072805
LW
5231 break;
5232 case 's':
a687059c 5233 switch (d[1]) {
79072805 5234 case 0: return KEY_s;
a687059c 5235 case 'c':
79072805 5236 if (strEQ(d,"scalar")) return KEY_scalar;
a687059c
LW
5237 break;
5238 case 'e':
79072805
LW
5239 switch (len) {
5240 case 4:
a0d0e21e
LW
5241 if (strEQ(d,"seek")) return -KEY_seek;
5242 if (strEQ(d,"send")) return -KEY_send;
79072805
LW
5243 break;
5244 case 5:
a0d0e21e 5245 if (strEQ(d,"semop")) return -KEY_semop;
79072805
LW
5246 break;
5247 case 6:
a0d0e21e
LW
5248 if (strEQ(d,"select")) return -KEY_select;
5249 if (strEQ(d,"semctl")) return -KEY_semctl;
5250 if (strEQ(d,"semget")) return -KEY_semget;
79072805
LW
5251 break;
5252 case 7:
a0d0e21e
LW
5253 if (strEQ(d,"setpgrp")) return -KEY_setpgrp;
5254 if (strEQ(d,"seekdir")) return -KEY_seekdir;
79072805
LW
5255 break;
5256 case 8:
a0d0e21e
LW
5257 if (strEQ(d,"setpwent")) return -KEY_setpwent;
5258 if (strEQ(d,"setgrent")) return -KEY_setgrent;
79072805
LW
5259 break;
5260 case 9:
a0d0e21e 5261 if (strEQ(d,"setnetent")) return -KEY_setnetent;
79072805
LW
5262 break;
5263 case 10:
a0d0e21e
LW
5264 if (strEQ(d,"setsockopt")) return -KEY_setsockopt;
5265 if (strEQ(d,"sethostent")) return -KEY_sethostent;
5266 if (strEQ(d,"setservent")) return -KEY_setservent;
79072805
LW
5267 break;
5268 case 11:
a0d0e21e
LW
5269 if (strEQ(d,"setpriority")) return -KEY_setpriority;
5270 if (strEQ(d,"setprotoent")) return -KEY_setprotoent;
79072805
LW
5271 break;
5272 }
a687059c
LW
5273 break;
5274 case 'h':
79072805
LW
5275 switch (len) {
5276 case 5:
5277 if (strEQ(d,"shift")) return KEY_shift;
5278 break;
5279 case 6:
a0d0e21e
LW
5280 if (strEQ(d,"shmctl")) return -KEY_shmctl;
5281 if (strEQ(d,"shmget")) return -KEY_shmget;
79072805
LW
5282 break;
5283 case 7:
a0d0e21e 5284 if (strEQ(d,"shmread")) return -KEY_shmread;
79072805
LW
5285 break;
5286 case 8:
a0d0e21e
LW
5287 if (strEQ(d,"shmwrite")) return -KEY_shmwrite;
5288 if (strEQ(d,"shutdown")) return -KEY_shutdown;
79072805
LW
5289 break;
5290 }
a687059c
LW
5291 break;
5292 case 'i':
a0d0e21e 5293 if (strEQ(d,"sin")) return -KEY_sin;
a687059c
LW
5294 break;
5295 case 'l':
a0d0e21e 5296 if (strEQ(d,"sleep")) return -KEY_sleep;
a687059c
LW
5297 break;
5298 case 'o':
79072805 5299 if (strEQ(d,"sort")) return KEY_sort;
a0d0e21e
LW
5300 if (strEQ(d,"socket")) return -KEY_socket;
5301 if (strEQ(d,"socketpair")) return -KEY_socketpair;
a687059c
LW
5302 break;
5303 case 'p':
79072805 5304 if (strEQ(d,"split")) return KEY_split;
a0d0e21e 5305 if (strEQ(d,"sprintf")) return -KEY_sprintf;
79072805 5306 if (strEQ(d,"splice")) return KEY_splice;
a687059c
LW
5307 break;
5308 case 'q':
a0d0e21e 5309 if (strEQ(d,"sqrt")) return -KEY_sqrt;
a687059c
LW
5310 break;
5311 case 'r':
a0d0e21e 5312 if (strEQ(d,"srand")) return -KEY_srand;
a687059c
LW
5313 break;
5314 case 't':
a0d0e21e 5315 if (strEQ(d,"stat")) return -KEY_stat;
79072805 5316 if (strEQ(d,"study")) return KEY_study;
a687059c
LW
5317 break;
5318 case 'u':
a0d0e21e 5319 if (strEQ(d,"substr")) return -KEY_substr;
79072805 5320 if (strEQ(d,"sub")) return KEY_sub;
a687059c
LW
5321 break;
5322 case 'y':
79072805
LW
5323 switch (len) {
5324 case 6:
a0d0e21e 5325 if (strEQ(d,"system")) return -KEY_system;
79072805
LW
5326 break;
5327 case 7:
a0d0e21e
LW
5328 if (strEQ(d,"symlink")) return -KEY_symlink;
5329 if (strEQ(d,"syscall")) return -KEY_syscall;
137443ea 5330 if (strEQ(d,"sysopen")) return -KEY_sysopen;
5331 if (strEQ(d,"sysread")) return -KEY_sysread;
5332 if (strEQ(d,"sysseek")) return -KEY_sysseek;
79072805
LW
5333 break;
5334 case 8:
a0d0e21e 5335 if (strEQ(d,"syswrite")) return -KEY_syswrite;
79072805 5336 break;
a687059c 5337 }
a687059c
LW
5338 break;
5339 }
5340 break;
79072805
LW
5341 case 't':
5342 switch (len) {
5343 case 2:
5344 if (strEQ(d,"tr")) return KEY_tr;
5345 break;
463ee0b2
LW
5346 case 3:
5347 if (strEQ(d,"tie")) return KEY_tie;
5348 break;
79072805 5349 case 4:
a0d0e21e 5350 if (strEQ(d,"tell")) return -KEY_tell;
c07a80fd 5351 if (strEQ(d,"tied")) return KEY_tied;
a0d0e21e 5352 if (strEQ(d,"time")) return -KEY_time;
79072805
LW
5353 break;
5354 case 5:
a0d0e21e 5355 if (strEQ(d,"times")) return -KEY_times;
79072805
LW
5356 break;
5357 case 7:
a0d0e21e 5358 if (strEQ(d,"telldir")) return -KEY_telldir;
79072805
LW
5359 break;
5360 case 8:
a0d0e21e 5361 if (strEQ(d,"truncate")) return -KEY_truncate;
79072805 5362 break;
378cc40b 5363 }
a687059c 5364 break;
79072805
LW
5365 case 'u':
5366 switch (len) {
5367 case 2:
a0d0e21e
LW
5368 if (strEQ(d,"uc")) return -KEY_uc;
5369 break;
5370 case 3:
5371 if (strEQ(d,"use")) return KEY_use;
79072805
LW
5372 break;
5373 case 5:
5374 if (strEQ(d,"undef")) return KEY_undef;
5375 if (strEQ(d,"until")) return KEY_until;
463ee0b2 5376 if (strEQ(d,"untie")) return KEY_untie;
a0d0e21e
LW
5377 if (strEQ(d,"utime")) return -KEY_utime;
5378 if (strEQ(d,"umask")) return -KEY_umask;
79072805
LW
5379 break;
5380 case 6:
5381 if (strEQ(d,"unless")) return KEY_unless;
a0d0e21e
LW
5382 if (strEQ(d,"unpack")) return -KEY_unpack;
5383 if (strEQ(d,"unlink")) return -KEY_unlink;
79072805
LW
5384 break;
5385 case 7:
5386 if (strEQ(d,"unshift")) return KEY_unshift;
a0d0e21e 5387 if (strEQ(d,"ucfirst")) return -KEY_ucfirst;
79072805 5388 break;
a687059c
LW
5389 }
5390 break;
79072805 5391 case 'v':
a0d0e21e
LW
5392 if (strEQ(d,"values")) return -KEY_values;
5393 if (strEQ(d,"vec")) return -KEY_vec;
a687059c 5394 break;
79072805
LW
5395 case 'w':
5396 switch (len) {
5397 case 4:
a0d0e21e
LW
5398 if (strEQ(d,"warn")) return -KEY_warn;
5399 if (strEQ(d,"wait")) return -KEY_wait;
79072805
LW
5400 break;
5401 case 5:
5402 if (strEQ(d,"while")) return KEY_while;
a0d0e21e 5403 if (strEQ(d,"write")) return -KEY_write;
79072805
LW
5404 break;
5405 case 7:
a0d0e21e 5406 if (strEQ(d,"waitpid")) return -KEY_waitpid;
79072805
LW
5407 break;
5408 case 9:
a0d0e21e 5409 if (strEQ(d,"wantarray")) return -KEY_wantarray;
79072805 5410 break;
2f3197b3 5411 }
a687059c 5412 break;
79072805 5413 case 'x':
a0d0e21e
LW
5414 if (len == 1) return -KEY_x;
5415 if (strEQ(d,"xor")) return -KEY_xor;
a687059c 5416 break;
79072805
LW
5417 case 'y':
5418 if (len == 1) return KEY_y;
5419 break;
5420 case 'z':
a687059c
LW
5421 break;
5422 }
79072805 5423 return 0;
a687059c
LW
5424}
5425
76e3520e 5426STATIC void
cea2e8a9 5427S_checkcomma(pTHX_ register char *s, char *name, char *what)
a687059c 5428{
2f3197b3
LW
5429 char *w;
5430
d008e5eb
GS
5431 if (*s == ' ' && s[1] == '(') { /* XXX gotta be a better way */
5432 dTHR; /* only for ckWARN */
5433 if (ckWARN(WARN_SYNTAX)) {
5434 int level = 1;
5435 for (w = s+2; *w && level; w++) {
5436 if (*w == '(')
5437 ++level;
5438 else if (*w == ')')
5439 --level;
5440 }
5441 if (*w)
5442 for (; *w && isSPACE(*w); w++) ;
5443 if (!*w || !strchr(";|})]oaiuw!=", *w)) /* an advisory hack only... */
65cec589
GS
5444 Perl_warner(aTHX_ WARN_SYNTAX,
5445 "%s (...) interpreted as function",name);
d008e5eb 5446 }
2f3197b3 5447 }
3280af22 5448 while (s < PL_bufend && isSPACE(*s))
2f3197b3 5449 s++;
a687059c
LW
5450 if (*s == '(')
5451 s++;
3280af22 5452 while (s < PL_bufend && isSPACE(*s))
a687059c 5453 s++;
834a4ddd 5454 if (isIDFIRST_lazy(s)) {
2f3197b3 5455 w = s++;
834a4ddd 5456 while (isALNUM_lazy(s))
a687059c 5457 s++;
3280af22 5458 while (s < PL_bufend && isSPACE(*s))
a687059c 5459 s++;
e929a76b 5460 if (*s == ',') {
463ee0b2 5461 int kw;
e929a76b 5462 *s = '\0';
864dbfa3 5463 kw = keyword(w, s - w) || get_cv(w, FALSE) != 0;
e929a76b 5464 *s = ',';
463ee0b2 5465 if (kw)
e929a76b 5466 return;
cea2e8a9 5467 Perl_croak(aTHX_ "No comma allowed after %s", what);
463ee0b2
LW
5468 }
5469 }
5470}
5471
423cee85
JH
5472/* Either returns sv, or mortalizes sv and returns a new SV*.
5473 Best used as sv=new_constant(..., sv, ...).
5474 If s, pv are NULL, calls subroutine with one argument,
5475 and type is used with error messages only. */
5476
b3ac6de7 5477STATIC SV *
cea2e8a9 5478S_new_constant(pTHX_ char *s, STRLEN len, char *key, SV *sv, SV *pv, char *type)
b3ac6de7 5479{
b3ac6de7 5480 dSP;
3280af22 5481 HV *table = GvHV(PL_hintgv); /* ^H */
b3ac6de7 5482 SV *res;
b3ac6de7
IZ
5483 SV **cvp;
5484 SV *cv, *typesv;
423cee85
JH
5485 char *why, *why1, *why2;
5486
5487 if (!(PL_hints & HINT_LOCALIZE_HH)) {
5488 SV *msg;
5489
5490 why = "%^H is not localized";
5491 report_short:
5492 why1 = why2 = "";
5493 report:
5494 msg = Perl_newSVpvf(aTHX_ "constant(%s): %s%s%s",
5495 (type ? type: "undef"), why1, why2, why);
5496 yyerror(SvPVX(msg));
5497 SvREFCNT_dec(msg);
5498 return sv;
5499 }
b3ac6de7 5500 if (!table) {
423cee85
JH
5501 why = "%^H is not defined";
5502 goto report_short;
b3ac6de7
IZ
5503 }
5504 cvp = hv_fetch(table, key, strlen(key), FALSE);
5505 if (!cvp || !SvOK(*cvp)) {
423cee85
JH
5506 why = "} is not defined";
5507 why1 = "$^H{";
5508 why2 = key;
5509 goto report;
b3ac6de7
IZ
5510 }
5511 sv_2mortal(sv); /* Parent created it permanently */
5512 cv = *cvp;
423cee85
JH
5513 if (!pv && s)
5514 pv = sv_2mortal(newSVpvn(s, len));
5515 if (type && pv)
5516 typesv = sv_2mortal(newSVpv(type, 0));
b3ac6de7 5517 else
423cee85
JH
5518 typesv = &PL_sv_undef;
5519
e788e7d3 5520 PUSHSTACKi(PERLSI_OVERLOAD);
423cee85
JH
5521 ENTER ;
5522 SAVETMPS;
5523
5524 PUSHMARK(SP) ;
25eaa213 5525 EXTEND(sp, 4);
423cee85
JH
5526 if (pv)
5527 PUSHs(pv);
b3ac6de7 5528 PUSHs(sv);
423cee85
JH
5529 if (pv)
5530 PUSHs(typesv);
b3ac6de7
IZ
5531 PUSHs(cv);
5532 PUTBACK;
423cee85
JH
5533 call_sv(cv, G_SCALAR | ( PL_in_eval ? 0 : G_EVAL));
5534
5535 SPAGAIN ;
5536
5537 /* Check the eval first */
5538 if (!PL_in_eval && SvTRUE(ERRSV))
5539 {
5540 STRLEN n_a;
5541 sv_catpv(ERRSV, "Propagated");
5542 yyerror(SvPV(ERRSV, n_a)); /* Duplicates the message inside eval */
5543 POPs ;
5544 res = SvREFCNT_inc(sv);
5545 }
5546 else {
5547 res = POPs;
5548 SvREFCNT_inc(res);
5549 }
5550
5551 PUTBACK ;
5552 FREETMPS ;
5553 LEAVE ;
b3ac6de7 5554 POPSTACK;
423cee85 5555
b3ac6de7 5556 if (!SvOK(res)) {
423cee85
JH
5557 why = "}} did not return a defined value";
5558 why1 = "Call to &{$^H{";
5559 why2 = key;
5560 sv = res;
5561 goto report;
5562 }
5563
5564 return res;
b3ac6de7 5565}
423cee85 5566
76e3520e 5567STATIC char *
cea2e8a9 5568S_scan_word(pTHX_ register char *s, char *dest, STRLEN destlen, int allow_package, STRLEN *slp)
463ee0b2
LW
5569{
5570 register char *d = dest;
8903cb82 5571 register char *e = d + destlen - 3; /* two-character token, ending NUL */
463ee0b2 5572 for (;;) {
8903cb82 5573 if (d >= e)
cea2e8a9 5574 Perl_croak(aTHX_ ident_too_long);
834a4ddd 5575 if (isALNUM(*s)) /* UTF handled below */
463ee0b2 5576 *d++ = *s++;
834a4ddd 5577 else if (*s == '\'' && allow_package && isIDFIRST_lazy(s+1)) {
463ee0b2
LW
5578 *d++ = ':';
5579 *d++ = ':';
5580 s++;
5581 }
c3e0f903 5582 else if (*s == ':' && s[1] == ':' && allow_package && s[2] != '$') {
463ee0b2
LW
5583 *d++ = *s++;
5584 *d++ = *s++;
5585 }
834a4ddd 5586 else if (UTF && *(U8*)s >= 0xc0 && isALNUM_utf8((U8*)s)) {
a0ed51b3 5587 char *t = s + UTF8SKIP(s);
dfe13c55 5588 while (*t & 0x80 && is_utf8_mark((U8*)t))
a0ed51b3
LW
5589 t += UTF8SKIP(t);
5590 if (d + (t - s) > e)
cea2e8a9 5591 Perl_croak(aTHX_ ident_too_long);
a0ed51b3
LW
5592 Copy(s, d, t - s, char);
5593 d += t - s;
5594 s = t;
5595 }
463ee0b2
LW
5596 else {
5597 *d = '\0';
5598 *slp = d - dest;
5599 return s;
e929a76b 5600 }
378cc40b
LW
5601 }
5602}
5603
76e3520e 5604STATIC char *
cea2e8a9 5605S_scan_ident(pTHX_ register char *s, register char *send, char *dest, STRLEN destlen, I32 ck_uni)
378cc40b
LW
5606{
5607 register char *d;
8903cb82 5608 register char *e;
79072805 5609 char *bracket = 0;
748a9306 5610 char funny = *s++;
378cc40b 5611
3280af22
NIS
5612 if (PL_lex_brackets == 0)
5613 PL_lex_fakebrack = 0;
a0d0e21e
LW
5614 if (isSPACE(*s))
5615 s = skipspace(s);
378cc40b 5616 d = dest;
8903cb82 5617 e = d + destlen - 3; /* two-character token, ending NUL */
de3bb511 5618 if (isDIGIT(*s)) {
8903cb82 5619 while (isDIGIT(*s)) {
5620 if (d >= e)
cea2e8a9 5621 Perl_croak(aTHX_ ident_too_long);
378cc40b 5622 *d++ = *s++;
8903cb82 5623 }
378cc40b
LW
5624 }
5625 else {
463ee0b2 5626 for (;;) {
8903cb82 5627 if (d >= e)
cea2e8a9 5628 Perl_croak(aTHX_ ident_too_long);
834a4ddd 5629 if (isALNUM(*s)) /* UTF handled below */
463ee0b2 5630 *d++ = *s++;
834a4ddd 5631 else if (*s == '\'' && isIDFIRST_lazy(s+1)) {
463ee0b2
LW
5632 *d++ = ':';
5633 *d++ = ':';
5634 s++;
5635 }
a0d0e21e 5636 else if (*s == ':' && s[1] == ':') {
463ee0b2
LW
5637 *d++ = *s++;
5638 *d++ = *s++;
5639 }
834a4ddd 5640 else if (UTF && *(U8*)s >= 0xc0 && isALNUM_utf8((U8*)s)) {
a0ed51b3 5641 char *t = s + UTF8SKIP(s);
dfe13c55 5642 while (*t & 0x80 && is_utf8_mark((U8*)t))
a0ed51b3
LW
5643 t += UTF8SKIP(t);
5644 if (d + (t - s) > e)
cea2e8a9 5645 Perl_croak(aTHX_ ident_too_long);
a0ed51b3
LW
5646 Copy(s, d, t - s, char);
5647 d += t - s;
5648 s = t;
5649 }
463ee0b2
LW
5650 else
5651 break;
5652 }
378cc40b
LW
5653 }
5654 *d = '\0';
5655 d = dest;
79072805 5656 if (*d) {
3280af22
NIS
5657 if (PL_lex_state != LEX_NORMAL)
5658 PL_lex_state = LEX_INTERPENDMAYBE;
79072805 5659 return s;
378cc40b 5660 }
748a9306 5661 if (*s == '$' && s[1] &&
834a4ddd 5662 (isALNUM_lazy(s+1) || strchr("${", s[1]) || strnEQ(s+1,"::",2)) )
5cd24f17 5663 {
4810e5ec 5664 return s;
5cd24f17 5665 }
79072805
LW
5666 if (*s == '{') {
5667 bracket = s;
5668 s++;
5669 }
5670 else if (ck_uni)
5671 check_uni();
93a17b20 5672 if (s < send)
79072805
LW
5673 *d = *s++;
5674 d[1] = '\0';
2b92dfce 5675 if (*d == '^' && *s && isCONTROLVAR(*s)) {
bbce6d69 5676 *d = toCTRL(*s);
5677 s++;
de3bb511 5678 }
79072805 5679 if (bracket) {
748a9306 5680 if (isSPACE(s[-1])) {
fa83b5b6 5681 while (s < send) {
5682 char ch = *s++;
5683 if (ch != ' ' && ch != '\t') {
5684 *d = ch;
5685 break;
5686 }
5687 }
748a9306 5688 }
834a4ddd 5689 if (isIDFIRST_lazy(d)) {
79072805 5690 d++;
a0ed51b3
LW
5691 if (UTF) {
5692 e = s;
834a4ddd 5693 while (e < send && isALNUM_lazy(e) || *e == ':') {
a0ed51b3 5694 e += UTF8SKIP(e);
dfe13c55 5695 while (e < send && *e & 0x80 && is_utf8_mark((U8*)e))
a0ed51b3
LW
5696 e += UTF8SKIP(e);
5697 }
5698 Copy(s, d, e - s, char);
5699 d += e - s;
5700 s = e;
5701 }
5702 else {
2b92dfce 5703 while ((isALNUM(*s) || *s == ':') && d < e)
a0ed51b3 5704 *d++ = *s++;
2b92dfce 5705 if (d >= e)
cea2e8a9 5706 Perl_croak(aTHX_ ident_too_long);
a0ed51b3 5707 }
79072805 5708 *d = '\0';
748a9306 5709 while (s < send && (*s == ' ' || *s == '\t')) s++;
ff68c719 5710 if ((*s == '[' || (*s == '{' && strNE(dest, "sub")))) {
d008e5eb 5711 dTHR; /* only for ckWARN */
599cee73 5712 if (ckWARN(WARN_AMBIGUOUS) && keyword(dest, d - dest)) {
748a9306 5713 char *brack = *s == '[' ? "[...]" : "{...}";
cea2e8a9 5714 Perl_warner(aTHX_ WARN_AMBIGUOUS,
599cee73 5715 "Ambiguous use of %c{%s%s} resolved to %c%s%s",
748a9306
LW
5716 funny, dest, brack, funny, dest, brack);
5717 }
3280af22 5718 PL_lex_fakebrack = PL_lex_brackets+1;
79072805 5719 bracket++;
3280af22 5720 PL_lex_brackstack[PL_lex_brackets++] = XOPERATOR;
79072805
LW
5721 return s;
5722 }
2b92dfce
GS
5723 }
5724 /* Handle extended ${^Foo} variables
5725 * 1999-02-27 mjd-perl-patch@plover.com */
5726 else if (!isALNUM(*d) && !isPRINT(*d) /* isCTRL(d) */
5727 && isALNUM(*s))
5728 {
5729 d++;
5730 while (isALNUM(*s) && d < e) {
5731 *d++ = *s++;
5732 }
5733 if (d >= e)
cea2e8a9 5734 Perl_croak(aTHX_ ident_too_long);
2b92dfce 5735 *d = '\0';
79072805
LW
5736 }
5737 if (*s == '}') {
5738 s++;
3280af22
NIS
5739 if (PL_lex_state == LEX_INTERPNORMAL && !PL_lex_brackets)
5740 PL_lex_state = LEX_INTERPEND;
748a9306
LW
5741 if (funny == '#')
5742 funny = '@';
d008e5eb
GS
5743 if (PL_lex_state == LEX_NORMAL) {
5744 dTHR; /* only for ckWARN */
5745 if (ckWARN(WARN_AMBIGUOUS) &&
864dbfa3 5746 (keyword(dest, d - dest) || get_cv(dest, FALSE)))
d008e5eb 5747 {
cea2e8a9 5748 Perl_warner(aTHX_ WARN_AMBIGUOUS,
d008e5eb
GS
5749 "Ambiguous use of %c{%s} resolved to %c%s",
5750 funny, dest, funny, dest);
5751 }
5752 }
79072805
LW
5753 }
5754 else {
5755 s = bracket; /* let the parser handle it */
93a17b20 5756 *dest = '\0';
79072805
LW
5757 }
5758 }
3280af22
NIS
5759 else if (PL_lex_state == LEX_INTERPNORMAL && !PL_lex_brackets && !intuit_more(s))
5760 PL_lex_state = LEX_INTERPEND;
378cc40b
LW
5761 return s;
5762}
5763
cea2e8a9
GS
5764void
5765Perl_pmflag(pTHX_ U16 *pmfl, int ch)
a0d0e21e 5766{
bbce6d69 5767 if (ch == 'i')
a0d0e21e 5768 *pmfl |= PMf_FOLD;
a0d0e21e
LW
5769 else if (ch == 'g')
5770 *pmfl |= PMf_GLOBAL;
c90c0ff4 5771 else if (ch == 'c')
5772 *pmfl |= PMf_CONTINUE;
a0d0e21e
LW
5773 else if (ch == 'o')
5774 *pmfl |= PMf_KEEP;
5775 else if (ch == 'm')
5776 *pmfl |= PMf_MULTILINE;
5777 else if (ch == 's')
5778 *pmfl |= PMf_SINGLELINE;
5779 else if (ch == 'x')
5780 *pmfl |= PMf_EXTENDED;
5781}
378cc40b 5782
76e3520e 5783STATIC char *
cea2e8a9 5784S_scan_pat(pTHX_ char *start, I32 type)
378cc40b 5785{
79072805
LW
5786 PMOP *pm;
5787 char *s;
378cc40b 5788
09bef843 5789 s = scan_str(start,FALSE,FALSE);
79072805 5790 if (!s) {
3280af22
NIS
5791 if (PL_lex_stuff)
5792 SvREFCNT_dec(PL_lex_stuff);
5793 PL_lex_stuff = Nullsv;
cea2e8a9 5794 Perl_croak(aTHX_ "Search pattern not terminated");
378cc40b 5795 }
bbce6d69 5796
8782bef2 5797 pm = (PMOP*)newPMOP(type, 0);
3280af22 5798 if (PL_multi_open == '?')
79072805 5799 pm->op_pmflags |= PMf_ONCE;
8782bef2
GB
5800 if(type == OP_QR) {
5801 while (*s && strchr("iomsx", *s))
5802 pmflag(&pm->op_pmflags,*s++);
5803 }
5804 else {
5805 while (*s && strchr("iogcmsx", *s))
5806 pmflag(&pm->op_pmflags,*s++);
5807 }
4633a7c4 5808 pm->op_pmpermflags = pm->op_pmflags;
bbce6d69 5809
3280af22 5810 PL_lex_op = (OP*)pm;
79072805 5811 yylval.ival = OP_MATCH;
378cc40b
LW
5812 return s;
5813}
5814
76e3520e 5815STATIC char *
cea2e8a9 5816S_scan_subst(pTHX_ char *start)
79072805 5817{
a0d0e21e 5818 register char *s;
79072805 5819 register PMOP *pm;
4fdae800 5820 I32 first_start;
79072805
LW
5821 I32 es = 0;
5822
79072805
LW
5823 yylval.ival = OP_NULL;
5824
09bef843 5825 s = scan_str(start,FALSE,FALSE);
79072805
LW
5826
5827 if (!s) {
3280af22
NIS
5828 if (PL_lex_stuff)
5829 SvREFCNT_dec(PL_lex_stuff);
5830 PL_lex_stuff = Nullsv;
cea2e8a9 5831 Perl_croak(aTHX_ "Substitution pattern not terminated");
a687059c 5832 }
79072805 5833
3280af22 5834 if (s[-1] == PL_multi_open)
79072805
LW
5835 s--;
5836
3280af22 5837 first_start = PL_multi_start;
09bef843 5838 s = scan_str(s,FALSE,FALSE);
79072805 5839 if (!s) {
3280af22
NIS
5840 if (PL_lex_stuff)
5841 SvREFCNT_dec(PL_lex_stuff);
5842 PL_lex_stuff = Nullsv;
5843 if (PL_lex_repl)
5844 SvREFCNT_dec(PL_lex_repl);
5845 PL_lex_repl = Nullsv;
cea2e8a9 5846 Perl_croak(aTHX_ "Substitution replacement not terminated");
a687059c 5847 }
3280af22 5848 PL_multi_start = first_start; /* so whole substitution is taken together */
2f3197b3 5849
79072805 5850 pm = (PMOP*)newPMOP(OP_SUBST, 0);
48c036b1 5851 while (*s) {
a687059c
LW
5852 if (*s == 'e') {
5853 s++;
2f3197b3 5854 es++;
a687059c 5855 }
b3eb6a9b 5856 else if (strchr("iogcmsx", *s))
a0d0e21e 5857 pmflag(&pm->op_pmflags,*s++);
48c036b1
GS
5858 else
5859 break;
378cc40b 5860 }
79072805
LW
5861
5862 if (es) {
5863 SV *repl;
0244c3a4
GS
5864 PL_sublex_info.super_bufptr = s;
5865 PL_sublex_info.super_bufend = PL_bufend;
5866 PL_multi_end = 0;
79072805 5867 pm->op_pmflags |= PMf_EVAL;
79cb57f6 5868 repl = newSVpvn("",0);
463ee0b2 5869 while (es-- > 0)
a0d0e21e 5870 sv_catpv(repl, es ? "eval " : "do ");
79072805 5871 sv_catpvn(repl, "{ ", 2);
3280af22 5872 sv_catsv(repl, PL_lex_repl);
79072805 5873 sv_catpvn(repl, " };", 2);
25da4f38 5874 SvEVALED_on(repl);
3280af22
NIS
5875 SvREFCNT_dec(PL_lex_repl);
5876 PL_lex_repl = repl;
378cc40b 5877 }
79072805 5878
4633a7c4 5879 pm->op_pmpermflags = pm->op_pmflags;
3280af22 5880 PL_lex_op = (OP*)pm;
79072805 5881 yylval.ival = OP_SUBST;
378cc40b
LW
5882 return s;
5883}
5884
76e3520e 5885STATIC char *
cea2e8a9 5886S_scan_trans(pTHX_ char *start)
378cc40b 5887{
a0d0e21e 5888 register char* s;
11343788 5889 OP *o;
79072805
LW
5890 short *tbl;
5891 I32 squash;
a0ed51b3 5892 I32 del;
79072805 5893 I32 complement;
a0ed51b3
LW
5894 I32 utf8;
5895 I32 count = 0;
79072805
LW
5896
5897 yylval.ival = OP_NULL;
5898
09bef843 5899 s = scan_str(start,FALSE,FALSE);
79072805 5900 if (!s) {
3280af22
NIS
5901 if (PL_lex_stuff)
5902 SvREFCNT_dec(PL_lex_stuff);
5903 PL_lex_stuff = Nullsv;
cea2e8a9 5904 Perl_croak(aTHX_ "Transliteration pattern not terminated");
a687059c 5905 }
3280af22 5906 if (s[-1] == PL_multi_open)
2f3197b3
LW
5907 s--;
5908
09bef843 5909 s = scan_str(s,FALSE,FALSE);
79072805 5910 if (!s) {
3280af22
NIS
5911 if (PL_lex_stuff)
5912 SvREFCNT_dec(PL_lex_stuff);
5913 PL_lex_stuff = Nullsv;
5914 if (PL_lex_repl)
5915 SvREFCNT_dec(PL_lex_repl);
5916 PL_lex_repl = Nullsv;
cea2e8a9 5917 Perl_croak(aTHX_ "Transliteration replacement not terminated");
a687059c 5918 }
79072805 5919
a0ed51b3
LW
5920 if (UTF) {
5921 o = newSVOP(OP_TRANS, 0, 0);
5922 utf8 = OPpTRANS_FROM_UTF|OPpTRANS_TO_UTF;
5923 }
5924 else {
5925 New(803,tbl,256,short);
5926 o = newPVOP(OP_TRANS, 0, (char*)tbl);
5927 utf8 = 0;
5928 }
2f3197b3 5929
a0ed51b3
LW
5930 complement = del = squash = 0;
5931 while (strchr("cdsCU", *s)) {
395c3793 5932 if (*s == 'c')
79072805 5933 complement = OPpTRANS_COMPLEMENT;
395c3793 5934 else if (*s == 'd')
a0ed51b3
LW
5935 del = OPpTRANS_DELETE;
5936 else if (*s == 's')
79072805 5937 squash = OPpTRANS_SQUASH;
a0ed51b3
LW
5938 else {
5939 switch (count++) {
5940 case 0:
5941 if (*s == 'C')
5942 utf8 &= ~OPpTRANS_FROM_UTF;
5943 else
5944 utf8 |= OPpTRANS_FROM_UTF;
5945 break;
5946 case 1:
5947 if (*s == 'C')
5948 utf8 &= ~OPpTRANS_TO_UTF;
5949 else
5950 utf8 |= OPpTRANS_TO_UTF;
5951 break;
5952 default:
cea2e8a9 5953 Perl_croak(aTHX_ "Too many /C and /U options");
a0ed51b3
LW
5954 }
5955 }
395c3793
LW
5956 s++;
5957 }
a0ed51b3 5958 o->op_private = del|squash|complement|utf8;
79072805 5959
3280af22 5960 PL_lex_op = o;
79072805
LW
5961 yylval.ival = OP_TRANS;
5962 return s;
5963}
5964
76e3520e 5965STATIC char *
cea2e8a9 5966S_scan_heredoc(pTHX_ register char *s)
79072805 5967{
11343788 5968 dTHR;
79072805
LW
5969 SV *herewas;
5970 I32 op_type = OP_SCALAR;
5971 I32 len;
5972 SV *tmpstr;
5973 char term;
5974 register char *d;
fc36a67e 5975 register char *e;
4633a7c4 5976 char *peek;
3280af22 5977 int outer = (PL_rsfp && !(PL_lex_inwhat == OP_SCALAR));
79072805
LW
5978
5979 s += 2;
3280af22
NIS
5980 d = PL_tokenbuf;
5981 e = PL_tokenbuf + sizeof PL_tokenbuf - 1;
fd2d0953 5982 if (!outer)
79072805 5983 *d++ = '\n';
4633a7c4
LW
5984 for (peek = s; *peek == ' ' || *peek == '\t'; peek++) ;
5985 if (*peek && strchr("`'\"",*peek)) {
5986 s = peek;
79072805 5987 term = *s++;
3280af22 5988 s = delimcpy(d, e, s, PL_bufend, term, &len);
fc36a67e 5989 d += len;
3280af22 5990 if (s < PL_bufend)
79072805 5991 s++;
79072805
LW
5992 }
5993 else {
5994 if (*s == '\\')
5995 s++, term = '\'';
5996 else
5997 term = '"';
834a4ddd 5998 if (!isALNUM_lazy(s))
4633a7c4 5999 deprecate("bare << to mean <<\"\"");
834a4ddd 6000 for (; isALNUM_lazy(s); s++) {
fc36a67e 6001 if (d < e)
6002 *d++ = *s;
6003 }
6004 }
3280af22 6005 if (d >= PL_tokenbuf + sizeof PL_tokenbuf - 1)
cea2e8a9 6006 Perl_croak(aTHX_ "Delimiter for here document is too long");
79072805
LW
6007 *d++ = '\n';
6008 *d = '\0';
3280af22 6009 len = d - PL_tokenbuf;
6a27c188 6010#ifndef PERL_STRICT_CR
f63a84b2
LW
6011 d = strchr(s, '\r');
6012 if (d) {
6013 char *olds = s;
6014 s = d;
3280af22 6015 while (s < PL_bufend) {
f63a84b2
LW
6016 if (*s == '\r') {
6017 *d++ = '\n';
6018 if (*++s == '\n')
6019 s++;
6020 }
6021 else if (*s == '\n' && s[1] == '\r') { /* \015\013 on a mac? */
6022 *d++ = *s++;
6023 s++;
6024 }
6025 else
6026 *d++ = *s++;
6027 }
6028 *d = '\0';
3280af22
NIS
6029 PL_bufend = d;
6030 SvCUR_set(PL_linestr, PL_bufend - SvPVX(PL_linestr));
f63a84b2
LW
6031 s = olds;
6032 }
6033#endif
79072805 6034 d = "\n";
3280af22 6035 if (outer || !(d=ninstr(s,PL_bufend,d,d+1)))
79cb57f6 6036 herewas = newSVpvn(s,PL_bufend-s);
79072805 6037 else
79cb57f6 6038 s--, herewas = newSVpvn(s,d-s);
79072805 6039 s += SvCUR(herewas);
748a9306 6040
8d6dde3e 6041 tmpstr = NEWSV(87,79);
748a9306
LW
6042 sv_upgrade(tmpstr, SVt_PVIV);
6043 if (term == '\'') {
79072805 6044 op_type = OP_CONST;
748a9306
LW
6045 SvIVX(tmpstr) = -1;
6046 }
6047 else if (term == '`') {
79072805 6048 op_type = OP_BACKTICK;
748a9306
LW
6049 SvIVX(tmpstr) = '\\';
6050 }
79072805
LW
6051
6052 CLINE;
3280af22
NIS
6053 PL_multi_start = PL_curcop->cop_line;
6054 PL_multi_open = PL_multi_close = '<';
6055 term = *PL_tokenbuf;
0244c3a4
GS
6056 if (PL_lex_inwhat == OP_SUBST && PL_in_eval && !PL_rsfp) {
6057 char *bufptr = PL_sublex_info.super_bufptr;
6058 char *bufend = PL_sublex_info.super_bufend;
6059 char *olds = s - SvCUR(herewas);
6060 s = strchr(bufptr, '\n');
6061 if (!s)
6062 s = bufend;
6063 d = s;
6064 while (s < bufend &&
6065 (*s != term || memNE(s,PL_tokenbuf,len)) ) {
6066 if (*s++ == '\n')
6067 PL_curcop->cop_line++;
6068 }
6069 if (s >= bufend) {
6070 PL_curcop->cop_line = PL_multi_start;
6071 missingterm(PL_tokenbuf);
6072 }
6073 sv_setpvn(herewas,bufptr,d-bufptr+1);
6074 sv_setpvn(tmpstr,d+1,s-d);
6075 s += len - 1;
6076 sv_catpvn(herewas,s,bufend-s);
6077 (void)strcpy(bufptr,SvPVX(herewas));
6078
6079 s = olds;
6080 goto retval;
6081 }
6082 else if (!outer) {
79072805 6083 d = s;
3280af22
NIS
6084 while (s < PL_bufend &&
6085 (*s != term || memNE(s,PL_tokenbuf,len)) ) {
79072805 6086 if (*s++ == '\n')
3280af22 6087 PL_curcop->cop_line++;
79072805 6088 }
3280af22
NIS
6089 if (s >= PL_bufend) {
6090 PL_curcop->cop_line = PL_multi_start;
6091 missingterm(PL_tokenbuf);
79072805
LW
6092 }
6093 sv_setpvn(tmpstr,d+1,s-d);
6094 s += len - 1;
3280af22 6095 PL_curcop->cop_line++; /* the preceding stmt passes a newline */
49d8d3a1 6096
3280af22
NIS
6097 sv_catpvn(herewas,s,PL_bufend-s);
6098 sv_setsv(PL_linestr,herewas);
6099 PL_oldoldbufptr = PL_oldbufptr = PL_bufptr = s = PL_linestart = SvPVX(PL_linestr);
6100 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
79072805
LW
6101 }
6102 else
6103 sv_setpvn(tmpstr,"",0); /* avoid "uninitialized" warning */
3280af22 6104 while (s >= PL_bufend) { /* multiple line string? */
fd2d0953 6105 if (!outer ||
3280af22
NIS
6106 !(PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = filter_gets(PL_linestr, PL_rsfp, 0))) {
6107 PL_curcop->cop_line = PL_multi_start;
6108 missingterm(PL_tokenbuf);
79072805 6109 }
3280af22
NIS
6110 PL_curcop->cop_line++;
6111 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
6a27c188 6112#ifndef PERL_STRICT_CR
3280af22 6113 if (PL_bufend - PL_linestart >= 2) {
a1529941
NIS
6114 if ((PL_bufend[-2] == '\r' && PL_bufend[-1] == '\n') ||
6115 (PL_bufend[-2] == '\n' && PL_bufend[-1] == '\r'))
c6f14548 6116 {
3280af22
NIS
6117 PL_bufend[-2] = '\n';
6118 PL_bufend--;
6119 SvCUR_set(PL_linestr, PL_bufend - SvPVX(PL_linestr));
f63a84b2 6120 }
3280af22
NIS
6121 else if (PL_bufend[-1] == '\r')
6122 PL_bufend[-1] = '\n';
f63a84b2 6123 }
3280af22
NIS
6124 else if (PL_bufend - PL_linestart == 1 && PL_bufend[-1] == '\r')
6125 PL_bufend[-1] = '\n';
f63a84b2 6126#endif
3280af22 6127 if (PERLDB_LINE && PL_curstash != PL_debstash) {
79072805
LW
6128 SV *sv = NEWSV(88,0);
6129
93a17b20 6130 sv_upgrade(sv, SVt_PVMG);
3280af22
NIS
6131 sv_setsv(sv,PL_linestr);
6132 av_store(GvAV(PL_curcop->cop_filegv),
6133 (I32)PL_curcop->cop_line,sv);
79072805 6134 }
3280af22
NIS
6135 if (*s == term && memEQ(s,PL_tokenbuf,len)) {
6136 s = PL_bufend - 1;
79072805 6137 *s = ' ';
3280af22
NIS
6138 sv_catsv(PL_linestr,herewas);
6139 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
79072805
LW
6140 }
6141 else {
3280af22
NIS
6142 s = PL_bufend;
6143 sv_catsv(tmpstr,PL_linestr);
395c3793
LW
6144 }
6145 }
79072805 6146 s++;
0244c3a4
GS
6147retval:
6148 PL_multi_end = PL_curcop->cop_line;
79072805
LW
6149 if (SvCUR(tmpstr) + 5 < SvLEN(tmpstr)) {
6150 SvLEN_set(tmpstr, SvCUR(tmpstr) + 1);
463ee0b2 6151 Renew(SvPVX(tmpstr), SvLEN(tmpstr), char);
79072805 6152 }
8990e307 6153 SvREFCNT_dec(herewas);
3280af22 6154 PL_lex_stuff = tmpstr;
79072805
LW
6155 yylval.ival = op_type;
6156 return s;
6157}
6158
02aa26ce
NT
6159/* scan_inputsymbol
6160 takes: current position in input buffer
6161 returns: new position in input buffer
6162 side-effects: yylval and lex_op are set.
6163
6164 This code handles:
6165
6166 <> read from ARGV
6167 <FH> read from filehandle
6168 <pkg::FH> read from package qualified filehandle
6169 <pkg'FH> read from package qualified filehandle
6170 <$fh> read from filehandle in $fh
6171 <*.h> filename glob
6172
6173*/
6174
76e3520e 6175STATIC char *
cea2e8a9 6176S_scan_inputsymbol(pTHX_ char *start)
79072805 6177{
02aa26ce 6178 register char *s = start; /* current position in buffer */
79072805 6179 register char *d;
fc36a67e 6180 register char *e;
1b420867 6181 char *end;
79072805
LW
6182 I32 len;
6183
3280af22
NIS
6184 d = PL_tokenbuf; /* start of temp holding space */
6185 e = PL_tokenbuf + sizeof PL_tokenbuf; /* end of temp holding space */
1b420867
GS
6186 end = strchr(s, '\n');
6187 if (!end)
6188 end = PL_bufend;
6189 s = delimcpy(d, e, s + 1, end, '>', &len); /* extract until > */
02aa26ce
NT
6190
6191 /* die if we didn't have space for the contents of the <>,
1b420867 6192 or if it didn't end, or if we see a newline
02aa26ce
NT
6193 */
6194
3280af22 6195 if (len >= sizeof PL_tokenbuf)
cea2e8a9 6196 Perl_croak(aTHX_ "Excessively long <> operator");
1b420867 6197 if (s >= end)
cea2e8a9 6198 Perl_croak(aTHX_ "Unterminated <> operator");
02aa26ce 6199
fc36a67e 6200 s++;
02aa26ce
NT
6201
6202 /* check for <$fh>
6203 Remember, only scalar variables are interpreted as filehandles by
6204 this code. Anything more complex (e.g., <$fh{$num}>) will be
6205 treated as a glob() call.
6206 This code makes use of the fact that except for the $ at the front,
6207 a scalar variable and a filehandle look the same.
6208 */
4633a7c4 6209 if (*d == '$' && d[1]) d++;
02aa26ce
NT
6210
6211 /* allow <Pkg'VALUE> or <Pkg::VALUE> */
834a4ddd 6212 while (*d && (isALNUM_lazy(d) || *d == '\'' || *d == ':'))
79072805 6213 d++;
02aa26ce
NT
6214
6215 /* If we've tried to read what we allow filehandles to look like, and
6216 there's still text left, then it must be a glob() and not a getline.
6217 Use scan_str to pull out the stuff between the <> and treat it
6218 as nothing more than a string.
6219 */
6220
3280af22 6221 if (d - PL_tokenbuf != len) {
79072805
LW
6222 yylval.ival = OP_GLOB;
6223 set_csh();
09bef843 6224 s = scan_str(start,FALSE,FALSE);
79072805 6225 if (!s)
cea2e8a9 6226 Perl_croak(aTHX_ "Glob not terminated");
79072805
LW
6227 return s;
6228 }
395c3793 6229 else {
02aa26ce 6230 /* we're in a filehandle read situation */
3280af22 6231 d = PL_tokenbuf;
02aa26ce
NT
6232
6233 /* turn <> into <ARGV> */
79072805
LW
6234 if (!len)
6235 (void)strcpy(d,"ARGV");
02aa26ce
NT
6236
6237 /* if <$fh>, create the ops to turn the variable into a
6238 filehandle
6239 */
79072805 6240 if (*d == '$') {
a0d0e21e 6241 I32 tmp;
02aa26ce
NT
6242
6243 /* try to find it in the pad for this block, otherwise find
6244 add symbol table ops
6245 */
11343788
MB
6246 if ((tmp = pad_findmy(d)) != NOT_IN_PAD) {
6247 OP *o = newOP(OP_PADSV, 0);
6248 o->op_targ = tmp;
f5284f61 6249 PL_lex_op = (OP*)newUNOP(OP_READLINE, 0, o);
a0d0e21e
LW
6250 }
6251 else {
6252 GV *gv = gv_fetchpv(d+1,TRUE, SVt_PV);
3280af22 6253 PL_lex_op = (OP*)newUNOP(OP_READLINE, 0,
a0d0e21e 6254 newUNOP(OP_RV2SV, 0,
f5284f61 6255 newGVOP(OP_GV, 0, gv)));
a0d0e21e 6256 }
f5284f61
IZ
6257 PL_lex_op->op_flags |= OPf_SPECIAL;
6258 /* we created the ops in PL_lex_op, so make yylval.ival a null op */
79072805
LW
6259 yylval.ival = OP_NULL;
6260 }
02aa26ce
NT
6261
6262 /* If it's none of the above, it must be a literal filehandle
6263 (<Foo::BAR> or <FOO>) so build a simple readline OP */
79072805 6264 else {
85e6fe83 6265 GV *gv = gv_fetchpv(d,TRUE, SVt_PVIO);
3280af22 6266 PL_lex_op = (OP*)newUNOP(OP_READLINE, 0, newGVOP(OP_GV, 0, gv));
79072805
LW
6267 yylval.ival = OP_NULL;
6268 }
6269 }
02aa26ce 6270
79072805
LW
6271 return s;
6272}
6273
02aa26ce
NT
6274
6275/* scan_str
6276 takes: start position in buffer
09bef843
SB
6277 keep_quoted preserve \ on the embedded delimiter(s)
6278 keep_delims preserve the delimiters around the string
02aa26ce
NT
6279 returns: position to continue reading from buffer
6280 side-effects: multi_start, multi_close, lex_repl or lex_stuff, and
6281 updates the read buffer.
6282
6283 This subroutine pulls a string out of the input. It is called for:
6284 q single quotes q(literal text)
6285 ' single quotes 'literal text'
6286 qq double quotes qq(interpolate $here please)
6287 " double quotes "interpolate $here please"
6288 qx backticks qx(/bin/ls -l)
6289 ` backticks `/bin/ls -l`
6290 qw quote words @EXPORT_OK = qw( func() $spam )
6291 m// regexp match m/this/
6292 s/// regexp substitute s/this/that/
6293 tr/// string transliterate tr/this/that/
6294 y/// string transliterate y/this/that/
6295 ($*@) sub prototypes sub foo ($)
09bef843 6296 (stuff) sub attr parameters sub foo : attr(stuff)
02aa26ce
NT
6297 <> readline or globs <FOO>, <>, <$fh>, or <*.c>
6298
6299 In most of these cases (all but <>, patterns and transliterate)
6300 yylex() calls scan_str(). m// makes yylex() call scan_pat() which
6301 calls scan_str(). s/// makes yylex() call scan_subst() which calls
6302 scan_str(). tr/// and y/// make yylex() call scan_trans() which
6303 calls scan_str().
6304
6305 It skips whitespace before the string starts, and treats the first
6306 character as the delimiter. If the delimiter is one of ([{< then
6307 the corresponding "close" character )]}> is used as the closing
6308 delimiter. It allows quoting of delimiters, and if the string has
6309 balanced delimiters ([{<>}]) it allows nesting.
6310
6311 The lexer always reads these strings into lex_stuff, except in the
6312 case of the operators which take *two* arguments (s/// and tr///)
6313 when it checks to see if lex_stuff is full (presumably with the 1st
6314 arg to s or tr) and if so puts the string into lex_repl.
6315
6316*/
6317
76e3520e 6318STATIC char *
09bef843 6319S_scan_str(pTHX_ char *start, int keep_quoted, int keep_delims)
79072805 6320{
11343788 6321 dTHR;
02aa26ce
NT
6322 SV *sv; /* scalar value: string */
6323 char *tmps; /* temp string, used for delimiter matching */
6324 register char *s = start; /* current position in the buffer */
6325 register char term; /* terminating character */
6326 register char *to; /* current position in the sv's data */
6327 I32 brackets = 1; /* bracket nesting level */
6328
6329 /* skip space before the delimiter */
fb73857a 6330 if (isSPACE(*s))
6331 s = skipspace(s);
02aa26ce
NT
6332
6333 /* mark where we are, in case we need to report errors */
79072805 6334 CLINE;
02aa26ce
NT
6335
6336 /* after skipping whitespace, the next character is the terminator */
a0d0e21e 6337 term = *s;
02aa26ce 6338 /* mark where we are */
3280af22
NIS
6339 PL_multi_start = PL_curcop->cop_line;
6340 PL_multi_open = term;
02aa26ce
NT
6341
6342 /* find corresponding closing delimiter */
93a17b20 6343 if (term && (tmps = strchr("([{< )]}> )]}>",term)))
79072805 6344 term = tmps[5];
3280af22 6345 PL_multi_close = term;
79072805 6346
02aa26ce 6347 /* create a new SV to hold the contents. 87 is leak category, I'm
8d6dde3e
IZ
6348 assuming. 79 is the SV's initial length. What a random number. */
6349 sv = NEWSV(87,79);
ed6116ce
LW
6350 sv_upgrade(sv, SVt_PVIV);
6351 SvIVX(sv) = term;
a0d0e21e 6352 (void)SvPOK_only(sv); /* validate pointer */
02aa26ce
NT
6353
6354 /* move past delimiter and try to read a complete string */
09bef843
SB
6355 if (keep_delims)
6356 sv_catpvn(sv, s, 1);
93a17b20
LW
6357 s++;
6358 for (;;) {
02aa26ce 6359 /* extend sv if need be */
3280af22 6360 SvGROW(sv, SvCUR(sv) + (PL_bufend - s) + 1);
02aa26ce 6361 /* set 'to' to the next character in the sv's string */
463ee0b2 6362 to = SvPVX(sv)+SvCUR(sv);
09bef843 6363
02aa26ce 6364 /* if open delimiter is the close delimiter read unbridle */
3280af22
NIS
6365 if (PL_multi_open == PL_multi_close) {
6366 for (; s < PL_bufend; s++,to++) {
02aa26ce 6367 /* embedded newlines increment the current line number */
3280af22
NIS
6368 if (*s == '\n' && !PL_rsfp)
6369 PL_curcop->cop_line++;
02aa26ce 6370 /* handle quoted delimiters */
3280af22 6371 if (*s == '\\' && s+1 < PL_bufend && term != '\\') {
09bef843 6372 if (!keep_quoted && s[1] == term)
a0d0e21e 6373 s++;
02aa26ce 6374 /* any other quotes are simply copied straight through */
a0d0e21e
LW
6375 else
6376 *to++ = *s++;
6377 }
02aa26ce
NT
6378 /* terminate when run out of buffer (the for() condition), or
6379 have found the terminator */
93a17b20
LW
6380 else if (*s == term)
6381 break;
6382 *to = *s;
6383 }
6384 }
02aa26ce
NT
6385
6386 /* if the terminator isn't the same as the start character (e.g.,
6387 matched brackets), we have to allow more in the quoting, and
6388 be prepared for nested brackets.
6389 */
93a17b20 6390 else {
02aa26ce 6391 /* read until we run out of string, or we find the terminator */
3280af22 6392 for (; s < PL_bufend; s++,to++) {
02aa26ce 6393 /* embedded newlines increment the line count */
3280af22
NIS
6394 if (*s == '\n' && !PL_rsfp)
6395 PL_curcop->cop_line++;
02aa26ce 6396 /* backslashes can escape the open or closing characters */
3280af22 6397 if (*s == '\\' && s+1 < PL_bufend) {
09bef843
SB
6398 if (!keep_quoted &&
6399 ((s[1] == PL_multi_open) || (s[1] == PL_multi_close)))
a0d0e21e
LW
6400 s++;
6401 else
6402 *to++ = *s++;
6403 }
02aa26ce 6404 /* allow nested opens and closes */
3280af22 6405 else if (*s == PL_multi_close && --brackets <= 0)
93a17b20 6406 break;
3280af22 6407 else if (*s == PL_multi_open)
93a17b20
LW
6408 brackets++;
6409 *to = *s;
6410 }
6411 }
02aa26ce 6412 /* terminate the copied string and update the sv's end-of-string */
93a17b20 6413 *to = '\0';
463ee0b2 6414 SvCUR_set(sv, to - SvPVX(sv));
93a17b20 6415
02aa26ce
NT
6416 /*
6417 * this next chunk reads more into the buffer if we're not done yet
6418 */
6419
3280af22 6420 if (s < PL_bufend) break; /* handle case where we are done yet :-) */
79072805 6421
6a27c188 6422#ifndef PERL_STRICT_CR
f63a84b2 6423 if (to - SvPVX(sv) >= 2) {
c6f14548
GS
6424 if ((to[-2] == '\r' && to[-1] == '\n') ||
6425 (to[-2] == '\n' && to[-1] == '\r'))
6426 {
f63a84b2
LW
6427 to[-2] = '\n';
6428 to--;
6429 SvCUR_set(sv, to - SvPVX(sv));
6430 }
6431 else if (to[-1] == '\r')
6432 to[-1] = '\n';
6433 }
6434 else if (to - SvPVX(sv) == 1 && to[-1] == '\r')
6435 to[-1] = '\n';
6436#endif
6437
02aa26ce
NT
6438 /* if we're out of file, or a read fails, bail and reset the current
6439 line marker so we can report where the unterminated string began
6440 */
3280af22
NIS
6441 if (!PL_rsfp ||
6442 !(PL_oldoldbufptr = PL_oldbufptr = s = PL_linestart = filter_gets(PL_linestr, PL_rsfp, 0))) {
c07a80fd 6443 sv_free(sv);
3280af22 6444 PL_curcop->cop_line = PL_multi_start;
79072805
LW
6445 return Nullch;
6446 }
02aa26ce 6447 /* we read a line, so increment our line counter */
3280af22 6448 PL_curcop->cop_line++;
a0ed51b3 6449
02aa26ce 6450 /* update debugger info */
3280af22 6451 if (PERLDB_LINE && PL_curstash != PL_debstash) {
79072805
LW
6452 SV *sv = NEWSV(88,0);
6453
93a17b20 6454 sv_upgrade(sv, SVt_PVMG);
3280af22
NIS
6455 sv_setsv(sv,PL_linestr);
6456 av_store(GvAV(PL_curcop->cop_filegv),
6457 (I32)PL_curcop->cop_line, sv);
395c3793 6458 }
a0ed51b3 6459
3280af22
NIS
6460 /* having changed the buffer, we must update PL_bufend */
6461 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
378cc40b 6462 }
02aa26ce
NT
6463
6464 /* at this point, we have successfully read the delimited string */
6465
09bef843
SB
6466 if (keep_delims)
6467 sv_catpvn(sv, s, 1);
3280af22 6468 PL_multi_end = PL_curcop->cop_line;
79072805 6469 s++;
02aa26ce
NT
6470
6471 /* if we allocated too much space, give some back */
93a17b20
LW
6472 if (SvCUR(sv) + 5 < SvLEN(sv)) {
6473 SvLEN_set(sv, SvCUR(sv) + 1);
463ee0b2 6474 Renew(SvPVX(sv), SvLEN(sv), char);
79072805 6475 }
02aa26ce
NT
6476
6477 /* decide whether this is the first or second quoted string we've read
6478 for this op
6479 */
6480
3280af22
NIS
6481 if (PL_lex_stuff)
6482 PL_lex_repl = sv;
79072805 6483 else
3280af22 6484 PL_lex_stuff = sv;
378cc40b
LW
6485 return s;
6486}
6487
02aa26ce
NT
6488/*
6489 scan_num
6490 takes: pointer to position in buffer
6491 returns: pointer to new position in buffer
6492 side-effects: builds ops for the constant in yylval.op
6493
6494 Read a number in any of the formats that Perl accepts:
6495
4f19785b 6496 0(x[0-7A-F]+)|([0-7]+)|(b[01])
02aa26ce
NT
6497 [\d_]+(\.[\d_]*)?[Ee](\d+)
6498
6499 Underbars (_) are allowed in decimal numbers. If -w is on,
6500 underbars before a decimal point must be at three digit intervals.
6501
3280af22 6502 Like most scan_ routines, it uses the PL_tokenbuf buffer to hold the
02aa26ce
NT
6503 thing it reads.
6504
6505 If it reads a number without a decimal point or an exponent, it will
6506 try converting the number to an integer and see if it can do so
6507 without loss of precision.
6508*/
6509
378cc40b 6510char *
864dbfa3 6511Perl_scan_num(pTHX_ char *start)
378cc40b 6512{
02aa26ce
NT
6513 register char *s = start; /* current position in buffer */
6514 register char *d; /* destination in temp buffer */
6515 register char *e; /* end of temp buffer */
b8403495 6516 IV tryiv; /* used to see if it can be an IV */
65202027 6517 NV value; /* number read, as a double */
02aa26ce 6518 SV *sv; /* place to put the converted number */
b8403495 6519 bool floatit; /* boolean: int or float? */
02aa26ce 6520 char *lastub = 0; /* position of last underbar */
fc36a67e 6521 static char number_too_long[] = "Number too long";
378cc40b 6522
02aa26ce
NT
6523 /* We use the first character to decide what type of number this is */
6524
378cc40b 6525 switch (*s) {
79072805 6526 default:
cea2e8a9 6527 Perl_croak(aTHX_ "panic: scan_num");
02aa26ce
NT
6528
6529 /* if it starts with a 0, it could be an octal number, a decimal in
4f19785b 6530 0.13 disguise, or a hexadecimal number, or a binary number.
02aa26ce 6531 */
378cc40b
LW
6532 case '0':
6533 {
02aa26ce
NT
6534 /* variables:
6535 u holds the "number so far"
4f19785b
WSI
6536 shift the power of 2 of the base
6537 (hex == 4, octal == 3, binary == 1)
02aa26ce
NT
6538 overflowed was the number more than we can hold?
6539
6540 Shift is used when we add a digit. It also serves as an "are
4f19785b
WSI
6541 we in octal/hex/binary?" indicator to disallow hex characters
6542 when in octal mode.
02aa26ce 6543 */
f248d071 6544 dTHR;
9e24b6e2
JH
6545 NV n = 0.0;
6546 UV u = 0;
79072805 6547 I32 shift;
9e24b6e2
JH
6548 bool overflowed = FALSE;
6549 static NV nvshift[5] = { 1.0, 2.0, 4.0, 8.0, 16.0 };
6550 static char* bases[5] = { "", "binary", "", "octal",
6551 "hexadecimal" };
6552 static char* Bases[5] = { "", "Binary", "", "Octal",
6553 "Hexadecimal" };
6554 static char *maxima[5] = { "",
6555 "0b11111111111111111111111111111111",
6556 "",
893fe2c2 6557 "037777777777",
9e24b6e2
JH
6558 "0xffffffff" };
6559 char *base, *Base, *max;
378cc40b 6560
02aa26ce 6561 /* check for hex */
378cc40b
LW
6562 if (s[1] == 'x') {
6563 shift = 4;
6564 s += 2;
4f19785b
WSI
6565 } else if (s[1] == 'b') {
6566 shift = 1;
6567 s += 2;
378cc40b 6568 }
02aa26ce 6569 /* check for a decimal in disguise */
b78218b7 6570 else if (s[1] == '.' || s[1] == 'e' || s[1] == 'E')
378cc40b 6571 goto decimal;
02aa26ce 6572 /* so it must be octal */
378cc40b
LW
6573 else
6574 shift = 3;
9e24b6e2
JH
6575
6576 base = bases[shift];
6577 Base = Bases[shift];
6578 max = maxima[shift];
02aa26ce 6579
4f19785b 6580 /* read the rest of the number */
378cc40b 6581 for (;;) {
9e24b6e2 6582 /* x is used in the overflow test,
893fe2c2 6583 b is the digit we're adding on. */
9e24b6e2 6584 UV x, b;
55497cff 6585
378cc40b 6586 switch (*s) {
02aa26ce
NT
6587
6588 /* if we don't mention it, we're done */
378cc40b
LW
6589 default:
6590 goto out;
02aa26ce
NT
6591
6592 /* _ are ignored */
de3bb511
LW
6593 case '_':
6594 s++;
6595 break;
02aa26ce
NT
6596
6597 /* 8 and 9 are not octal */
378cc40b 6598 case '8': case '9':
4f19785b 6599 if (shift == 3)
cea2e8a9 6600 yyerror(Perl_form(aTHX_ "Illegal octal digit '%c'", *s));
378cc40b 6601 /* FALL THROUGH */
02aa26ce
NT
6602
6603 /* octal digits */
4f19785b 6604 case '2': case '3': case '4':
378cc40b 6605 case '5': case '6': case '7':
4f19785b 6606 if (shift == 1)
cea2e8a9 6607 yyerror(Perl_form(aTHX_ "Illegal binary digit '%c'", *s));
4f19785b
WSI
6608 /* FALL THROUGH */
6609
6610 case '0': case '1':
02aa26ce 6611 b = *s++ & 15; /* ASCII digit -> value of digit */
55497cff 6612 goto digit;
02aa26ce
NT
6613
6614 /* hex digits */
378cc40b
LW
6615 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
6616 case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
02aa26ce 6617 /* make sure they said 0x */
378cc40b
LW
6618 if (shift != 4)
6619 goto out;
55497cff 6620 b = (*s++ & 7) + 9;
02aa26ce
NT
6621
6622 /* Prepare to put the digit we have onto the end
6623 of the number so far. We check for overflows.
6624 */
6625
55497cff 6626 digit:
9e24b6e2
JH
6627 if (!overflowed) {
6628 x = u << shift; /* make room for the digit */
6629
6630 if ((x >> shift) != u
6631 && !(PL_hints & HINT_NEW_BINARY)) {
6632 dTHR;
6633 overflowed = TRUE;
6634 n = (NV) u;
767a6a26
PM
6635 if (ckWARN_d(WARN_OVERFLOW))
6636 Perl_warner(aTHX_ WARN_OVERFLOW,
9e24b6e2
JH
6637 "Integer overflow in %s number",
6638 base);
6639 } else
6640 u = x | b; /* add the digit to the end */
6641 }
6642 if (overflowed) {
6643 n *= nvshift[shift];
6644 /* If an NV has not enough bits in its
6645 * mantissa to represent an UV this summing of
6646 * small low-order numbers is a waste of time
6647 * (because the NV cannot preserve the
6648 * low-order bits anyway): we could just
6649 * remember when did we overflow and in the
6650 * end just multiply n by the right
6651 * amount. */
6652 n += (NV) b;
55497cff 6653 }
378cc40b
LW
6654 break;
6655 }
6656 }
02aa26ce
NT
6657
6658 /* if we get here, we had success: make a scalar value from
6659 the number.
6660 */
378cc40b 6661 out:
79072805 6662 sv = NEWSV(92,0);
9e24b6e2
JH
6663 if (overflowed) {
6664 dTHR;
767a6a26
PM
6665 if (ckWARN(WARN_PORTABLE) && n > 4294967295.0)
6666 Perl_warner(aTHX_ WARN_PORTABLE,
9e24b6e2
JH
6667 "%s number > %s non-portable",
6668 Base, max);
6669 sv_setnv(sv, n);
6670 }
6671 else {
15041a67 6672#if UVSIZE > 4
9e24b6e2 6673 dTHR;
767a6a26
PM
6674 if (ckWARN(WARN_PORTABLE) && u > 0xffffffff)
6675 Perl_warner(aTHX_ WARN_PORTABLE,
9e24b6e2
JH
6676 "%s number > %s non-portable",
6677 Base, max);
2cc4c2dc 6678#endif
9e24b6e2
JH
6679 sv_setuv(sv, u);
6680 }
2cc4c2dc 6681 if (PL_hints & HINT_NEW_BINARY)
b3ac6de7 6682 sv = new_constant(start, s - start, "binary", sv, Nullsv, NULL);
378cc40b
LW
6683 }
6684 break;
02aa26ce
NT
6685
6686 /*
6687 handle decimal numbers.
6688 we're also sent here when we read a 0 as the first digit
6689 */
378cc40b
LW
6690 case '1': case '2': case '3': case '4': case '5':
6691 case '6': case '7': case '8': case '9': case '.':
6692 decimal:
3280af22
NIS
6693 d = PL_tokenbuf;
6694 e = PL_tokenbuf + sizeof PL_tokenbuf - 6; /* room for various punctuation */
79072805 6695 floatit = FALSE;
02aa26ce
NT
6696
6697 /* read next group of digits and _ and copy into d */
de3bb511 6698 while (isDIGIT(*s) || *s == '_') {
02aa26ce
NT
6699 /* skip underscores, checking for misplaced ones
6700 if -w is on
6701 */
93a17b20 6702 if (*s == '_') {
d008e5eb 6703 dTHR; /* only for ckWARN */
599cee73 6704 if (ckWARN(WARN_SYNTAX) && lastub && s - lastub != 3)
cea2e8a9 6705 Perl_warner(aTHX_ WARN_SYNTAX, "Misplaced _ in number");
93a17b20
LW
6706 lastub = ++s;
6707 }
fc36a67e 6708 else {
02aa26ce 6709 /* check for end of fixed-length buffer */
fc36a67e 6710 if (d >= e)
cea2e8a9 6711 Perl_croak(aTHX_ number_too_long);
02aa26ce 6712 /* if we're ok, copy the character */
378cc40b 6713 *d++ = *s++;
fc36a67e 6714 }
378cc40b 6715 }
02aa26ce
NT
6716
6717 /* final misplaced underbar check */
d008e5eb
GS
6718 if (lastub && s - lastub != 3) {
6719 dTHR;
6720 if (ckWARN(WARN_SYNTAX))
cea2e8a9 6721 Perl_warner(aTHX_ WARN_SYNTAX, "Misplaced _ in number");
d008e5eb 6722 }
02aa26ce
NT
6723
6724 /* read a decimal portion if there is one. avoid
6725 3..5 being interpreted as the number 3. followed
6726 by .5
6727 */
2f3197b3 6728 if (*s == '.' && s[1] != '.') {
79072805 6729 floatit = TRUE;
378cc40b 6730 *d++ = *s++;
02aa26ce
NT
6731
6732 /* copy, ignoring underbars, until we run out of
6733 digits. Note: no misplaced underbar checks!
6734 */
fc36a67e 6735 for (; isDIGIT(*s) || *s == '_'; s++) {
02aa26ce 6736 /* fixed length buffer check */
fc36a67e 6737 if (d >= e)
cea2e8a9 6738 Perl_croak(aTHX_ number_too_long);
fc36a67e 6739 if (*s != '_')
6740 *d++ = *s;
378cc40b
LW
6741 }
6742 }
02aa26ce
NT
6743
6744 /* read exponent part, if present */
93a17b20 6745 if (*s && strchr("eE",*s) && strchr("+-0123456789",s[1])) {
79072805
LW
6746 floatit = TRUE;
6747 s++;
02aa26ce
NT
6748
6749 /* regardless of whether user said 3E5 or 3e5, use lower 'e' */
79072805 6750 *d++ = 'e'; /* At least some Mach atof()s don't grok 'E' */
02aa26ce
NT
6751
6752 /* allow positive or negative exponent */
378cc40b
LW
6753 if (*s == '+' || *s == '-')
6754 *d++ = *s++;
02aa26ce
NT
6755
6756 /* read digits of exponent (no underbars :-) */
fc36a67e 6757 while (isDIGIT(*s)) {
6758 if (d >= e)
cea2e8a9 6759 Perl_croak(aTHX_ number_too_long);
378cc40b 6760 *d++ = *s++;
fc36a67e 6761 }
378cc40b 6762 }
02aa26ce
NT
6763
6764 /* terminate the string */
378cc40b 6765 *d = '\0';
02aa26ce
NT
6766
6767 /* make an sv from the string */
79072805 6768 sv = NEWSV(92,0);
097ee67d
JH
6769
6770 value = Atof(PL_tokenbuf);
02aa26ce
NT
6771
6772 /*
6773 See if we can make do with an integer value without loss of
6774 precision. We use I_V to cast to an int, because some
6775 compilers have issues. Then we try casting it back and see
6776 if it was the same. We only do this if we know we
6777 specifically read an integer.
6778
6779 Note: if floatit is true, then we don't need to do the
6780 conversion at all.
6781 */
1e422769 6782 tryiv = I_V(value);
65202027 6783 if (!floatit && (NV)tryiv == value)
1e422769 6784 sv_setiv(sv, tryiv);
2f3197b3 6785 else
1e422769 6786 sv_setnv(sv, value);
b8403495
JH
6787 if ( floatit ? (PL_hints & HINT_NEW_FLOAT) :
6788 (PL_hints & HINT_NEW_INTEGER) )
3280af22 6789 sv = new_constant(PL_tokenbuf, d - PL_tokenbuf,
b8403495
JH
6790 (floatit ? "float" : "integer"),
6791 sv, Nullsv, NULL);
378cc40b 6792 break;
79072805 6793 }
a687059c 6794
02aa26ce
NT
6795 /* make the op for the constant and return */
6796
79072805 6797 yylval.opval = newSVOP(OP_CONST, 0, sv);
a687059c 6798
378cc40b
LW
6799 return s;
6800}
6801
76e3520e 6802STATIC char *
cea2e8a9 6803S_scan_formline(pTHX_ register char *s)
378cc40b 6804{
11343788 6805 dTHR;
79072805 6806 register char *eol;
378cc40b 6807 register char *t;
79cb57f6 6808 SV *stuff = newSVpvn("",0);
79072805 6809 bool needargs = FALSE;
378cc40b 6810
79072805 6811 while (!needargs) {
85e6fe83 6812 if (*s == '.' || *s == '}') {
79072805 6813 /*SUPPRESS 530*/
51882d45
GS
6814#ifdef PERL_STRICT_CR
6815 for (t = s+1;*t == ' ' || *t == '\t'; t++) ;
6816#else
6817 for (t = s+1;*t == ' ' || *t == '\t' || *t == '\r'; t++) ;
6818#endif
6a65c6a0 6819 if (*t == '\n' || t == PL_bufend)
79072805
LW
6820 break;
6821 }
3280af22 6822 if (PL_in_eval && !PL_rsfp) {
93a17b20 6823 eol = strchr(s,'\n');
0f85fab0 6824 if (!eol++)
3280af22 6825 eol = PL_bufend;
0f85fab0
LW
6826 }
6827 else
3280af22 6828 eol = PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
79072805 6829 if (*s != '#') {
a0d0e21e
LW
6830 for (t = s; t < eol; t++) {
6831 if (*t == '~' && t[1] == '~' && SvCUR(stuff)) {
6832 needargs = FALSE;
6833 goto enough; /* ~~ must be first line in formline */
378cc40b 6834 }
a0d0e21e
LW
6835 if (*t == '@' || *t == '^')
6836 needargs = TRUE;
378cc40b 6837 }
a0d0e21e 6838 sv_catpvn(stuff, s, eol-s);
79072805
LW
6839 }
6840 s = eol;
3280af22
NIS
6841 if (PL_rsfp) {
6842 s = filter_gets(PL_linestr, PL_rsfp, 0);
6843 PL_oldoldbufptr = PL_oldbufptr = PL_bufptr = PL_linestart = SvPVX(PL_linestr);
6844 PL_bufend = PL_bufptr + SvCUR(PL_linestr);
79072805 6845 if (!s) {
3280af22 6846 s = PL_bufptr;
79072805 6847 yyerror("Format not terminated");
378cc40b
LW
6848 break;
6849 }
378cc40b 6850 }
463ee0b2 6851 incline(s);
79072805 6852 }
a0d0e21e
LW
6853 enough:
6854 if (SvCUR(stuff)) {
3280af22 6855 PL_expect = XTERM;
79072805 6856 if (needargs) {
3280af22
NIS
6857 PL_lex_state = LEX_NORMAL;
6858 PL_nextval[PL_nexttoke].ival = 0;
79072805
LW
6859 force_next(',');
6860 }
a0d0e21e 6861 else
3280af22
NIS
6862 PL_lex_state = LEX_FORMLINE;
6863 PL_nextval[PL_nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, stuff);
79072805 6864 force_next(THING);
3280af22 6865 PL_nextval[PL_nexttoke].ival = OP_FORMLINE;
79072805 6866 force_next(LSTOP);
378cc40b 6867 }
79072805 6868 else {
8990e307 6869 SvREFCNT_dec(stuff);
3280af22
NIS
6870 PL_lex_formbrack = 0;
6871 PL_bufptr = s;
79072805
LW
6872 }
6873 return s;
378cc40b 6874}
a687059c 6875
76e3520e 6876STATIC void
cea2e8a9 6877S_set_csh(pTHX)
a687059c 6878{
ae986130 6879#ifdef CSH
3280af22
NIS
6880 if (!PL_cshlen)
6881 PL_cshlen = strlen(PL_cshname);
ae986130 6882#endif
a687059c 6883}
463ee0b2 6884
ba6d6ac9 6885I32
864dbfa3 6886Perl_start_subparse(pTHX_ I32 is_format, U32 flags)
8990e307 6887{
11343788 6888 dTHR;
3280af22
NIS
6889 I32 oldsavestack_ix = PL_savestack_ix;
6890 CV* outsidecv = PL_compcv;
748a9306 6891 AV* comppadlist;
8990e307 6892
3280af22
NIS
6893 if (PL_compcv) {
6894 assert(SvTYPE(PL_compcv) == SVt_PVCV);
e9a444f0 6895 }
3280af22
NIS
6896 save_I32(&PL_subline);
6897 save_item(PL_subname);
6898 SAVEI32(PL_padix);
6899 SAVESPTR(PL_curpad);
6900 SAVESPTR(PL_comppad);
6901 SAVESPTR(PL_comppad_name);
6902 SAVESPTR(PL_compcv);
6903 SAVEI32(PL_comppad_name_fill);
6904 SAVEI32(PL_min_intro_pending);
6905 SAVEI32(PL_max_intro_pending);
6906 SAVEI32(PL_pad_reset_pending);
6907
6908 PL_compcv = (CV*)NEWSV(1104,0);
6909 sv_upgrade((SV *)PL_compcv, is_format ? SVt_PVFM : SVt_PVCV);
6910 CvFLAGS(PL_compcv) |= flags;
6911
6912 PL_comppad = newAV();
6913 av_push(PL_comppad, Nullsv);
6914 PL_curpad = AvARRAY(PL_comppad);
6915 PL_comppad_name = newAV();
6916 PL_comppad_name_fill = 0;
6917 PL_min_intro_pending = 0;
6918 PL_padix = 0;
6919 PL_subline = PL_curcop->cop_line;
6d4ff0d2 6920#ifdef USE_THREADS
79cb57f6 6921 av_store(PL_comppad_name, 0, newSVpvn("@_", 2));
533c011a
NIS
6922 PL_curpad[0] = (SV*)newAV();
6923 SvPADMY_on(PL_curpad[0]); /* XXX Needed? */
6d4ff0d2 6924#endif /* USE_THREADS */
748a9306
LW
6925
6926 comppadlist = newAV();
6927 AvREAL_off(comppadlist);
3280af22
NIS
6928 av_store(comppadlist, 0, (SV*)PL_comppad_name);
6929 av_store(comppadlist, 1, (SV*)PL_comppad);
748a9306 6930
3280af22
NIS
6931 CvPADLIST(PL_compcv) = comppadlist;
6932 CvOUTSIDE(PL_compcv) = (CV*)SvREFCNT_inc(outsidecv);
11343788 6933#ifdef USE_THREADS
533c011a
NIS
6934 CvOWNER(PL_compcv) = 0;
6935 New(666, CvMUTEXP(PL_compcv), 1, perl_mutex);
6936 MUTEX_INIT(CvMUTEXP(PL_compcv));
11343788 6937#endif /* USE_THREADS */
748a9306 6938
8990e307
LW
6939 return oldsavestack_ix;
6940}
6941
6942int
864dbfa3 6943Perl_yywarn(pTHX_ char *s)
8990e307 6944{
11343788 6945 dTHR;
faef0170 6946 PL_in_eval |= EVAL_WARNONLY;
748a9306 6947 yyerror(s);
faef0170 6948 PL_in_eval &= ~EVAL_WARNONLY;
748a9306 6949 return 0;
8990e307
LW
6950}
6951
6952int
864dbfa3 6953Perl_yyerror(pTHX_ char *s)
463ee0b2 6954{
11343788 6955 dTHR;
68dc0745 6956 char *where = NULL;
6957 char *context = NULL;
6958 int contlen = -1;
46fc3d4c 6959 SV *msg;
463ee0b2 6960
3280af22 6961 if (!yychar || (yychar == ';' && !PL_rsfp))
54310121 6962 where = "at EOF";
3280af22
NIS
6963 else if (PL_bufptr > PL_oldoldbufptr && PL_bufptr - PL_oldoldbufptr < 200 &&
6964 PL_oldoldbufptr != PL_oldbufptr && PL_oldbufptr != PL_bufptr) {
6965 while (isSPACE(*PL_oldoldbufptr))
6966 PL_oldoldbufptr++;
6967 context = PL_oldoldbufptr;
6968 contlen = PL_bufptr - PL_oldoldbufptr;
463ee0b2 6969 }
3280af22
NIS
6970 else if (PL_bufptr > PL_oldbufptr && PL_bufptr - PL_oldbufptr < 200 &&
6971 PL_oldbufptr != PL_bufptr) {
6972 while (isSPACE(*PL_oldbufptr))
6973 PL_oldbufptr++;
6974 context = PL_oldbufptr;
6975 contlen = PL_bufptr - PL_oldbufptr;
463ee0b2
LW
6976 }
6977 else if (yychar > 255)
68dc0745 6978 where = "next token ???";
463ee0b2 6979 else if ((yychar & 127) == 127) {
3280af22
NIS
6980 if (PL_lex_state == LEX_NORMAL ||
6981 (PL_lex_state == LEX_KNOWNEXT && PL_lex_defer == LEX_NORMAL))
68dc0745 6982 where = "at end of line";
3280af22 6983 else if (PL_lex_inpat)
68dc0745 6984 where = "within pattern";
463ee0b2 6985 else
68dc0745 6986 where = "within string";
463ee0b2 6987 }
46fc3d4c 6988 else {
79cb57f6 6989 SV *where_sv = sv_2mortal(newSVpvn("next char ", 10));
46fc3d4c 6990 if (yychar < 32)
cea2e8a9 6991 Perl_sv_catpvf(aTHX_ where_sv, "^%c", toCTRL(yychar));
46fc3d4c 6992 else if (isPRINT_LC(yychar))
cea2e8a9 6993 Perl_sv_catpvf(aTHX_ where_sv, "%c", yychar);
463ee0b2 6994 else
cea2e8a9 6995 Perl_sv_catpvf(aTHX_ where_sv, "\\%03o", yychar & 255);
46fc3d4c 6996 where = SvPVX(where_sv);
463ee0b2 6997 }
46fc3d4c 6998 msg = sv_2mortal(newSVpv(s, 0));
57def98f 6999 Perl_sv_catpvf(aTHX_ msg, " at %_ line %"IVdf", ",
cf2093f6 7000 GvSV(PL_curcop->cop_filegv), (IV)PL_curcop->cop_line);
68dc0745 7001 if (context)
cea2e8a9 7002 Perl_sv_catpvf(aTHX_ msg, "near \"%.*s\"\n", contlen, context);
463ee0b2 7003 else
cea2e8a9 7004 Perl_sv_catpvf(aTHX_ msg, "%s\n", where);
3280af22 7005 if (PL_multi_start < PL_multi_end && (U32)(PL_curcop->cop_line - PL_multi_end) <= 1) {
cf2093f6 7006 Perl_sv_catpvf(aTHX_ msg,
57def98f 7007 " (Might be a runaway multi-line %c%c string starting on line %"IVdf")\n",
cf2093f6 7008 (int)PL_multi_open,(int)PL_multi_close,(IV)PL_multi_start);
3280af22 7009 PL_multi_end = 0;
a0d0e21e 7010 }
faef0170 7011 if (PL_in_eval & EVAL_WARNONLY)
cea2e8a9 7012 Perl_warn(aTHX_ "%_", msg);
463ee0b2 7013 else
5a844595
GS
7014 qerror(msg);
7015 if (PL_error_count >= 10)
cea2e8a9 7016 Perl_croak(aTHX_ "%_ has too many errors.\n", GvSV(PL_curcop->cop_filegv));
3280af22
NIS
7017 PL_in_my = 0;
7018 PL_in_my_stash = Nullhv;
463ee0b2
LW
7019 return 0;
7020}
4e35701f 7021
161b471a 7022
51371543
GS
7023#ifdef PERL_OBJECT
7024#define NO_XSLOCKS
7025#include "XSUB.h"
7026#endif
7027
ffb4593c
NT
7028/*
7029 * restore_rsfp
7030 * Restore a source filter.
7031 */
7032
51371543
GS
7033static void
7034restore_rsfp(pTHXo_ void *f)
7035{
7036 PerlIO *fp = (PerlIO*)f;
7037
7038 if (PL_rsfp == PerlIO_stdin())
7039 PerlIO_clearerr(PL_rsfp);
7040 else if (PL_rsfp && (PL_rsfp != fp))
7041 PerlIO_close(PL_rsfp);
7042 PL_rsfp = fp;
7043}
7044
ffb4593c
NT
7045/*
7046 * restore_expect
7047 * Restores the state of PL_expect when the lexing that begun with a
7048 * start_lex() call has ended.
7049 */
7050
51371543
GS
7051static void
7052restore_expect(pTHXo_ void *e)
7053{
7054 /* a safe way to store a small integer in a pointer */
7055 PL_expect = (expectation)((char *)e - PL_tokenbuf);
7056}
7057
ffb4593c
NT
7058/*
7059 * restore_lex_expect
7060 * Restores the state of PL_lex_expect when the lexing that begun with a
7061 * start_lex() call has ended.
7062 */
7063
51371543
GS
7064static void
7065restore_lex_expect(pTHXo_ void *e)
7066{
7067 /* a safe way to store a small integer in a pointer */
7068 PL_lex_expect = (expectation)((char *)e - PL_tokenbuf);
7069}