This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
[inseperable differences up to perl 5.004_02]
[perl5.git] / toke.c
CommitLineData
a0d0e21e 1/* toke.c
a687059c 2 *
9607fc9c 3 * Copyright (c) 1991-1997, Larry Wall
a687059c 4 *
d48672a2
LW
5 * You may distribute under the terms of either the GNU General Public
6 * License or the Artistic License, as specified in the README file.
378cc40b 7 *
a0d0e21e
LW
8 */
9
10/*
11 * "It all comes from here, the stench and the peril." --Frodo
378cc40b
LW
12 */
13
14#include "EXTERN.h"
15#include "perl.h"
378cc40b 16
a0d0e21e
LW
17static void check_uni _((void));
18static void force_next _((I32 type));
89bfa8cd 19static char *force_version _((char *start));
a0d0e21e
LW
20static char *force_word _((char *start, int token, int check_keyword, int allow_pack, int allow_tick));
21static SV *q _((SV *sv));
22static char *scan_const _((char *start));
23static char *scan_formline _((char *s));
24static char *scan_heredoc _((char *s));
8903cb82 25static char *scan_ident _((char *s, char *send, char *dest, STRLEN destlen,
26 I32 ck_uni));
a0d0e21e
LW
27static char *scan_inputsymbol _((char *start));
28static char *scan_pat _((char *start));
29static char *scan_str _((char *start));
30static char *scan_subst _((char *start));
31static char *scan_trans _((char *start));
8903cb82 32static char *scan_word _((char *s, char *dest, STRLEN destlen,
33 int allow_package, STRLEN *slp));
a0d0e21e
LW
34static char *skipspace _((char *s));
35static void checkcomma _((char *s, char *name, char *what));
36static void force_ident _((char *s, int kind));
37static void incline _((char *s));
38static int intuit_method _((char *s, GV *gv));
39static int intuit_more _((char *s));
40static I32 lop _((I32 f, expectation x, char *s));
41static void missingterm _((char *s));
42static void no_op _((char *what, char *s));
43static void set_csh _((void));
44static I32 sublex_done _((void));
55497cff 45static I32 sublex_push _((void));
a0d0e21e
LW
46static I32 sublex_start _((void));
47#ifdef CRIPPLED_CC
48static int uni _((I32 f, char *s));
49#endif
fd049845 50static char * filter_gets _((SV *sv, PerlIO *fp, STRLEN append));
6d5fb7e3 51static void restore_rsfp _((void *f));
2f3197b3 52
fc36a67e 53static char ident_too_long[] = "Identifier too long";
8903cb82 54
fd049845 55static char *linestart; /* beg. of most recently read line */
56
bbce6d69 57static char pending_ident; /* pending identifier lookup */
58
55497cff 59static struct {
60 I32 super_state; /* lexer state to save */
61 I32 sub_inwhat; /* "lex_inwhat" to use */
62 OP *sub_op; /* "lex_op" to use */
63} sublex_info;
64
79072805
LW
65/* The following are arranged oddly so that the guard on the switch statement
66 * can get by with a single comparison (if the compiler is smart enough).
67 */
68
55497cff 69#define LEX_NORMAL 10
70#define LEX_INTERPNORMAL 9
71#define LEX_INTERPCASEMOD 8
72#define LEX_INTERPPUSH 7
73#define LEX_INTERPSTART 6
74#define LEX_INTERPEND 5
75#define LEX_INTERPENDMAYBE 4
76#define LEX_INTERPCONCAT 3
77#define LEX_INTERPCONST 2
78#define LEX_FORMLINE 1
79#define LEX_KNOWNEXT 0
79072805 80
395c3793
LW
81#ifdef I_FCNTL
82#include <fcntl.h>
83#endif
fe14fcc3
LW
84#ifdef I_SYS_FILE
85#include <sys/file.h>
86#endif
395c3793 87
a790bc05 88/* XXX If this causes problems, set i_unistd=undef in the hint file. */
89#ifdef I_UNISTD
90# include <unistd.h> /* Needed for execv() */
91#endif
92
93
79072805
LW
94#ifdef ff_next
95#undef ff_next
d48672a2
LW
96#endif
97
79072805 98#include "keywords.h"
fe14fcc3 99
ae986130
LW
100#ifdef CLINE
101#undef CLINE
102#endif
79072805 103#define CLINE (copline = (curcop->cop_line < copline ? curcop->cop_line : copline))
378cc40b 104
79072805
LW
105#define TOKEN(retval) return (bufptr = s,(int)retval)
106#define OPERATOR(retval) return (expect = XTERM,bufptr = s,(int)retval)
a0d0e21e 107#define AOPERATOR(retval) return ao((expect = XTERM,bufptr = s,(int)retval))
79072805 108#define PREBLOCK(retval) return (expect = XBLOCK,bufptr = s,(int)retval)
a0d0e21e 109#define PRETERMBLOCK(retval) return (expect = XTERMBLOCK,bufptr = s,(int)retval)
79072805
LW
110#define PREREF(retval) return (expect = XREF,bufptr = s,(int)retval)
111#define TERM(retval) return (CLINE, expect = XOPERATOR,bufptr = s,(int)retval)
463ee0b2 112#define LOOPX(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)LOOPEX)
79072805
LW
113#define FTST(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)UNIOP)
114#define FUN0(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC0)
115#define FUN1(f) return(yylval.ival = f,expect = XOPERATOR,bufptr = s,(int)FUNC1)
a0d0e21e
LW
116#define BOop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)BITOROP))
117#define BAop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)BITANDOP))
118#define SHop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)SHIFTOP))
119#define PWop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)POWOP))
79072805 120#define PMop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)MATCHOP)
a0d0e21e
LW
121#define Aop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)ADDOP))
122#define Mop(f) return ao((yylval.ival=f,expect = XTERM,bufptr = s,(int)MULOP))
79072805
LW
123#define Eop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)EQOP)
124#define Rop(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)RELOP)
2f3197b3 125
a687059c
LW
126/* This bit of chicanery makes a unary function followed by
127 * a parenthesis into a function with one argument, highest precedence.
128 */
2f3197b3 129#define UNI(f) return(yylval.ival = f, \
79072805 130 expect = XTERM, \
2f3197b3
LW
131 bufptr = s, \
132 last_uni = oldbufptr, \
a0d0e21e 133 last_lop_op = f, \
a687059c
LW
134 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
135
79072805
LW
136#define UNIBRACK(f) return(yylval.ival = f, \
137 bufptr = s, \
138 last_uni = oldbufptr, \
139 (*s == '(' || (s = skipspace(s), *s == '(') ? (int)FUNC1 : (int)UNIOP) )
140
9f68db38 141/* grandfather return to old style */
79072805
LW
142#define OLDLOP(f) return(yylval.ival=f,expect = XTERM,bufptr = s,(int)LSTOP)
143
a0d0e21e
LW
144static int
145ao(toketype)
146int toketype;
147{
148 if (*bufptr == '=') {
149 bufptr++;
150 if (toketype == ANDAND)
151 yylval.ival = OP_ANDASSIGN;
152 else if (toketype == OROR)
153 yylval.ival = OP_ORASSIGN;
154 toketype = ASSIGNOP;
155 }
156 return toketype;
157}
158
8990e307
LW
159static void
160no_op(what, s)
463ee0b2 161char *what;
8990e307 162char *s;
463ee0b2 163{
748a9306 164 char *oldbp = bufptr;
fd049845 165 bool is_first = (oldbufptr == linestart);
68dc0745 166
8990e307 167 bufptr = s;
46fc3d4c 168 yywarn(form("%s found where operator expected", what));
748a9306 169 if (is_first)
a0d0e21e 170 warn("\t(Missing semicolon on previous line?)\n");
748a9306
LW
171 else if (oldoldbufptr && isIDFIRST(*oldoldbufptr)) {
172 char *t;
173 for (t = oldoldbufptr; *t && (isALNUM(*t) || *t == ':'); t++) ;
174 if (t < bufptr && isSPACE(*t))
175 warn("\t(Do you need to predeclare %.*s?)\n",
176 t - oldoldbufptr, oldoldbufptr);
177
178 }
179 else
180 warn("\t(Missing operator before %.*s?)\n", s - oldbp, oldbp);
181 bufptr = oldbp;
8990e307
LW
182}
183
184static void
185missingterm(s)
186char *s;
187{
188 char tmpbuf[3];
189 char q;
190 if (s) {
191 char *nl = strrchr(s,'\n');
192 if (nl)
193 *nl = '\0';
194 }
195 else if (multi_close < 32 || multi_close == 127) {
196 *tmpbuf = '^';
bbce6d69 197 tmpbuf[1] = toCTRL(multi_close);
8990e307
LW
198 s = "\\n";
199 tmpbuf[2] = '\0';
200 s = tmpbuf;
201 }
202 else {
203 *tmpbuf = multi_close;
204 tmpbuf[1] = '\0';
205 s = tmpbuf;
206 }
207 q = strchr(s,'"') ? '\'' : '"';
208 croak("Can't find string terminator %c%s%c anywhere before EOF",q,s,q);
463ee0b2 209}
79072805
LW
210
211void
a0d0e21e
LW
212deprecate(s)
213char *s;
214{
215 if (dowarn)
216 warn("Use of %s is deprecated", s);
217}
218
219static void
220depcom()
221{
222 deprecate("comma-less variable list");
223}
224
225void
8990e307
LW
226lex_start(line)
227SV *line;
79072805 228{
8990e307
LW
229 char *s;
230 STRLEN len;
231
55497cff 232 SAVEI32(lex_dojoin);
233 SAVEI32(lex_brackets);
234 SAVEI32(lex_fakebrack);
235 SAVEI32(lex_casemods);
236 SAVEI32(lex_starts);
237 SAVEI32(lex_state);
a0d0e21e 238 SAVESPTR(lex_inpat);
55497cff 239 SAVEI32(lex_inwhat);
240 SAVEI16(curcop->cop_line);
85e6fe83
LW
241 SAVEPPTR(bufptr);
242 SAVEPPTR(bufend);
243 SAVEPPTR(oldbufptr);
244 SAVEPPTR(oldoldbufptr);
fd049845 245 SAVEPPTR(linestart);
463ee0b2 246 SAVESPTR(linestr);
85e6fe83 247 SAVEPPTR(lex_brackstack);
a0d0e21e 248 SAVEPPTR(lex_casestack);
6d5fb7e3 249 SAVEDESTRUCTOR(restore_rsfp, rsfp);
463ee0b2 250
79072805
LW
251 lex_state = LEX_NORMAL;
252 lex_defer = 0;
8990e307 253 expect = XSTATE;
79072805
LW
254 lex_brackets = 0;
255 lex_fakebrack = 0;
8990e307 256 New(899, lex_brackstack, 120, char);
a0d0e21e 257 New(899, lex_casestack, 12, char);
8990e307 258 SAVEFREEPV(lex_brackstack);
a0d0e21e 259 SAVEFREEPV(lex_casestack);
79072805 260 lex_casemods = 0;
a0d0e21e 261 *lex_casestack = '\0';
79072805
LW
262 lex_dojoin = 0;
263 lex_starts = 0;
264 if (lex_stuff)
8990e307 265 SvREFCNT_dec(lex_stuff);
79072805
LW
266 lex_stuff = Nullsv;
267 if (lex_repl)
8990e307 268 SvREFCNT_dec(lex_repl);
79072805
LW
269 lex_repl = Nullsv;
270 lex_inpat = 0;
271 lex_inwhat = 0;
8990e307
LW
272 linestr = line;
273 if (SvREADONLY(linestr))
274 linestr = sv_2mortal(newSVsv(linestr));
275 s = SvPV(linestr, len);
276 if (len && s[len-1] != ';') {
a0d0e21e 277 if (!(SvFLAGS(linestr) & SVs_TEMP))
8990e307
LW
278 linestr = sv_2mortal(newSVsv(linestr));
279 sv_catpvn(linestr, "\n;", 2);
280 }
281 SvTEMP_off(linestr);
fd049845 282 oldoldbufptr = oldbufptr = bufptr = linestart = SvPVX(linestr);
79072805 283 bufend = bufptr + SvCUR(linestr);
c07a80fd 284 SvREFCNT_dec(rs);
285 rs = newSVpv("\n", 1);
8990e307 286 rsfp = 0;
79072805 287}
a687059c 288
463ee0b2
LW
289void
290lex_end()
291{
6ca21dd3 292 doextract = FALSE;
463ee0b2
LW
293}
294
295static void
6d5fb7e3
CS
296restore_rsfp(f)
297void *f;
298{
760ac839 299 PerlIO *fp = (PerlIO*)f;
6d5fb7e3 300
760ac839
LW
301 if (rsfp == PerlIO_stdin())
302 PerlIO_clearerr(rsfp);
a5f75d66 303 else if (rsfp && (rsfp != fp))
760ac839 304 PerlIO_close(rsfp);
6d5fb7e3
CS
305 rsfp = fp;
306}
307
308static void
463ee0b2
LW
309incline(s)
310char *s;
311{
312 char *t;
313 char *n;
314 char ch;
315 int sawline = 0;
316
317 curcop->cop_line++;
318 if (*s++ != '#')
319 return;
320 while (*s == ' ' || *s == '\t') s++;
321 if (strnEQ(s, "line ", 5)) {
322 s += 5;
323 sawline = 1;
324 }
325 if (!isDIGIT(*s))
326 return;
327 n = s;
328 while (isDIGIT(*s))
329 s++;
330 while (*s == ' ' || *s == '\t')
331 s++;
332 if (*s == '"' && (t = strchr(s+1, '"')))
333 s++;
334 else {
335 if (!sawline)
336 return; /* false alarm */
337 for (t = s; !isSPACE(*t); t++) ;
338 }
339 ch = *t;
340 *t = '\0';
341 if (t - s > 0)
342 curcop->cop_filegv = gv_fetchfile(s);
343 else
344 curcop->cop_filegv = gv_fetchfile(origfilename);
345 *t = ch;
346 curcop->cop_line = atoi(n)-1;
347}
348
8990e307 349static char *
a687059c
LW
350skipspace(s)
351register char *s;
352{
85e6fe83 353 if (lex_formbrack && lex_brackets <= lex_formbrack) {
463ee0b2
LW
354 while (s < bufend && (*s == ' ' || *s == '\t'))
355 s++;
356 return s;
357 }
358 for (;;) {
fd049845 359 STRLEN prevlen;
463ee0b2
LW
360 while (s < bufend && isSPACE(*s))
361 s++;
362 if (s < bufend && *s == '#') {
363 while (s < bufend && *s != '\n')
364 s++;
365 if (s < bufend)
366 s++;
367 }
a0d0e21e 368 if (s < bufend || !rsfp || lex_state != LEX_NORMAL)
463ee0b2 369 return s;
fd049845 370 if ((s = filter_gets(linestr, rsfp, (prevlen = SvCUR(linestr)))) == Nullch) {
a0d0e21e 371 if (minus_n || minus_p) {
08e9d68e
DD
372 sv_setpv(linestr,minus_p ?
373 ";}continue{print or die qq(-p destination: $!\\n)" :
374 "");
a0d0e21e
LW
375 sv_catpv(linestr,";}");
376 minus_n = minus_p = 0;
377 }
378 else
379 sv_setpv(linestr,";");
fd049845 380 oldoldbufptr = oldbufptr = bufptr = s = linestart = SvPVX(linestr);
a0d0e21e
LW
381 bufend = SvPVX(linestr) + SvCUR(linestr);
382 if (preprocess && !in_eval)
8990e307 383 (void)my_pclose(rsfp);
760ac839
LW
384 else if ((PerlIO*)rsfp == PerlIO_stdin())
385 PerlIO_clearerr(rsfp);
8990e307 386 else
760ac839 387 (void)PerlIO_close(rsfp);
8990e307 388 rsfp = Nullfp;
463ee0b2
LW
389 return s;
390 }
fd049845 391 linestart = bufptr = s + prevlen;
392 bufend = s + SvCUR(linestr);
393 s = bufptr;
a0d0e21e 394 incline(s);
84902520 395 if (PERLDB_LINE && curstash != debstash) {
8990e307
LW
396 SV *sv = NEWSV(85,0);
397
398 sv_upgrade(sv, SVt_PVMG);
fd049845 399 sv_setpvn(sv,bufptr,bufend-bufptr);
8990e307
LW
400 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
401 }
463ee0b2 402 }
a687059c 403}
378cc40b 404
8990e307 405static void
2f3197b3
LW
406check_uni() {
407 char *s;
408 char ch;
a0d0e21e 409 char *t;
2f3197b3
LW
410
411 if (oldoldbufptr != last_uni)
412 return;
413 while (isSPACE(*last_uni))
414 last_uni++;
e334a159 415 for (s = last_uni; isALNUM(*s) || *s == '-'; s++) ;
a0d0e21e
LW
416 if ((t = strchr(s, '(')) && t < bufptr)
417 return;
2f3197b3
LW
418 ch = *s;
419 *s = '\0';
420 warn("Warning: Use of \"%s\" without parens is ambiguous", last_uni);
421 *s = ch;
422}
423
ffed7fef
LW
424#ifdef CRIPPLED_CC
425
426#undef UNI
ffed7fef 427#define UNI(f) return uni(f,s)
ffed7fef 428
8990e307 429static int
ffed7fef 430uni(f,s)
79072805 431I32 f;
ffed7fef
LW
432char *s;
433{
434 yylval.ival = f;
79072805 435 expect = XTERM;
ffed7fef 436 bufptr = s;
2f3197b3 437 last_uni = oldbufptr;
a0d0e21e 438 last_lop_op = f;
ffed7fef
LW
439 if (*s == '(')
440 return FUNC1;
441 s = skipspace(s);
442 if (*s == '(')
443 return FUNC1;
444 else
445 return UNIOP;
446}
447
a0d0e21e
LW
448#endif /* CRIPPLED_CC */
449
450#define LOP(f,x) return lop(f,x,s)
451
8990e307 452static I32
f86702cc 453lop
454#ifdef CAN_PROTOTYPE
455 (I32 f, expectation x, char *s)
456#else
457 (f,x,s)
79072805 458I32 f;
a0d0e21e 459expectation x;
ffed7fef 460char *s;
f86702cc 461#endif /* CAN_PROTOTYPE */
ffed7fef 462{
79072805 463 yylval.ival = f;
35c8bce7 464 CLINE;
a0d0e21e 465 expect = x;
79072805 466 bufptr = s;
8990e307
LW
467 last_lop = oldbufptr;
468 last_lop_op = f;
a0d0e21e
LW
469 if (nexttoke)
470 return LSTOP;
79072805
LW
471 if (*s == '(')
472 return FUNC;
473 s = skipspace(s);
474 if (*s == '(')
475 return FUNC;
476 else
477 return LSTOP;
478}
479
8990e307 480static void
79072805
LW
481force_next(type)
482I32 type;
483{
484 nexttype[nexttoke] = type;
485 nexttoke++;
486 if (lex_state != LEX_KNOWNEXT) {
487 lex_defer = lex_state;
463ee0b2 488 lex_expect = expect;
79072805
LW
489 lex_state = LEX_KNOWNEXT;
490 }
491}
492
8990e307 493static char *
a0d0e21e 494force_word(start,token,check_keyword,allow_pack,allow_tick)
463ee0b2 495register char *start;
79072805 496int token;
463ee0b2 497int check_keyword;
a0d0e21e 498int allow_pack;
463ee0b2 499int allow_tick;
79072805 500{
463ee0b2
LW
501 register char *s;
502 STRLEN len;
503
504 start = skipspace(start);
505 s = start;
a0d0e21e
LW
506 if (isIDFIRST(*s) ||
507 (allow_pack && *s == ':') ||
508 (allow_tick && *s == '\'') )
509 {
8903cb82 510 s = scan_word(s, tokenbuf, sizeof tokenbuf, allow_pack, &len);
463ee0b2
LW
511 if (check_keyword && keyword(tokenbuf, len))
512 return start;
513 if (token == METHOD) {
514 s = skipspace(s);
515 if (*s == '(')
516 expect = XTERM;
517 else {
518 expect = XOPERATOR;
519 force_next(')');
520 force_next('(');
521 }
79072805 522 }
463ee0b2 523 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST,0, newSVpv(tokenbuf,0));
8990e307 524 nextval[nexttoke].opval->op_private |= OPpCONST_BARE;
79072805
LW
525 force_next(token);
526 }
527 return s;
528}
529
8990e307 530static void
a0d0e21e 531force_ident(s, kind)
79072805 532register char *s;
a0d0e21e 533int kind;
79072805
LW
534{
535 if (s && *s) {
748a9306
LW
536 OP* op = (OP*)newSVOP(OP_CONST, 0, newSVpv(s,0));
537 nextval[nexttoke].opval = op;
79072805 538 force_next(WORD);
748a9306
LW
539 if (kind) {
540 op->op_private = OPpCONST_ENTERED;
55497cff 541 /* XXX see note in pp_entereval() for why we forgo typo
542 warnings if the symbol must be introduced in an eval.
543 GSAR 96-10-12 */
544 gv_fetchpv(s, in_eval ? GV_ADDMULTI : TRUE,
a0d0e21e
LW
545 kind == '$' ? SVt_PV :
546 kind == '@' ? SVt_PVAV :
547 kind == '%' ? SVt_PVHV :
548 SVt_PVGV
549 );
748a9306 550 }
79072805
LW
551 }
552}
553
89bfa8cd 554static char *
555force_version(s)
556char *s;
557{
558 OP *version = Nullop;
559
560 s = skipspace(s);
561
562 /* default VERSION number -- GBARR */
563
564 if(isDIGIT(*s)) {
565 char *d;
566 int c;
55497cff 567 for( d=s, c = 1; isDIGIT(*d) || *d == '_' || (*d == '.' && c--); d++);
89bfa8cd 568 if((*d == ';' || isSPACE(*d)) && *(skipspace(d)) != ',') {
569 s = scan_num(s);
570 /* real VERSION number -- GBARR */
571 version = yylval.opval;
572 }
573 }
574
575 /* NOTE: The parser sees the package name and the VERSION swapped */
576 nextval[nexttoke].opval = version;
577 force_next(WORD);
578
579 return (s);
580}
581
8990e307 582static SV *
79072805
LW
583q(sv)
584SV *sv;
585{
586 register char *s;
587 register char *send;
588 register char *d;
463ee0b2 589 STRLEN len;
79072805
LW
590
591 if (!SvLEN(sv))
592 return sv;
593
a0d0e21e 594 s = SvPV_force(sv, len);
748a9306
LW
595 if (SvIVX(sv) == -1)
596 return sv;
463ee0b2 597 send = s + len;
79072805
LW
598 while (s < send && *s != '\\')
599 s++;
600 if (s == send)
601 return sv;
602 d = s;
79072805
LW
603 while (s < send) {
604 if (*s == '\\') {
a0d0e21e 605 if (s + 1 < send && (s[1] == '\\'))
79072805
LW
606 s++; /* all that, just for this */
607 }
608 *d++ = *s++;
609 }
610 *d = '\0';
463ee0b2 611 SvCUR_set(sv, d - SvPVX(sv));
79072805
LW
612
613 return sv;
614}
615
8990e307 616static I32
79072805
LW
617sublex_start()
618{
619 register I32 op_type = yylval.ival;
79072805
LW
620
621 if (op_type == OP_NULL) {
622 yylval.opval = lex_op;
623 lex_op = Nullop;
624 return THING;
625 }
626 if (op_type == OP_CONST || op_type == OP_READLINE) {
1c9c84df
CS
627 SV *sv = q(lex_stuff);
628 STRLEN len;
629 char *p = SvPV(sv, len);
630 yylval.opval = (OP*)newSVOP(op_type, 0, newSVpv(p, len));
631 SvREFCNT_dec(sv);
79072805
LW
632 lex_stuff = Nullsv;
633 return THING;
634 }
635
55497cff 636 sublex_info.super_state = lex_state;
637 sublex_info.sub_inwhat = op_type;
638 sublex_info.sub_op = lex_op;
639 lex_state = LEX_INTERPPUSH;
640
641 expect = XTERM;
642 if (lex_op) {
643 yylval.opval = lex_op;
644 lex_op = Nullop;
645 return PMFUNC;
646 }
647 else
648 return FUNC;
649}
650
651static I32
652sublex_push()
653{
79072805 654 push_scope();
55497cff 655
656 lex_state = sublex_info.super_state;
657 SAVEI32(lex_dojoin);
658 SAVEI32(lex_brackets);
659 SAVEI32(lex_fakebrack);
660 SAVEI32(lex_casemods);
661 SAVEI32(lex_starts);
662 SAVEI32(lex_state);
a0d0e21e 663 SAVESPTR(lex_inpat);
55497cff 664 SAVEI32(lex_inwhat);
665 SAVEI16(curcop->cop_line);
85e6fe83
LW
666 SAVEPPTR(bufptr);
667 SAVEPPTR(oldbufptr);
668 SAVEPPTR(oldoldbufptr);
fd049845 669 SAVEPPTR(linestart);
79072805 670 SAVESPTR(linestr);
85e6fe83 671 SAVEPPTR(lex_brackstack);
a0d0e21e 672 SAVEPPTR(lex_casestack);
79072805
LW
673
674 linestr = lex_stuff;
675 lex_stuff = Nullsv;
676
fd049845 677 bufend = bufptr = oldbufptr = oldoldbufptr = linestart = SvPVX(linestr);
79072805 678 bufend += SvCUR(linestr);
8990e307 679 SAVEFREESV(linestr);
79072805
LW
680
681 lex_dojoin = FALSE;
682 lex_brackets = 0;
683 lex_fakebrack = 0;
8990e307 684 New(899, lex_brackstack, 120, char);
a0d0e21e 685 New(899, lex_casestack, 12, char);
8990e307 686 SAVEFREEPV(lex_brackstack);
a0d0e21e 687 SAVEFREEPV(lex_casestack);
79072805 688 lex_casemods = 0;
a0d0e21e 689 *lex_casestack = '\0';
79072805
LW
690 lex_starts = 0;
691 lex_state = LEX_INTERPCONCAT;
692 curcop->cop_line = multi_start;
693
55497cff 694 lex_inwhat = sublex_info.sub_inwhat;
695 if (lex_inwhat == OP_MATCH || lex_inwhat == OP_SUBST)
696 lex_inpat = sublex_info.sub_op;
79072805 697 else
55497cff 698 lex_inpat = Nullop;
79072805 699
55497cff 700 return '(';
79072805
LW
701}
702
8990e307 703static I32
79072805
LW
704sublex_done()
705{
706 if (!lex_starts++) {
707 expect = XOPERATOR;
93a17b20 708 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv("",0));
79072805
LW
709 return THING;
710 }
711
712 if (lex_casemods) { /* oops, we've got some unbalanced parens */
713 lex_state = LEX_INTERPCASEMOD;
714 return yylex();
715 }
716
79072805
LW
717 /* Is there a right-hand side to take care of? */
718 if (lex_repl && (lex_inwhat == OP_SUBST || lex_inwhat == OP_TRANS)) {
719 linestr = lex_repl;
720 lex_inpat = 0;
fd049845 721 bufend = bufptr = oldbufptr = oldoldbufptr = linestart = SvPVX(linestr);
79072805 722 bufend += SvCUR(linestr);
8990e307 723 SAVEFREESV(linestr);
79072805
LW
724 lex_dojoin = FALSE;
725 lex_brackets = 0;
726 lex_fakebrack = 0;
727 lex_casemods = 0;
a0d0e21e 728 *lex_casestack = '\0';
79072805
LW
729 lex_starts = 0;
730 if (SvCOMPILED(lex_repl)) {
731 lex_state = LEX_INTERPNORMAL;
732 lex_starts++;
733 }
734 else
735 lex_state = LEX_INTERPCONCAT;
736 lex_repl = Nullsv;
737 return ',';
ffed7fef
LW
738 }
739 else {
79072805 740 pop_scope();
463ee0b2 741 bufend = SvPVX(linestr);
79072805
LW
742 bufend += SvCUR(linestr);
743 expect = XOPERATOR;
744 return ')';
ffed7fef
LW
745 }
746}
747
8990e307 748static char *
79072805
LW
749scan_const(start)
750char *start;
751{
752 register char *send = bufend;
753 SV *sv = NEWSV(93, send - start);
754 register char *s = start;
463ee0b2 755 register char *d = SvPVX(sv);
79072805
LW
756 bool dorange = FALSE;
757 I32 len;
758 char *leave =
759 lex_inpat
748a9306 760 ? "\\.^$@AGZdDwWsSbB+*?|()-nrtfeaxc0123456789[{]} \t\n\r\f\v#"
79072805
LW
761 : (lex_inwhat & OP_TRANS)
762 ? ""
763 : "";
764
765 while (s < send || dorange) {
766 if (lex_inwhat == OP_TRANS) {
767 if (dorange) {
768 I32 i;
769 I32 max;
463ee0b2 770 i = d - SvPVX(sv);
79072805 771 SvGROW(sv, SvLEN(sv) + 256);
463ee0b2 772 d = SvPVX(sv) + i;
79072805 773 d -= 2;
91b7def8 774 max = (U8)d[1];
775 for (i = (U8)*d; i <= max; i++)
79072805
LW
776 *d++ = i;
777 dorange = FALSE;
778 continue;
779 }
780 else if (*s == '-' && s+1 < send && s != start) {
781 dorange = TRUE;
782 s++;
783 }
784 }
748a9306
LW
785 else if (*s == '(' && lex_inpat && s[1] == '?' && s[2] == '#') {
786 while (s < send && *s != ')')
787 *d++ = *s++;
788 }
789 else if (*s == '#' && lex_inpat &&
790 ((PMOP*)lex_inpat)->op_pmflags & PMf_EXTENDED) {
791 while (s+1 < send && *s != '\n')
792 *d++ = *s++;
793 }
a0d0e21e 794 else if (*s == '@' && s[1] && (isALNUM(s[1]) || strchr(":'{$", s[1])))
79072805
LW
795 break;
796 else if (*s == '$') {
797 if (!lex_inpat) /* not a regexp, so $ must be var */
798 break;
a0d0e21e 799 if (s + 1 < send && !strchr(")| \n\t", s[1]))
79072805
LW
800 break; /* in regexp, $ might be tail anchor */
801 }
802 if (*s == '\\' && s+1 < send) {
803 s++;
93a17b20 804 if (*s && strchr(leave, *s)) {
79072805
LW
805 *d++ = '\\';
806 *d++ = *s++;
807 continue;
808 }
809 if (lex_inwhat == OP_SUBST && !lex_inpat &&
a0d0e21e 810 isDIGIT(*s) && *s != '0' && !isDIGIT(s[1]))
79072805 811 {
a0d0e21e
LW
812 if (dowarn)
813 warn("\\%c better written as $%c", *s, *s);
79072805
LW
814 *--s = '$';
815 break;
816 }
a0d0e21e 817 if (lex_inwhat != OP_TRANS && *s && strchr("lLuUEQ", *s)) {
79072805
LW
818 --s;
819 break;
820 }
821 switch (*s) {
822 case '-':
823 if (lex_inwhat == OP_TRANS) {
824 *d++ = *s++;
825 continue;
826 }
827 /* FALL THROUGH */
828 default:
829 *d++ = *s++;
830 continue;
831 case '0': case '1': case '2': case '3':
832 case '4': case '5': case '6': case '7':
833 *d++ = scan_oct(s, 3, &len);
834 s += len;
835 continue;
836 case 'x':
837 *d++ = scan_hex(++s, 2, &len);
838 s += len;
839 continue;
840 case 'c':
841 s++;
bbce6d69 842 len = *s++;
843 *d++ = toCTRL(len);
79072805
LW
844 continue;
845 case 'b':
846 *d++ = '\b';
847 break;
848 case 'n':
849 *d++ = '\n';
850 break;
851 case 'r':
852 *d++ = '\r';
853 break;
854 case 'f':
855 *d++ = '\f';
856 break;
857 case 't':
858 *d++ = '\t';
859 break;
860 case 'e':
861 *d++ = '\033';
862 break;
863 case 'a':
864 *d++ = '\007';
865 break;
866 }
867 s++;
868 continue;
869 }
870 *d++ = *s++;
871 }
872 *d = '\0';
463ee0b2 873 SvCUR_set(sv, d - SvPVX(sv));
79072805
LW
874 SvPOK_on(sv);
875
876 if (SvCUR(sv) + 5 < SvLEN(sv)) {
877 SvLEN_set(sv, SvCUR(sv) + 1);
463ee0b2 878 Renew(SvPVX(sv), SvLEN(sv), char);
79072805
LW
879 }
880 if (s > bufptr)
881 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
882 else
8990e307 883 SvREFCNT_dec(sv);
79072805
LW
884 return s;
885}
886
887/* This is the one truly awful dwimmer necessary to conflate C and sed. */
8990e307 888static int
79072805
LW
889intuit_more(s)
890register char *s;
891{
892 if (lex_brackets)
893 return TRUE;
894 if (*s == '-' && s[1] == '>' && (s[2] == '[' || s[2] == '{'))
895 return TRUE;
896 if (*s != '{' && *s != '[')
897 return FALSE;
898 if (!lex_inpat)
899 return TRUE;
900
901 /* In a pattern, so maybe we have {n,m}. */
902 if (*s == '{') {
903 s++;
904 if (!isDIGIT(*s))
905 return TRUE;
906 while (isDIGIT(*s))
907 s++;
908 if (*s == ',')
909 s++;
910 while (isDIGIT(*s))
911 s++;
912 if (*s == '}')
913 return FALSE;
914 return TRUE;
915
916 }
917
918 /* On the other hand, maybe we have a character class */
919
920 s++;
921 if (*s == ']' || *s == '^')
922 return FALSE;
923 else {
924 int weight = 2; /* let's weigh the evidence */
925 char seen[256];
926 unsigned char un_char = 0, last_un_char;
93a17b20 927 char *send = strchr(s,']');
8903cb82 928 char tmpbuf[sizeof tokenbuf * 4];
79072805
LW
929
930 if (!send) /* has to be an expression */
931 return TRUE;
932
933 Zero(seen,256,char);
934 if (*s == '$')
935 weight -= 3;
936 else if (isDIGIT(*s)) {
937 if (s[1] != ']') {
938 if (isDIGIT(s[1]) && s[2] == ']')
939 weight -= 10;
940 }
941 else
942 weight -= 100;
943 }
944 for (; s < send; s++) {
945 last_un_char = un_char;
946 un_char = (unsigned char)*s;
947 switch (*s) {
948 case '@':
949 case '&':
950 case '$':
951 weight -= seen[un_char] * 10;
952 if (isALNUM(s[1])) {
8903cb82 953 scan_ident(s, send, tmpbuf, sizeof tmpbuf, FALSE);
a0d0e21e 954 if ((int)strlen(tmpbuf) > 1 && gv_fetchpv(tmpbuf,FALSE, SVt_PV))
79072805
LW
955 weight -= 100;
956 else
957 weight -= 10;
958 }
959 else if (*s == '$' && s[1] &&
93a17b20
LW
960 strchr("[#!%*<>()-=",s[1])) {
961 if (/*{*/ strchr("])} =",s[2]))
79072805
LW
962 weight -= 10;
963 else
964 weight -= 1;
965 }
966 break;
967 case '\\':
968 un_char = 254;
969 if (s[1]) {
93a17b20 970 if (strchr("wds]",s[1]))
79072805
LW
971 weight += 100;
972 else if (seen['\''] || seen['"'])
973 weight += 1;
93a17b20 974 else if (strchr("rnftbxcav",s[1]))
79072805
LW
975 weight += 40;
976 else if (isDIGIT(s[1])) {
977 weight += 40;
978 while (s[1] && isDIGIT(s[1]))
979 s++;
980 }
981 }
982 else
983 weight += 100;
984 break;
985 case '-':
986 if (s[1] == '\\')
987 weight += 50;
93a17b20 988 if (strchr("aA01! ",last_un_char))
79072805 989 weight += 30;
93a17b20 990 if (strchr("zZ79~",s[1]))
79072805
LW
991 weight += 30;
992 break;
993 default:
93a17b20 994 if (!isALNUM(last_un_char) && !strchr("$@&",last_un_char) &&
79072805
LW
995 isALPHA(*s) && s[1] && isALPHA(s[1])) {
996 char *d = tmpbuf;
997 while (isALPHA(*s))
998 *d++ = *s++;
999 *d = '\0';
1000 if (keyword(tmpbuf, d - tmpbuf))
1001 weight -= 150;
1002 }
1003 if (un_char == last_un_char + 1)
1004 weight += 5;
1005 weight -= seen[un_char];
1006 break;
1007 }
1008 seen[un_char]++;
1009 }
1010 if (weight >= 0) /* probably a character class */
1011 return FALSE;
1012 }
1013
1014 return TRUE;
1015}
ffed7fef 1016
a0d0e21e
LW
1017static int
1018intuit_method(start,gv)
1019char *start;
1020GV *gv;
1021{
1022 char *s = start + (*start == '$');
8903cb82 1023 char tmpbuf[sizeof tokenbuf];
a0d0e21e
LW
1024 STRLEN len;
1025 GV* indirgv;
1026
1027 if (gv) {
1028 if (GvIO(gv))
1029 return 0;
8ebc5c01 1030 if (!GvCVu(gv))
a0d0e21e
LW
1031 gv = 0;
1032 }
8903cb82 1033 s = scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
a0d0e21e
LW
1034 if (*start == '$') {
1035 if (gv || last_lop_op == OP_PRINT || isUPPER(*tokenbuf))
1036 return 0;
1037 s = skipspace(s);
1038 bufptr = start;
1039 expect = XREF;
1040 return *s == '(' ? FUNCMETH : METHOD;
1041 }
1042 if (!keyword(tmpbuf, len)) {
1043 indirgv = gv_fetchpv(tmpbuf,FALSE, SVt_PVCV);
8ebc5c01 1044 if (indirgv && GvCVu(indirgv))
a0d0e21e
LW
1045 return 0;
1046 /* filehandle or package name makes it a method */
89bfa8cd 1047 if (!gv || GvIO(indirgv) || gv_stashpvn(tmpbuf, len, FALSE)) {
a0d0e21e 1048 s = skipspace(s);
55497cff 1049 if ((bufend - s) >= 2 && *s == '=' && *(s+1) == '>')
1050 return 0; /* no assumptions -- "=>" quotes bearword */
a0d0e21e
LW
1051 nextval[nexttoke].opval =
1052 (OP*)newSVOP(OP_CONST, 0,
1053 newSVpv(tmpbuf,0));
1054 nextval[nexttoke].opval->op_private =
1055 OPpCONST_BARE;
1056 expect = XTERM;
1057 force_next(WORD);
1058 bufptr = s;
1059 return *s == '(' ? FUNCMETH : METHOD;
1060 }
1061 }
1062 return 0;
1063}
1064
1065static char*
1066incl_perldb()
1067{
1068 if (perldb) {
1069 char *pdb = getenv("PERL5DB");
1070
1071 if (pdb)
1072 return pdb;
1073 return "BEGIN { require 'perl5db.pl' }";
1074 }
1075 return "";
1076}
1077
1078
16d20bd9
AD
1079/* Encoded script support. filter_add() effectively inserts a
1080 * 'pre-processing' function into the current source input stream.
1081 * Note that the filter function only applies to the current source file
1082 * (e.g., it will not affect files 'require'd or 'use'd by this one).
1083 *
1084 * The datasv parameter (which may be NULL) can be used to pass
1085 * private data to this instance of the filter. The filter function
1086 * can recover the SV using the FILTER_DATA macro and use it to
1087 * store private buffers and state information.
1088 *
1089 * The supplied datasv parameter is upgraded to a PVIO type
1090 * and the IoDIRP field is used to store the function pointer.
1091 * Note that IoTOP_NAME, IoFMT_NAME, IoBOTTOM_NAME, if set for
1092 * private use must be set using malloc'd pointers.
1093 */
1094static int filter_debug = 0;
1095
1096SV *
1097filter_add(funcp, datasv)
1098 filter_t funcp;
1099 SV *datasv;
1100{
1101 if (!funcp){ /* temporary handy debugging hack to be deleted */
1102 filter_debug = atoi((char*)datasv);
1103 return NULL;
1104 }
1105 if (!rsfp_filters)
1106 rsfp_filters = newAV();
1107 if (!datasv)
1108 datasv = newSV(0);
1109 if (!SvUPGRADE(datasv, SVt_PVIO))
1110 die("Can't upgrade filter_add data to SVt_PVIO");
1111 IoDIRP(datasv) = (DIR*)funcp; /* stash funcp into spare field */
1112 if (filter_debug)
ff0cee69 1113 warn("filter_add func %p (%s)", funcp, SvPV(datasv,na));
e50aee73
AD
1114 av_unshift(rsfp_filters, 1);
1115 av_store(rsfp_filters, 0, datasv) ;
16d20bd9
AD
1116 return(datasv);
1117}
1118
1119
1120/* Delete most recently added instance of this filter function. */
a0d0e21e 1121void
16d20bd9
AD
1122filter_del(funcp)
1123 filter_t funcp;
1124{
1125 if (filter_debug)
ff0cee69 1126 warn("filter_del func %p", funcp);
16d20bd9
AD
1127 if (!rsfp_filters || AvFILL(rsfp_filters)<0)
1128 return;
1129 /* if filter is on top of stack (usual case) just pop it off */
e50aee73
AD
1130 if (IoDIRP(FILTER_DATA(0)) == (void*)funcp){
1131 /* sv_free(av_pop(rsfp_filters)); */
1132 sv_free(av_shift(rsfp_filters));
1133
16d20bd9
AD
1134 return;
1135 }
1136 /* we need to search for the correct entry and clear it */
1137 die("filter_del can only delete in reverse order (currently)");
1138}
1139
1140
1141/* Invoke the n'th filter function for the current rsfp. */
1142I32
1143filter_read(idx, buf_sv, maxlen)
1144 int idx;
1145 SV *buf_sv;
1146 int maxlen; /* 0 = read one text line */
a0d0e21e 1147{
16d20bd9
AD
1148 filter_t funcp;
1149 SV *datasv = NULL;
e50aee73 1150
16d20bd9
AD
1151 if (!rsfp_filters)
1152 return -1;
1153 if (idx > AvFILL(rsfp_filters)){ /* Any more filters? */
1154 /* Provide a default input filter to make life easy. */
1155 /* Note that we append to the line. This is handy. */
16d20bd9
AD
1156 if (filter_debug)
1157 warn("filter_read %d: from rsfp\n", idx);
1158 if (maxlen) {
1159 /* Want a block */
1160 int len ;
1161 int old_len = SvCUR(buf_sv) ;
1162
1163 /* ensure buf_sv is large enough */
1164 SvGROW(buf_sv, old_len + maxlen) ;
760ac839
LW
1165 if ((len = PerlIO_read(rsfp, SvPVX(buf_sv) + old_len, maxlen)) <= 0){
1166 if (PerlIO_error(rsfp))
37120919
AD
1167 return -1; /* error */
1168 else
1169 return 0 ; /* end of file */
1170 }
16d20bd9
AD
1171 SvCUR_set(buf_sv, old_len + len) ;
1172 } else {
1173 /* Want a line */
37120919 1174 if (sv_gets(buf_sv, rsfp, SvCUR(buf_sv)) == NULL) {
760ac839 1175 if (PerlIO_error(rsfp))
37120919
AD
1176 return -1; /* error */
1177 else
1178 return 0 ; /* end of file */
1179 }
16d20bd9
AD
1180 }
1181 return SvCUR(buf_sv);
1182 }
1183 /* Skip this filter slot if filter has been deleted */
1184 if ( (datasv = FILTER_DATA(idx)) == &sv_undef){
1185 if (filter_debug)
1186 warn("filter_read %d: skipped (filter deleted)\n", idx);
1187 return FILTER_READ(idx+1, buf_sv, maxlen); /* recurse */
1188 }
1189 /* Get function pointer hidden within datasv */
1190 funcp = (filter_t)IoDIRP(datasv);
1191 if (filter_debug)
ff0cee69 1192 warn("filter_read %d: via function %p (%s)\n",
16d20bd9
AD
1193 idx, funcp, SvPV(datasv,na));
1194 /* Call function. The function is expected to */
1195 /* call "FILTER_READ(idx+1, buf_sv)" first. */
37120919 1196 /* Return: <0:error, =0:eof, >0:not eof */
16d20bd9
AD
1197 return (*funcp)(idx, buf_sv, maxlen);
1198}
1199
1200static char *
fd049845 1201filter_gets(sv,fp, append)
16d20bd9 1202register SV *sv;
760ac839 1203register PerlIO *fp;
fd049845 1204STRLEN append;
16d20bd9
AD
1205{
1206 if (rsfp_filters) {
1207
55497cff 1208 if (!append)
1209 SvCUR_set(sv, 0); /* start with empty line */
16d20bd9
AD
1210 if (FILTER_READ(0, sv, 0) > 0)
1211 return ( SvPVX(sv) ) ;
1212 else
1213 return Nullch ;
1214 }
1215 else
fd049845 1216 return (sv_gets(sv, fp, append));
16d20bd9 1217
a0d0e21e
LW
1218}
1219
1220
748a9306
LW
1221#ifdef DEBUGGING
1222 static char* exp_name[] =
a0d0e21e 1223 { "OPERATOR", "TERM", "REF", "STATE", "BLOCK", "TERMBLOCK" };
748a9306 1224#endif
463ee0b2 1225
71be2cbc 1226EXT int yychar; /* last token */
463ee0b2 1227
2f3197b3 1228int
378cc40b
LW
1229yylex()
1230{
79072805 1231 register char *s;
378cc40b 1232 register char *d;
79072805 1233 register I32 tmp;
463ee0b2 1234 STRLEN len;
a687059c 1235
bbce6d69 1236 if (pending_ident) {
1237 char pit = pending_ident;
1238 pending_ident = 0;
1239
1240 if (in_my) {
1241 if (strchr(tokenbuf,':'))
1242 croak(no_myglob,tokenbuf);
1243 yylval.opval = newOP(OP_PADANY, 0);
1244 yylval.opval->op_targ = pad_allocmy(tokenbuf);
1245 return PRIVATEREF;
1246 }
1247
1248 if (!strchr(tokenbuf,':') && (tmp = pad_findmy(tokenbuf))) {
1249 if (last_lop_op == OP_SORT &&
1250 tokenbuf[0] == '$' &&
1251 (tokenbuf[1] == 'a' || tokenbuf[1] == 'b')
1252 && !tokenbuf[2])
1253 {
1254 for (d = in_eval ? oldoldbufptr : linestart;
1255 d < bufend && *d != '\n';
1256 d++)
1257 {
1258 if (strnEQ(d,"<=>",3) || strnEQ(d,"cmp",3)) {
1259 croak("Can't use \"my %s\" in sort comparison",
1260 tokenbuf);
1261 }
1262 }
1263 }
1264
1265 yylval.opval = newOP(OP_PADANY, 0);
1266 yylval.opval->op_targ = tmp;
1267 return PRIVATEREF;
1268 }
1269
1270 /* Force them to make up their mind on "@foo". */
1271 if (pit == '@' && lex_state != LEX_NORMAL && !lex_brackets) {
1272 GV *gv = gv_fetchpv(tokenbuf+1, FALSE, SVt_PVAV);
46fc3d4c 1273 if (!gv || ((tokenbuf[0] == '@') ? !GvAV(gv) : !GvHV(gv)))
1274 yyerror(form("In string, %s now must be written as \\%s",
1275 tokenbuf, tokenbuf));
bbce6d69 1276 }
1277
1278 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf+1, 0));
1279 yylval.opval->op_private = OPpCONST_ENTERED;
1280 gv_fetchpv(tokenbuf+1, in_eval ? GV_ADDMULTI : TRUE,
1281 ((tokenbuf[0] == '$') ? SVt_PV
1282 : (tokenbuf[0] == '@') ? SVt_PVAV
1283 : SVt_PVHV));
1284 return WORD;
1285 }
1286
79072805
LW
1287 switch (lex_state) {
1288#ifdef COMMENTARY
1289 case LEX_NORMAL: /* Some compilers will produce faster */
1290 case LEX_INTERPNORMAL: /* code if we comment these out. */
1291 break;
1292#endif
1293
1294 case LEX_KNOWNEXT:
1295 nexttoke--;
1296 yylval = nextval[nexttoke];
463ee0b2 1297 if (!nexttoke) {
79072805 1298 lex_state = lex_defer;
463ee0b2 1299 expect = lex_expect;
a0d0e21e 1300 lex_defer = LEX_NORMAL;
463ee0b2 1301 }
79072805
LW
1302 return(nexttype[nexttoke]);
1303
1304 case LEX_INTERPCASEMOD:
1305#ifdef DEBUGGING
1306 if (bufptr != bufend && *bufptr != '\\')
463ee0b2 1307 croak("panic: INTERPCASEMOD");
79072805
LW
1308#endif
1309 if (bufptr == bufend || bufptr[1] == 'E') {
a0d0e21e 1310 char oldmod;
79072805 1311 if (lex_casemods) {
a0d0e21e
LW
1312 oldmod = lex_casestack[--lex_casemods];
1313 lex_casestack[lex_casemods] = '\0';
1314 if (bufptr != bufend && strchr("LUQ", oldmod)) {
1315 bufptr += 2;
1316 lex_state = LEX_INTERPCONCAT;
1317 }
79072805
LW
1318 return ')';
1319 }
a0d0e21e
LW
1320 if (bufptr != bufend)
1321 bufptr += 2;
1322 lex_state = LEX_INTERPCONCAT;
79072805
LW
1323 return yylex();
1324 }
1325 else {
1326 s = bufptr + 1;
1327 if (strnEQ(s, "L\\u", 3) || strnEQ(s, "U\\l", 3))
1328 tmp = *s, *s = s[2], s[2] = tmp; /* misordered... */
a0d0e21e
LW
1329 if (strchr("LU", *s) &&
1330 (strchr(lex_casestack, 'L') || strchr(lex_casestack, 'U')))
1331 {
1332 lex_casestack[--lex_casemods] = '\0';
1333 return ')';
1334 }
1335 if (lex_casemods > 10) {
89bfa8cd 1336 char* newlb = Renew(lex_casestack, lex_casemods + 2, char);
a0d0e21e
LW
1337 if (newlb != lex_casestack) {
1338 SAVEFREEPV(newlb);
1339 lex_casestack = newlb;
1340 }
1341 }
1342 lex_casestack[lex_casemods++] = *s;
1343 lex_casestack[lex_casemods] = '\0';
79072805
LW
1344 lex_state = LEX_INTERPCONCAT;
1345 nextval[nexttoke].ival = 0;
1346 force_next('(');
1347 if (*s == 'l')
1348 nextval[nexttoke].ival = OP_LCFIRST;
1349 else if (*s == 'u')
1350 nextval[nexttoke].ival = OP_UCFIRST;
1351 else if (*s == 'L')
1352 nextval[nexttoke].ival = OP_LC;
1353 else if (*s == 'U')
1354 nextval[nexttoke].ival = OP_UC;
a0d0e21e
LW
1355 else if (*s == 'Q')
1356 nextval[nexttoke].ival = OP_QUOTEMETA;
79072805 1357 else
463ee0b2 1358 croak("panic: yylex");
79072805
LW
1359 bufptr = s + 1;
1360 force_next(FUNC);
1361 if (lex_starts) {
1362 s = bufptr;
463ee0b2 1363 lex_starts = 0;
79072805
LW
1364 Aop(OP_CONCAT);
1365 }
1366 else
1367 return yylex();
1368 }
1369
55497cff 1370 case LEX_INTERPPUSH:
1371 return sublex_push();
1372
79072805
LW
1373 case LEX_INTERPSTART:
1374 if (bufptr == bufend)
1375 return sublex_done();
1376 expect = XTERM;
1377 lex_dojoin = (*bufptr == '@');
1378 lex_state = LEX_INTERPNORMAL;
1379 if (lex_dojoin) {
1380 nextval[nexttoke].ival = 0;
1381 force_next(',');
a0d0e21e 1382 force_ident("\"", '$');
79072805
LW
1383 nextval[nexttoke].ival = 0;
1384 force_next('$');
1385 nextval[nexttoke].ival = 0;
1386 force_next('(');
1387 nextval[nexttoke].ival = OP_JOIN; /* emulate join($", ...) */
1388 force_next(FUNC);
1389 }
1390 if (lex_starts++) {
1391 s = bufptr;
1392 Aop(OP_CONCAT);
1393 }
68dc0745 1394 return yylex();
79072805
LW
1395
1396 case LEX_INTERPENDMAYBE:
1397 if (intuit_more(bufptr)) {
1398 lex_state = LEX_INTERPNORMAL; /* false alarm, more expr */
1399 break;
1400 }
1401 /* FALL THROUGH */
1402
1403 case LEX_INTERPEND:
1404 if (lex_dojoin) {
1405 lex_dojoin = FALSE;
1406 lex_state = LEX_INTERPCONCAT;
1407 return ')';
1408 }
1409 /* FALLTHROUGH */
1410 case LEX_INTERPCONCAT:
1411#ifdef DEBUGGING
1412 if (lex_brackets)
463ee0b2 1413 croak("panic: INTERPCONCAT");
79072805
LW
1414#endif
1415 if (bufptr == bufend)
1416 return sublex_done();
1417
ed6116ce 1418 if (SvIVX(linestr) == '\'') {
79072805
LW
1419 SV *sv = newSVsv(linestr);
1420 if (!lex_inpat)
1421 sv = q(sv);
1422 yylval.opval = (OP*)newSVOP(OP_CONST, 0, sv);
1423 s = bufend;
1424 }
1425 else {
1426 s = scan_const(bufptr);
1427 if (*s == '\\')
1428 lex_state = LEX_INTERPCASEMOD;
1429 else
1430 lex_state = LEX_INTERPSTART;
1431 }
1432
1433 if (s != bufptr) {
1434 nextval[nexttoke] = yylval;
463ee0b2 1435 expect = XTERM;
79072805
LW
1436 force_next(THING);
1437 if (lex_starts++)
1438 Aop(OP_CONCAT);
1439 else {
1440 bufptr = s;
1441 return yylex();
1442 }
1443 }
1444
1445 return yylex();
a0d0e21e
LW
1446 case LEX_FORMLINE:
1447 lex_state = LEX_NORMAL;
1448 s = scan_formline(bufptr);
1449 if (!lex_formbrack)
1450 goto rightbracket;
1451 OPERATOR(';');
79072805
LW
1452 }
1453
1454 s = bufptr;
a687059c
LW
1455 oldoldbufptr = oldbufptr;
1456 oldbufptr = s;
79072805 1457 DEBUG_p( {
760ac839 1458 PerlIO_printf(PerlIO_stderr(), "### Tokener expecting %s at %s\n", exp_name[expect], s);
79072805 1459 } )
463ee0b2
LW
1460
1461 retry:
378cc40b
LW
1462 switch (*s) {
1463 default:
54310121 1464 croak("Unrecognized character \\%03o", *s & 255);
e929a76b
LW
1465 case 4:
1466 case 26:
1467 goto fake_eof; /* emulate EOF on ^D or ^Z */
378cc40b 1468 case 0:
463ee0b2 1469 if (!rsfp) {
55497cff 1470 last_uni = 0;
1471 last_lop = 0;
463ee0b2
LW
1472 if (lex_brackets)
1473 yyerror("Missing right bracket");
79072805 1474 TOKEN(0);
463ee0b2 1475 }
a687059c
LW
1476 if (s++ < bufend)
1477 goto retry; /* ignore stray nulls */
2f3197b3 1478 last_uni = 0;
79072805 1479 last_lop = 0;
a0d0e21e 1480 if (!in_eval && !preambled) {
79072805 1481 preambled = TRUE;
a0d0e21e 1482 sv_setpv(linestr,incl_perldb());
91b7def8 1483 if (SvCUR(linestr))
1484 sv_catpv(linestr,";");
1485 if (preambleav){
1486 while(AvFILL(preambleav) >= 0) {
1487 SV *tmpsv = av_shift(preambleav);
1488 sv_catsv(linestr, tmpsv);
1489 sv_catpv(linestr, ";");
1490 sv_free(tmpsv);
1491 }
1492 sv_free((SV*)preambleav);
1493 preambleav = NULL;
1494 }
79072805
LW
1495 if (minus_n || minus_p) {
1496 sv_catpv(linestr, "LINE: while (<>) {");
1497 if (minus_l)
a0d0e21e 1498 sv_catpv(linestr,"chomp;");
8fd239a7
CS
1499 if (minus_a) {
1500 GV* gv = gv_fetchpv("::F", TRUE, SVt_PVAV);
1501 if (gv)
1502 GvIMPORTED_AV_on(gv);
1503 if (minus_F) {
54310121 1504 if (strchr("/'\"", *splitstr)
1505 && strchr(splitstr + 1, *splitstr))
46fc3d4c 1506 sv_catpvf(linestr, "@F=split(%s);", splitstr);
54310121 1507 else {
1508 char delim;
1509 s = "'~#\200\1'"; /* surely one char is unused...*/
1510 while (s[1] && strchr(splitstr, *s)) s++;
1511 delim = *s;
46fc3d4c 1512 sv_catpvf(linestr, "@F=split(%s%c",
1513 "q" + (delim == '\''), delim);
1514 for (s = splitstr; *s; s++) {
54310121 1515 if (*s == '\\')
46fc3d4c 1516 sv_catpvn(linestr, "\\", 1);
1517 sv_catpvn(linestr, s, 1);
54310121 1518 }
46fc3d4c 1519 sv_catpvf(linestr, "%c);", delim);
54310121 1520 }
2304df62
AD
1521 }
1522 else
1523 sv_catpv(linestr,"@F=split(' ');");
1524 }
79072805 1525 }
a0d0e21e 1526 sv_catpv(linestr, "\n");
fd049845 1527 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
463ee0b2 1528 bufend = SvPVX(linestr) + SvCUR(linestr);
84902520 1529 if (PERLDB_LINE && curstash != debstash) {
a0d0e21e
LW
1530 SV *sv = NEWSV(85,0);
1531
1532 sv_upgrade(sv, SVt_PVMG);
1533 sv_setsv(sv,linestr);
1534 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
1535 }
79072805 1536 goto retry;
a687059c 1537 }
e929a76b 1538 do {
fd049845 1539 if ((s = filter_gets(linestr, rsfp, 0)) == Nullch) {
e929a76b 1540 fake_eof:
395c3793 1541 if (rsfp) {
a0d0e21e 1542 if (preprocess && !in_eval)
79072805 1543 (void)my_pclose(rsfp);
760ac839
LW
1544 else if ((PerlIO *)rsfp == PerlIO_stdin())
1545 PerlIO_clearerr(rsfp);
395c3793 1546 else
760ac839 1547 (void)PerlIO_close(rsfp);
395c3793
LW
1548 rsfp = Nullfp;
1549 }
a0d0e21e 1550 if (!in_eval && (minus_n || minus_p)) {
79072805
LW
1551 sv_setpv(linestr,minus_p ? ";}continue{print" : "");
1552 sv_catpv(linestr,";}");
fd049845 1553 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
463ee0b2 1554 bufend = SvPVX(linestr) + SvCUR(linestr);
e929a76b
LW
1555 minus_n = minus_p = 0;
1556 goto retry;
1557 }
fd049845 1558 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
79072805
LW
1559 sv_setpv(linestr,"");
1560 TOKEN(';'); /* not infinite loop because rsfp is NULL now */
378cc40b 1561 }
a0d0e21e
LW
1562 if (doextract) {
1563 if (*s == '#' && s[1] == '!' && instr(s,"perl"))
1564 doextract = FALSE;
1565
1566 /* Incest with pod. */
1567 if (*s == '=' && strnEQ(s, "=cut", 4)) {
1568 sv_setpv(linestr, "");
fd049845 1569 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
a0d0e21e
LW
1570 bufend = SvPVX(linestr) + SvCUR(linestr);
1571 doextract = FALSE;
1572 }
1573 }
463ee0b2 1574 incline(s);
e929a76b 1575 } while (doextract);
fd049845 1576 oldoldbufptr = oldbufptr = bufptr = linestart = s;
84902520 1577 if (PERLDB_LINE && curstash != debstash) {
79072805 1578 SV *sv = NEWSV(85,0);
a687059c 1579
93a17b20 1580 sv_upgrade(sv, SVt_PVMG);
79072805
LW
1581 sv_setsv(sv,linestr);
1582 av_store(GvAV(curcop->cop_filegv),(I32)curcop->cop_line,sv);
a687059c 1583 }
463ee0b2 1584 bufend = SvPVX(linestr) + SvCUR(linestr);
79072805
LW
1585 if (curcop->cop_line == 1) {
1586 while (s < bufend && isSPACE(*s))
1587 s++;
a0d0e21e 1588 if (*s == ':' && s[1] != ':') /* for csh execing sh scripts */
79072805 1589 s++;
44a8e56a 1590 d = Nullch;
1591 if (!in_eval) {
1592 if (*s == '#' && *(s+1) == '!')
1593 d = s + 2;
1594#ifdef ALTERNATE_SHEBANG
1595 else {
1596 static char as[] = ALTERNATE_SHEBANG;
1597 if (*s == as[0] && strnEQ(s, as, sizeof(as) - 1))
1598 d = s + (sizeof(as) - 1);
1599 }
1600#endif /* ALTERNATE_SHEBANG */
1601 }
1602 if (d) {
b8378b72 1603 char *ipath;
774d564b 1604 char *ipathend;
b8378b72 1605
774d564b 1606 while (isSPACE(*d))
b8378b72
CS
1607 d++;
1608 ipath = d;
774d564b 1609 while (*d && !isSPACE(*d))
1610 d++;
1611 ipathend = d;
1612
1613#ifdef ARG_ZERO_IS_SCRIPT
1614 if (ipathend > ipath) {
1615 /*
1616 * HP-UX (at least) sets argv[0] to the script name,
1617 * which makes $^X incorrect. And Digital UNIX and Linux,
1618 * at least, set argv[0] to the basename of the Perl
1619 * interpreter. So, having found "#!", we'll set it right.
1620 */
1621 SV *x = GvSV(gv_fetchpv("\030", TRUE, SVt_PV));
1622 assert(SvPOK(x) || SvGMAGICAL(x));
9607fc9c 1623 if (sv_eq(x, GvSV(curcop->cop_filegv))) {
774d564b 1624 sv_setpvn(x, ipath, ipathend - ipath);
9607fc9c 1625 SvSETMAGIC(x);
1626 }
774d564b 1627 TAINT_NOT; /* $^X is always tainted, but that's OK */
8ebc5c01 1628 }
774d564b 1629#endif /* ARG_ZERO_IS_SCRIPT */
b8378b72
CS
1630
1631 /*
1632 * Look for options.
1633 */
748a9306
LW
1634 d = instr(s,"perl -");
1635 if (!d)
1636 d = instr(s,"perl");
44a8e56a 1637#ifdef ALTERNATE_SHEBANG
1638 /*
1639 * If the ALTERNATE_SHEBANG on this system starts with a
1640 * character that can be part of a Perl expression, then if
1641 * we see it but not "perl", we're probably looking at the
1642 * start of Perl code, not a request to hand off to some
1643 * other interpreter. Similarly, if "perl" is there, but
1644 * not in the first 'word' of the line, we assume the line
1645 * contains the start of the Perl program.
44a8e56a 1646 */
1647 if (d && *s != '#') {
774d564b 1648 char *c = ipath;
44a8e56a 1649 while (*c && !strchr("; \t\r\n\f\v#", *c))
1650 c++;
1651 if (c < d)
1652 d = Nullch; /* "perl" not in first word; ignore */
1653 else
1654 *s = '#'; /* Don't try to parse shebang line */
1655 }
774d564b 1656#endif /* ALTERNATE_SHEBANG */
748a9306 1657 if (!d &&
44a8e56a 1658 *s == '#' &&
774d564b 1659 ipathend > ipath &&
748a9306
LW
1660 !minus_c &&
1661 !instr(s,"indir") &&
1662 instr(origargv[0],"perl"))
1663 {
9f68db38 1664 char **newargv;
9f68db38 1665
774d564b 1666 *ipathend = '\0';
1667 s = ipathend + 1;
de3bb511 1668 while (s < bufend && isSPACE(*s))
9f68db38
LW
1669 s++;
1670 if (s < bufend) {
1671 Newz(899,newargv,origargc+3,char*);
1672 newargv[1] = s;
de3bb511 1673 while (s < bufend && !isSPACE(*s))
9f68db38
LW
1674 s++;
1675 *s = '\0';
1676 Copy(origargv+1, newargv+2, origargc+1, char*);
1677 }
1678 else
1679 newargv = origargv;
774d564b 1680 newargv[0] = ipath;
1681 execv(ipath, newargv);
1682 croak("Can't exec %s", ipath);
9f68db38 1683 }
748a9306 1684 if (d) {
ba6d6ac9
CS
1685 U32 oldpdb = perldb;
1686 bool oldn = minus_n;
1687 bool oldp = minus_p;
748a9306
LW
1688
1689 while (*d && !isSPACE(*d)) d++;
89bfa8cd 1690 while (*d == ' ' || *d == '\t') d++;
748a9306
LW
1691
1692 if (*d++ == '-') {
8cc95fdb 1693 do {
1694 if (*d == 'M' || *d == 'm') {
1695 char *m = d;
1696 while (*d && !isSPACE(*d)) d++;
1697 croak("Too late for \"-%.*s\" option",
1698 (int)(d - m), m);
1699 }
1700 d = moreswitches(d);
1701 } while (d);
84902520 1702 if (PERLDB_LINE && !oldpdb ||
b084f20b 1703 ( minus_n || minus_p ) && !(oldn || oldp) )
1704 /* if we have already added "LINE: while (<>) {",
1705 we must not do it again */
748a9306
LW
1706 {
1707 sv_setpv(linestr, "");
fd049845 1708 oldoldbufptr = oldbufptr = s = linestart = SvPVX(linestr);
748a9306
LW
1709 bufend = SvPVX(linestr) + SvCUR(linestr);
1710 preambled = FALSE;
84902520 1711 if (PERLDB_LINE)
748a9306
LW
1712 (void)gv_fetchfile(origfilename);
1713 goto retry;
1714 }
a0d0e21e 1715 }
79072805 1716 }
9f68db38 1717 }
79072805 1718 }
85e6fe83 1719 if (lex_formbrack && lex_brackets <= lex_formbrack) {
a0d0e21e
LW
1720 bufptr = s;
1721 lex_state = LEX_FORMLINE;
1722 return yylex();
ae986130 1723 }
378cc40b 1724 goto retry;
4fdae800 1725 case '\r':
54310121 1726 warn("Illegal character \\%03o (carriage return)", '\r');
1727 croak(
1728 "(Maybe you didn't strip carriage returns after a network transfer?)\n");
4fdae800 1729 case ' ': case '\t': case '\f': case 013:
378cc40b
LW
1730 s++;
1731 goto retry;
378cc40b 1732 case '#':
e929a76b 1733 case '\n':
79072805 1734 if (lex_state != LEX_NORMAL || (in_eval && !rsfp)) {
a687059c
LW
1735 d = bufend;
1736 while (s < d && *s != '\n')
378cc40b 1737 s++;
0f85fab0 1738 if (s < d)
378cc40b 1739 s++;
463ee0b2 1740 incline(s);
85e6fe83 1741 if (lex_formbrack && lex_brackets <= lex_formbrack) {
a0d0e21e
LW
1742 bufptr = s;
1743 lex_state = LEX_FORMLINE;
1744 return yylex();
a687059c 1745 }
378cc40b 1746 }
a687059c 1747 else {
378cc40b 1748 *s = '\0';
a687059c
LW
1749 bufend = s;
1750 }
378cc40b
LW
1751 goto retry;
1752 case '-':
79072805 1753 if (s[1] && isALPHA(s[1]) && !isALNUM(s[2])) {
378cc40b 1754 s++;
748a9306
LW
1755 bufptr = s;
1756 tmp = *s++;
1757
1758 while (s < bufend && (*s == ' ' || *s == '\t'))
1759 s++;
1760
1761 if (strnEQ(s,"=>",2)) {
1762 if (dowarn)
1763 warn("Ambiguous use of -%c => resolved to \"-%c\" =>",
ff0cee69 1764 (int)tmp, (int)tmp);
748a9306
LW
1765 s = force_word(bufptr,WORD,FALSE,FALSE,FALSE);
1766 OPERATOR('-'); /* unary minus */
1767 }
e334a159 1768 last_uni = oldbufptr;
a0d0e21e 1769 last_lop_op = OP_FTEREAD; /* good enough */
748a9306 1770 switch (tmp) {
79072805
LW
1771 case 'r': FTST(OP_FTEREAD);
1772 case 'w': FTST(OP_FTEWRITE);
1773 case 'x': FTST(OP_FTEEXEC);
1774 case 'o': FTST(OP_FTEOWNED);
1775 case 'R': FTST(OP_FTRREAD);
1776 case 'W': FTST(OP_FTRWRITE);
1777 case 'X': FTST(OP_FTREXEC);
1778 case 'O': FTST(OP_FTROWNED);
1779 case 'e': FTST(OP_FTIS);
1780 case 'z': FTST(OP_FTZERO);
1781 case 's': FTST(OP_FTSIZE);
1782 case 'f': FTST(OP_FTFILE);
1783 case 'd': FTST(OP_FTDIR);
1784 case 'l': FTST(OP_FTLINK);
1785 case 'p': FTST(OP_FTPIPE);
1786 case 'S': FTST(OP_FTSOCK);
1787 case 'u': FTST(OP_FTSUID);
1788 case 'g': FTST(OP_FTSGID);
1789 case 'k': FTST(OP_FTSVTX);
1790 case 'b': FTST(OP_FTBLK);
1791 case 'c': FTST(OP_FTCHR);
1792 case 't': FTST(OP_FTTTY);
1793 case 'T': FTST(OP_FTTEXT);
1794 case 'B': FTST(OP_FTBINARY);
85e6fe83
LW
1795 case 'M': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTMTIME);
1796 case 'A': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTATIME);
1797 case 'C': gv_fetchpv("\024",TRUE, SVt_PV); FTST(OP_FTCTIME);
378cc40b 1798 default:
ff0cee69 1799 croak("Unrecognized file test: -%c", (int)tmp);
378cc40b
LW
1800 break;
1801 }
1802 }
a687059c
LW
1803 tmp = *s++;
1804 if (*s == tmp) {
1805 s++;
79072805
LW
1806 if (expect == XOPERATOR)
1807 TERM(POSTDEC);
1808 else
1809 OPERATOR(PREDEC);
1810 }
1811 else if (*s == '>') {
1812 s++;
1813 s = skipspace(s);
1814 if (isIDFIRST(*s)) {
a0d0e21e 1815 s = force_word(s,METHOD,FALSE,TRUE,FALSE);
463ee0b2 1816 TOKEN(ARROW);
79072805 1817 }
748a9306
LW
1818 else if (*s == '$')
1819 OPERATOR(ARROW);
463ee0b2 1820 else
748a9306 1821 TERM(ARROW);
a687059c 1822 }
79072805
LW
1823 if (expect == XOPERATOR)
1824 Aop(OP_SUBTRACT);
1825 else {
2f3197b3
LW
1826 if (isSPACE(*s) || !isSPACE(*bufptr))
1827 check_uni();
79072805 1828 OPERATOR('-'); /* unary minus */
2f3197b3 1829 }
79072805 1830
378cc40b 1831 case '+':
a687059c
LW
1832 tmp = *s++;
1833 if (*s == tmp) {
378cc40b 1834 s++;
79072805
LW
1835 if (expect == XOPERATOR)
1836 TERM(POSTINC);
1837 else
1838 OPERATOR(PREINC);
378cc40b 1839 }
79072805
LW
1840 if (expect == XOPERATOR)
1841 Aop(OP_ADD);
1842 else {
2f3197b3
LW
1843 if (isSPACE(*s) || !isSPACE(*bufptr))
1844 check_uni();
a687059c 1845 OPERATOR('+');
2f3197b3 1846 }
a687059c 1847
378cc40b 1848 case '*':
79072805 1849 if (expect != XOPERATOR) {
8903cb82 1850 s = scan_ident(s, bufend, tokenbuf, sizeof tokenbuf, TRUE);
463ee0b2 1851 expect = XOPERATOR;
a0d0e21e
LW
1852 force_ident(tokenbuf, '*');
1853 if (!*tokenbuf)
1854 PREREF('*');
79072805 1855 TERM('*');
a687059c 1856 }
79072805
LW
1857 s++;
1858 if (*s == '*') {
a687059c 1859 s++;
79072805 1860 PWop(OP_POW);
a687059c 1861 }
79072805
LW
1862 Mop(OP_MULTIPLY);
1863
378cc40b 1864 case '%':
bbce6d69 1865 if (expect == XOPERATOR) {
1866 ++s;
1867 Mop(OP_MODULO);
a687059c 1868 }
bbce6d69 1869 tokenbuf[0] = '%';
8903cb82 1870 s = scan_ident(s, bufend, tokenbuf + 1, sizeof tokenbuf - 1, TRUE);
bbce6d69 1871 if (!tokenbuf[1]) {
1872 if (s == bufend)
1873 yyerror("Final % should be \\% or %name");
1874 PREREF('%');
1875 }
1876 pending_ident = '%';
1877 TERM('%');
a687059c 1878
378cc40b 1879 case '^':
79072805 1880 s++;
a0d0e21e 1881 BOop(OP_BIT_XOR);
79072805
LW
1882 case '[':
1883 lex_brackets++;
1884 /* FALL THROUGH */
378cc40b 1885 case '~':
378cc40b 1886 case ',':
378cc40b
LW
1887 tmp = *s++;
1888 OPERATOR(tmp);
a0d0e21e
LW
1889 case ':':
1890 if (s[1] == ':') {
1891 len = 0;
1892 goto just_a_word;
1893 }
1894 s++;
1895 OPERATOR(':');
8990e307
LW
1896 case '(':
1897 s++;
a0d0e21e 1898 if (last_lop == oldoldbufptr || last_uni == oldoldbufptr)
8990e307 1899 oldbufptr = oldoldbufptr; /* allow print(STDOUT 123) */
a0d0e21e
LW
1900 else
1901 expect = XTERM;
1902 TOKEN('(');
378cc40b 1903 case ';':
79072805
LW
1904 if (curcop->cop_line < copline)
1905 copline = curcop->cop_line;
378cc40b
LW
1906 tmp = *s++;
1907 OPERATOR(tmp);
1908 case ')':
378cc40b 1909 tmp = *s++;
16d20bd9
AD
1910 s = skipspace(s);
1911 if (*s == '{')
1912 PREBLOCK(tmp);
378cc40b 1913 TERM(tmp);
79072805
LW
1914 case ']':
1915 s++;
463ee0b2
LW
1916 if (lex_brackets <= 0)
1917 yyerror("Unmatched right bracket");
1918 else
1919 --lex_brackets;
79072805 1920 if (lex_state == LEX_INTERPNORMAL) {
463ee0b2 1921 if (lex_brackets == 0) {
a0d0e21e 1922 if (*s != '[' && *s != '{' && (*s != '-' || s[1] != '>'))
79072805
LW
1923 lex_state = LEX_INTERPEND;
1924 }
1925 }
4633a7c4 1926 TERM(']');
79072805
LW
1927 case '{':
1928 leftbracket:
79072805 1929 s++;
8990e307 1930 if (lex_brackets > 100) {
89bfa8cd 1931 char* newlb = Renew(lex_brackstack, lex_brackets + 1, char);
8990e307
LW
1932 if (newlb != lex_brackstack) {
1933 SAVEFREEPV(newlb);
1934 lex_brackstack = newlb;
1935 }
1936 }
a0d0e21e
LW
1937 switch (expect) {
1938 case XTERM:
1939 if (lex_formbrack) {
1940 s--;
1941 PRETERMBLOCK(DO);
1942 }
1943 if (oldoldbufptr == last_lop)
1944 lex_brackstack[lex_brackets++] = XTERM;
1945 else
1946 lex_brackstack[lex_brackets++] = XOPERATOR;
79072805 1947 OPERATOR(HASHBRACK);
a0d0e21e 1948 case XOPERATOR:
748a9306
LW
1949 while (s < bufend && (*s == ' ' || *s == '\t'))
1950 s++;
44a8e56a 1951 d = s;
1952 tokenbuf[0] = '\0';
1953 if (d < bufend && *d == '-') {
1954 tokenbuf[0] = '-';
1955 d++;
1956 while (d < bufend && (*d == ' ' || *d == '\t'))
1957 d++;
1958 }
1959 if (d < bufend && isIDFIRST(*d)) {
8903cb82 1960 d = scan_word(d, tokenbuf + 1, sizeof tokenbuf - 1,
1961 FALSE, &len);
748a9306
LW
1962 while (d < bufend && (*d == ' ' || *d == '\t'))
1963 d++;
1964 if (*d == '}') {
44a8e56a 1965 char minus = (tokenbuf[0] == '-');
748a9306 1966 if (dowarn &&
44a8e56a 1967 (keyword(tokenbuf + 1, len) ||
1968 (minus && len == 1 && isALPHA(tokenbuf[1])) ||
1969 perl_get_cv(tokenbuf + 1, FALSE) ))
748a9306 1970 warn("Ambiguous use of {%s} resolved to {\"%s\"}",
44a8e56a 1971 tokenbuf + !minus, tokenbuf + !minus);
1972 s = force_word(s + minus, WORD, FALSE, TRUE, FALSE);
1973 if (minus)
1974 force_next('-');
748a9306
LW
1975 }
1976 }
1977 /* FALL THROUGH */
1978 case XBLOCK:
a0d0e21e 1979 lex_brackstack[lex_brackets++] = XSTATE;
2304df62 1980 expect = XSTATE;
a0d0e21e
LW
1981 break;
1982 case XTERMBLOCK:
1983 lex_brackstack[lex_brackets++] = XOPERATOR;
1984 expect = XSTATE;
1985 break;
1986 default: {
1987 char *t;
1988 if (oldoldbufptr == last_lop)
1989 lex_brackstack[lex_brackets++] = XTERM;
1990 else
1991 lex_brackstack[lex_brackets++] = XOPERATOR;
1992 s = skipspace(s);
1993 if (*s == '}')
1994 OPERATOR(HASHBRACK);
b8a4b1be
GS
1995 /* This hack serves to disambiguate a pair of curlies
1996 * as being a block or an anon hash. Normally, expectation
1997 * determines that, but in cases where we're not in a
1998 * position to expect anything in particular (like inside
1999 * eval"") we have to resolve the ambiguity. This code
2000 * covers the case where the first term in the curlies is a
2001 * quoted string. Most other cases need to be explicitly
2002 * disambiguated by prepending a `+' before the opening
2003 * curly in order to force resolution as an anon hash.
2004 *
2005 * XXX should probably propagate the outer expectation
2006 * into eval"" to rely less on this hack, but that could
2007 * potentially break current behavior of eval"".
2008 * GSAR 97-07-21
2009 */
2010 t = s;
2011 if (*s == '\'' || *s == '"' || *s == '`') {
2012 /* common case: get past first string, handling escapes */
2013 for (t++; t < bufend && *t != *s;)
2014 if (*t++ == '\\' && (*t == '\\' || *t == *s))
2015 t++;
2016 t++;
2017 }
2018 else if (*s == 'q') {
2019 if (++t < bufend
2020 && (!isALNUM(*t)
2021 || ((*t == 'q' || *t == 'x') && ++t < bufend
2022 && !isALNUM(*t)))) {
2023 char *tmps;
2024 char open, close, term;
2025 I32 brackets = 1;
2026
2027 while (t < bufend && isSPACE(*t))
2028 t++;
2029 term = *t;
2030 open = term;
2031 if (term && (tmps = strchr("([{< )]}> )]}>",term)))
2032 term = tmps[5];
2033 close = term;
2034 if (open == close)
2035 for (t++; t < bufend; t++) {
6d07e5e9 2036 if (*t == '\\' && t+1 < bufend && open != '\\')
b8a4b1be 2037 t++;
6d07e5e9 2038 else if (*t == open)
b8a4b1be
GS
2039 break;
2040 }
2041 else
2042 for (t++; t < bufend; t++) {
6d07e5e9 2043 if (*t == '\\' && t+1 < bufend)
b8a4b1be 2044 t++;
6d07e5e9 2045 else if (*t == close && --brackets <= 0)
b8a4b1be
GS
2046 break;
2047 else if (*t == open)
2048 brackets++;
2049 }
2050 }
2051 t++;
a0d0e21e 2052 }
b8a4b1be
GS
2053 else if (isALPHA(*s)) {
2054 for (t++; t < bufend && isALNUM(*t); t++) ;
a0d0e21e 2055 }
a0d0e21e
LW
2056 while (t < bufend && isSPACE(*t))
2057 t++;
b8a4b1be
GS
2058 /* if comma follows first term, call it an anon hash */
2059 /* XXX it could be a comma expression with loop modifiers */
2060 if (t < bufend && ((*t == ',' && (*s == 'q' || !isLOWER(*s)))
2061 || (*t == '=' && t[1] == '>')))
a0d0e21e
LW
2062 OPERATOR(HASHBRACK);
2063 if (expect == XREF)
2064 expect = XTERM;
2065 else {
2066 lex_brackstack[lex_brackets-1] = XSTATE;
2067 expect = XSTATE;
2068 }
8990e307 2069 }
a0d0e21e 2070 break;
463ee0b2 2071 }
79072805
LW
2072 yylval.ival = curcop->cop_line;
2073 if (isSPACE(*s) || *s == '#')
2074 copline = NOLINE; /* invalidate current command line number */
79072805 2075 TOKEN('{');
378cc40b 2076 case '}':
79072805
LW
2077 rightbracket:
2078 s++;
463ee0b2
LW
2079 if (lex_brackets <= 0)
2080 yyerror("Unmatched right bracket");
2081 else
2082 expect = (expectation)lex_brackstack[--lex_brackets];
85e6fe83
LW
2083 if (lex_brackets < lex_formbrack)
2084 lex_formbrack = 0;
79072805 2085 if (lex_state == LEX_INTERPNORMAL) {
463ee0b2 2086 if (lex_brackets == 0) {
79072805
LW
2087 if (lex_fakebrack) {
2088 lex_state = LEX_INTERPEND;
2089 bufptr = s;
2090 return yylex(); /* ignore fake brackets */
2091 }
fa83b5b6 2092 if (*s == '-' && s[1] == '>')
2093 lex_state = LEX_INTERPENDMAYBE;
2094 else if (*s != '[' && *s != '{')
79072805
LW
2095 lex_state = LEX_INTERPEND;
2096 }
2097 }
748a9306
LW
2098 if (lex_brackets < lex_fakebrack) {
2099 bufptr = s;
2100 lex_fakebrack = 0;
2101 return yylex(); /* ignore fake brackets */
2102 }
79072805
LW
2103 force_next('}');
2104 TOKEN(';');
378cc40b
LW
2105 case '&':
2106 s++;
2107 tmp = *s++;
2108 if (tmp == '&')
a0d0e21e 2109 AOPERATOR(ANDAND);
378cc40b 2110 s--;
463ee0b2 2111 if (expect == XOPERATOR) {
fd049845 2112 if (dowarn && isALPHA(*s) && bufptr == linestart) {
463ee0b2
LW
2113 curcop->cop_line--;
2114 warn(warn_nosemi);
2115 curcop->cop_line++;
2116 }
79072805 2117 BAop(OP_BIT_AND);
463ee0b2 2118 }
79072805 2119
8903cb82 2120 s = scan_ident(s - 1, bufend, tokenbuf, sizeof tokenbuf, TRUE);
463ee0b2
LW
2121 if (*tokenbuf) {
2122 expect = XOPERATOR;
a0d0e21e 2123 force_ident(tokenbuf, '&');
463ee0b2 2124 }
79072805
LW
2125 else
2126 PREREF('&');
c07a80fd 2127 yylval.ival = (OPpENTERSUB_AMPER<<8);
79072805
LW
2128 TERM('&');
2129
378cc40b
LW
2130 case '|':
2131 s++;
2132 tmp = *s++;
2133 if (tmp == '|')
a0d0e21e 2134 AOPERATOR(OROR);
378cc40b 2135 s--;
79072805 2136 BOop(OP_BIT_OR);
378cc40b
LW
2137 case '=':
2138 s++;
2139 tmp = *s++;
2140 if (tmp == '=')
79072805
LW
2141 Eop(OP_EQ);
2142 if (tmp == '>')
2143 OPERATOR(',');
378cc40b 2144 if (tmp == '~')
79072805 2145 PMop(OP_MATCH);
463ee0b2 2146 if (dowarn && tmp && isSPACE(*s) && strchr("+-*/%.^&|<",tmp))
ff0cee69 2147 warn("Reversed %c= operator",(int)tmp);
378cc40b 2148 s--;
748a9306 2149 if (expect == XSTATE && isALPHA(tmp) &&
fd049845 2150 (s == linestart+1 || s[-2] == '\n') )
748a9306 2151 {
a5f75d66
AD
2152 if (in_eval && !rsfp) {
2153 d = bufend;
2154 while (s < d) {
2155 if (*s++ == '\n') {
2156 incline(s);
2157 if (strnEQ(s,"=cut",4)) {
2158 s = strchr(s,'\n');
2159 if (s)
2160 s++;
2161 else
2162 s = d;
2163 incline(s);
2164 goto retry;
2165 }
2166 }
2167 }
2168 goto retry;
2169 }
a0d0e21e
LW
2170 s = bufend;
2171 doextract = TRUE;
2172 goto retry;
2173 }
2174 if (lex_brackets < lex_formbrack) {
2175 char *t;
2176 for (t = s; *t == ' ' || *t == '\t'; t++) ;
2177 if (*t == '\n' || *t == '#') {
2178 s--;
2179 expect = XBLOCK;
2180 goto leftbracket;
2181 }
79072805 2182 }
a0d0e21e
LW
2183 yylval.ival = 0;
2184 OPERATOR(ASSIGNOP);
378cc40b
LW
2185 case '!':
2186 s++;
2187 tmp = *s++;
2188 if (tmp == '=')
79072805 2189 Eop(OP_NE);
378cc40b 2190 if (tmp == '~')
79072805 2191 PMop(OP_NOT);
378cc40b
LW
2192 s--;
2193 OPERATOR('!');
2194 case '<':
79072805 2195 if (expect != XOPERATOR) {
93a17b20 2196 if (s[1] != '<' && !strchr(s,'>'))
2f3197b3 2197 check_uni();
79072805
LW
2198 if (s[1] == '<')
2199 s = scan_heredoc(s);
2200 else
2201 s = scan_inputsymbol(s);
2202 TERM(sublex_start());
378cc40b
LW
2203 }
2204 s++;
2205 tmp = *s++;
2206 if (tmp == '<')
79072805 2207 SHop(OP_LEFT_SHIFT);
395c3793
LW
2208 if (tmp == '=') {
2209 tmp = *s++;
2210 if (tmp == '>')
79072805 2211 Eop(OP_NCMP);
395c3793 2212 s--;
79072805 2213 Rop(OP_LE);
395c3793 2214 }
378cc40b 2215 s--;
79072805 2216 Rop(OP_LT);
378cc40b
LW
2217 case '>':
2218 s++;
2219 tmp = *s++;
2220 if (tmp == '>')
79072805 2221 SHop(OP_RIGHT_SHIFT);
378cc40b 2222 if (tmp == '=')
79072805 2223 Rop(OP_GE);
378cc40b 2224 s--;
79072805 2225 Rop(OP_GT);
378cc40b
LW
2226
2227 case '$':
bbce6d69 2228 CLINE;
2229
2230 if (expect == XOPERATOR) {
2231 if (lex_formbrack && lex_brackets == lex_formbrack) {
2232 expect = XTERM;
2233 depcom();
2234 return ','; /* grandfather non-comma-format format */
8990e307 2235 }
bbce6d69 2236 }
2237
2238 if (s[1] == '#' && (isALPHA(s[2]) || strchr("_{$:", s[2]))) {
2239 if (expect == XOPERATOR)
2240 no_op("Array length", bufptr);
2241 tokenbuf[0] = '@';
8903cb82 2242 s = scan_ident(s + 1, bufend, tokenbuf + 1, sizeof tokenbuf - 1,
2243 FALSE);
bbce6d69 2244 if (!tokenbuf[1])
a0d0e21e 2245 PREREF(DOLSHARP);
463ee0b2 2246 expect = XOPERATOR;
bbce6d69 2247 pending_ident = '#';
463ee0b2 2248 TOKEN(DOLSHARP);
79072805 2249 }
bbce6d69 2250
2251 if (expect == XOPERATOR)
2252 no_op("Scalar", bufptr);
2253 tokenbuf[0] = '$';
8903cb82 2254 s = scan_ident(s, bufend, tokenbuf + 1, sizeof tokenbuf - 1, FALSE);
bbce6d69 2255 if (!tokenbuf[1]) {
2256 if (s == bufend)
2257 yyerror("Final $ should be \\$ or $name");
2258 PREREF('$');
8990e307 2259 }
a0d0e21e 2260
bbce6d69 2261 /* This kludge not intended to be bulletproof. */
2262 if (tokenbuf[1] == '[' && !tokenbuf[2]) {
2263 yylval.opval = newSVOP(OP_CONST, 0,
2264 newSViv((IV)compiling.cop_arybase));
2265 yylval.opval->op_private = OPpCONST_ARYBASE;
2266 TERM(THING);
2267 }
2268
ff68c719 2269 d = s;
2270 if (lex_state == LEX_NORMAL)
2271 s = skipspace(s);
2272
bbce6d69 2273 if ((expect != XREF || oldoldbufptr == last_lop) && intuit_more(s)) {
2274 char *t;
2275 if (*s == '[') {
2276 tokenbuf[0] = '@';
2277 if (dowarn) {
2278 for(t = s + 1;
2279 isSPACE(*t) || isALNUM(*t) || *t == '$';
2280 t++) ;
a0d0e21e
LW
2281 if (*t++ == ',') {
2282 bufptr = skipspace(bufptr);
bbce6d69 2283 while (t < bufend && *t != ']')
2284 t++;
a0d0e21e 2285 warn("Multidimensional syntax %.*s not supported",
bbce6d69 2286 (t - bufptr) + 1, bufptr);
a0d0e21e
LW
2287 }
2288 }
bbce6d69 2289 }
2290 else if (*s == '{') {
2291 tokenbuf[0] = '%';
2292 if (dowarn && strEQ(tokenbuf+1, "SIG") &&
2293 (t = strchr(s, '}')) && (t = strchr(t, '=')))
2294 {
8903cb82 2295 char tmpbuf[sizeof tokenbuf];
a0d0e21e
LW
2296 STRLEN len;
2297 for (t++; isSPACE(*t); t++) ;
748a9306 2298 if (isIDFIRST(*t)) {
8903cb82 2299 t = scan_word(t, tmpbuf, sizeof tmpbuf, TRUE, &len);
748a9306
LW
2300 if (*t != '(' && perl_get_cv(tmpbuf, FALSE))
2301 warn("You need to quote \"%s\"", tmpbuf);
2302 }
93a17b20
LW
2303 }
2304 }
2f3197b3 2305 }
bbce6d69 2306
2307 expect = XOPERATOR;
ff68c719 2308 if (lex_state == LEX_NORMAL && isSPACE(*d)) {
bbce6d69 2309 bool islop = (last_lop == oldoldbufptr);
bbce6d69 2310 if (!islop || last_lop_op == OP_GREPSTART)
2311 expect = XOPERATOR;
2312 else if (strchr("$@\"'`q", *s))
2313 expect = XTERM; /* e.g. print $fh "foo" */
2314 else if (strchr("&*<%", *s) && isIDFIRST(s[1]))
2315 expect = XTERM; /* e.g. print $fh &sub */
68dc0745 2316 else if (isIDFIRST(*s)) {
8903cb82 2317 char tmpbuf[sizeof tokenbuf];
2318 scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
84902520
TB
2319 if (tmp = keyword(tmpbuf, len)) {
2320 /* binary operators exclude handle interpretations */
2321 switch (tmp) {
2322 case -KEY_x:
2323 case -KEY_eq:
2324 case -KEY_ne:
2325 case -KEY_gt:
2326 case -KEY_lt:
2327 case -KEY_ge:
2328 case -KEY_le:
2329 case -KEY_cmp:
2330 break;
2331 default:
2332 expect = XTERM; /* e.g. print $fh length() */
2333 break;
2334 }
2335 }
68dc0745 2336 else {
2337 GV *gv = gv_fetchpv(tmpbuf, FALSE, SVt_PVCV);
2338 if (gv && GvCVu(gv))
2339 expect = XTERM; /* e.g. print $fh subr() */
2340 }
2341 }
bbce6d69 2342 else if (isDIGIT(*s))
2343 expect = XTERM; /* e.g. print $fh 3 */
2344 else if (*s == '.' && isDIGIT(s[1]))
2345 expect = XTERM; /* e.g. print $fh .3 */
2346 else if (strchr("/?-+", *s) && !isSPACE(s[1]))
2347 expect = XTERM; /* e.g. print $fh -1 */
2348 else if (*s == '<' && s[1] == '<' && !isSPACE(s[2]))
2349 expect = XTERM; /* print $fh <<"EOF" */
2350 }
2351 pending_ident = '$';
79072805 2352 TOKEN('$');
378cc40b
LW
2353
2354 case '@':
8990e307 2355 if (expect == XOPERATOR)
bbce6d69 2356 no_op("Array", s);
2357 tokenbuf[0] = '@';
8903cb82 2358 s = scan_ident(s, bufend, tokenbuf + 1, sizeof tokenbuf - 1, FALSE);
bbce6d69 2359 if (!tokenbuf[1]) {
2360 if (s == bufend)
2361 yyerror("Final @ should be \\@ or @name");
2362 PREREF('@');
2363 }
ff68c719 2364 if (lex_state == LEX_NORMAL)
2365 s = skipspace(s);
bbce6d69 2366 if ((expect != XREF || oldoldbufptr == last_lop) && intuit_more(s)) {
2367 if (*s == '{')
2368 tokenbuf[0] = '%';
a0d0e21e
LW
2369
2370 /* Warn about @ where they meant $. */
2371 if (dowarn) {
2372 if (*s == '[' || *s == '{') {
2373 char *t = s + 1;
2374 while (*t && (isALNUM(*t) || strchr(" \t$#+-'\"", *t)))
2375 t++;
2376 if (*t == '}' || *t == ']') {
2377 t++;
2378 bufptr = skipspace(bufptr);
2379 warn("Scalar value %.*s better written as $%.*s",
2380 t-bufptr, bufptr, t-bufptr-1, bufptr+1);
2381 }
93a17b20
LW
2382 }
2383 }
463ee0b2 2384 }
bbce6d69 2385 pending_ident = '@';
79072805 2386 TERM('@');
378cc40b
LW
2387
2388 case '/': /* may either be division or pattern */
2389 case '?': /* may either be conditional or pattern */
79072805 2390 if (expect != XOPERATOR) {
2f3197b3 2391 check_uni();
79072805
LW
2392 s = scan_pat(s);
2393 TERM(sublex_start());
378cc40b
LW
2394 }
2395 tmp = *s++;
a687059c 2396 if (tmp == '/')
79072805 2397 Mop(OP_DIVIDE);
378cc40b
LW
2398 OPERATOR(tmp);
2399
2400 case '.':
748a9306 2401 if (lex_formbrack && lex_brackets == lex_formbrack && s[1] == '\n' &&
fd049845 2402 (s == linestart || s[-1] == '\n') ) {
85e6fe83 2403 lex_formbrack = 0;
8990e307 2404 expect = XSTATE;
79072805
LW
2405 goto rightbracket;
2406 }
2407 if (expect == XOPERATOR || !isDIGIT(s[1])) {
378cc40b 2408 tmp = *s++;
a687059c
LW
2409 if (*s == tmp) {
2410 s++;
2f3197b3
LW
2411 if (*s == tmp) {
2412 s++;
79072805 2413 yylval.ival = OPf_SPECIAL;
2f3197b3
LW
2414 }
2415 else
79072805 2416 yylval.ival = 0;
378cc40b 2417 OPERATOR(DOTDOT);
a687059c 2418 }
79072805 2419 if (expect != XOPERATOR)
2f3197b3 2420 check_uni();
79072805 2421 Aop(OP_CONCAT);
378cc40b
LW
2422 }
2423 /* FALL THROUGH */
2424 case '0': case '1': case '2': case '3': case '4':
2425 case '5': case '6': case '7': case '8': case '9':
79072805 2426 s = scan_num(s);
8990e307
LW
2427 if (expect == XOPERATOR)
2428 no_op("Number",s);
79072805
LW
2429 TERM(THING);
2430
2431 case '\'':
8990e307 2432 s = scan_str(s);
463ee0b2 2433 if (expect == XOPERATOR) {
a0d0e21e
LW
2434 if (lex_formbrack && lex_brackets == lex_formbrack) {
2435 expect = XTERM;
2436 depcom();
2437 return ','; /* grandfather non-comma-format format */
2438 }
463ee0b2 2439 else
8990e307 2440 no_op("String",s);
463ee0b2 2441 }
79072805 2442 if (!s)
85e6fe83 2443 missingterm((char*)0);
79072805
LW
2444 yylval.ival = OP_CONST;
2445 TERM(sublex_start());
2446
2447 case '"':
8990e307 2448 s = scan_str(s);
463ee0b2 2449 if (expect == XOPERATOR) {
a0d0e21e
LW
2450 if (lex_formbrack && lex_brackets == lex_formbrack) {
2451 expect = XTERM;
2452 depcom();
2453 return ','; /* grandfather non-comma-format format */
2454 }
463ee0b2 2455 else
8990e307 2456 no_op("String",s);
463ee0b2 2457 }
79072805 2458 if (!s)
85e6fe83 2459 missingterm((char*)0);
4633a7c4
LW
2460 yylval.ival = OP_CONST;
2461 for (d = SvPV(lex_stuff, len); len; len--, d++) {
2462 if (*d == '$' || *d == '@' || *d == '\\') {
2463 yylval.ival = OP_STRINGIFY;
2464 break;
2465 }
2466 }
79072805
LW
2467 TERM(sublex_start());
2468
2469 case '`':
2470 s = scan_str(s);
8990e307
LW
2471 if (expect == XOPERATOR)
2472 no_op("Backticks",s);
79072805 2473 if (!s)
85e6fe83 2474 missingterm((char*)0);
79072805
LW
2475 yylval.ival = OP_BACKTICK;
2476 set_csh();
2477 TERM(sublex_start());
2478
2479 case '\\':
2480 s++;
748a9306
LW
2481 if (dowarn && lex_inwhat && isDIGIT(*s))
2482 warn("Can't use \\%c to mean $%c in expression", *s, *s);
8990e307
LW
2483 if (expect == XOPERATOR)
2484 no_op("Backslash",s);
79072805
LW
2485 OPERATOR(REFGEN);
2486
2487 case 'x':
2488 if (isDIGIT(s[1]) && expect == XOPERATOR) {
2489 s++;
2490 Mop(OP_REPEAT);
2f3197b3 2491 }
79072805
LW
2492 goto keylookup;
2493
378cc40b 2494 case '_':
79072805
LW
2495 case 'a': case 'A':
2496 case 'b': case 'B':
2497 case 'c': case 'C':
2498 case 'd': case 'D':
2499 case 'e': case 'E':
2500 case 'f': case 'F':
2501 case 'g': case 'G':
2502 case 'h': case 'H':
2503 case 'i': case 'I':
2504 case 'j': case 'J':
2505 case 'k': case 'K':
2506 case 'l': case 'L':
2507 case 'm': case 'M':
2508 case 'n': case 'N':
2509 case 'o': case 'O':
2510 case 'p': case 'P':
2511 case 'q': case 'Q':
2512 case 'r': case 'R':
2513 case 's': case 'S':
2514 case 't': case 'T':
2515 case 'u': case 'U':
2516 case 'v': case 'V':
2517 case 'w': case 'W':
2518 case 'X':
2519 case 'y': case 'Y':
2520 case 'z': case 'Z':
2521
2522 keylookup:
748a9306 2523 bufptr = s;
8903cb82 2524 s = scan_word(s, tokenbuf, sizeof tokenbuf, FALSE, &len);
8ebc5c01 2525
2526 /* Some keywords can be followed by any delimiter, including ':' */
2527 tmp = (len == 1 && strchr("msyq", tokenbuf[0]) ||
2528 len == 2 && ((tokenbuf[0] == 't' && tokenbuf[1] == 'r') ||
2529 (tokenbuf[0] == 'q' &&
2530 strchr("qwx", tokenbuf[1]))));
2531
2532 /* x::* is just a word, unless x is "CORE" */
2533 if (!tmp && *s == ':' && s[1] == ':' && strNE(tokenbuf, "CORE"))
4633a7c4
LW
2534 goto just_a_word;
2535
3643fb5f
CS
2536 d = s;
2537 while (d < bufend && isSPACE(*d))
2538 d++; /* no comments skipped here, or s### is misparsed */
2539
2540 /* Is this a label? */
8ebc5c01 2541 if (!tmp && expect == XSTATE
2542 && d < bufend && *d == ':' && *(d + 1) != ':') {
2543 s = d + 1;
2544 yylval.pval = savepv(tokenbuf);
2545 CLINE;
2546 TOKEN(LABEL);
3643fb5f
CS
2547 }
2548
2549 /* Check for keywords */
a0d0e21e 2550 tmp = keyword(tokenbuf, len);
748a9306
LW
2551
2552 /* Is this a word before a => operator? */
748a9306
LW
2553 if (strnEQ(d,"=>",2)) {
2554 CLINE;
2555 if (dowarn && (tmp || perl_get_cv(tokenbuf, FALSE)))
2556 warn("Ambiguous use of %s => resolved to \"%s\" =>",
2557 tokenbuf, tokenbuf);
2558 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
2559 yylval.opval->op_private = OPpCONST_BARE;
2560 TERM(WORD);
2561 }
2562
a0d0e21e
LW
2563 if (tmp < 0) { /* second-class keyword? */
2564 GV* gv;
2565 if (expect != XOPERATOR &&
a5f75d66
AD
2566 (*s != ':' || s[1] != ':') &&
2567 (gv = gv_fetchpv(tokenbuf, FALSE, SVt_PVCV)) &&
2568 GvIMPORTED_CV(gv))
a0d0e21e
LW
2569 {
2570 tmp = 0;
2571 }
2572 else
2573 tmp = -tmp;
2574 }
2575
2576 reserved_word:
2577 switch (tmp) {
79072805
LW
2578
2579 default: /* not a keyword */
93a17b20
LW
2580 just_a_word: {
2581 GV *gv;
96e4d5b1 2582 SV *sv;
748a9306 2583 char lastchar = (bufptr == oldoldbufptr ? 0 : bufptr[-1]);
8990e307
LW
2584
2585 /* Get the rest if it looks like a package qualifier */
2586
a0d0e21e 2587 if (*s == '\'' || *s == ':' && s[1] == ':') {
8903cb82 2588 s = scan_word(s, tokenbuf + len, sizeof tokenbuf - len,
2589 TRUE, &len);
a0d0e21e
LW
2590 if (!len)
2591 croak("Bad name after %s::", tokenbuf);
2592 }
8990e307 2593
3643fb5f 2594 if (expect == XOPERATOR) {
fd049845 2595 if (bufptr == linestart) {
463ee0b2
LW
2596 curcop->cop_line--;
2597 warn(warn_nosemi);
2598 curcop->cop_line++;
2599 }
2600 else
54310121 2601 no_op("Bareword",s);
463ee0b2 2602 }
8990e307
LW
2603
2604 /* Look for a subroutine with this name in current package. */
2605
85e6fe83 2606 gv = gv_fetchpv(tokenbuf,FALSE, SVt_PVCV);
8990e307 2607
a0d0e21e
LW
2608 /* Presume this is going to be a bareword of some sort. */
2609
2610 CLINE;
2611 yylval.opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(tokenbuf,0));
2612 yylval.opval->op_private = OPpCONST_BARE;
2613
8990e307
LW
2614 /* See if it's the indirect object for a list operator. */
2615
a0d0e21e
LW
2616 if (oldoldbufptr &&
2617 oldoldbufptr < bufptr &&
2618 (oldoldbufptr == last_lop || oldoldbufptr == last_uni) &&
2619 /* NO SKIPSPACE BEFORE HERE! */
2620 (expect == XREF ||
2621 (opargs[last_lop_op] >> OASHIFT & 7) == OA_FILEREF) )
2622 {
748a9306
LW
2623 bool immediate_paren = *s == '(';
2624
a0d0e21e
LW
2625 /* (Now we can afford to cross potential line boundary.) */
2626 s = skipspace(s);
2627
2628 /* Two barewords in a row may indicate method call. */
2629
2630 if ((isALPHA(*s) || *s == '$') && (tmp=intuit_method(s,gv)))
2631 return tmp;
2632
2633 /* If not a declared subroutine, it's an indirect object. */
2634 /* (But it's an indir obj regardless for sort.) */
2635
8e07c86e 2636 if ((last_lop_op == OP_SORT ||
8ebc5c01 2637 (!immediate_paren && (!gv || !GvCVu(gv))) ) &&
8e07c86e 2638 (last_lop_op != OP_MAPSTART && last_lop_op != OP_GREPSTART)){
748a9306
LW
2639 expect = (last_lop == oldoldbufptr) ? XTERM : XOPERATOR;
2640 goto bareword;
93a17b20
LW
2641 }
2642 }
8990e307
LW
2643
2644 /* If followed by a paren, it's certainly a subroutine. */
2645
2646 expect = XOPERATOR;
2647 s = skipspace(s);
93a17b20 2648 if (*s == '(') {
79072805 2649 CLINE;
96e4d5b1 2650 if (gv && GvCVu(gv)) {
2651 for (d = s + 1; *d == ' ' || *d == '\t'; d++) ;
2652 if (*d == ')' && (sv = cv_const_sv(GvCV(gv)))) {
2653 s = d + 1;
2654 goto its_constant;
2655 }
2656 }
a0d0e21e 2657 nextval[nexttoke].opval = yylval.opval;
463ee0b2 2658 expect = XOPERATOR;
93a17b20 2659 force_next(WORD);
c07a80fd 2660 yylval.ival = 0;
463ee0b2 2661 TOKEN('&');
79072805 2662 }
93a17b20 2663
a0d0e21e 2664 /* If followed by var or block, call it a method (unless sub) */
8990e307 2665
8ebc5c01 2666 if ((*s == '$' || *s == '{') && (!gv || !GvCVu(gv))) {
463ee0b2 2667 last_lop = oldbufptr;
8990e307 2668 last_lop_op = OP_METHOD;
93a17b20 2669 PREBLOCK(METHOD);
463ee0b2
LW
2670 }
2671
8990e307
LW
2672 /* If followed by a bareword, see if it looks like indir obj. */
2673
a0d0e21e
LW
2674 if ((isALPHA(*s) || *s == '$') && (tmp = intuit_method(s,gv)))
2675 return tmp;
93a17b20 2676
8990e307
LW
2677 /* Not a method, so call it a subroutine (if defined) */
2678
8ebc5c01 2679 if (gv && GvCVu(gv)) {
46fc3d4c 2680 CV* cv;
748a9306 2681 if (lastchar == '-')
c2960299 2682 warn("Ambiguous use of -%s resolved as -&%s()",
748a9306 2683 tokenbuf, tokenbuf);
8990e307 2684 last_lop = oldbufptr;
a0d0e21e 2685 last_lop_op = OP_ENTERSUB;
89bfa8cd 2686 /* Check for a constant sub */
46fc3d4c 2687 cv = GvCV(gv);
96e4d5b1 2688 if ((sv = cv_const_sv(cv))) {
2689 its_constant:
2690 SvREFCNT_dec(((SVOP*)yylval.opval)->op_sv);
2691 ((SVOP*)yylval.opval)->op_sv = SvREFCNT_inc(sv);
2692 yylval.opval->op_private = 0;
2693 TOKEN(WORD);
89bfa8cd 2694 }
2695
a5f75d66
AD
2696 /* Resolve to GV now. */
2697 op_free(yylval.opval);
2698 yylval.opval = newCVREF(0, newGVOP(OP_GV, 0, gv));
4633a7c4
LW
2699 /* Is there a prototype? */
2700 if (SvPOK(cv)) {
2701 STRLEN len;
2702 char *proto = SvPV((SV*)cv, len);
2703 if (!len)
2704 TERM(FUNC0SUB);
2705 if (strEQ(proto, "$"))
2706 OPERATOR(UNIOPSUB);
2707 if (*proto == '&' && *s == '{') {
2708 sv_setpv(subname,"__ANON__");
2709 PREBLOCK(LSTOPSUB);
2710 }
2711 }
a5f75d66 2712 nextval[nexttoke].opval = yylval.opval;
8990e307
LW
2713 expect = XTERM;
2714 force_next(WORD);
2715 TOKEN(NOAMP);
2716 }
748a9306
LW
2717
2718 if (hints & HINT_STRICT_SUBS &&
2719 lastchar != '-' &&
a0d0e21e 2720 strnNE(s,"->",2) &&
9b01e405 2721 last_lop_op != OP_TRUNCATE && /* S/F prototype in opcode.pl */
a0d0e21e
LW
2722 last_lop_op != OP_ACCEPT &&
2723 last_lop_op != OP_PIPE_OP &&
2724 last_lop_op != OP_SOCKPAIR)
2725 {
2726 warn(
2727 "Bareword \"%s\" not allowed while \"strict subs\" in use",
85e6fe83
LW
2728 tokenbuf);
2729 ++error_count;
2730 }
8990e307
LW
2731
2732 /* Call it a bare word */
2733
748a9306
LW
2734 bareword:
2735 if (dowarn) {
2736 if (lastchar != '-') {
2737 for (d = tokenbuf; *d && isLOWER(*d); d++) ;
2738 if (!*d)
2739 warn(warn_reserved, tokenbuf);
2740 }
2741 }
2742 if (lastchar && strchr("*%&", lastchar)) {
2743 warn("Operator or semicolon missing before %c%s",
2744 lastchar, tokenbuf);
c2960299 2745 warn("Ambiguous use of %c resolved as operator %c",
748a9306
LW
2746 lastchar, lastchar);
2747 }
93a17b20 2748 TOKEN(WORD);
79072805 2749 }
79072805 2750
68dc0745 2751 case KEY___FILE__:
46fc3d4c 2752 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
2753 newSVsv(GvSV(curcop->cop_filegv)));
2754 TERM(THING);
2755
79072805 2756 case KEY___LINE__:
46fc3d4c 2757 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
2758 newSVpvf("%ld", (long)curcop->cop_line));
79072805 2759 TERM(THING);
68dc0745 2760
2761 case KEY___PACKAGE__:
2762 yylval.opval = (OP*)newSVOP(OP_CONST, 0,
2763 (curstash
2764 ? newSVsv(curstname)
2765 : &sv_undef));
2766 TERM(THING);
79072805 2767
e50aee73 2768 case KEY___DATA__:
79072805
LW
2769 case KEY___END__: {
2770 GV *gv;
79072805
LW
2771
2772 /*SUPPRESS 560*/
a5f75d66 2773 if (rsfp && (!in_eval || tokenbuf[2] == 'D')) {
e50aee73
AD
2774 char *pname = "main";
2775 if (tokenbuf[2] == 'D')
2776 pname = HvNAME(curstash ? curstash : defstash);
46fc3d4c 2777 gv = gv_fetchpv(form("%s::DATA", pname), TRUE, SVt_PVIO);
a5f75d66 2778 GvMULTI_on(gv);
79072805 2779 if (!GvIO(gv))
a0d0e21e
LW
2780 GvIOp(gv) = newIO();
2781 IoIFP(GvIOp(gv)) = rsfp;
2782#if defined(HAS_FCNTL) && defined(F_SETFD)
2783 {
760ac839 2784 int fd = PerlIO_fileno(rsfp);
a0d0e21e
LW
2785 fcntl(fd,F_SETFD,fd >= 3);
2786 }
79072805 2787#endif
fd049845 2788 /* Mark this internal pseudo-handle as clean */
2789 IoFLAGS(GvIOp(gv)) |= IOf_UNTAINT;
79072805 2790 if (preprocess)
a0d0e21e 2791 IoTYPE(GvIOp(gv)) = '|';
760ac839 2792 else if ((PerlIO*)rsfp == PerlIO_stdin())
a0d0e21e 2793 IoTYPE(GvIOp(gv)) = '-';
79072805 2794 else
a0d0e21e 2795 IoTYPE(GvIOp(gv)) = '<';
79072805
LW
2796 rsfp = Nullfp;
2797 }
2798 goto fake_eof;
e929a76b 2799 }
de3bb511 2800
8990e307 2801 case KEY_AUTOLOAD:
ed6116ce 2802 case KEY_DESTROY:
79072805
LW
2803 case KEY_BEGIN:
2804 case KEY_END:
a0d0e21e 2805 if (expect == XSTATE) {
93a17b20
LW
2806 s = bufptr;
2807 goto really_sub;
79072805
LW
2808 }
2809 goto just_a_word;
2810
a0d0e21e
LW
2811 case KEY_CORE:
2812 if (*s == ':' && s[1] == ':') {
2813 s += 2;
748a9306 2814 d = s;
8903cb82 2815 s = scan_word(s, tokenbuf, sizeof tokenbuf, FALSE, &len);
a0d0e21e
LW
2816 tmp = keyword(tokenbuf, len);
2817 if (tmp < 0)
2818 tmp = -tmp;
2819 goto reserved_word;
2820 }
2821 goto just_a_word;
2822
463ee0b2
LW
2823 case KEY_abs:
2824 UNI(OP_ABS);
2825
79072805
LW
2826 case KEY_alarm:
2827 UNI(OP_ALARM);
2828
2829 case KEY_accept:
a0d0e21e 2830 LOP(OP_ACCEPT,XTERM);
79072805 2831
463ee0b2
LW
2832 case KEY_and:
2833 OPERATOR(ANDOP);
2834
79072805 2835 case KEY_atan2:
a0d0e21e 2836 LOP(OP_ATAN2,XTERM);
85e6fe83 2837
79072805 2838 case KEY_bind:
a0d0e21e 2839 LOP(OP_BIND,XTERM);
79072805
LW
2840
2841 case KEY_binmode:
2842 UNI(OP_BINMODE);
2843
2844 case KEY_bless:
a0d0e21e 2845 LOP(OP_BLESS,XTERM);
79072805
LW
2846
2847 case KEY_chop:
2848 UNI(OP_CHOP);
2849
2850 case KEY_continue:
2851 PREBLOCK(CONTINUE);
2852
2853 case KEY_chdir:
85e6fe83 2854 (void)gv_fetchpv("ENV",TRUE, SVt_PVHV); /* may use HOME */
79072805
LW
2855 UNI(OP_CHDIR);
2856
2857 case KEY_close:
2858 UNI(OP_CLOSE);
2859
2860 case KEY_closedir:
2861 UNI(OP_CLOSEDIR);
2862
2863 case KEY_cmp:
2864 Eop(OP_SCMP);
2865
2866 case KEY_caller:
2867 UNI(OP_CALLER);
2868
2869 case KEY_crypt:
2870#ifdef FCRYPT
de3bb511
LW
2871 if (!cryptseen++)
2872 init_des();
a687059c 2873#endif
a0d0e21e 2874 LOP(OP_CRYPT,XTERM);
79072805
LW
2875
2876 case KEY_chmod:
748a9306
LW
2877 if (dowarn) {
2878 for (d = s; d < bufend && (isSPACE(*d) || *d == '('); d++) ;
2879 if (*d != '0' && isDIGIT(*d))
2880 yywarn("chmod: mode argument is missing initial 0");
2881 }
a0d0e21e 2882 LOP(OP_CHMOD,XTERM);
79072805
LW
2883
2884 case KEY_chown:
a0d0e21e 2885 LOP(OP_CHOWN,XTERM);
79072805
LW
2886
2887 case KEY_connect:
a0d0e21e 2888 LOP(OP_CONNECT,XTERM);
79072805 2889
463ee0b2
LW
2890 case KEY_chr:
2891 UNI(OP_CHR);
2892
79072805
LW
2893 case KEY_cos:
2894 UNI(OP_COS);
2895
2896 case KEY_chroot:
2897 UNI(OP_CHROOT);
2898
2899 case KEY_do:
2900 s = skipspace(s);
2901 if (*s == '{')
a0d0e21e 2902 PRETERMBLOCK(DO);
79072805 2903 if (*s != '\'')
a0d0e21e 2904 s = force_word(s,WORD,FALSE,TRUE,FALSE);
378cc40b 2905 OPERATOR(DO);
79072805
LW
2906
2907 case KEY_die:
a0d0e21e
LW
2908 hints |= HINT_BLOCK_SCOPE;
2909 LOP(OP_DIE,XTERM);
79072805
LW
2910
2911 case KEY_defined:
2912 UNI(OP_DEFINED);
2913
2914 case KEY_delete:
a0d0e21e 2915 UNI(OP_DELETE);
79072805
LW
2916
2917 case KEY_dbmopen:
a0d0e21e
LW
2918 gv_fetchpv("AnyDBM_File::ISA", GV_ADDMULTI, SVt_PVAV);
2919 LOP(OP_DBMOPEN,XTERM);
79072805
LW
2920
2921 case KEY_dbmclose:
2922 UNI(OP_DBMCLOSE);
2923
2924 case KEY_dump:
a0d0e21e 2925 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
2926 LOOPX(OP_DUMP);
2927
2928 case KEY_else:
2929 PREBLOCK(ELSE);
2930
2931 case KEY_elsif:
2932 yylval.ival = curcop->cop_line;
2933 OPERATOR(ELSIF);
2934
2935 case KEY_eq:
2936 Eop(OP_SEQ);
2937
a0d0e21e
LW
2938 case KEY_exists:
2939 UNI(OP_EXISTS);
2940
79072805
LW
2941 case KEY_exit:
2942 UNI(OP_EXIT);
2943
2944 case KEY_eval:
79072805 2945 s = skipspace(s);
a0d0e21e 2946 expect = (*s == '{') ? XTERMBLOCK : XTERM;
463ee0b2 2947 UNIBRACK(OP_ENTEREVAL);
79072805
LW
2948
2949 case KEY_eof:
2950 UNI(OP_EOF);
2951
2952 case KEY_exp:
2953 UNI(OP_EXP);
2954
2955 case KEY_each:
2956 UNI(OP_EACH);
2957
2958 case KEY_exec:
2959 set_csh();
a0d0e21e 2960 LOP(OP_EXEC,XREF);
79072805
LW
2961
2962 case KEY_endhostent:
2963 FUN0(OP_EHOSTENT);
2964
2965 case KEY_endnetent:
2966 FUN0(OP_ENETENT);
2967
2968 case KEY_endservent:
2969 FUN0(OP_ESERVENT);
2970
2971 case KEY_endprotoent:
2972 FUN0(OP_EPROTOENT);
2973
2974 case KEY_endpwent:
2975 FUN0(OP_EPWENT);
2976
2977 case KEY_endgrent:
2978 FUN0(OP_EGRENT);
2979
2980 case KEY_for:
2981 case KEY_foreach:
2982 yylval.ival = curcop->cop_line;
55497cff 2983 s = skipspace(s);
2984 if (isIDFIRST(*s)) {
2985 char *p = s;
2986 if ((bufend - p) >= 3 &&
2987 strnEQ(p, "my", 2) && isSPACE(*(p + 2)))
2988 p += 2;
2989 p = skipspace(p);
2990 if (isIDFIRST(*p))
2991 croak("Missing $ on loop variable");
2992 }
79072805
LW
2993 OPERATOR(FOR);
2994
2995 case KEY_formline:
a0d0e21e 2996 LOP(OP_FORMLINE,XTERM);
79072805
LW
2997
2998 case KEY_fork:
2999 FUN0(OP_FORK);
3000
3001 case KEY_fcntl:
a0d0e21e 3002 LOP(OP_FCNTL,XTERM);
79072805
LW
3003
3004 case KEY_fileno:
3005 UNI(OP_FILENO);
3006
3007 case KEY_flock:
a0d0e21e 3008 LOP(OP_FLOCK,XTERM);
79072805
LW
3009
3010 case KEY_gt:
3011 Rop(OP_SGT);
3012
3013 case KEY_ge:
3014 Rop(OP_SGE);
3015
3016 case KEY_grep:
a0d0e21e 3017 LOP(OP_GREPSTART, *s == '(' ? XTERM : XREF);
79072805
LW
3018
3019 case KEY_goto:
a0d0e21e 3020 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
3021 LOOPX(OP_GOTO);
3022
3023 case KEY_gmtime:
3024 UNI(OP_GMTIME);
3025
3026 case KEY_getc:
3027 UNI(OP_GETC);
3028
3029 case KEY_getppid:
3030 FUN0(OP_GETPPID);
3031
3032 case KEY_getpgrp:
3033 UNI(OP_GETPGRP);
3034
3035 case KEY_getpriority:
a0d0e21e 3036 LOP(OP_GETPRIORITY,XTERM);
79072805
LW
3037
3038 case KEY_getprotobyname:
3039 UNI(OP_GPBYNAME);
3040
3041 case KEY_getprotobynumber:
a0d0e21e 3042 LOP(OP_GPBYNUMBER,XTERM);
79072805
LW
3043
3044 case KEY_getprotoent:
3045 FUN0(OP_GPROTOENT);
3046
3047 case KEY_getpwent:
3048 FUN0(OP_GPWENT);
3049
3050 case KEY_getpwnam:
ff68c719 3051 UNI(OP_GPWNAM);
79072805
LW
3052
3053 case KEY_getpwuid:
ff68c719 3054 UNI(OP_GPWUID);
79072805
LW
3055
3056 case KEY_getpeername:
3057 UNI(OP_GETPEERNAME);
3058
3059 case KEY_gethostbyname:
3060 UNI(OP_GHBYNAME);
3061
3062 case KEY_gethostbyaddr:
a0d0e21e 3063 LOP(OP_GHBYADDR,XTERM);
79072805
LW
3064
3065 case KEY_gethostent:
3066 FUN0(OP_GHOSTENT);
3067
3068 case KEY_getnetbyname:
3069 UNI(OP_GNBYNAME);
3070
3071 case KEY_getnetbyaddr:
a0d0e21e 3072 LOP(OP_GNBYADDR,XTERM);
79072805
LW
3073
3074 case KEY_getnetent:
3075 FUN0(OP_GNETENT);
3076
3077 case KEY_getservbyname:
a0d0e21e 3078 LOP(OP_GSBYNAME,XTERM);
79072805
LW
3079
3080 case KEY_getservbyport:
a0d0e21e 3081 LOP(OP_GSBYPORT,XTERM);
79072805
LW
3082
3083 case KEY_getservent:
3084 FUN0(OP_GSERVENT);
3085
3086 case KEY_getsockname:
3087 UNI(OP_GETSOCKNAME);
3088
3089 case KEY_getsockopt:
a0d0e21e 3090 LOP(OP_GSOCKOPT,XTERM);
79072805
LW
3091
3092 case KEY_getgrent:
3093 FUN0(OP_GGRENT);
3094
3095 case KEY_getgrnam:
ff68c719 3096 UNI(OP_GGRNAM);
79072805
LW
3097
3098 case KEY_getgrgid:
ff68c719 3099 UNI(OP_GGRGID);
79072805
LW
3100
3101 case KEY_getlogin:
3102 FUN0(OP_GETLOGIN);
3103
93a17b20 3104 case KEY_glob:
a0d0e21e
LW
3105 set_csh();
3106 LOP(OP_GLOB,XTERM);
93a17b20 3107
79072805
LW
3108 case KEY_hex:
3109 UNI(OP_HEX);
3110
3111 case KEY_if:
3112 yylval.ival = curcop->cop_line;
71be2cbc 3113 OPERATOR(IF);
79072805
LW
3114
3115 case KEY_index:
a0d0e21e 3116 LOP(OP_INDEX,XTERM);
79072805
LW
3117
3118 case KEY_int:
3119 UNI(OP_INT);
3120
3121 case KEY_ioctl:
a0d0e21e 3122 LOP(OP_IOCTL,XTERM);
79072805
LW
3123
3124 case KEY_join:
a0d0e21e 3125 LOP(OP_JOIN,XTERM);
79072805
LW
3126
3127 case KEY_keys:
3128 UNI(OP_KEYS);
3129
3130 case KEY_kill:
a0d0e21e 3131 LOP(OP_KILL,XTERM);
79072805
LW
3132
3133 case KEY_last:
a0d0e21e 3134 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805 3135 LOOPX(OP_LAST);
a0d0e21e 3136
79072805
LW
3137 case KEY_lc:
3138 UNI(OP_LC);
3139
3140 case KEY_lcfirst:
3141 UNI(OP_LCFIRST);
3142
3143 case KEY_local:
3144 OPERATOR(LOCAL);
3145
3146 case KEY_length:
3147 UNI(OP_LENGTH);
3148
3149 case KEY_lt:
3150 Rop(OP_SLT);
3151
3152 case KEY_le:
3153 Rop(OP_SLE);
3154
3155 case KEY_localtime:
3156 UNI(OP_LOCALTIME);
3157
3158 case KEY_log:
3159 UNI(OP_LOG);
3160
3161 case KEY_link:
a0d0e21e 3162 LOP(OP_LINK,XTERM);
79072805
LW
3163
3164 case KEY_listen:
a0d0e21e 3165 LOP(OP_LISTEN,XTERM);
79072805
LW
3166
3167 case KEY_lstat:
3168 UNI(OP_LSTAT);
3169
3170 case KEY_m:
3171 s = scan_pat(s);
3172 TERM(sublex_start());
3173
a0d0e21e
LW
3174 case KEY_map:
3175 LOP(OP_MAPSTART,XREF);
3176
79072805 3177 case KEY_mkdir:
a0d0e21e 3178 LOP(OP_MKDIR,XTERM);
79072805
LW
3179
3180 case KEY_msgctl:
a0d0e21e 3181 LOP(OP_MSGCTL,XTERM);
79072805
LW
3182
3183 case KEY_msgget:
a0d0e21e 3184 LOP(OP_MSGGET,XTERM);
79072805
LW
3185
3186 case KEY_msgrcv:
a0d0e21e 3187 LOP(OP_MSGRCV,XTERM);
79072805
LW
3188
3189 case KEY_msgsnd:
a0d0e21e 3190 LOP(OP_MSGSND,XTERM);
79072805 3191
93a17b20
LW
3192 case KEY_my:
3193 in_my = TRUE;
55497cff 3194 OPERATOR(MY);
93a17b20 3195
79072805 3196 case KEY_next:
a0d0e21e 3197 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
3198 LOOPX(OP_NEXT);
3199
3200 case KEY_ne:
3201 Eop(OP_SNE);
3202
a0d0e21e
LW
3203 case KEY_no:
3204 if (expect != XSTATE)
3205 yyerror("\"no\" not allowed in expression");
3206 s = force_word(s,WORD,FALSE,TRUE,FALSE);
89bfa8cd 3207 s = force_version(s);
a0d0e21e
LW
3208 yylval.ival = 0;
3209 OPERATOR(USE);
3210
3211 case KEY_not:
3212 OPERATOR(NOTOP);
3213
79072805 3214 case KEY_open:
93a17b20
LW
3215 s = skipspace(s);
3216 if (isIDFIRST(*s)) {
3217 char *t;
3218 for (d = s; isALNUM(*d); d++) ;
3219 t = skipspace(d);
3220 if (strchr("|&*+-=!?:.", *t))
3221 warn("Precedence problem: open %.*s should be open(%.*s)",
3222 d-s,s, d-s,s);
3223 }
a0d0e21e 3224 LOP(OP_OPEN,XTERM);
79072805 3225
463ee0b2 3226 case KEY_or:
a0d0e21e 3227 yylval.ival = OP_OR;
463ee0b2
LW
3228 OPERATOR(OROP);
3229
79072805
LW
3230 case KEY_ord:
3231 UNI(OP_ORD);
3232
3233 case KEY_oct:
3234 UNI(OP_OCT);
3235
3236 case KEY_opendir:
a0d0e21e 3237 LOP(OP_OPEN_DIR,XTERM);
79072805
LW
3238
3239 case KEY_print:
3240 checkcomma(s,tokenbuf,"filehandle");
a0d0e21e 3241 LOP(OP_PRINT,XREF);
79072805
LW
3242
3243 case KEY_printf:
3244 checkcomma(s,tokenbuf,"filehandle");
a0d0e21e 3245 LOP(OP_PRTF,XREF);
79072805 3246
c07a80fd 3247 case KEY_prototype:
3248 UNI(OP_PROTOTYPE);
3249
79072805 3250 case KEY_push:
a0d0e21e 3251 LOP(OP_PUSH,XTERM);
79072805
LW
3252
3253 case KEY_pop:
3254 UNI(OP_POP);
3255
a0d0e21e
LW
3256 case KEY_pos:
3257 UNI(OP_POS);
3258
79072805 3259 case KEY_pack:
a0d0e21e 3260 LOP(OP_PACK,XTERM);
79072805
LW
3261
3262 case KEY_package:
a0d0e21e 3263 s = force_word(s,WORD,FALSE,TRUE,FALSE);
79072805
LW
3264 OPERATOR(PACKAGE);
3265
3266 case KEY_pipe:
a0d0e21e 3267 LOP(OP_PIPE_OP,XTERM);
79072805
LW
3268
3269 case KEY_q:
3270 s = scan_str(s);
3271 if (!s)
85e6fe83 3272 missingterm((char*)0);
79072805
LW
3273 yylval.ival = OP_CONST;
3274 TERM(sublex_start());
3275
a0d0e21e
LW
3276 case KEY_quotemeta:
3277 UNI(OP_QUOTEMETA);
3278
8990e307
LW
3279 case KEY_qw:
3280 s = scan_str(s);
3281 if (!s)
85e6fe83 3282 missingterm((char*)0);
55497cff 3283 if (dowarn && SvLEN(lex_stuff)) {
3284 d = SvPV_force(lex_stuff, len);
3285 for (; len; --len, ++d) {
3286 if (*d == ',') {
3287 warn("Possible attempt to separate words with commas");
3288 break;
3289 }
3290 if (*d == '#') {
3291 warn("Possible attempt to put comments in qw() list");
3292 break;
3293 }
3294 }
3295 }
8990e307
LW
3296 force_next(')');
3297 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, q(lex_stuff));
3298 lex_stuff = Nullsv;
3299 force_next(THING);
3300 force_next(',');
3301 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, newSVpv(" ",1));
3302 force_next(THING);
3303 force_next('(');
a0d0e21e
LW
3304 yylval.ival = OP_SPLIT;
3305 CLINE;
3306 expect = XTERM;
3307 bufptr = s;
3308 last_lop = oldbufptr;
3309 last_lop_op = OP_SPLIT;
3310 return FUNC;
8990e307 3311
79072805
LW
3312 case KEY_qq:
3313 s = scan_str(s);
3314 if (!s)
85e6fe83 3315 missingterm((char*)0);
a0d0e21e 3316 yylval.ival = OP_STRINGIFY;
ed6116ce
LW
3317 if (SvIVX(lex_stuff) == '\'')
3318 SvIVX(lex_stuff) = 0; /* qq'$foo' should intepolate */
79072805
LW
3319 TERM(sublex_start());
3320
3321 case KEY_qx:
3322 s = scan_str(s);
3323 if (!s)
85e6fe83 3324 missingterm((char*)0);
79072805
LW
3325 yylval.ival = OP_BACKTICK;
3326 set_csh();
3327 TERM(sublex_start());
3328
3329 case KEY_return:
3330 OLDLOP(OP_RETURN);
3331
3332 case KEY_require:
748a9306 3333 *tokenbuf = '\0';
a0d0e21e 3334 s = force_word(s,WORD,TRUE,TRUE,FALSE);
748a9306 3335 if (isIDFIRST(*tokenbuf))
89bfa8cd 3336 gv_stashpvn(tokenbuf, strlen(tokenbuf), TRUE);
748a9306 3337 else if (*s == '<')
a0d0e21e 3338 yyerror("<> should be quotes");
463ee0b2 3339 UNI(OP_REQUIRE);
79072805
LW
3340
3341 case KEY_reset:
3342 UNI(OP_RESET);
3343
3344 case KEY_redo:
a0d0e21e 3345 s = force_word(s,WORD,TRUE,FALSE,FALSE);
79072805
LW
3346 LOOPX(OP_REDO);
3347
3348 case KEY_rename:
a0d0e21e 3349 LOP(OP_RENAME,XTERM);
79072805
LW
3350
3351 case KEY_rand:
3352 UNI(OP_RAND);
3353
3354 case KEY_rmdir:
3355 UNI(OP_RMDIR);
3356
3357 case KEY_rindex:
a0d0e21e 3358 LOP(OP_RINDEX,XTERM);
79072805
LW
3359
3360 case KEY_read:
a0d0e21e 3361 LOP(OP_READ,XTERM);
79072805
LW
3362
3363 case KEY_readdir:
3364 UNI(OP_READDIR);
3365
93a17b20
LW
3366 case KEY_readline:
3367 set_csh();
3368 UNI(OP_READLINE);
3369
3370 case KEY_readpipe:
3371 set_csh();
3372 UNI(OP_BACKTICK);
3373
79072805
LW
3374 case KEY_rewinddir:
3375 UNI(OP_REWINDDIR);
3376
3377 case KEY_recv:
a0d0e21e 3378 LOP(OP_RECV,XTERM);
79072805
LW
3379
3380 case KEY_reverse:
a0d0e21e 3381 LOP(OP_REVERSE,XTERM);
79072805
LW
3382
3383 case KEY_readlink:
3384 UNI(OP_READLINK);
3385
3386 case KEY_ref:
3387 UNI(OP_REF);
3388
3389 case KEY_s:
3390 s = scan_subst(s);
3391 if (yylval.opval)
3392 TERM(sublex_start());
3393 else
3394 TOKEN(1); /* force error */
3395
a0d0e21e
LW
3396 case KEY_chomp:
3397 UNI(OP_CHOMP);
3398
79072805
LW
3399 case KEY_scalar:
3400 UNI(OP_SCALAR);
3401
3402 case KEY_select:
a0d0e21e 3403 LOP(OP_SELECT,XTERM);
79072805
LW
3404
3405 case KEY_seek:
a0d0e21e 3406 LOP(OP_SEEK,XTERM);
79072805
LW
3407
3408 case KEY_semctl:
a0d0e21e 3409 LOP(OP_SEMCTL,XTERM);
79072805
LW
3410
3411 case KEY_semget:
a0d0e21e 3412 LOP(OP_SEMGET,XTERM);
79072805
LW
3413
3414 case KEY_semop:
a0d0e21e 3415 LOP(OP_SEMOP,XTERM);
79072805
LW
3416
3417 case KEY_send:
a0d0e21e 3418 LOP(OP_SEND,XTERM);
79072805
LW
3419
3420 case KEY_setpgrp:
a0d0e21e 3421 LOP(OP_SETPGRP,XTERM);
79072805
LW
3422
3423 case KEY_setpriority:
a0d0e21e 3424 LOP(OP_SETPRIORITY,XTERM);
79072805
LW
3425
3426 case KEY_sethostent:
ff68c719 3427 UNI(OP_SHOSTENT);
79072805
LW
3428
3429 case KEY_setnetent:
ff68c719 3430 UNI(OP_SNETENT);
79072805
LW
3431
3432 case KEY_setservent:
ff68c719 3433 UNI(OP_SSERVENT);
79072805
LW
3434
3435 case KEY_setprotoent:
ff68c719 3436 UNI(OP_SPROTOENT);
79072805
LW
3437
3438 case KEY_setpwent:
3439 FUN0(OP_SPWENT);
3440
3441 case KEY_setgrent:
3442 FUN0(OP_SGRENT);
3443
3444 case KEY_seekdir:
a0d0e21e 3445 LOP(OP_SEEKDIR,XTERM);
79072805
LW
3446
3447 case KEY_setsockopt:
a0d0e21e 3448 LOP(OP_SSOCKOPT,XTERM);
79072805
LW
3449
3450 case KEY_shift:
3451 UNI(OP_SHIFT);
3452
3453 case KEY_shmctl:
a0d0e21e 3454 LOP(OP_SHMCTL,XTERM);
79072805
LW
3455
3456 case KEY_shmget:
a0d0e21e 3457 LOP(OP_SHMGET,XTERM);
79072805
LW
3458
3459 case KEY_shmread:
a0d0e21e 3460 LOP(OP_SHMREAD,XTERM);
79072805
LW
3461
3462 case KEY_shmwrite:
a0d0e21e 3463 LOP(OP_SHMWRITE,XTERM);
79072805
LW
3464
3465 case KEY_shutdown:
a0d0e21e 3466 LOP(OP_SHUTDOWN,XTERM);
79072805
LW
3467
3468 case KEY_sin:
3469 UNI(OP_SIN);
3470
3471 case KEY_sleep:
3472 UNI(OP_SLEEP);
3473
3474 case KEY_socket:
a0d0e21e 3475 LOP(OP_SOCKET,XTERM);
79072805
LW
3476
3477 case KEY_socketpair:
a0d0e21e 3478 LOP(OP_SOCKPAIR,XTERM);
79072805
LW
3479
3480 case KEY_sort:
3481 checkcomma(s,tokenbuf,"subroutine name");
3482 s = skipspace(s);
3483 if (*s == ';' || *s == ')') /* probably a close */
463ee0b2
LW
3484 croak("sort is now a reserved word");
3485 expect = XTERM;
a0d0e21e
LW
3486 s = force_word(s,WORD,TRUE,TRUE,TRUE);
3487 LOP(OP_SORT,XREF);
79072805
LW
3488
3489 case KEY_split:
a0d0e21e 3490 LOP(OP_SPLIT,XTERM);
79072805
LW
3491
3492 case KEY_sprintf:
a0d0e21e 3493 LOP(OP_SPRINTF,XTERM);
79072805
LW
3494
3495 case KEY_splice:
a0d0e21e 3496 LOP(OP_SPLICE,XTERM);
79072805
LW
3497
3498 case KEY_sqrt:
3499 UNI(OP_SQRT);
3500
3501 case KEY_srand:
3502 UNI(OP_SRAND);
3503
3504 case KEY_stat:
3505 UNI(OP_STAT);
3506
3507 case KEY_study:
3508 sawstudy++;
3509 UNI(OP_STUDY);
3510
3511 case KEY_substr:
a0d0e21e 3512 LOP(OP_SUBSTR,XTERM);
79072805
LW
3513
3514 case KEY_format:
3515 case KEY_sub:
93a17b20 3516 really_sub:
79072805 3517 s = skipspace(s);
4633a7c4 3518
463ee0b2 3519 if (isIDFIRST(*s) || *s == '\'' || *s == ':') {
8903cb82 3520 char tmpbuf[sizeof tokenbuf];
4633a7c4 3521 expect = XBLOCK;
8903cb82 3522 d = scan_word(s, tmpbuf, sizeof tmpbuf, TRUE, &len);
463ee0b2
LW
3523 if (strchr(tmpbuf, ':'))
3524 sv_setpv(subname, tmpbuf);
3525 else {
3526 sv_setsv(subname,curstname);
8990e307 3527 sv_catpvn(subname,"::",2);
463ee0b2
LW
3528 sv_catpvn(subname,tmpbuf,len);
3529 }
a0d0e21e 3530 s = force_word(s,WORD,FALSE,TRUE,TRUE);
4633a7c4 3531 s = skipspace(s);
79072805 3532 }
4633a7c4
LW
3533 else {
3534 expect = XTERMBLOCK;
79072805 3535 sv_setpv(subname,"?");
4633a7c4
LW
3536 }
3537
3538 if (tmp == KEY_format) {
3539 s = skipspace(s);
3540 if (*s == '=')
3541 lex_formbrack = lex_brackets + 1;
3542 OPERATOR(FORMAT);
3543 }
79072805 3544
4633a7c4
LW
3545 /* Look for a prototype */
3546 if (*s == '(') {
68dc0745 3547 char *p;
3548
4633a7c4
LW
3549 s = scan_str(s);
3550 if (!s) {
3551 if (lex_stuff)
3552 SvREFCNT_dec(lex_stuff);
3553 lex_stuff = Nullsv;
3554 croak("Prototype not terminated");
3555 }
68dc0745 3556 /* strip spaces */
3557 d = SvPVX(lex_stuff);
3558 tmp = 0;
3559 for (p = d; *p; ++p) {
3560 if (!isSPACE(*p))
3561 d[tmp++] = *p;
3562 }
3563 d[tmp] = '\0';
3564 SvCUR(lex_stuff) = tmp;
3565
4633a7c4
LW
3566 nexttoke++;
3567 nextval[1] = nextval[0];
3568 nexttype[1] = nexttype[0];
3569 nextval[0].opval = (OP*)newSVOP(OP_CONST, 0, lex_stuff);
3570 nexttype[0] = THING;
3571 if (nexttoke == 1) {
3572 lex_defer = lex_state;
3573 lex_expect = expect;
3574 lex_state = LEX_KNOWNEXT;
3575 }
3576 lex_stuff = Nullsv;
3577 }
79072805 3578
4633a7c4
LW
3579 if (*SvPV(subname,na) == '?') {
3580 sv_setpv(subname,"__ANON__");
3581 TOKEN(ANONSUB);
3582 }
3583 PREBLOCK(SUB);
79072805
LW
3584
3585 case KEY_system:
3586 set_csh();
a0d0e21e 3587 LOP(OP_SYSTEM,XREF);
79072805
LW
3588
3589 case KEY_symlink:
a0d0e21e 3590 LOP(OP_SYMLINK,XTERM);
79072805
LW
3591
3592 case KEY_syscall:
a0d0e21e 3593 LOP(OP_SYSCALL,XTERM);
79072805 3594
c07a80fd 3595 case KEY_sysopen:
3596 LOP(OP_SYSOPEN,XTERM);
3597
137443ea 3598 case KEY_sysseek:
3599 LOP(OP_SYSSEEK,XTERM);
3600
96e4d5b1 3601 case KEY_sysread:
3602 LOP(OP_SYSREAD,XTERM);
3603
79072805 3604 case KEY_syswrite:
a0d0e21e 3605 LOP(OP_SYSWRITE,XTERM);
79072805
LW
3606
3607 case KEY_tr:
3608 s = scan_trans(s);
3609 TERM(sublex_start());
3610
3611 case KEY_tell:
3612 UNI(OP_TELL);
3613
3614 case KEY_telldir:
3615 UNI(OP_TELLDIR);
3616
463ee0b2 3617 case KEY_tie:
a0d0e21e 3618 LOP(OP_TIE,XTERM);
463ee0b2 3619
c07a80fd 3620 case KEY_tied:
3621 UNI(OP_TIED);
3622
79072805
LW
3623 case KEY_time:
3624 FUN0(OP_TIME);
3625
3626 case KEY_times:
3627 FUN0(OP_TMS);
3628
3629 case KEY_truncate:
a0d0e21e 3630 LOP(OP_TRUNCATE,XTERM);
79072805
LW
3631
3632 case KEY_uc:
3633 UNI(OP_UC);
3634
3635 case KEY_ucfirst:
3636 UNI(OP_UCFIRST);
3637
463ee0b2
LW
3638 case KEY_untie:
3639 UNI(OP_UNTIE);
3640
79072805
LW
3641 case KEY_until:
3642 yylval.ival = curcop->cop_line;
71be2cbc 3643 OPERATOR(UNTIL);
79072805
LW
3644
3645 case KEY_unless:
3646 yylval.ival = curcop->cop_line;
71be2cbc 3647 OPERATOR(UNLESS);
79072805
LW
3648
3649 case KEY_unlink:
a0d0e21e 3650 LOP(OP_UNLINK,XTERM);
79072805
LW
3651
3652 case KEY_undef:
3653 UNI(OP_UNDEF);
3654
3655 case KEY_unpack:
a0d0e21e 3656 LOP(OP_UNPACK,XTERM);
79072805
LW
3657
3658 case KEY_utime:
a0d0e21e 3659 LOP(OP_UTIME,XTERM);
79072805
LW
3660
3661 case KEY_umask:
748a9306
LW
3662 if (dowarn) {
3663 for (d = s; d < bufend && (isSPACE(*d) || *d == '('); d++) ;
3664 if (*d != '0' && isDIGIT(*d))
3665 yywarn("umask: argument is missing initial 0");
3666 }
79072805
LW
3667 UNI(OP_UMASK);
3668
3669 case KEY_unshift:
a0d0e21e
LW
3670 LOP(OP_UNSHIFT,XTERM);
3671
3672 case KEY_use:
3673 if (expect != XSTATE)
3674 yyerror("\"use\" not allowed in expression");
89bfa8cd 3675 s = skipspace(s);
3676 if(isDIGIT(*s)) {
3677 s = force_version(s);
3678 if(*s == ';' || (s = skipspace(s), *s == ';')) {
3679 nextval[nexttoke].opval = Nullop;
3680 force_next(WORD);
3681 }
3682 }
3683 else {
3684 s = force_word(s,WORD,FALSE,TRUE,FALSE);
3685 s = force_version(s);
3686 }
a0d0e21e
LW
3687 yylval.ival = 1;
3688 OPERATOR(USE);
79072805
LW
3689
3690 case KEY_values:
3691 UNI(OP_VALUES);
3692
3693 case KEY_vec:
3694 sawvec = TRUE;
a0d0e21e 3695 LOP(OP_VEC,XTERM);
79072805
LW
3696
3697 case KEY_while:
3698 yylval.ival = curcop->cop_line;
71be2cbc 3699 OPERATOR(WHILE);
79072805
LW
3700
3701 case KEY_warn:
a0d0e21e
LW
3702 hints |= HINT_BLOCK_SCOPE;
3703 LOP(OP_WARN,XTERM);
79072805
LW
3704
3705 case KEY_wait:
3706 FUN0(OP_WAIT);
3707
3708 case KEY_waitpid:
a0d0e21e 3709 LOP(OP_WAITPID,XTERM);
79072805
LW
3710
3711 case KEY_wantarray:
3712 FUN0(OP_WANTARRAY);
3713
3714 case KEY_write:
85e6fe83 3715 gv_fetchpv("\f",TRUE, SVt_PV); /* Make sure $^L is defined */
79072805
LW
3716 UNI(OP_ENTERWRITE);
3717
3718 case KEY_x:
3719 if (expect == XOPERATOR)
3720 Mop(OP_REPEAT);
3721 check_uni();
3722 goto just_a_word;
3723
a0d0e21e
LW
3724 case KEY_xor:
3725 yylval.ival = OP_XOR;
3726 OPERATOR(OROP);
3727
79072805
LW
3728 case KEY_y:
3729 s = scan_trans(s);
3730 TERM(sublex_start());
3731 }
3732 }
3733}
3734
3735I32
3736keyword(d, len)
3737register char *d;
3738I32 len;
3739{
3740 switch (*d) {
3741 case '_':
3742 if (d[1] == '_') {
a0d0e21e 3743 if (strEQ(d,"__FILE__")) return -KEY___FILE__;
68dc0745 3744 if (strEQ(d,"__LINE__")) return -KEY___LINE__;
3745 if (strEQ(d,"__PACKAGE__")) return -KEY___PACKAGE__;
e50aee73 3746 if (strEQ(d,"__DATA__")) return KEY___DATA__;
79072805
LW
3747 if (strEQ(d,"__END__")) return KEY___END__;
3748 }
3749 break;
8990e307
LW
3750 case 'A':
3751 if (strEQ(d,"AUTOLOAD")) return KEY_AUTOLOAD;
3752 break;
79072805 3753 case 'a':
463ee0b2
LW
3754 switch (len) {
3755 case 3:
a0d0e21e
LW
3756 if (strEQ(d,"and")) return -KEY_and;
3757 if (strEQ(d,"abs")) return -KEY_abs;
85e6fe83 3758 break;
463ee0b2 3759 case 5:
a0d0e21e
LW
3760 if (strEQ(d,"alarm")) return -KEY_alarm;
3761 if (strEQ(d,"atan2")) return -KEY_atan2;
463ee0b2
LW
3762 break;
3763 case 6:
a0d0e21e 3764 if (strEQ(d,"accept")) return -KEY_accept;
463ee0b2
LW
3765 break;
3766 }
79072805
LW
3767 break;
3768 case 'B':
3769 if (strEQ(d,"BEGIN")) return KEY_BEGIN;
93a17b20 3770 break;
79072805 3771 case 'b':
a0d0e21e
LW
3772 if (strEQ(d,"bless")) return -KEY_bless;
3773 if (strEQ(d,"bind")) return -KEY_bind;
3774 if (strEQ(d,"binmode")) return -KEY_binmode;
3775 break;
3776 case 'C':
3777 if (strEQ(d,"CORE")) return -KEY_CORE;
79072805
LW
3778 break;
3779 case 'c':
3780 switch (len) {
3781 case 3:
a0d0e21e
LW
3782 if (strEQ(d,"cmp")) return -KEY_cmp;
3783 if (strEQ(d,"chr")) return -KEY_chr;
3784 if (strEQ(d,"cos")) return -KEY_cos;
79072805
LW
3785 break;
3786 case 4:
3787 if (strEQ(d,"chop")) return KEY_chop;
3788 break;
3789 case 5:
a0d0e21e
LW
3790 if (strEQ(d,"close")) return -KEY_close;
3791 if (strEQ(d,"chdir")) return -KEY_chdir;
3792 if (strEQ(d,"chomp")) return KEY_chomp;
3793 if (strEQ(d,"chmod")) return -KEY_chmod;
3794 if (strEQ(d,"chown")) return -KEY_chown;
3795 if (strEQ(d,"crypt")) return -KEY_crypt;
79072805
LW
3796 break;
3797 case 6:
a0d0e21e
LW
3798 if (strEQ(d,"chroot")) return -KEY_chroot;
3799 if (strEQ(d,"caller")) return -KEY_caller;
79072805
LW
3800 break;
3801 case 7:
a0d0e21e 3802 if (strEQ(d,"connect")) return -KEY_connect;
79072805
LW
3803 break;
3804 case 8:
a0d0e21e
LW
3805 if (strEQ(d,"closedir")) return -KEY_closedir;
3806 if (strEQ(d,"continue")) return -KEY_continue;
79072805
LW
3807 break;
3808 }
3809 break;
ed6116ce
LW
3810 case 'D':
3811 if (strEQ(d,"DESTROY")) return KEY_DESTROY;
3812 break;
79072805
LW
3813 case 'd':
3814 switch (len) {
3815 case 2:
3816 if (strEQ(d,"do")) return KEY_do;
3817 break;
3818 case 3:
a0d0e21e 3819 if (strEQ(d,"die")) return -KEY_die;
79072805
LW
3820 break;
3821 case 4:
a0d0e21e 3822 if (strEQ(d,"dump")) return -KEY_dump;
79072805
LW
3823 break;
3824 case 6:
3825 if (strEQ(d,"delete")) return KEY_delete;
3826 break;
3827 case 7:
3828 if (strEQ(d,"defined")) return KEY_defined;
a0d0e21e 3829 if (strEQ(d,"dbmopen")) return -KEY_dbmopen;
79072805
LW
3830 break;
3831 case 8:
a0d0e21e 3832 if (strEQ(d,"dbmclose")) return -KEY_dbmclose;
79072805
LW
3833 break;
3834 }
3835 break;
3836 case 'E':
a0d0e21e 3837 if (strEQ(d,"EQ")) { deprecate(d); return -KEY_eq;}
79072805
LW
3838 if (strEQ(d,"END")) return KEY_END;
3839 break;
3840 case 'e':
3841 switch (len) {
3842 case 2:
a0d0e21e 3843 if (strEQ(d,"eq")) return -KEY_eq;
79072805
LW
3844 break;
3845 case 3:
a0d0e21e
LW
3846 if (strEQ(d,"eof")) return -KEY_eof;
3847 if (strEQ(d,"exp")) return -KEY_exp;
79072805
LW
3848 break;
3849 case 4:
3850 if (strEQ(d,"else")) return KEY_else;
a0d0e21e 3851 if (strEQ(d,"exit")) return -KEY_exit;
79072805 3852 if (strEQ(d,"eval")) return KEY_eval;
a0d0e21e 3853 if (strEQ(d,"exec")) return -KEY_exec;
79072805
LW
3854 if (strEQ(d,"each")) return KEY_each;
3855 break;
3856 case 5:
3857 if (strEQ(d,"elsif")) return KEY_elsif;
3858 break;
a0d0e21e
LW
3859 case 6:
3860 if (strEQ(d,"exists")) return KEY_exists;
4633a7c4 3861 if (strEQ(d,"elseif")) warn("elseif should be elsif");
a0d0e21e 3862 break;
79072805 3863 case 8:
a0d0e21e
LW
3864 if (strEQ(d,"endgrent")) return -KEY_endgrent;
3865 if (strEQ(d,"endpwent")) return -KEY_endpwent;
79072805
LW
3866 break;
3867 case 9:
a0d0e21e 3868 if (strEQ(d,"endnetent")) return -KEY_endnetent;
79072805
LW
3869 break;
3870 case 10:
a0d0e21e
LW
3871 if (strEQ(d,"endhostent")) return -KEY_endhostent;
3872 if (strEQ(d,"endservent")) return -KEY_endservent;
79072805
LW
3873 break;
3874 case 11:
a0d0e21e 3875 if (strEQ(d,"endprotoent")) return -KEY_endprotoent;
79072805 3876 break;
a687059c 3877 }
a687059c 3878 break;
79072805
LW
3879 case 'f':
3880 switch (len) {
3881 case 3:
3882 if (strEQ(d,"for")) return KEY_for;
3883 break;
3884 case 4:
a0d0e21e 3885 if (strEQ(d,"fork")) return -KEY_fork;
79072805
LW
3886 break;
3887 case 5:
a0d0e21e
LW
3888 if (strEQ(d,"fcntl")) return -KEY_fcntl;
3889 if (strEQ(d,"flock")) return -KEY_flock;
79072805
LW
3890 break;
3891 case 6:
3892 if (strEQ(d,"format")) return KEY_format;
a0d0e21e 3893 if (strEQ(d,"fileno")) return -KEY_fileno;
79072805
LW
3894 break;
3895 case 7:
3896 if (strEQ(d,"foreach")) return KEY_foreach;
3897 break;
3898 case 8:
a0d0e21e 3899 if (strEQ(d,"formline")) return -KEY_formline;
79072805 3900 break;
378cc40b 3901 }
a687059c 3902 break;
79072805
LW
3903 case 'G':
3904 if (len == 2) {
a0d0e21e
LW
3905 if (strEQ(d,"GT")) { deprecate(d); return -KEY_gt;}
3906 if (strEQ(d,"GE")) { deprecate(d); return -KEY_ge;}
9f68db38 3907 }
a687059c 3908 break;
79072805 3909 case 'g':
a687059c
LW
3910 if (strnEQ(d,"get",3)) {
3911 d += 3;
3912 if (*d == 'p') {
79072805
LW
3913 switch (len) {
3914 case 7:
a0d0e21e
LW
3915 if (strEQ(d,"ppid")) return -KEY_getppid;
3916 if (strEQ(d,"pgrp")) return -KEY_getpgrp;
79072805
LW
3917 break;
3918 case 8:
a0d0e21e
LW
3919 if (strEQ(d,"pwent")) return -KEY_getpwent;
3920 if (strEQ(d,"pwnam")) return -KEY_getpwnam;
3921 if (strEQ(d,"pwuid")) return -KEY_getpwuid;
79072805
LW
3922 break;
3923 case 11:
a0d0e21e
LW
3924 if (strEQ(d,"peername")) return -KEY_getpeername;
3925 if (strEQ(d,"protoent")) return -KEY_getprotoent;
3926 if (strEQ(d,"priority")) return -KEY_getpriority;
79072805
LW
3927 break;
3928 case 14:
a0d0e21e 3929 if (strEQ(d,"protobyname")) return -KEY_getprotobyname;
79072805
LW
3930 break;
3931 case 16:
a0d0e21e 3932 if (strEQ(d,"protobynumber"))return -KEY_getprotobynumber;
79072805
LW
3933 break;
3934 }
a687059c
LW
3935 }
3936 else if (*d == 'h') {
a0d0e21e
LW
3937 if (strEQ(d,"hostbyname")) return -KEY_gethostbyname;
3938 if (strEQ(d,"hostbyaddr")) return -KEY_gethostbyaddr;
3939 if (strEQ(d,"hostent")) return -KEY_gethostent;
a687059c
LW
3940 }
3941 else if (*d == 'n') {
a0d0e21e
LW
3942 if (strEQ(d,"netbyname")) return -KEY_getnetbyname;
3943 if (strEQ(d,"netbyaddr")) return -KEY_getnetbyaddr;
3944 if (strEQ(d,"netent")) return -KEY_getnetent;
a687059c
LW
3945 }
3946 else if (*d == 's') {
a0d0e21e
LW
3947 if (strEQ(d,"servbyname")) return -KEY_getservbyname;
3948 if (strEQ(d,"servbyport")) return -KEY_getservbyport;
3949 if (strEQ(d,"servent")) return -KEY_getservent;
3950 if (strEQ(d,"sockname")) return -KEY_getsockname;
3951 if (strEQ(d,"sockopt")) return -KEY_getsockopt;
a687059c
LW
3952 }
3953 else if (*d == 'g') {
a0d0e21e
LW
3954 if (strEQ(d,"grent")) return -KEY_getgrent;
3955 if (strEQ(d,"grnam")) return -KEY_getgrnam;
3956 if (strEQ(d,"grgid")) return -KEY_getgrgid;
a687059c
LW
3957 }
3958 else if (*d == 'l') {
a0d0e21e 3959 if (strEQ(d,"login")) return -KEY_getlogin;
a687059c 3960 }
a0d0e21e 3961 else if (strEQ(d,"c")) return -KEY_getc;
79072805 3962 break;
a687059c 3963 }
79072805
LW
3964 switch (len) {
3965 case 2:
a0d0e21e
LW
3966 if (strEQ(d,"gt")) return -KEY_gt;
3967 if (strEQ(d,"ge")) return -KEY_ge;
79072805
LW
3968 break;
3969 case 4:
3970 if (strEQ(d,"grep")) return KEY_grep;
3971 if (strEQ(d,"goto")) return KEY_goto;
a0d0e21e 3972 if (strEQ(d,"glob")) return -KEY_glob;
79072805
LW
3973 break;
3974 case 6:
a0d0e21e 3975 if (strEQ(d,"gmtime")) return -KEY_gmtime;
79072805 3976 break;
378cc40b 3977 }
a687059c 3978 break;
79072805 3979 case 'h':
a0d0e21e 3980 if (strEQ(d,"hex")) return -KEY_hex;
a687059c 3981 break;
79072805
LW
3982 case 'i':
3983 switch (len) {
3984 case 2:
3985 if (strEQ(d,"if")) return KEY_if;
3986 break;
3987 case 3:
a0d0e21e 3988 if (strEQ(d,"int")) return -KEY_int;
79072805
LW
3989 break;
3990 case 5:
a0d0e21e
LW
3991 if (strEQ(d,"index")) return -KEY_index;
3992 if (strEQ(d,"ioctl")) return -KEY_ioctl;
79072805
LW
3993 break;
3994 }
a687059c 3995 break;
79072805 3996 case 'j':
a0d0e21e 3997 if (strEQ(d,"join")) return -KEY_join;
a687059c 3998 break;
79072805
LW
3999 case 'k':
4000 if (len == 4) {
4001 if (strEQ(d,"keys")) return KEY_keys;
a0d0e21e 4002 if (strEQ(d,"kill")) return -KEY_kill;
663a0e37 4003 }
79072805
LW
4004 break;
4005 case 'L':
4006 if (len == 2) {
a0d0e21e
LW
4007 if (strEQ(d,"LT")) { deprecate(d); return -KEY_lt;}
4008 if (strEQ(d,"LE")) { deprecate(d); return -KEY_le;}
378cc40b 4009 }
79072805
LW
4010 break;
4011 case 'l':
4012 switch (len) {
4013 case 2:
a0d0e21e
LW
4014 if (strEQ(d,"lt")) return -KEY_lt;
4015 if (strEQ(d,"le")) return -KEY_le;
4016 if (strEQ(d,"lc")) return -KEY_lc;
79072805
LW
4017 break;
4018 case 3:
a0d0e21e 4019 if (strEQ(d,"log")) return -KEY_log;
79072805
LW
4020 break;
4021 case 4:
4022 if (strEQ(d,"last")) return KEY_last;
a0d0e21e 4023 if (strEQ(d,"link")) return -KEY_link;
395c3793 4024 break;
79072805
LW
4025 case 5:
4026 if (strEQ(d,"local")) return KEY_local;
a0d0e21e 4027 if (strEQ(d,"lstat")) return -KEY_lstat;
79072805
LW
4028 break;
4029 case 6:
a0d0e21e
LW
4030 if (strEQ(d,"length")) return -KEY_length;
4031 if (strEQ(d,"listen")) return -KEY_listen;
79072805
LW
4032 break;
4033 case 7:
a0d0e21e 4034 if (strEQ(d,"lcfirst")) return -KEY_lcfirst;
79072805
LW
4035 break;
4036 case 9:
a0d0e21e 4037 if (strEQ(d,"localtime")) return -KEY_localtime;
395c3793
LW
4038 break;
4039 }
a687059c 4040 break;
79072805
LW
4041 case 'm':
4042 switch (len) {
4043 case 1: return KEY_m;
93a17b20
LW
4044 case 2:
4045 if (strEQ(d,"my")) return KEY_my;
4046 break;
a0d0e21e
LW
4047 case 3:
4048 if (strEQ(d,"map")) return KEY_map;
4049 break;
79072805 4050 case 5:
a0d0e21e 4051 if (strEQ(d,"mkdir")) return -KEY_mkdir;
79072805
LW
4052 break;
4053 case 6:
a0d0e21e
LW
4054 if (strEQ(d,"msgctl")) return -KEY_msgctl;
4055 if (strEQ(d,"msgget")) return -KEY_msgget;
4056 if (strEQ(d,"msgrcv")) return -KEY_msgrcv;
4057 if (strEQ(d,"msgsnd")) return -KEY_msgsnd;
79072805
LW
4058 break;
4059 }
a687059c 4060 break;
79072805 4061 case 'N':
a0d0e21e 4062 if (strEQ(d,"NE")) { deprecate(d); return -KEY_ne;}
a687059c 4063 break;
79072805
LW
4064 case 'n':
4065 if (strEQ(d,"next")) return KEY_next;
a0d0e21e
LW
4066 if (strEQ(d,"ne")) return -KEY_ne;
4067 if (strEQ(d,"not")) return -KEY_not;
4068 if (strEQ(d,"no")) return KEY_no;
a687059c 4069 break;
79072805
LW
4070 case 'o':
4071 switch (len) {
463ee0b2 4072 case 2:
a0d0e21e 4073 if (strEQ(d,"or")) return -KEY_or;
463ee0b2 4074 break;
79072805 4075 case 3:
a0d0e21e
LW
4076 if (strEQ(d,"ord")) return -KEY_ord;
4077 if (strEQ(d,"oct")) return -KEY_oct;
79072805
LW
4078 break;
4079 case 4:
a0d0e21e 4080 if (strEQ(d,"open")) return -KEY_open;
79072805
LW
4081 break;
4082 case 7:
a0d0e21e 4083 if (strEQ(d,"opendir")) return -KEY_opendir;
79072805 4084 break;
fe14fcc3 4085 }
a687059c 4086 break;
79072805
LW
4087 case 'p':
4088 switch (len) {
4089 case 3:
4090 if (strEQ(d,"pop")) return KEY_pop;
a0d0e21e 4091 if (strEQ(d,"pos")) return KEY_pos;
79072805
LW
4092 break;
4093 case 4:
4094 if (strEQ(d,"push")) return KEY_push;
a0d0e21e
LW
4095 if (strEQ(d,"pack")) return -KEY_pack;
4096 if (strEQ(d,"pipe")) return -KEY_pipe;
79072805
LW
4097 break;
4098 case 5:
4099 if (strEQ(d,"print")) return KEY_print;
4100 break;
4101 case 6:
4102 if (strEQ(d,"printf")) return KEY_printf;
4103 break;
4104 case 7:
4105 if (strEQ(d,"package")) return KEY_package;
4106 break;
c07a80fd 4107 case 9:
4108 if (strEQ(d,"prototype")) return KEY_prototype;
663a0e37 4109 }
79072805
LW
4110 break;
4111 case 'q':
4112 if (len <= 2) {
4113 if (strEQ(d,"q")) return KEY_q;
4114 if (strEQ(d,"qq")) return KEY_qq;
8990e307 4115 if (strEQ(d,"qw")) return KEY_qw;
79072805 4116 if (strEQ(d,"qx")) return KEY_qx;
663a0e37 4117 }
a0d0e21e 4118 else if (strEQ(d,"quotemeta")) return -KEY_quotemeta;
79072805
LW
4119 break;
4120 case 'r':
4121 switch (len) {
4122 case 3:
a0d0e21e 4123 if (strEQ(d,"ref")) return -KEY_ref;
79072805
LW
4124 break;
4125 case 4:
a0d0e21e
LW
4126 if (strEQ(d,"read")) return -KEY_read;
4127 if (strEQ(d,"rand")) return -KEY_rand;
4128 if (strEQ(d,"recv")) return -KEY_recv;
79072805
LW
4129 if (strEQ(d,"redo")) return KEY_redo;
4130 break;
4131 case 5:
a0d0e21e
LW
4132 if (strEQ(d,"rmdir")) return -KEY_rmdir;
4133 if (strEQ(d,"reset")) return -KEY_reset;
79072805
LW
4134 break;
4135 case 6:
4136 if (strEQ(d,"return")) return KEY_return;
a0d0e21e
LW
4137 if (strEQ(d,"rename")) return -KEY_rename;
4138 if (strEQ(d,"rindex")) return -KEY_rindex;
79072805
LW
4139 break;
4140 case 7:
a0d0e21e
LW
4141 if (strEQ(d,"require")) return -KEY_require;
4142 if (strEQ(d,"reverse")) return -KEY_reverse;
4143 if (strEQ(d,"readdir")) return -KEY_readdir;
79072805
LW
4144 break;
4145 case 8:
a0d0e21e
LW
4146 if (strEQ(d,"readlink")) return -KEY_readlink;
4147 if (strEQ(d,"readline")) return -KEY_readline;
4148 if (strEQ(d,"readpipe")) return -KEY_readpipe;
79072805
LW
4149 break;
4150 case 9:
a0d0e21e 4151 if (strEQ(d,"rewinddir")) return -KEY_rewinddir;
79072805 4152 break;
a687059c 4153 }
79072805
LW
4154 break;
4155 case 's':
a687059c 4156 switch (d[1]) {
79072805 4157 case 0: return KEY_s;
a687059c 4158 case 'c':
79072805 4159 if (strEQ(d,"scalar")) return KEY_scalar;
a687059c
LW
4160 break;
4161 case 'e':
79072805
LW
4162 switch (len) {
4163 case 4:
a0d0e21e
LW
4164 if (strEQ(d,"seek")) return -KEY_seek;
4165 if (strEQ(d,"send")) return -KEY_send;
79072805
LW
4166 break;
4167 case 5:
a0d0e21e 4168 if (strEQ(d,"semop")) return -KEY_semop;
79072805
LW
4169 break;
4170 case 6:
a0d0e21e
LW
4171 if (strEQ(d,"select")) return -KEY_select;
4172 if (strEQ(d,"semctl")) return -KEY_semctl;
4173 if (strEQ(d,"semget")) return -KEY_semget;
79072805
LW
4174 break;
4175 case 7:
a0d0e21e
LW
4176 if (strEQ(d,"setpgrp")) return -KEY_setpgrp;
4177 if (strEQ(d,"seekdir")) return -KEY_seekdir;
79072805
LW
4178 break;
4179 case 8:
a0d0e21e
LW
4180 if (strEQ(d,"setpwent")) return -KEY_setpwent;
4181 if (strEQ(d,"setgrent")) return -KEY_setgrent;
79072805
LW
4182 break;
4183 case 9:
a0d0e21e 4184 if (strEQ(d,"setnetent")) return -KEY_setnetent;
79072805
LW
4185 break;
4186 case 10:
a0d0e21e
LW
4187 if (strEQ(d,"setsockopt")) return -KEY_setsockopt;
4188 if (strEQ(d,"sethostent")) return -KEY_sethostent;
4189 if (strEQ(d,"setservent")) return -KEY_setservent;
79072805
LW
4190 break;
4191 case 11:
a0d0e21e
LW
4192 if (strEQ(d,"setpriority")) return -KEY_setpriority;
4193 if (strEQ(d,"setprotoent")) return -KEY_setprotoent;
79072805
LW
4194 break;
4195 }
a687059c
LW
4196 break;
4197 case 'h':
79072805
LW
4198 switch (len) {
4199 case 5:
4200 if (strEQ(d,"shift")) return KEY_shift;
4201 break;
4202 case 6:
a0d0e21e
LW
4203 if (strEQ(d,"shmctl")) return -KEY_shmctl;
4204 if (strEQ(d,"shmget")) return -KEY_shmget;
79072805
LW
4205 break;
4206 case 7:
a0d0e21e 4207 if (strEQ(d,"shmread")) return -KEY_shmread;
79072805
LW
4208 break;
4209 case 8:
a0d0e21e
LW
4210 if (strEQ(d,"shmwrite")) return -KEY_shmwrite;
4211 if (strEQ(d,"shutdown")) return -KEY_shutdown;
79072805
LW
4212 break;
4213 }
a687059c
LW
4214 break;
4215 case 'i':
a0d0e21e 4216 if (strEQ(d,"sin")) return -KEY_sin;
a687059c
LW
4217 break;
4218 case 'l':
a0d0e21e 4219 if (strEQ(d,"sleep")) return -KEY_sleep;
a687059c
LW
4220 break;
4221 case 'o':
79072805 4222 if (strEQ(d,"sort")) return KEY_sort;
a0d0e21e
LW
4223 if (strEQ(d,"socket")) return -KEY_socket;
4224 if (strEQ(d,"socketpair")) return -KEY_socketpair;
a687059c
LW
4225 break;
4226 case 'p':
79072805 4227 if (strEQ(d,"split")) return KEY_split;
a0d0e21e 4228 if (strEQ(d,"sprintf")) return -KEY_sprintf;
79072805 4229 if (strEQ(d,"splice")) return KEY_splice;
a687059c
LW
4230 break;
4231 case 'q':
a0d0e21e 4232 if (strEQ(d,"sqrt")) return -KEY_sqrt;
a687059c
LW
4233 break;
4234 case 'r':
a0d0e21e 4235 if (strEQ(d,"srand")) return -KEY_srand;
a687059c
LW
4236 break;
4237 case 't':
a0d0e21e 4238 if (strEQ(d,"stat")) return -KEY_stat;
79072805 4239 if (strEQ(d,"study")) return KEY_study;
a687059c
LW
4240 break;
4241 case 'u':
a0d0e21e 4242 if (strEQ(d,"substr")) return -KEY_substr;
79072805 4243 if (strEQ(d,"sub")) return KEY_sub;
a687059c
LW
4244 break;
4245 case 'y':
79072805
LW
4246 switch (len) {
4247 case 6:
a0d0e21e 4248 if (strEQ(d,"system")) return -KEY_system;
79072805
LW
4249 break;
4250 case 7:
a0d0e21e
LW
4251 if (strEQ(d,"symlink")) return -KEY_symlink;
4252 if (strEQ(d,"syscall")) return -KEY_syscall;
137443ea 4253 if (strEQ(d,"sysopen")) return -KEY_sysopen;
4254 if (strEQ(d,"sysread")) return -KEY_sysread;
4255 if (strEQ(d,"sysseek")) return -KEY_sysseek;
79072805
LW
4256 break;
4257 case 8:
a0d0e21e 4258 if (strEQ(d,"syswrite")) return -KEY_syswrite;
79072805 4259 break;
a687059c 4260 }
a687059c
LW
4261 break;
4262 }
4263 break;
79072805
LW
4264 case 't':
4265 switch (len) {
4266 case 2:
4267 if (strEQ(d,"tr")) return KEY_tr;
4268 break;
463ee0b2
LW
4269 case 3:
4270 if (strEQ(d,"tie")) return KEY_tie;
4271 break;
79072805 4272 case 4:
a0d0e21e 4273 if (strEQ(d,"tell")) return -KEY_tell;
c07a80fd 4274 if (strEQ(d,"tied")) return KEY_tied;
a0d0e21e 4275 if (strEQ(d,"time")) return -KEY_time;
79072805
LW
4276 break;
4277 case 5:
a0d0e21e 4278 if (strEQ(d,"times")) return -KEY_times;
79072805
LW
4279 break;
4280 case 7:
a0d0e21e 4281 if (strEQ(d,"telldir")) return -KEY_telldir;
79072805
LW
4282 break;
4283 case 8:
a0d0e21e 4284 if (strEQ(d,"truncate")) return -KEY_truncate;
79072805 4285 break;
378cc40b 4286 }
a687059c 4287 break;
79072805
LW
4288 case 'u':
4289 switch (len) {
4290 case 2:
a0d0e21e
LW
4291 if (strEQ(d,"uc")) return -KEY_uc;
4292 break;
4293 case 3:
4294 if (strEQ(d,"use")) return KEY_use;
79072805
LW
4295 break;
4296 case 5:
4297 if (strEQ(d,"undef")) return KEY_undef;
4298 if (strEQ(d,"until")) return KEY_until;
463ee0b2 4299 if (strEQ(d,"untie")) return KEY_untie;
a0d0e21e
LW
4300 if (strEQ(d,"utime")) return -KEY_utime;
4301 if (strEQ(d,"umask")) return -KEY_umask;
79072805
LW
4302 break;
4303 case 6:
4304 if (strEQ(d,"unless")) return KEY_unless;
a0d0e21e
LW
4305 if (strEQ(d,"unpack")) return -KEY_unpack;
4306 if (strEQ(d,"unlink")) return -KEY_unlink;
79072805
LW
4307 break;
4308 case 7:
4309 if (strEQ(d,"unshift")) return KEY_unshift;
a0d0e21e 4310 if (strEQ(d,"ucfirst")) return -KEY_ucfirst;
79072805 4311 break;
a687059c
LW
4312 }
4313 break;
79072805 4314 case 'v':
a0d0e21e
LW
4315 if (strEQ(d,"values")) return -KEY_values;
4316 if (strEQ(d,"vec")) return -KEY_vec;
a687059c 4317 break;
79072805
LW
4318 case 'w':
4319 switch (len) {
4320 case 4:
a0d0e21e
LW
4321 if (strEQ(d,"warn")) return -KEY_warn;
4322 if (strEQ(d,"wait")) return -KEY_wait;
79072805
LW
4323 break;
4324 case 5:
4325 if (strEQ(d,"while")) return KEY_while;
a0d0e21e 4326 if (strEQ(d,"write")) return -KEY_write;
79072805
LW
4327 break;
4328 case 7:
a0d0e21e 4329 if (strEQ(d,"waitpid")) return -KEY_waitpid;
79072805
LW
4330 break;
4331 case 9:
a0d0e21e 4332 if (strEQ(d,"wantarray")) return -KEY_wantarray;
79072805 4333 break;
2f3197b3 4334 }
a687059c 4335 break;
79072805 4336 case 'x':
a0d0e21e
LW
4337 if (len == 1) return -KEY_x;
4338 if (strEQ(d,"xor")) return -KEY_xor;
a687059c 4339 break;
79072805
LW
4340 case 'y':
4341 if (len == 1) return KEY_y;
4342 break;
4343 case 'z':
a687059c
LW
4344 break;
4345 }
79072805 4346 return 0;
a687059c
LW
4347}
4348
8990e307 4349static void
2f3197b3 4350checkcomma(s,name,what)
a687059c 4351register char *s;
2f3197b3 4352char *name;
a687059c
LW
4353char *what;
4354{
2f3197b3
LW
4355 char *w;
4356
463ee0b2 4357 if (dowarn && *s == ' ' && s[1] == '(') { /* XXX gotta be a better way */
a0d0e21e
LW
4358 int level = 1;
4359 for (w = s+2; *w && level; w++) {
4360 if (*w == '(')
4361 ++level;
4362 else if (*w == ')')
4363 --level;
4364 }
4365 if (*w)
4366 for (; *w && isSPACE(*w); w++) ;
d1f3fb15 4367 if (!*w || !strchr(";|})]oaiuw!=", *w)) /* an advisory hack only... */
2f3197b3
LW
4368 warn("%s (...) interpreted as function",name);
4369 }
4370 while (s < bufend && isSPACE(*s))
4371 s++;
a687059c
LW
4372 if (*s == '(')
4373 s++;
de3bb511 4374 while (s < bufend && isSPACE(*s))
a687059c 4375 s++;
79072805 4376 if (isIDFIRST(*s)) {
2f3197b3 4377 w = s++;
de3bb511 4378 while (isALNUM(*s))
a687059c 4379 s++;
de3bb511 4380 while (s < bufend && isSPACE(*s))
a687059c 4381 s++;
e929a76b 4382 if (*s == ',') {
463ee0b2 4383 int kw;
e929a76b 4384 *s = '\0';
4633a7c4 4385 kw = keyword(w, s - w) || perl_get_cv(w, FALSE) != 0;
e929a76b 4386 *s = ',';
463ee0b2 4387 if (kw)
e929a76b 4388 return;
463ee0b2
LW
4389 croak("No comma allowed after %s", what);
4390 }
4391 }
4392}
4393
8990e307 4394static char *
8903cb82 4395scan_word(s, dest, destlen, allow_package, slp)
463ee0b2
LW
4396register char *s;
4397char *dest;
8903cb82 4398STRLEN destlen;
463ee0b2
LW
4399int allow_package;
4400STRLEN *slp;
4401{
4402 register char *d = dest;
8903cb82 4403 register char *e = d + destlen - 3; /* two-character token, ending NUL */
463ee0b2 4404 for (;;) {
8903cb82 4405 if (d >= e)
fc36a67e 4406 croak(ident_too_long);
463ee0b2
LW
4407 if (isALNUM(*s))
4408 *d++ = *s++;
4409 else if (*s == '\'' && allow_package && isIDFIRST(s[1])) {
4410 *d++ = ':';
4411 *d++ = ':';
4412 s++;
4413 }
4414 else if (*s == ':' && s[1] == ':' && allow_package && isIDFIRST(s[2])) {
4415 *d++ = *s++;
4416 *d++ = *s++;
4417 }
4418 else {
4419 *d = '\0';
4420 *slp = d - dest;
4421 return s;
e929a76b 4422 }
378cc40b
LW
4423 }
4424}
4425
8990e307 4426static char *
8903cb82 4427scan_ident(s, send, dest, destlen, ck_uni)
378cc40b 4428register char *s;
a687059c 4429register char *send;
378cc40b 4430char *dest;
8903cb82 4431STRLEN destlen;
79072805 4432I32 ck_uni;
378cc40b
LW
4433{
4434 register char *d;
8903cb82 4435 register char *e;
79072805 4436 char *bracket = 0;
748a9306 4437 char funny = *s++;
378cc40b 4438
79072805
LW
4439 if (lex_brackets == 0)
4440 lex_fakebrack = 0;
a0d0e21e
LW
4441 if (isSPACE(*s))
4442 s = skipspace(s);
378cc40b 4443 d = dest;
8903cb82 4444 e = d + destlen - 3; /* two-character token, ending NUL */
de3bb511 4445 if (isDIGIT(*s)) {
8903cb82 4446 while (isDIGIT(*s)) {
4447 if (d >= e)
fc36a67e 4448 croak(ident_too_long);
378cc40b 4449 *d++ = *s++;
8903cb82 4450 }
378cc40b
LW
4451 }
4452 else {
463ee0b2 4453 for (;;) {
8903cb82 4454 if (d >= e)
fc36a67e 4455 croak(ident_too_long);
463ee0b2
LW
4456 if (isALNUM(*s))
4457 *d++ = *s++;
4458 else if (*s == '\'' && isIDFIRST(s[1])) {
4459 *d++ = ':';
4460 *d++ = ':';
4461 s++;
4462 }
a0d0e21e 4463 else if (*s == ':' && s[1] == ':') {
463ee0b2
LW
4464 *d++ = *s++;
4465 *d++ = *s++;
4466 }
4467 else
4468 break;
4469 }
378cc40b
LW
4470 }
4471 *d = '\0';
4472 d = dest;
79072805
LW
4473 if (*d) {
4474 if (lex_state != LEX_NORMAL)
4475 lex_state = LEX_INTERPENDMAYBE;
4476 return s;
378cc40b 4477 }
748a9306 4478 if (*s == '$' && s[1] &&
ff0cee69 4479 (isALNUM(s[1]) || strchr("${", s[1]) || strnEQ(s+1,"::",2)) )
5cd24f17 4480 {
4481 if (isDIGIT(s[1]) && lex_state == LEX_INTERPNORMAL)
4482 deprecate("\"$$<digit>\" to mean \"${$}<digit>\"");
4483 else
4484 return s;
4485 }
79072805
LW
4486 if (*s == '{') {
4487 bracket = s;
4488 s++;
4489 }
4490 else if (ck_uni)
4491 check_uni();
93a17b20 4492 if (s < send)
79072805
LW
4493 *d = *s++;
4494 d[1] = '\0';
748a9306 4495 if (*d == '^' && *s && (isUPPER(*s) || strchr("[\\]^_?", *s))) {
bbce6d69 4496 *d = toCTRL(*s);
4497 s++;
de3bb511 4498 }
79072805 4499 if (bracket) {
748a9306 4500 if (isSPACE(s[-1])) {
fa83b5b6 4501 while (s < send) {
4502 char ch = *s++;
4503 if (ch != ' ' && ch != '\t') {
4504 *d = ch;
4505 break;
4506 }
4507 }
748a9306 4508 }
ff68c719 4509 if (isIDFIRST(*d)) {
79072805 4510 d++;
748a9306 4511 while (isALNUM(*s) || *s == ':')
79072805
LW
4512 *d++ = *s++;
4513 *d = '\0';
748a9306 4514 while (s < send && (*s == ' ' || *s == '\t')) s++;
ff68c719 4515 if ((*s == '[' || (*s == '{' && strNE(dest, "sub")))) {
748a9306
LW
4516 if (dowarn && keyword(dest, d - dest)) {
4517 char *brack = *s == '[' ? "[...]" : "{...}";
4518 warn("Ambiguous use of %c{%s%s} resolved to %c%s%s",
4519 funny, dest, brack, funny, dest, brack);
4520 }
4521 lex_fakebrack = lex_brackets+1;
79072805 4522 bracket++;
a0d0e21e 4523 lex_brackstack[lex_brackets++] = XOPERATOR;
79072805
LW
4524 return s;
4525 }
4526 }
4527 if (*s == '}') {
4528 s++;
4529 if (lex_state == LEX_INTERPNORMAL && !lex_brackets)
4530 lex_state = LEX_INTERPEND;
748a9306
LW
4531 if (funny == '#')
4532 funny = '@';
84902520 4533 if (dowarn && lex_state == LEX_NORMAL &&
748a9306
LW
4534 (keyword(dest, d - dest) || perl_get_cv(dest, FALSE)))
4535 warn("Ambiguous use of %c{%s} resolved to %c%s",
4536 funny, dest, funny, dest);
79072805
LW
4537 }
4538 else {
4539 s = bracket; /* let the parser handle it */
93a17b20 4540 *dest = '\0';
79072805
LW
4541 }
4542 }
4543 else if (lex_state == LEX_INTERPNORMAL && !lex_brackets && !intuit_more(s))
4544 lex_state = LEX_INTERPEND;
378cc40b
LW
4545 return s;
4546}
4547
a0d0e21e
LW
4548void pmflag(pmfl,ch)
4549U16* pmfl;
4550int ch;
4551{
bbce6d69 4552 if (ch == 'i')
a0d0e21e 4553 *pmfl |= PMf_FOLD;
a0d0e21e
LW
4554 else if (ch == 'g')
4555 *pmfl |= PMf_GLOBAL;
c90c0ff4 4556 else if (ch == 'c')
4557 *pmfl |= PMf_CONTINUE;
a0d0e21e
LW
4558 else if (ch == 'o')
4559 *pmfl |= PMf_KEEP;
4560 else if (ch == 'm')
4561 *pmfl |= PMf_MULTILINE;
4562 else if (ch == 's')
4563 *pmfl |= PMf_SINGLELINE;
4564 else if (ch == 'x')
4565 *pmfl |= PMf_EXTENDED;
4566}
378cc40b 4567
8990e307 4568static char *
79072805
LW
4569scan_pat(start)
4570char *start;
378cc40b 4571{
79072805
LW
4572 PMOP *pm;
4573 char *s;
378cc40b 4574
79072805
LW
4575 s = scan_str(start);
4576 if (!s) {
4577 if (lex_stuff)
8990e307 4578 SvREFCNT_dec(lex_stuff);
79072805 4579 lex_stuff = Nullsv;
463ee0b2 4580 croak("Search pattern not terminated");
378cc40b 4581 }
bbce6d69 4582
79072805 4583 pm = (PMOP*)newPMOP(OP_MATCH, 0);
a0d0e21e 4584 if (multi_open == '?')
79072805 4585 pm->op_pmflags |= PMf_ONCE;
c90c0ff4 4586 while (*s && strchr("iogcmsx", *s))
a0d0e21e 4587 pmflag(&pm->op_pmflags,*s++);
4633a7c4 4588 pm->op_pmpermflags = pm->op_pmflags;
bbce6d69 4589
79072805
LW
4590 lex_op = (OP*)pm;
4591 yylval.ival = OP_MATCH;
378cc40b
LW
4592 return s;
4593}
4594
8990e307 4595static char *
79072805 4596scan_subst(start)
2f3197b3 4597char *start;
79072805 4598{
a0d0e21e 4599 register char *s;
79072805 4600 register PMOP *pm;
4fdae800 4601 I32 first_start;
79072805
LW
4602 I32 es = 0;
4603
79072805
LW
4604 yylval.ival = OP_NULL;
4605
a0d0e21e 4606 s = scan_str(start);
79072805
LW
4607
4608 if (!s) {
4609 if (lex_stuff)
8990e307 4610 SvREFCNT_dec(lex_stuff);
79072805 4611 lex_stuff = Nullsv;
463ee0b2 4612 croak("Substitution pattern not terminated");
a687059c 4613 }
79072805 4614
a0d0e21e 4615 if (s[-1] == multi_open)
79072805
LW
4616 s--;
4617
4fdae800 4618 first_start = multi_start;
79072805
LW
4619 s = scan_str(s);
4620 if (!s) {
4621 if (lex_stuff)
8990e307 4622 SvREFCNT_dec(lex_stuff);
79072805
LW
4623 lex_stuff = Nullsv;
4624 if (lex_repl)
8990e307 4625 SvREFCNT_dec(lex_repl);
79072805 4626 lex_repl = Nullsv;
463ee0b2 4627 croak("Substitution replacement not terminated");
a687059c 4628 }
4fdae800 4629 multi_start = first_start; /* so whole substitution is taken together */
2f3197b3 4630
79072805 4631 pm = (PMOP*)newPMOP(OP_SUBST, 0);
c90c0ff4 4632 while (*s && strchr("iogcmsex", *s)) {
a687059c
LW
4633 if (*s == 'e') {
4634 s++;
2f3197b3 4635 es++;
a687059c 4636 }
a0d0e21e
LW
4637 else
4638 pmflag(&pm->op_pmflags,*s++);
378cc40b 4639 }
79072805
LW
4640
4641 if (es) {
4642 SV *repl;
4643 pm->op_pmflags |= PMf_EVAL;
463ee0b2
LW
4644 repl = newSVpv("",0);
4645 while (es-- > 0)
a0d0e21e 4646 sv_catpv(repl, es ? "eval " : "do ");
79072805
LW
4647 sv_catpvn(repl, "{ ", 2);
4648 sv_catsv(repl, lex_repl);
4649 sv_catpvn(repl, " };", 2);
4650 SvCOMPILED_on(repl);
8990e307 4651 SvREFCNT_dec(lex_repl);
79072805 4652 lex_repl = repl;
378cc40b 4653 }
79072805 4654
4633a7c4 4655 pm->op_pmpermflags = pm->op_pmflags;
79072805
LW
4656 lex_op = (OP*)pm;
4657 yylval.ival = OP_SUBST;
378cc40b
LW
4658 return s;
4659}
4660
1462b684 4661void
79072805
LW
4662hoistmust(pm)
4663register PMOP *pm;
378cc40b 4664{
79072805
LW
4665 if (!pm->op_pmshort && pm->op_pmregexp->regstart &&
4666 (!pm->op_pmregexp->regmust || pm->op_pmregexp->reganch & ROPT_ANCH)
d48672a2 4667 ) {
79072805
LW
4668 if (!(pm->op_pmregexp->reganch & ROPT_ANCH))
4669 pm->op_pmflags |= PMf_SCANFIRST;
8990e307 4670 pm->op_pmshort = SvREFCNT_inc(pm->op_pmregexp->regstart);
748a9306 4671 pm->op_pmslen = SvCUR(pm->op_pmshort);
d48672a2 4672 }
79072805
LW
4673 else if (pm->op_pmregexp->regmust) {/* is there a better short-circuit? */
4674 if (pm->op_pmshort &&
4675 sv_eq(pm->op_pmshort,pm->op_pmregexp->regmust))
a687059c 4676 {
79072805 4677 if (pm->op_pmflags & PMf_SCANFIRST) {
8990e307 4678 SvREFCNT_dec(pm->op_pmshort);
79072805 4679 pm->op_pmshort = Nullsv;
378cc40b
LW
4680 }
4681 else {
8990e307 4682 SvREFCNT_dec(pm->op_pmregexp->regmust);
79072805 4683 pm->op_pmregexp->regmust = Nullsv;
378cc40b
LW
4684 return;
4685 }
4686 }
774d564b 4687 /* promote the better string */
5cd24f17 4688 if ((!pm->op_pmshort &&
4689 !(pm->op_pmregexp->reganch & ROPT_ANCH_GPOS)) ||
774d564b 4690 ((pm->op_pmflags & PMf_SCANFIRST) &&
4691 (SvCUR(pm->op_pmshort) < SvCUR(pm->op_pmregexp->regmust)))) {
8990e307 4692 SvREFCNT_dec(pm->op_pmshort); /* ok if null */
79072805 4693 pm->op_pmshort = pm->op_pmregexp->regmust;
748a9306 4694 pm->op_pmslen = SvCUR(pm->op_pmshort);
79072805
LW
4695 pm->op_pmregexp->regmust = Nullsv;
4696 pm->op_pmflags |= PMf_SCANFIRST;
378cc40b
LW
4697 }
4698 }
4699}
4700
8990e307 4701static char *
79072805 4702scan_trans(start)
2f3197b3 4703char *start;
378cc40b 4704{
a0d0e21e 4705 register char* s;
79072805
LW
4706 OP *op;
4707 short *tbl;
4708 I32 squash;
4709 I32 delete;
4710 I32 complement;
4711
4712 yylval.ival = OP_NULL;
4713
a0d0e21e 4714 s = scan_str(start);
79072805
LW
4715 if (!s) {
4716 if (lex_stuff)
8990e307 4717 SvREFCNT_dec(lex_stuff);
79072805 4718 lex_stuff = Nullsv;
463ee0b2 4719 croak("Translation pattern not terminated");
a687059c 4720 }
a0d0e21e 4721 if (s[-1] == multi_open)
2f3197b3
LW
4722 s--;
4723
93a17b20 4724 s = scan_str(s);
79072805
LW
4725 if (!s) {
4726 if (lex_stuff)
8990e307 4727 SvREFCNT_dec(lex_stuff);
79072805
LW
4728 lex_stuff = Nullsv;
4729 if (lex_repl)
8990e307 4730 SvREFCNT_dec(lex_repl);
79072805 4731 lex_repl = Nullsv;
463ee0b2 4732 croak("Translation replacement not terminated");
a687059c 4733 }
79072805
LW
4734
4735 New(803,tbl,256,short);
4736 op = newPVOP(OP_TRANS, 0, (char*)tbl);
2f3197b3 4737
395c3793
LW
4738 complement = delete = squash = 0;
4739 while (*s == 'c' || *s == 'd' || *s == 's') {
4740 if (*s == 'c')
79072805 4741 complement = OPpTRANS_COMPLEMENT;
395c3793 4742 else if (*s == 'd')
79072805 4743 delete = OPpTRANS_DELETE;
395c3793 4744 else
79072805 4745 squash = OPpTRANS_SQUASH;
395c3793
LW
4746 s++;
4747 }
79072805
LW
4748 op->op_private = delete|squash|complement;
4749
4750 lex_op = op;
4751 yylval.ival = OP_TRANS;
4752 return s;
4753}
4754
8990e307 4755static char *
79072805
LW
4756scan_heredoc(s)
4757register char *s;
4758{
4759 SV *herewas;
4760 I32 op_type = OP_SCALAR;
4761 I32 len;
4762 SV *tmpstr;
4763 char term;
4764 register char *d;
fc36a67e 4765 register char *e;
4633a7c4 4766 char *peek;
fd2d0953 4767 int outer = (rsfp && !lex_inwhat);
79072805
LW
4768
4769 s += 2;
4770 d = tokenbuf;
fc36a67e 4771 e = tokenbuf + sizeof tokenbuf - 1;
fd2d0953 4772 if (!outer)
79072805 4773 *d++ = '\n';
4633a7c4
LW
4774 for (peek = s; *peek == ' ' || *peek == '\t'; peek++) ;
4775 if (*peek && strchr("`'\"",*peek)) {
4776 s = peek;
79072805 4777 term = *s++;
fc36a67e 4778 s = delimcpy(d, e, s, bufend, term, &len);
4779 d += len;
79072805
LW
4780 if (s < bufend)
4781 s++;
79072805
LW
4782 }
4783 else {
4784 if (*s == '\\')
4785 s++, term = '\'';
4786 else
4787 term = '"';
4633a7c4
LW
4788 if (!isALNUM(*s))
4789 deprecate("bare << to mean <<\"\"");
fc36a67e 4790 for (; isALNUM(*s); s++) {
4791 if (d < e)
4792 *d++ = *s;
4793 }
4794 }
4795 if (d >= tokenbuf + sizeof tokenbuf - 1)
4796 croak("Delimiter for here document is too long");
79072805
LW
4797 *d++ = '\n';
4798 *d = '\0';
4799 len = d - tokenbuf;
4800 d = "\n";
fd2d0953 4801 if (outer || !(d=ninstr(s,bufend,d,d+1)))
79072805
LW
4802 herewas = newSVpv(s,bufend-s);
4803 else
4804 s--, herewas = newSVpv(s,d-s);
4805 s += SvCUR(herewas);
748a9306
LW
4806
4807 tmpstr = NEWSV(87,80);
4808 sv_upgrade(tmpstr, SVt_PVIV);
4809 if (term == '\'') {
79072805 4810 op_type = OP_CONST;
748a9306
LW
4811 SvIVX(tmpstr) = -1;
4812 }
4813 else if (term == '`') {
79072805 4814 op_type = OP_BACKTICK;
748a9306
LW
4815 SvIVX(tmpstr) = '\\';
4816 }
79072805
LW
4817
4818 CLINE;
4819 multi_start = curcop->cop_line;
4820 multi_open = multi_close = '<';
79072805 4821 term = *tokenbuf;
fd2d0953 4822 if (!outer) {
79072805
LW
4823 d = s;
4824 while (s < bufend &&
36477c24 4825 (*s != term || memNE(s,tokenbuf,len)) ) {
79072805
LW
4826 if (*s++ == '\n')
4827 curcop->cop_line++;
4828 }
4829 if (s >= bufend) {
4830 curcop->cop_line = multi_start;
8990e307 4831 missingterm(tokenbuf);
79072805
LW
4832 }
4833 sv_setpvn(tmpstr,d+1,s-d);
4834 s += len - 1;
4835 sv_catpvn(herewas,s,bufend-s);
4836 sv_setsv(linestr,herewas);
fd049845 4837 oldoldbufptr = oldbufptr = bufptr = s = linestart = SvPVX(linestr);
463ee0b2 4838 bufend = SvPVX(linestr) + SvCUR(linestr);
79072805
LW
4839 }
4840 else
4841 sv_setpvn(tmpstr,"",0); /* avoid "uninitialized" warning */
4842 while (s >= bufend) { /* multiple line string? */
fd2d0953 4843 if (!outer ||
fd049845 4844 !(oldoldbufptr = oldbufptr = s = linestart = filter_gets(linestr, rsfp, 0))) {
79072805 4845 curcop->cop_line = multi_start;
8990e307 4846 missingterm(tokenbuf);
79072805
LW
4847 }
4848 curcop->cop_line++;
84902520 4849 if (PERLDB_LINE && curstash != debstash) {
79072805
LW
4850 SV *sv = NEWSV(88,0);
4851
93a17b20 4852 sv_upgrade(sv, SVt_PVMG);
79072805
LW
4853 sv_setsv(sv,linestr);
4854 av_store(GvAV(curcop->cop_filegv),
4855 (I32)curcop->cop_line,sv);
4856 }
463ee0b2 4857 bufend = SvPVX(linestr) + SvCUR(linestr);
36477c24 4858 if (*s == term && memEQ(s,tokenbuf,len)) {
79072805
LW
4859 s = bufend - 1;
4860 *s = ' ';
4861 sv_catsv(linestr,herewas);
463ee0b2 4862 bufend = SvPVX(linestr) + SvCUR(linestr);
79072805
LW
4863 }
4864 else {
4865 s = bufend;
4866 sv_catsv(tmpstr,linestr);
395c3793
LW
4867 }
4868 }
79072805
LW
4869 multi_end = curcop->cop_line;
4870 s++;
4871 if (SvCUR(tmpstr) + 5 < SvLEN(tmpstr)) {
4872 SvLEN_set(tmpstr, SvCUR(tmpstr) + 1);
463ee0b2 4873 Renew(SvPVX(tmpstr), SvLEN(tmpstr), char);
79072805 4874 }
8990e307 4875 SvREFCNT_dec(herewas);
79072805
LW
4876 lex_stuff = tmpstr;
4877 yylval.ival = op_type;
4878 return s;
4879}
4880
8990e307 4881static char *
79072805
LW
4882scan_inputsymbol(start)
4883char *start;
4884{
4885 register char *s = start;
4886 register char *d;
fc36a67e 4887 register char *e;
79072805
LW
4888 I32 len;
4889
4890 d = tokenbuf;
fc36a67e 4891 e = tokenbuf + sizeof tokenbuf;
4892 s = delimcpy(d, e, s + 1, bufend, '>', &len);
4893 if (len >= sizeof tokenbuf)
4894 croak("Excessively long <> operator");
4895 if (s >= bufend)
463ee0b2 4896 croak("Unterminated <> operator");
fc36a67e 4897 s++;
4633a7c4 4898 if (*d == '$' && d[1]) d++;
a0d0e21e 4899 while (*d && (isALNUM(*d) || *d == '\'' || *d == ':'))
79072805
LW
4900 d++;
4901 if (d - tokenbuf != len) {
4902 yylval.ival = OP_GLOB;
4903 set_csh();
4904 s = scan_str(start);
4905 if (!s)
463ee0b2 4906 croak("Glob not terminated");
79072805
LW
4907 return s;
4908 }
395c3793 4909 else {
79072805
LW
4910 d = tokenbuf;
4911 if (!len)
4912 (void)strcpy(d,"ARGV");
4913 if (*d == '$') {
a0d0e21e
LW
4914 I32 tmp;
4915 if (tmp = pad_findmy(d)) {
4916 OP *op = newOP(OP_PADSV, 0);
4917 op->op_targ = tmp;
4918 lex_op = (OP*)newUNOP(OP_READLINE, 0, newUNOP(OP_RV2GV, 0, op));
4919 }
4920 else {
4921 GV *gv = gv_fetchpv(d+1,TRUE, SVt_PV);
4922 lex_op = (OP*)newUNOP(OP_READLINE, 0,
4923 newUNOP(OP_RV2GV, 0,
4924 newUNOP(OP_RV2SV, 0,
4925 newGVOP(OP_GV, 0, gv))));
4926 }
79072805
LW
4927 yylval.ival = OP_NULL;
4928 }
4929 else {
85e6fe83 4930 GV *gv = gv_fetchpv(d,TRUE, SVt_PVIO);
79072805
LW
4931 lex_op = (OP*)newUNOP(OP_READLINE, 0, newGVOP(OP_GV, 0, gv));
4932 yylval.ival = OP_NULL;
4933 }
4934 }
4935 return s;
4936}
4937
8990e307 4938static char *
79072805
LW
4939scan_str(start)
4940char *start;
4941{
93a17b20 4942 SV *sv;
79072805
LW
4943 char *tmps;
4944 register char *s = start;
a0d0e21e 4945 register char term;
93a17b20
LW
4946 register char *to;
4947 I32 brackets = 1;
79072805 4948
84902520
TB
4949 if (isSPACE(*s)) {
4950 /* "#" is allowed as delimiter if on same line */
4951 while (*s == ' ' || *s == '\t')
4952 s++;
4953 if (isSPACE(*s))
4954 s = skipspace(s);
4955 }
79072805 4956 CLINE;
a0d0e21e 4957 term = *s;
79072805
LW
4958 multi_start = curcop->cop_line;
4959 multi_open = term;
93a17b20 4960 if (term && (tmps = strchr("([{< )]}> )]}>",term)))
79072805
LW
4961 term = tmps[5];
4962 multi_close = term;
4963
93a17b20 4964 sv = NEWSV(87,80);
ed6116ce
LW
4965 sv_upgrade(sv, SVt_PVIV);
4966 SvIVX(sv) = term;
a0d0e21e 4967 (void)SvPOK_only(sv); /* validate pointer */
93a17b20
LW
4968 s++;
4969 for (;;) {
4970 SvGROW(sv, SvCUR(sv) + (bufend - s) + 1);
463ee0b2 4971 to = SvPVX(sv)+SvCUR(sv);
93a17b20
LW
4972 if (multi_open == multi_close) {
4973 for (; s < bufend; s++,to++) {
463ee0b2
LW
4974 if (*s == '\n' && !rsfp)
4975 curcop->cop_line++;
84902520
TB
4976 if (*s == '\\' && s+1 < bufend && term != '\\') {
4977 if (s[1] == term)
a0d0e21e
LW
4978 s++;
4979 else
4980 *to++ = *s++;
4981 }
93a17b20
LW
4982 else if (*s == term)
4983 break;
4984 *to = *s;
4985 }
4986 }
4987 else {
4988 for (; s < bufend; s++,to++) {
463ee0b2
LW
4989 if (*s == '\n' && !rsfp)
4990 curcop->cop_line++;
6d07e5e9
GS
4991 if (*s == '\\' && s+1 < bufend) {
4992 if ((s[1] == multi_open) || (s[1] == multi_close))
a0d0e21e
LW
4993 s++;
4994 else
4995 *to++ = *s++;
4996 }
6d07e5e9 4997 else if (*s == multi_close && --brackets <= 0)
93a17b20
LW
4998 break;
4999 else if (*s == multi_open)
5000 brackets++;
5001 *to = *s;
5002 }
5003 }
5004 *to = '\0';
463ee0b2 5005 SvCUR_set(sv, to - SvPVX(sv));
93a17b20
LW
5006
5007 if (s < bufend) break; /* string ends on this line? */
79072805 5008
79072805 5009 if (!rsfp ||
fd049845 5010 !(oldoldbufptr = oldbufptr = s = linestart = filter_gets(linestr, rsfp, 0))) {
c07a80fd 5011 sv_free(sv);
79072805
LW
5012 curcop->cop_line = multi_start;
5013 return Nullch;
5014 }
5015 curcop->cop_line++;
84902520 5016 if (PERLDB_LINE && curstash != debstash) {
79072805
LW
5017 SV *sv = NEWSV(88,0);
5018
93a17b20 5019 sv_upgrade(sv, SVt_PVMG);
79072805
LW
5020 sv_setsv(sv,linestr);
5021 av_store(GvAV(curcop->cop_filegv),
5022 (I32)curcop->cop_line, sv);
395c3793 5023 }
463ee0b2 5024 bufend = SvPVX(linestr) + SvCUR(linestr);
378cc40b 5025 }
79072805
LW
5026 multi_end = curcop->cop_line;
5027 s++;
93a17b20
LW
5028 if (SvCUR(sv) + 5 < SvLEN(sv)) {
5029 SvLEN_set(sv, SvCUR(sv) + 1);
463ee0b2 5030 Renew(SvPVX(sv), SvLEN(sv), char);
79072805
LW
5031 }
5032 if (lex_stuff)
93a17b20 5033 lex_repl = sv;
79072805 5034 else
93a17b20 5035 lex_stuff = sv;
378cc40b
LW
5036 return s;
5037}
5038
5039char *
79072805 5040scan_num(start)
2f3197b3 5041char *start;
378cc40b 5042{
2f3197b3 5043 register char *s = start;
378cc40b 5044 register char *d;
fc36a67e 5045 register char *e;
1e422769 5046 I32 tryiv;
79072805
LW
5047 double value;
5048 SV *sv;
5049 I32 floatit;
93a17b20 5050 char *lastub = 0;
fc36a67e 5051 static char number_too_long[] = "Number too long";
378cc40b
LW
5052
5053 switch (*s) {
79072805 5054 default:
463ee0b2 5055 croak("panic: scan_num");
378cc40b
LW
5056 case '0':
5057 {
55497cff 5058 UV u;
79072805 5059 I32 shift;
55497cff 5060 bool overflowed = FALSE;
378cc40b 5061
378cc40b
LW
5062 if (s[1] == 'x') {
5063 shift = 4;
5064 s += 2;
5065 }
5066 else if (s[1] == '.')
5067 goto decimal;
5068 else
5069 shift = 3;
55497cff 5070 u = 0;
378cc40b 5071 for (;;) {
55497cff 5072 UV n, b;
5073
378cc40b
LW
5074 switch (*s) {
5075 default:
5076 goto out;
de3bb511
LW
5077 case '_':
5078 s++;
5079 break;
378cc40b
LW
5080 case '8': case '9':
5081 if (shift != 4)
a687059c 5082 yyerror("Illegal octal digit");
378cc40b
LW
5083 /* FALL THROUGH */
5084 case '0': case '1': case '2': case '3': case '4':
5085 case '5': case '6': case '7':
55497cff 5086 b = *s++ & 15;
5087 goto digit;
378cc40b
LW
5088 case 'a': case 'b': case 'c': case 'd': case 'e': case 'f':
5089 case 'A': case 'B': case 'C': case 'D': case 'E': case 'F':
5090 if (shift != 4)
5091 goto out;
55497cff 5092 b = (*s++ & 7) + 9;
5093 digit:
5094 n = u << shift;
5095 if (!overflowed && (n >> shift) != u) {
5096 warn("Integer overflow in %s number",
5097 (shift == 4) ? "hex" : "octal");
5098 overflowed = TRUE;
5099 }
5100 u = n | b;
378cc40b
LW
5101 break;
5102 }
5103 }
5104 out:
79072805 5105 sv = NEWSV(92,0);
55497cff 5106 sv_setuv(sv, u);
378cc40b
LW
5107 }
5108 break;
5109 case '1': case '2': case '3': case '4': case '5':
5110 case '6': case '7': case '8': case '9': case '.':
5111 decimal:
378cc40b 5112 d = tokenbuf;
fc36a67e 5113 e = tokenbuf + sizeof tokenbuf - 6; /* room for various punctuation */
79072805 5114 floatit = FALSE;
de3bb511 5115 while (isDIGIT(*s) || *s == '_') {
93a17b20
LW
5116 if (*s == '_') {
5117 if (dowarn && lastub && s - lastub != 3)
8990e307 5118 warn("Misplaced _ in number");
93a17b20
LW
5119 lastub = ++s;
5120 }
fc36a67e 5121 else {
5122 if (d >= e)
5123 croak(number_too_long);
378cc40b 5124 *d++ = *s++;
fc36a67e 5125 }
378cc40b 5126 }
93a17b20 5127 if (dowarn && lastub && s - lastub != 3)
8990e307 5128 warn("Misplaced _ in number");
2f3197b3 5129 if (*s == '.' && s[1] != '.') {
79072805 5130 floatit = TRUE;
378cc40b 5131 *d++ = *s++;
fc36a67e 5132 for (; isDIGIT(*s) || *s == '_'; s++) {
5133 if (d >= e)
5134 croak(number_too_long);
5135 if (*s != '_')
5136 *d++ = *s;
378cc40b
LW
5137 }
5138 }
93a17b20 5139 if (*s && strchr("eE",*s) && strchr("+-0123456789",s[1])) {
79072805
LW
5140 floatit = TRUE;
5141 s++;
5142 *d++ = 'e'; /* At least some Mach atof()s don't grok 'E' */
378cc40b
LW
5143 if (*s == '+' || *s == '-')
5144 *d++ = *s++;
fc36a67e 5145 while (isDIGIT(*s)) {
5146 if (d >= e)
5147 croak(number_too_long);
378cc40b 5148 *d++ = *s++;
fc36a67e 5149 }
378cc40b
LW
5150 }
5151 *d = '\0';
79072805 5152 sv = NEWSV(92,0);
36477c24 5153 SET_NUMERIC_STANDARD();
79072805 5154 value = atof(tokenbuf);
1e422769 5155 tryiv = I_V(value);
5156 if (!floatit && (double)tryiv == value)
5157 sv_setiv(sv, tryiv);
2f3197b3 5158 else
1e422769 5159 sv_setnv(sv, value);
378cc40b 5160 break;
79072805 5161 }
a687059c 5162
79072805 5163 yylval.opval = newSVOP(OP_CONST, 0, sv);
a687059c 5164
378cc40b
LW
5165 return s;
5166}
5167
8990e307 5168static char *
79072805
LW
5169scan_formline(s)
5170register char *s;
378cc40b 5171{
79072805 5172 register char *eol;
378cc40b 5173 register char *t;
a0d0e21e 5174 SV *stuff = newSVpv("",0);
79072805 5175 bool needargs = FALSE;
378cc40b 5176
79072805 5177 while (!needargs) {
85e6fe83 5178 if (*s == '.' || *s == '}') {
79072805
LW
5179 /*SUPPRESS 530*/
5180 for (t = s+1; *t == ' ' || *t == '\t'; t++) ;
5181 if (*t == '\n')
5182 break;
5183 }
0f85fab0 5184 if (in_eval && !rsfp) {
93a17b20 5185 eol = strchr(s,'\n');
0f85fab0
LW
5186 if (!eol++)
5187 eol = bufend;
5188 }
5189 else
463ee0b2 5190 eol = bufend = SvPVX(linestr) + SvCUR(linestr);
79072805 5191 if (*s != '#') {
a0d0e21e
LW
5192 for (t = s; t < eol; t++) {
5193 if (*t == '~' && t[1] == '~' && SvCUR(stuff)) {
5194 needargs = FALSE;
5195 goto enough; /* ~~ must be first line in formline */
378cc40b 5196 }
a0d0e21e
LW
5197 if (*t == '@' || *t == '^')
5198 needargs = TRUE;
378cc40b 5199 }
a0d0e21e 5200 sv_catpvn(stuff, s, eol-s);
79072805
LW
5201 }
5202 s = eol;
5203 if (rsfp) {
fd049845 5204 s = filter_gets(linestr, rsfp, 0);
5205 oldoldbufptr = oldbufptr = bufptr = linestart = SvPVX(linestr);
a0d0e21e 5206 bufend = bufptr + SvCUR(linestr);
79072805
LW
5207 if (!s) {
5208 s = bufptr;
5209 yyerror("Format not terminated");
378cc40b
LW
5210 break;
5211 }
378cc40b 5212 }
463ee0b2 5213 incline(s);
79072805 5214 }
a0d0e21e
LW
5215 enough:
5216 if (SvCUR(stuff)) {
463ee0b2 5217 expect = XTERM;
79072805 5218 if (needargs) {
a0d0e21e 5219 lex_state = LEX_NORMAL;
79072805
LW
5220 nextval[nexttoke].ival = 0;
5221 force_next(',');
5222 }
a0d0e21e
LW
5223 else
5224 lex_state = LEX_FORMLINE;
79072805
LW
5225 nextval[nexttoke].opval = (OP*)newSVOP(OP_CONST, 0, stuff);
5226 force_next(THING);
5227 nextval[nexttoke].ival = OP_FORMLINE;
5228 force_next(LSTOP);
378cc40b 5229 }
79072805 5230 else {
8990e307 5231 SvREFCNT_dec(stuff);
85e6fe83 5232 lex_formbrack = 0;
79072805
LW
5233 bufptr = s;
5234 }
5235 return s;
378cc40b 5236}
a687059c 5237
2f3197b3 5238static void
a687059c
LW
5239set_csh()
5240{
ae986130
LW
5241#ifdef CSH
5242 if (!cshlen)
5243 cshlen = strlen(cshname);
5244#endif
a687059c 5245}
463ee0b2 5246
ba6d6ac9 5247I32
774d564b 5248start_subparse(is_format, flags)
5249I32 is_format;
fa83b5b6 5250U32 flags;
8990e307 5251{
ba6d6ac9 5252 I32 oldsavestack_ix = savestack_ix;
748a9306
LW
5253 CV* outsidecv = compcv;
5254 AV* comppadlist;
8990e307 5255
e9a444f0
LW
5256 if (compcv) {
5257 assert(SvTYPE(compcv) == SVt_PVCV);
5258 }
8990e307
LW
5259 save_I32(&subline);
5260 save_item(subname);
55497cff 5261 SAVEI32(padix);
8990e307
LW
5262 SAVESPTR(curpad);
5263 SAVESPTR(comppad);
5264 SAVESPTR(comppad_name);
748a9306 5265 SAVESPTR(compcv);
55497cff 5266 SAVEI32(comppad_name_fill);
5267 SAVEI32(min_intro_pending);
5268 SAVEI32(max_intro_pending);
5269 SAVEI32(pad_reset_pending);
748a9306
LW
5270
5271 compcv = (CV*)NEWSV(1104,0);
774d564b 5272 sv_upgrade((SV *)compcv, is_format ? SVt_PVFM : SVt_PVCV);
fa83b5b6 5273 CvFLAGS(compcv) |= flags;
748a9306 5274
8990e307
LW
5275 comppad = newAV();
5276 comppad_name = newAV();
5277 comppad_name_fill = 0;
5278 min_intro_pending = 0;
5279 av_push(comppad, Nullsv);
5280 curpad = AvARRAY(comppad);
5281 padix = 0;
8990e307 5282 subline = curcop->cop_line;
748a9306
LW
5283
5284 comppadlist = newAV();
5285 AvREAL_off(comppadlist);
8e07c86e
AD
5286 av_store(comppadlist, 0, (SV*)comppad_name);
5287 av_store(comppadlist, 1, (SV*)comppad);
748a9306
LW
5288
5289 CvPADLIST(compcv) = comppadlist;
e9a444f0 5290 CvOUTSIDE(compcv) = (CV*)SvREFCNT_inc((SV*)outsidecv);
748a9306 5291
8990e307
LW
5292 return oldsavestack_ix;
5293}
5294
5295int
5296yywarn(s)
5297char *s;
5298{
5299 --error_count;
748a9306
LW
5300 in_eval |= 2;
5301 yyerror(s);
5302 in_eval &= ~2;
5303 return 0;
8990e307
LW
5304}
5305
5306int
463ee0b2
LW
5307yyerror(s)
5308char *s;
5309{
68dc0745 5310 char *where = NULL;
5311 char *context = NULL;
5312 int contlen = -1;
46fc3d4c 5313 SV *msg;
463ee0b2 5314
54310121 5315 if (!yychar || (yychar == ';' && !rsfp))
5316 where = "at EOF";
5317 else if (bufptr > oldoldbufptr && bufptr - oldoldbufptr < 200 &&
463ee0b2
LW
5318 oldoldbufptr != oldbufptr && oldbufptr != bufptr) {
5319 while (isSPACE(*oldoldbufptr))
5320 oldoldbufptr++;
68dc0745 5321 context = oldoldbufptr;
5322 contlen = bufptr - oldoldbufptr;
463ee0b2
LW
5323 }
5324 else if (bufptr > oldbufptr && bufptr - oldbufptr < 200 &&
5325 oldbufptr != bufptr) {
5326 while (isSPACE(*oldbufptr))
5327 oldbufptr++;
68dc0745 5328 context = oldbufptr;
5329 contlen = bufptr - oldbufptr;
463ee0b2
LW
5330 }
5331 else if (yychar > 255)
68dc0745 5332 where = "next token ???";
463ee0b2
LW
5333 else if ((yychar & 127) == 127) {
5334 if (lex_state == LEX_NORMAL ||
5335 (lex_state == LEX_KNOWNEXT && lex_defer == LEX_NORMAL))
68dc0745 5336 where = "at end of line";
4633a7c4 5337 else if (lex_inpat)
68dc0745 5338 where = "within pattern";
463ee0b2 5339 else
68dc0745 5340 where = "within string";
463ee0b2 5341 }
46fc3d4c 5342 else {
5343 SV *where_sv = sv_2mortal(newSVpv("next char ", 0));
5344 if (yychar < 32)
5345 sv_catpvf(where_sv, "^%c", toCTRL(yychar));
5346 else if (isPRINT_LC(yychar))
5347 sv_catpvf(where_sv, "%c", yychar);
5348 else
5349 sv_catpvf(where_sv, "\\%03o", yychar & 255);
5350 where = SvPVX(where_sv);
5351 }
5352 msg = sv_2mortal(newSVpv(s, 0));
fc36a67e 5353 sv_catpvf(msg, " at %_ line %ld, ",
46fc3d4c 5354 GvSV(curcop->cop_filegv), (long)curcop->cop_line);
68dc0745 5355 if (context)
46fc3d4c 5356 sv_catpvf(msg, "near \"%.*s\"\n", contlen, context);
463ee0b2 5357 else
46fc3d4c 5358 sv_catpvf(msg, "%s\n", where);
4fdae800 5359 if (multi_start < multi_end && (U32)(curcop->cop_line - multi_end) <= 1) {
46fc3d4c 5360 sv_catpvf(msg,
4fdae800 5361 " (Might be a runaway multi-line %c%c string starting on line %ld)\n",
ff0cee69 5362 (int)multi_open,(int)multi_close,(long)multi_start);
a0d0e21e
LW
5363 multi_end = 0;
5364 }
748a9306 5365 if (in_eval & 2)
fc36a67e 5366 warn("%_", msg);
748a9306 5367 else if (in_eval)
46fc3d4c 5368 sv_catsv(GvSV(errgv), msg);
463ee0b2 5369 else
46fc3d4c 5370 PerlIO_write(PerlIO_stderr(), SvPVX(msg), SvCUR(msg));
463ee0b2 5371 if (++error_count >= 10)
fc36a67e 5372 croak("%_ has too many errors.\n", GvSV(curcop->cop_filegv));
4633a7c4 5373 in_my = 0;
463ee0b2
LW
5374 return 0;
5375}