This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
MANIFEST.SKIP is missing from the list of files that come
[perl5.git] / bytecode.pl
CommitLineData
73f0cc2d
GS
1BEGIN {
2 push @INC, './lib';
9ad884cb 3 require 'regen_lib.pl';
73f0cc2d 4}
a8a597b2
MB
5use strict;
6my %alias_to = (
113d5bd9
JH
7 U32 => [qw(line_t)],
8 PADOFFSET => [qw(STRLEN SSize_t)],
dea28490 9 U16 => [qw(OPCODE short)],
d5e9ef99 10 U8 => [qw(char)],
a8a597b2
MB
11);
12
7934575e 13my @optype= qw(OP UNOP BINOP LOGOP LISTOP PMOP SVOP PADOP PVOP LOOP COP);
a8a597b2
MB
14
15# Nullsv *must* come first in the following so that the condition
16# ($$sv == 0) can continue to be used to test (sv == Nullsv).
059a8bb7 17my @specialsv = qw(Nullsv &PL_sv_undef &PL_sv_yes &PL_sv_no pWARN_ALL pWARN_NONE);
a8a597b2
MB
18
19my (%alias_from, $from, $tos);
20while (($from, $tos) = each %alias_to) {
21 map { $alias_from{$_} = $from } @$tos;
22}
23
24my $c_header = <<'EOT';
25/*
4eb8286e 26 * Copyright (c) 1996-1999 Malcolm Beattie
a8a597b2
MB
27 *
28 * You may distribute under the terms of either the GNU General Public
29 * License or the Artistic License, as specified in the README file.
30 *
31 */
32/*
33 * This file is autogenerated from bytecode.pl. Changes made here will be lost.
34 */
35EOT
36
37my $perl_header;
38($perl_header = $c_header) =~ s{[/ ]?\*/?}{#}g;
39
36bb303b 40safer_unlink "ext/ByteLoader/byterun.c", "ext/ByteLoader/byterun.h", "ext/B/B/Asmdata.pm";
a8a597b2
MB
41
42#
43# Start with boilerplate for Asmdata.pm
44#
33b839e2 45open(ASMDATA_PM, ">ext/B/B/Asmdata.pm") or die "ext/B/B/Asmdata.pm: $!";
dfb1454f 46binmode ASMDATA_PM;
a8a597b2
MB
47print ASMDATA_PM $perl_header, <<'EOT';
48package B::Asmdata;
28b605d8 49
a0edd7f8 50our $VERSION = '1.01';
28b605d8 51
a8a597b2
MB
52use Exporter;
53@ISA = qw(Exporter);
54@EXPORT_OK = qw(%insn_data @insn_name @optype @specialsv_name);
1b11e67e 55our(%insn_data, @insn_name, @optype, @specialsv_name);
a8a597b2
MB
56
57EOT
58print ASMDATA_PM <<"EOT";
59\@optype = qw(@optype);
60\@specialsv_name = qw(@specialsv);
61
62# XXX insn_data is initialised this way because with a large
63# %insn_data = (foo => [...], bar => [...], ...) initialiser
64# I get a hard-to-track-down stack underflow and segfault.
65EOT
66
67#
68# Boilerplate for byterun.c
69#
e8edd1e6 70open(BYTERUN_C, ">ext/ByteLoader/byterun.c") or die "ext/ByteLoader/byterun.c: $!";
dfb1454f 71binmode BYTERUN_C;
a8a597b2
MB
72print BYTERUN_C $c_header, <<'EOT';
73
c5be433b 74#define PERL_NO_GET_CONTEXT
a8a597b2
MB
75#include "EXTERN.h"
76#include "perl.h"
0cb96387
GS
77#define NO_XSLOCKS
78#include "XSUB.h"
79
e8edd1e6
TH
80#include "byterun.h"
81#include "bytecode.h"
82
0cb96387 83
059a8bb7 84static const int optype_size[] = {
e8edd1e6
TH
85EOT
86my $i = 0;
87for ($i = 0; $i < @optype - 1; $i++) {
88 printf BYTERUN_C " sizeof(%s),\n", $optype[$i], $i;
89}
90printf BYTERUN_C " sizeof(%s)\n", $optype[$i], $i;
91print BYTERUN_C <<'EOT';
92};
93
d613ef02 94void *
acfe0abc 95bset_obj_store(pTHX_ struct byteloader_state *bstate, void *obj, I32 ix)
d613ef02 96{
059a8bb7
JH
97 if (ix > bstate->bs_obj_list_fill) {
98 Renew(bstate->bs_obj_list, ix + 32, void*);
99 bstate->bs_obj_list_fill = ix + 31;
d613ef02 100 }
059a8bb7 101 bstate->bs_obj_list[ix] = obj;
d613ef02
GS
102 return obj;
103}
a8a597b2 104
1df34986 105int
acfe0abc 106byterun(pTHX_ register struct byteloader_state *bstate)
a8a597b2 107{
059a8bb7
JH
108 register int insn;
109 U32 ix;
110 SV *specialsv_list[6];
111
112 BYTECODE_HEADER_CHECK; /* croak if incorrect platform */
113 New(666, bstate->bs_obj_list, 32, void*); /* set op objlist */
114 bstate->bs_obj_list_fill = 31;
1df34986 115 bstate->bs_obj_list[0] = NULL; /* first is always Null */
566ece03 116 bstate->bs_ix = 1;
e8edd1e6
TH
117
118EOT
119
e3751d82 120for my $i ( 0 .. $#specialsv ) {
e8edd1e6
TH
121 print BYTERUN_C " specialsv_list[$i] = $specialsv[$i];\n";
122}
123
124print BYTERUN_C <<'EOT';
125
47358472 126 while ((insn = BGET_FGETC()) != EOF) {
a8a597b2
MB
127 switch (insn) {
128EOT
129
130
131my (@insn_name, $insn_num, $insn, $lvalue, $argtype, $flags, $fundtype);
132
133while (<DATA>) {
1df34986
AE
134 if (/^\s*#/) {
135 print BYTERUN_C if /^\s*#\s*(?:if|endif|el)/;
136 next;
137 }
a8a597b2 138 chop;
a8a597b2
MB
139 next unless length;
140 if (/^%number\s+(.*)/) {
141 $insn_num = $1;
142 next;
143 } elsif (/%enum\s+(.*?)\s+(.*)/) {
144 create_enum($1, $2); # must come before instructions
145 next;
146 }
147 ($insn, $lvalue, $argtype, $flags) = split;
b97332e7
JH
148 my $rvalcast = '';
149 if ($argtype =~ m:(.+)/(.+):) {
150 ($rvalcast, $argtype) = ("($1)", $2);
151 }
a8a597b2
MB
152 $insn_name[$insn_num] = $insn;
153 $fundtype = $alias_from{$argtype} || $argtype;
154
155 #
156 # Add the case statement and code for the bytecode interpreter in byterun.c
157 #
158 printf BYTERUN_C "\t case INSN_%s:\t\t/* %d */\n\t {\n",
159 uc($insn), $insn_num;
160 my $optarg = $argtype eq "none" ? "" : ", arg";
161 if ($optarg) {
162 printf BYTERUN_C "\t\t$argtype arg;\n\t\tBGET_%s(arg);\n", $fundtype;
163 }
164 if ($flags =~ /x/) {
165 print BYTERUN_C "\t\tBSET_$insn($lvalue$optarg);\n";
166 } elsif ($flags =~ /s/) {
e8edd1e6 167 # Store instructions store to bytecode_obj_list[arg]. "lvalue" field is rvalue.
a8a597b2
MB
168 print BYTERUN_C "\t\tBSET_OBJ_STORE($lvalue$optarg);\n";
169 }
170 elsif ($optarg && $lvalue ne "none") {
b97332e7 171 print BYTERUN_C "\t\t$lvalue = ${rvalcast}arg;\n";
a8a597b2
MB
172 }
173 print BYTERUN_C "\t\tbreak;\n\t }\n";
174
175 #
176 # Add the initialiser line for %insn_data in Asmdata.pm
177 #
178 print ASMDATA_PM <<"EOT";
179\$insn_data{$insn} = [$insn_num, \\&PUT_$fundtype, "GET_$fundtype"];
180EOT
181
182 # Find the next unused instruction number
183 do { $insn_num++ } while $insn_name[$insn_num];
184}
185
186#
187# Finish off byterun.c
188#
189print BYTERUN_C <<'EOT';
190 default:
cea2e8a9 191 Perl_croak(aTHX_ "Illegal bytecode instruction %d\n", insn);
a8a597b2
MB
192 /* NOTREACHED */
193 }
194 }
1df34986 195 return 0;
a8a597b2
MB
196}
197EOT
198
199#
200# Write the instruction and optype enum constants into byterun.h
201#
e8edd1e6 202open(BYTERUN_H, ">ext/ByteLoader/byterun.h") or die "ext/ByteLoader/byterun.h: $!";
dfb1454f 203binmode BYTERUN_H;
a8a597b2 204print BYTERUN_H $c_header, <<'EOT';
059a8bb7
JH
205struct byteloader_fdata {
206 SV *datasv;
207 int next_out;
208 int idx;
a8a597b2 209};
a8a597b2 210
059a8bb7
JH
211struct byteloader_state {
212 struct byteloader_fdata *bs_fdata;
213 SV *bs_sv;
214 void **bs_obj_list;
215 int bs_obj_list_fill;
566ece03 216 int bs_ix;
059a8bb7
JH
217 XPV bs_pv;
218 int bs_iv_overflows;
219};
220
221int bl_getc(struct byteloader_fdata *);
222int bl_read(struct byteloader_fdata *, char *, size_t, size_t);
1df34986 223extern int byterun(pTHX_ struct byteloader_state *);
059a8bb7 224
a8a597b2
MB
225enum {
226EOT
227
a8a597b2
MB
228my $add_enum_value = 0;
229my $max_insn;
e3751d82 230for $i ( 0 .. $#insn_name ) {
a8a597b2
MB
231 $insn = uc($insn_name[$i]);
232 if (defined($insn)) {
233 $max_insn = $i;
234 if ($add_enum_value) {
235 print BYTERUN_H " INSN_$insn = $i,\t\t\t/* $i */\n";
236 $add_enum_value = 0;
237 } else {
238 print BYTERUN_H " INSN_$insn,\t\t\t/* $i */\n";
239 }
240 } else {
241 $add_enum_value = 1;
242 }
243}
244
245print BYTERUN_H " MAX_INSN = $max_insn\n};\n";
246
247print BYTERUN_H "\nenum {\n";
248for ($i = 0; $i < @optype - 1; $i++) {
249 printf BYTERUN_H " OPt_%s,\t\t/* %d */\n", $optype[$i], $i;
250}
251printf BYTERUN_H " OPt_%s\t\t/* %d */\n};\n\n", $optype[$i], $i;
a8a597b2 252
a8a597b2
MB
253#
254# Finish off insn_data and create array initialisers in Asmdata.pm
255#
256print ASMDATA_PM <<'EOT';
257
258my ($insn_name, $insn_data);
259while (($insn_name, $insn_data) = each %insn_data) {
260 $insn_name[$insn_data->[0]] = $insn_name;
261}
262# Fill in any gaps
263@insn_name = map($_ || "unused", @insn_name);
264
2651;
42d3a99d
GS
266
267__END__
268
269=head1 NAME
270
271B::Asmdata - Autogenerated data about Perl ops, used to generate bytecode
272
273=head1 SYNOPSIS
274
4162ffa6 275 use B::Asmdata qw(%insn_data @insn_name @optype @specialsv_name);
42d3a99d
GS
276
277=head1 DESCRIPTION
278
4162ffa6
MS
279Provides information about Perl ops in order to generate bytecode via
280a bunch of exported variables. Its mostly used by B::Assembler and
281B::Disassembler.
282
283=over 4
284
285=item %insn_data
286
287 my($bytecode_num, $put_sub, $get_meth) = @$insn_data{$op_name};
288
289For a given $op_name (for example, 'cop_label', 'sv_flags', etc...)
290you get an array ref containing the bytecode number of the op, a
291reference to the subroutine used to 'PUT', and the name of the method
292used to 'GET'.
293
294=for _private
295Add more detail about what $put_sub and $get_meth are and how to use them.
296
297=item @insn_name
298
299 my $op_name = $insn_name[$bytecode_num];
300
301A simple mapping of the bytecode number to the name of the op.
302Suitable for using with %insn_data like so:
303
304 my $op_info = $insn_data{$insn_name[$bytecode_num]};
305
306=item @optype
307
308 my $op_type = $optype[$op_type_num];
309
310A simple mapping of the op type number to its type (like 'COP' or 'BINOP').
311
312=item @specialsv_name
313
314 my $sv_name = $specialsv_name[$sv_index];
315
316Certain SV types are considered 'special'. They're represented by
317B::SPECIAL and are refered to by a number from the specialsv_list.
318This array maps that number back to the name of the SV (like 'Nullsv'
319or '&PL_sv_undef').
320
321=back
42d3a99d
GS
322
323=head1 AUTHOR
324
325Malcolm Beattie, C<mbeattie@sable.ox.ac.uk>
326
327=cut
a8a597b2
MB
328EOT
329
36bb303b
NC
330
331close ASMDATA_PM or die "Error closing ASMDATA_PM: $!";
332close BYTERUN_H or die "Error closing BYTERUN_H: $!";
333close BYTERUN_C or die "Error closing BYTERUN_C: $!";
334
a8a597b2
MB
335__END__
336# First set instruction ord("#") to read comment to end-of-line (sneaky)
337%number 35
fe3a57c4 338comment arg comment_t
a8a597b2
MB
339# Then make ord("\n") into a no-op
340%number 10
341nop none none
1df34986 342
a8a597b2
MB
343# Now for the rest of the ordinary ones, beginning with \0 which is
344# ret so that \0-terminated strings can be read properly as bytecode.
345%number 0
346#
b97332e7
JH
347# The argtype is either a single type or "rightvaluecast/argtype".
348#
92742e37 349#opcode lvalue argtype flags
a8a597b2 350#
92742e37 351ret none none x
059a8bb7 352ldsv bstate->bs_sv svindex
92742e37 353ldop PL_op opindex
059a8bb7 354stsv bstate->bs_sv U32 s
92742e37 355stop PL_op U32 s
059a8bb7
JH
356stpv bstate->bs_pv.xpv_pv U32 x
357ldspecsv bstate->bs_sv U8 x
566ece03 358ldspecsvx bstate->bs_sv U8 x
059a8bb7 359newsv bstate->bs_sv U8 x
566ece03 360newsvx bstate->bs_sv U32 x
92742e37 361newop PL_op U8 x
566ece03 362newopx PL_op U16 x
92742e37
GS
363newopn PL_op U8 x
364newpv none PV
059a8bb7
JH
365pv_cur bstate->bs_pv.xpv_cur STRLEN
366pv_free bstate->bs_pv none x
6e21dc91 367sv_upgrade bstate->bs_sv U8 x
059a8bb7
JH
368sv_refcnt SvREFCNT(bstate->bs_sv) U32
369sv_refcnt_add SvREFCNT(bstate->bs_sv) I32 x
370sv_flags SvFLAGS(bstate->bs_sv) U32
371xrv SvRV(bstate->bs_sv) svindex
372xpv bstate->bs_sv none x
1df34986
AE
373xpv_cur SvCUR(bstate->bs_sv) STRLEN
374xpv_len SvLEN(bstate->bs_sv) STRLEN
375xiv SvIVX(bstate->bs_sv) IV
059a8bb7
JH
376xnv SvNVX(bstate->bs_sv) NV
377xlv_targoff LvTARGOFF(bstate->bs_sv) STRLEN
378xlv_targlen LvTARGLEN(bstate->bs_sv) STRLEN
379xlv_targ LvTARG(bstate->bs_sv) svindex
380xlv_type LvTYPE(bstate->bs_sv) char
381xbm_useful BmUSEFUL(bstate->bs_sv) I32
382xbm_previous BmPREVIOUS(bstate->bs_sv) U16
383xbm_rare BmRARE(bstate->bs_sv) U8
11a7ac70
JH
384xfm_lines FmLINES(bstate->bs_sv) IV
385xio_lines IoLINES(bstate->bs_sv) IV
386xio_page IoPAGE(bstate->bs_sv) IV
387xio_page_len IoPAGE_LEN(bstate->bs_sv) IV
388xio_lines_left IoLINES_LEFT(bstate->bs_sv) IV
1df34986 389xio_top_name IoTOP_NAME(bstate->bs_sv) pvindex
059a8bb7 390xio_top_gv *(SV**)&IoTOP_GV(bstate->bs_sv) svindex
1df34986 391xio_fmt_name IoFMT_NAME(bstate->bs_sv) pvindex
059a8bb7 392xio_fmt_gv *(SV**)&IoFMT_GV(bstate->bs_sv) svindex
1df34986 393xio_bottom_name IoBOTTOM_NAME(bstate->bs_sv) pvindex
059a8bb7
JH
394xio_bottom_gv *(SV**)&IoBOTTOM_GV(bstate->bs_sv) svindex
395xio_subprocess IoSUBPROCESS(bstate->bs_sv) short
396xio_type IoTYPE(bstate->bs_sv) char
397xio_flags IoFLAGS(bstate->bs_sv) char
1df34986 398xcv_xsubany *(SV**)&CvXSUBANY(bstate->bs_sv).any_ptr svindex
059a8bb7
JH
399xcv_stash *(SV**)&CvSTASH(bstate->bs_sv) svindex
400xcv_start CvSTART(bstate->bs_sv) opindex
401xcv_root CvROOT(bstate->bs_sv) opindex
402xcv_gv *(SV**)&CvGV(bstate->bs_sv) svindex
403xcv_file CvFILE(bstate->bs_sv) pvindex
404xcv_depth CvDEPTH(bstate->bs_sv) long
405xcv_padlist *(SV**)&CvPADLIST(bstate->bs_sv) svindex
406xcv_outside *(SV**)&CvOUTSIDE(bstate->bs_sv) svindex
f52873be 407xcv_outside_seq CvOUTSIDE_SEQ(bstate->bs_sv) U32
059a8bb7
JH
408xcv_flags CvFLAGS(bstate->bs_sv) U16
409av_extend bstate->bs_sv SSize_t x
1df34986 410av_pushx bstate->bs_sv svindex x
059a8bb7
JH
411av_push bstate->bs_sv svindex x
412xav_fill AvFILLp(bstate->bs_sv) SSize_t
413xav_max AvMAX(bstate->bs_sv) SSize_t
414xav_flags AvFLAGS(bstate->bs_sv) U8
415xhv_riter HvRITER(bstate->bs_sv) I32
1df34986
AE
416xhv_name HvNAME(bstate->bs_sv) pvindex
417xhv_pmroot *(OP**)&HvPMROOT(bstate->bs_sv) opindex
059a8bb7
JH
418hv_store bstate->bs_sv svindex x
419sv_magic bstate->bs_sv char x
420mg_obj SvMAGIC(bstate->bs_sv)->mg_obj svindex
421mg_private SvMAGIC(bstate->bs_sv)->mg_private U16
422mg_flags SvMAGIC(bstate->bs_sv)->mg_flags U8
1df34986
AE
423mg_name SvMAGIC(bstate->bs_sv) pvcontents x
424mg_namex SvMAGIC(bstate->bs_sv) svindex x
059a8bb7
JH
425xmg_stash *(SV**)&SvSTASH(bstate->bs_sv) svindex
426gv_fetchpv bstate->bs_sv strconst x
566ece03 427gv_fetchpvx bstate->bs_sv strconst x
059a8bb7 428gv_stashpv bstate->bs_sv strconst x
566ece03 429gv_stashpvx bstate->bs_sv strconst x
059a8bb7
JH
430gp_sv GvSV(bstate->bs_sv) svindex
431gp_refcnt GvREFCNT(bstate->bs_sv) U32
432gp_refcnt_add GvREFCNT(bstate->bs_sv) I32 x
433gp_av *(SV**)&GvAV(bstate->bs_sv) svindex
434gp_hv *(SV**)&GvHV(bstate->bs_sv) svindex
435gp_cv *(SV**)&GvCV(bstate->bs_sv) svindex
436gp_file GvFILE(bstate->bs_sv) pvindex
437gp_io *(SV**)&GvIOp(bstate->bs_sv) svindex
438gp_form *(SV**)&GvFORM(bstate->bs_sv) svindex
439gp_cvgen GvCVGEN(bstate->bs_sv) U32
440gp_line GvLINE(bstate->bs_sv) line_t
441gp_share bstate->bs_sv svindex x
442xgv_flags GvFLAGS(bstate->bs_sv) U8
92742e37
GS
443op_next PL_op->op_next opindex
444op_sibling PL_op->op_sibling opindex
445op_ppaddr PL_op->op_ppaddr strconst x
446op_targ PL_op->op_targ PADOFFSET
447op_type PL_op OPCODE x
2814eb74
PJ
448op_opt PL_op->op_opt U8
449op_static PL_op->op_static U8
92742e37
GS
450op_flags PL_op->op_flags U8
451op_private PL_op->op_private U8
452op_first cUNOP->op_first opindex
453op_last cBINOP->op_last opindex
454op_other cLOGOP->op_other opindex
92742e37 455op_pmreplroot cPMOP->op_pmreplroot opindex
92742e37
GS
456op_pmreplstart cPMOP->op_pmreplstart opindex
457op_pmnext *(OP**)&cPMOP->op_pmnext opindex
1df34986 458#ifdef USE_ITHREADS
47682f07 459op_pmstashpv cPMOP pvindex x
b97332e7 460op_pmreplrootpo cPMOP->op_pmreplroot OP*/PADOFFSET
1df34986
AE
461#else
462op_pmstash *(SV**)&cPMOP->op_pmstash svindex
463op_pmreplrootgv *(SV**)&cPMOP->op_pmreplroot svindex
464#endif
92742e37
GS
465pregcomp PL_op pvcontents x
466op_pmflags cPMOP->op_pmflags U16
467op_pmpermflags cPMOP->op_pmpermflags U16
1df34986 468op_pmdynflags cPMOP->op_pmdynflags U8
92742e37 469op_sv cSVOP->op_sv svindex
7934575e 470op_padix cPADOP->op_padix PADOFFSET
92742e37
GS
471op_pv cPVOP->op_pv pvcontents
472op_pv_tr cPVOP->op_pv op_tr_array
473op_redoop cLOOP->op_redoop opindex
474op_nextop cLOOP->op_nextop opindex
475op_lastop cLOOP->op_lastop opindex
059a8bb7 476cop_label cCOP->cop_label pvindex
1df34986 477#ifdef USE_ITHREADS
059a8bb7
JH
478cop_stashpv cCOP pvindex x
479cop_file cCOP pvindex x
1df34986
AE
480#else
481cop_stash cCOP svindex x
482cop_filegv cCOP svindex x
483#endif
92742e37
GS
484cop_seq cCOP->cop_seq U32
485cop_arybase cCOP->cop_arybase I32
1df34986
AE
486cop_line cCOP->cop_line line_t
487cop_io cCOP->cop_io svindex
b295d113 488cop_warnings cCOP->cop_warnings svindex
92742e37
GS
489main_start PL_main_start opindex
490main_root PL_main_root opindex
1df34986 491main_cv *(SV**)&PL_main_cv svindex
92742e37 492curpad PL_curpad svindex x
059a8bb7
JH
493push_begin PL_beginav svindex x
494push_init PL_initav svindex x
495push_end PL_endav svindex x
1df34986
AE
496curstash *(SV**)&PL_curstash svindex
497defstash *(SV**)&PL_defstash svindex
498data none U8 x
0ac16f7c 499incav *(SV**)&GvAV(PL_incgv) svindex
1df34986
AE
500load_glob none svindex x
501#ifdef USE_ITHREADS
502regex_padav *(SV**)&PL_regex_padav svindex
503#endif
504dowarn PL_dowarn U8
505comppad_name *(SV**)&PL_comppad_name svindex
506xgv_stash *(SV**)&GvSTASH(bstate->bs_sv) svindex
507signal bstate->bs_sv strconst x
508# to be removed
509formfeed PL_formfeed svindex