This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
regcomp.sym: Make adjacent opcodes for 2 similar regnodes
[perl5.git] / regnodes.h
CommitLineData
37442d52
RGS
1/* -*- buffer-read-only: t -*-
2 !!!!!!! DO NOT EDIT THIS FILE !!!!!!!
eb2624c9 3 This file is built by regen/regcomp.pl from regcomp.sym.
d09b2d29 4 Any changes made here will be lost!
78102347 5 */
d09b2d29 6
6bda09f9
YO
7/* Regops and State definitions */
8
86451f01
KW
9#define REGNODE_MAX 109
10#define REGMATCH_STATE_MAX 149
03363afd 11
ce553cf5
KW
12/* -- For regexec.c to switch on target being utf8 (t8) or not (tb, b='byte');
13 * same with pattern (p8, pb) -- */
14#define with_tp_UTF8ness(op, t_utf8, p_utf8) \
15 (((op) << 2) + (cBOOL(t_utf8) << 1) + cBOOL(p_utf8))
16
17/* The #defines below give both the basic regnode and the expanded version for
18 switching on utf8ness */
19#define END 0 /* 0x00 End of program. */
20#define END_tb_pb 0 /* 0x000 */
21#define END_tb_p8 1 /* 0x001 */
22#define END_t8_pb 2 /* 0x002 */
23#define END_t8_p8 3 /* 0x003 */
24
25#define SUCCEED 1 /* 0x01 Return from a subroutine,
26 basically. */
27#define SUCCEED_tb_pb 4 /* 0x004 */
28#define SUCCEED_tb_p8 5 /* 0x005 */
29#define SUCCEED_t8_pb 6 /* 0x006 */
30#define SUCCEED_t8_p8 7 /* 0x007 */
31
32#define SBOL 2 /* 0x02 Match "" at beginning of
33 line: /^/, /\A/ */
34#define SBOL_tb_pb 8 /* 0x008 */
35#define SBOL_tb_p8 9 /* 0x009 */
36#define SBOL_t8_pb 10 /* 0x00a */
37#define SBOL_t8_p8 11 /* 0x00b */
38
39#define BOL 2 /* 0x02 Match "" at beginning of
40 line: /^/, /\A/ */
41#define BOL_tb_pb 8 /* 0x008 */
42#define BOL_tb_p8 9 /* 0x009 */
43#define BOL_t8_pb 10 /* 0x00a */
44#define BOL_t8_p8 11 /* 0x00b */
45
46#define MBOL 3 /* 0x03 Same, assuming multiline:
47 /^/m */
48#define MBOL_tb_pb 12 /* 0x00c */
49#define MBOL_tb_p8 13 /* 0x00d */
50#define MBOL_t8_pb 14 /* 0x00e */
51#define MBOL_t8_p8 15 /* 0x00f */
52
53#define SEOL 4 /* 0x04 Match "" at end of line:
54 /$/ */
55#define SEOL_tb_pb 16 /* 0x010 */
56#define SEOL_tb_p8 17 /* 0x011 */
57#define SEOL_t8_pb 18 /* 0x012 */
58#define SEOL_t8_p8 19 /* 0x013 */
59
60#define EOL 4 /* 0x04 Match "" at end of line:
61 /$/ */
62#define EOL_tb_pb 16 /* 0x010 */
63#define EOL_tb_p8 17 /* 0x011 */
64#define EOL_t8_pb 18 /* 0x012 */
65#define EOL_t8_p8 19 /* 0x013 */
66
67#define MEOL 5 /* 0x05 Same, assuming multiline:
68 /$/m */
69#define MEOL_tb_pb 20 /* 0x014 */
70#define MEOL_tb_p8 21 /* 0x015 */
71#define MEOL_t8_pb 22 /* 0x016 */
72#define MEOL_t8_p8 23 /* 0x017 */
73
74#define EOS 6 /* 0x06 Match "" at end of string:
75 /\z/ */
76#define EOS_tb_pb 24 /* 0x018 */
77#define EOS_tb_p8 25 /* 0x019 */
78#define EOS_t8_pb 26 /* 0x01a */
79#define EOS_t8_p8 27 /* 0x01b */
80
81#define GPOS 7 /* 0x07 Matches where last m//g
82 left off. */
83#define GPOS_tb_pb 28 /* 0x01c */
84#define GPOS_tb_p8 29 /* 0x01d */
85#define GPOS_t8_pb 30 /* 0x01e */
86#define GPOS_t8_p8 31 /* 0x01f */
87
88#define BOUND 8 /* 0x08 Like BOUNDA for non-utf8,
89 otherwise like BOUNDU */
90#define BOUND_tb_pb 32 /* 0x020 */
91#define BOUND_tb_p8 33 /* 0x021 */
92#define BOUND_t8_pb 34 /* 0x022 */
93#define BOUND_t8_p8 35 /* 0x023 */
94
95#define BOUNDL 9 /* 0x09 Like BOUND/BOUNDU, but \w
96 and \W are defined by current
97 locale */
98#define BOUNDL_tb_pb 36 /* 0x024 */
99#define BOUNDL_tb_p8 37 /* 0x025 */
100#define BOUNDL_t8_pb 38 /* 0x026 */
101#define BOUNDL_t8_p8 39 /* 0x027 */
102
103#define BOUNDU 10 /* 0x0a Match "" at any boundary of
104 a given type using /u rules. */
105#define BOUNDU_tb_pb 40 /* 0x028 */
106#define BOUNDU_tb_p8 41 /* 0x029 */
107#define BOUNDU_t8_pb 42 /* 0x02a */
108#define BOUNDU_t8_p8 43 /* 0x02b */
109
110#define BOUNDA 11 /* 0x0b Match "" at any boundary
111 between \w\W or \W\w, where \w
112 is [_a-zA-Z0-9] */
113#define BOUNDA_tb_pb 44 /* 0x02c */
114#define BOUNDA_tb_p8 45 /* 0x02d */
115#define BOUNDA_t8_pb 46 /* 0x02e */
116#define BOUNDA_t8_p8 47 /* 0x02f */
117
118#define NBOUND 12 /* 0x0c Like NBOUNDA for non-utf8,
119 otherwise like BOUNDU */
120#define NBOUND_tb_pb 48 /* 0x030 */
121#define NBOUND_tb_p8 49 /* 0x031 */
122#define NBOUND_t8_pb 50 /* 0x032 */
123#define NBOUND_t8_p8 51 /* 0x033 */
124
125#define NBOUNDL 13 /* 0x0d Like NBOUND/NBOUNDU, but \w
126 and \W are defined by current
127 locale */
128#define NBOUNDL_tb_pb 52 /* 0x034 */
129#define NBOUNDL_tb_p8 53 /* 0x035 */
130#define NBOUNDL_t8_pb 54 /* 0x036 */
131#define NBOUNDL_t8_p8 55 /* 0x037 */
132
133#define NBOUNDU 14 /* 0x0e Match "" at any
134 non-boundary of a given type
135 using using /u rules. */
136#define NBOUNDU_tb_pb 56 /* 0x038 */
137#define NBOUNDU_tb_p8 57 /* 0x039 */
138#define NBOUNDU_t8_pb 58 /* 0x03a */
139#define NBOUNDU_t8_p8 59 /* 0x03b */
140
141#define NBOUNDA 15 /* 0x0f Match "" betweeen any \w\w
142 or \W\W, where \w is
143 [_a-zA-Z0-9] */
144#define NBOUNDA_tb_pb 60 /* 0x03c */
145#define NBOUNDA_tb_p8 61 /* 0x03d */
146#define NBOUNDA_t8_pb 62 /* 0x03e */
147#define NBOUNDA_t8_p8 63 /* 0x03f */
148
149#define REG_ANY 16 /* 0x10 Match any one character
150 (except newline). */
151#define REG_ANY_tb_pb 64 /* 0x040 */
152#define REG_ANY_tb_p8 65 /* 0x041 */
153#define REG_ANY_t8_pb 66 /* 0x042 */
154#define REG_ANY_t8_p8 67 /* 0x043 */
155
156#define SANY 17 /* 0x11 Match any one character. */
157#define SANY_tb_pb 68 /* 0x044 */
158#define SANY_tb_p8 69 /* 0x045 */
159#define SANY_t8_pb 70 /* 0x046 */
160#define SANY_t8_p8 71 /* 0x047 */
161
162#define ANYOF 18 /* 0x12 Match character in (or not
163 in) this class, single char
164 match only */
165#define ANYOF_tb_pb 72 /* 0x048 */
166#define ANYOF_tb_p8 73 /* 0x049 */
167#define ANYOF_t8_pb 74 /* 0x04a */
168#define ANYOF_t8_p8 75 /* 0x04b */
169
170#define ANYOFD 19 /* 0x13 Like ANYOF, but /d is in
171 effect */
172#define ANYOFD_tb_pb 76 /* 0x04c */
173#define ANYOFD_tb_p8 77 /* 0x04d */
174#define ANYOFD_t8_pb 78 /* 0x04e */
175#define ANYOFD_t8_p8 79 /* 0x04f */
176
177#define ANYOFL 20 /* 0x14 Like ANYOF, but /l is in
178 effect */
179#define ANYOFL_tb_pb 80 /* 0x050 */
180#define ANYOFL_tb_p8 81 /* 0x051 */
181#define ANYOFL_t8_pb 82 /* 0x052 */
182#define ANYOFL_t8_p8 83 /* 0x053 */
183
184#define ANYOFPOSIXL 21 /* 0x15 Like ANYOFL, but matches
185 [[:posix:]] classes */
186#define ANYOFPOSIXL_tb_pb 84 /* 0x054 */
187#define ANYOFPOSIXL_tb_p8 85 /* 0x055 */
188#define ANYOFPOSIXL_t8_pb 86 /* 0x056 */
189#define ANYOFPOSIXL_t8_p8 87 /* 0x057 */
190
191#define ANYOFH 22 /* 0x16 Like ANYOF, but only has
192 "High" matches, none in the
193 bitmap; the flags field contains
194 the lowest matchable UTF-8 start
195 byte */
196#define ANYOFH_tb_pb 88 /* 0x058 */
197#define ANYOFH_tb_p8 89 /* 0x059 */
198#define ANYOFH_t8_pb 90 /* 0x05a */
199#define ANYOFH_t8_p8 91 /* 0x05b */
200
201#define ANYOFHb 23 /* 0x17 Like ANYOFH, but all
202 matches share the same UTF-8
203 start byte, given in the flags
204 field */
205#define ANYOFHb_tb_pb 92 /* 0x05c */
206#define ANYOFHb_tb_p8 93 /* 0x05d */
207#define ANYOFHb_t8_pb 94 /* 0x05e */
208#define ANYOFHb_t8_p8 95 /* 0x05f */
209
210#define ANYOFHr 24 /* 0x18 Like ANYOFH, but the flags
211 field contains packed bounds for
212 all matchable UTF-8 start bytes.
213 */
214#define ANYOFHr_tb_pb 96 /* 0x060 */
215#define ANYOFHr_tb_p8 97 /* 0x061 */
216#define ANYOFHr_t8_pb 98 /* 0x062 */
217#define ANYOFHr_t8_p8 99 /* 0x063 */
218
219#define ANYOFHs 25 /* 0x19 Like ANYOFHb, but has a
220 string field that gives the
221 leading matchable UTF-8 bytes;
222 flags field is len */
223#define ANYOFHs_tb_pb 100 /* 0x064 */
224#define ANYOFHs_tb_p8 101 /* 0x065 */
225#define ANYOFHs_t8_pb 102 /* 0x066 */
226#define ANYOFHs_t8_p8 103 /* 0x067 */
227
228#define ANYOFR 26 /* 0x1a Matches any character in
229 the range given by its packed
230 args: upper 12 bits is the max
231 delta from the base lower 20;
232 the flags field contains the
233 lowest matchable UTF-8 start
234 byte */
235#define ANYOFR_tb_pb 104 /* 0x068 */
236#define ANYOFR_tb_p8 105 /* 0x069 */
237#define ANYOFR_t8_pb 106 /* 0x06a */
238#define ANYOFR_t8_p8 107 /* 0x06b */
239
240#define ANYOFRb 27 /* 0x1b Like ANYOFR, but all
241 matches share the same UTF-8
242 start byte, given in the flags
243 field */
244#define ANYOFRb_tb_pb 108 /* 0x06c */
245#define ANYOFRb_tb_p8 109 /* 0x06d */
246#define ANYOFRb_t8_pb 110 /* 0x06e */
247#define ANYOFRb_t8_p8 111 /* 0x06f */
248
249#define ANYOFM 28 /* 0x1c Like ANYOF, but matches an
250 invariant byte as determined by
251 the mask and arg */
252#define ANYOFM_tb_pb 112 /* 0x070 */
253#define ANYOFM_tb_p8 113 /* 0x071 */
254#define ANYOFM_t8_pb 114 /* 0x072 */
255#define ANYOFM_t8_p8 115 /* 0x073 */
256
257#define NANYOFM 29 /* 0x1d complement of ANYOFM */
258#define NANYOFM_tb_pb 116 /* 0x074 */
259#define NANYOFM_tb_p8 117 /* 0x075 */
260#define NANYOFM_t8_pb 118 /* 0x076 */
261#define NANYOFM_t8_p8 119 /* 0x077 */
262
263#define POSIXD 30 /* 0x1e Some [[:class:]] under /d;
264 the FLAGS field gives which one
265 */
266#define POSIXD_tb_pb 120 /* 0x078 */
267#define POSIXD_tb_p8 121 /* 0x079 */
268#define POSIXD_t8_pb 122 /* 0x07a */
269#define POSIXD_t8_p8 123 /* 0x07b */
270
271#define POSIXL 31 /* 0x1f Some [[:class:]] under /l;
272 the FLAGS field gives which one
273 */
274#define POSIXL_tb_pb 124 /* 0x07c */
275#define POSIXL_tb_p8 125 /* 0x07d */
276#define POSIXL_t8_pb 126 /* 0x07e */
277#define POSIXL_t8_p8 127 /* 0x07f */
278
279#define POSIXU 32 /* 0x20 Some [[:class:]] under /u;
280 the FLAGS field gives which one
281 */
282#define POSIXU_tb_pb 128 /* 0x080 */
283#define POSIXU_tb_p8 129 /* 0x081 */
284#define POSIXU_t8_pb 130 /* 0x082 */
285#define POSIXU_t8_p8 131 /* 0x083 */
286
287#define POSIXA 33 /* 0x21 Some [[:class:]] under /a;
288 the FLAGS field gives which one
289 */
290#define POSIXA_tb_pb 132 /* 0x084 */
291#define POSIXA_tb_p8 133 /* 0x085 */
292#define POSIXA_t8_pb 134 /* 0x086 */
293#define POSIXA_t8_p8 135 /* 0x087 */
294
295#define NPOSIXD 34 /* 0x22 complement of POSIXD,
296 [[:^class:]] */
297#define NPOSIXD_tb_pb 136 /* 0x088 */
298#define NPOSIXD_tb_p8 137 /* 0x089 */
299#define NPOSIXD_t8_pb 138 /* 0x08a */
300#define NPOSIXD_t8_p8 139 /* 0x08b */
301
302#define NPOSIXL 35 /* 0x23 complement of POSIXL,
303 [[:^class:]] */
304#define NPOSIXL_tb_pb 140 /* 0x08c */
305#define NPOSIXL_tb_p8 141 /* 0x08d */
306#define NPOSIXL_t8_pb 142 /* 0x08e */
307#define NPOSIXL_t8_p8 143 /* 0x08f */
308
309#define NPOSIXU 36 /* 0x24 complement of POSIXU,
310 [[:^class:]] */
311#define NPOSIXU_tb_pb 144 /* 0x090 */
312#define NPOSIXU_tb_p8 145 /* 0x091 */
313#define NPOSIXU_t8_pb 146 /* 0x092 */
314#define NPOSIXU_t8_p8 147 /* 0x093 */
315
316#define NPOSIXA 37 /* 0x25 complement of POSIXA,
317 [[:^class:]] */
318#define NPOSIXA_tb_pb 148 /* 0x094 */
319#define NPOSIXA_tb_p8 149 /* 0x095 */
320#define NPOSIXA_t8_pb 150 /* 0x096 */
321#define NPOSIXA_t8_p8 151 /* 0x097 */
322
323#define CLUMP 38 /* 0x26 Match any extended grapheme
324 cluster sequence */
325#define CLUMP_tb_pb 152 /* 0x098 */
326#define CLUMP_tb_p8 153 /* 0x099 */
327#define CLUMP_t8_pb 154 /* 0x09a */
328#define CLUMP_t8_p8 155 /* 0x09b */
329
330#define BRANCH 39 /* 0x27 Match this alternative, or
331 the next... */
332#define BRANCH_tb_pb 156 /* 0x09c */
333#define BRANCH_tb_p8 157 /* 0x09d */
334#define BRANCH_t8_pb 158 /* 0x09e */
335#define BRANCH_t8_p8 159 /* 0x09f */
336
337#define EXACT 40 /* 0x28 Match this string (flags
338 field is the length). */
339#define EXACT_tb_pb 160 /* 0x0a0 */
340#define EXACT_tb_p8 161 /* 0x0a1 */
341#define EXACT_t8_pb 162 /* 0x0a2 */
342#define EXACT_t8_p8 163 /* 0x0a3 */
343
344#define LEXACT 41 /* 0x29 Match this long string
345 (preceded by length; flags
346 unused). */
347#define LEXACT_tb_pb 164 /* 0x0a4 */
348#define LEXACT_tb_p8 165 /* 0x0a5 */
349#define LEXACT_t8_pb 166 /* 0x0a6 */
350#define LEXACT_t8_p8 167 /* 0x0a7 */
351
352#define EXACTL 42 /* 0x2a Like EXACT, but /l is in
353 effect (used so locale-related
354 warnings can be checked for) */
355#define EXACTL_tb_pb 168 /* 0x0a8 */
356#define EXACTL_tb_p8 169 /* 0x0a9 */
357#define EXACTL_t8_pb 170 /* 0x0aa */
358#define EXACTL_t8_p8 171 /* 0x0ab */
359
360#define EXACTF 43 /* 0x2b Like EXACT, but match using
361 /id rules; (string not UTF-8,
362 ASCII folded; non-ASCII not) */
363#define EXACTF_tb_pb 172 /* 0x0ac */
364#define EXACTF_tb_p8 173 /* 0x0ad */
365#define EXACTF_t8_pb 174 /* 0x0ae */
366#define EXACTF_t8_p8 175 /* 0x0af */
367
368#define EXACTFL 44 /* 0x2c Like EXACT, but match using
369 /il rules; (string not likely to
370 be folded) */
371#define EXACTFL_tb_pb 176 /* 0x0b0 */
372#define EXACTFL_tb_p8 177 /* 0x0b1 */
373#define EXACTFL_t8_pb 178 /* 0x0b2 */
374#define EXACTFL_t8_p8 179 /* 0x0b3 */
375
376#define EXACTFU 45 /* 0x2d Like EXACT, but match using
377 /iu rules; (string folded) */
378#define EXACTFU_tb_pb 180 /* 0x0b4 */
379#define EXACTFU_tb_p8 181 /* 0x0b5 */
380#define EXACTFU_t8_pb 182 /* 0x0b6 */
381#define EXACTFU_t8_p8 183 /* 0x0b7 */
382
383#define EXACTFAA 46 /* 0x2e Like EXACT, but match using
384 /iaa rules; (string folded
5f162c35
KW
385 except MICRO in non-UTF8
386 patterns; doesn't contain SHARP
387 S unless UTF-8; folded length <=
ce553cf5
KW
388 unfolded) */
389#define EXACTFAA_tb_pb 184 /* 0x0b8 */
390#define EXACTFAA_tb_p8 185 /* 0x0b9 */
391#define EXACTFAA_t8_pb 186 /* 0x0ba */
392#define EXACTFAA_t8_p8 187 /* 0x0bb */
393
f97d9711
KW
394#define EXACTFAA_NO_TRIE 47 /* 0x2f Like EXACTFAA, (string not
395 UTF-8, folded except: MICRO,
396 SHARP S; folded length <=
397 unfolded, not currently
398 trie-able) */
399#define EXACTFAA_NO_TRIE_tb_pb 188 /* 0x0bc */
400#define EXACTFAA_NO_TRIE_tb_p8 189 /* 0x0bd */
401#define EXACTFAA_NO_TRIE_t8_pb 190 /* 0x0be */
402#define EXACTFAA_NO_TRIE_t8_p8 191 /* 0x0bf */
403
404#define EXACTFUP 48 /* 0x30 Like EXACT, but match using
ce553cf5 405 /iu rules; (string not UTF-8,
5f162c35
KW
406 folded except MICRO: hence
407 Problematic) */
f97d9711
KW
408#define EXACTFUP_tb_pb 192 /* 0x0c0 */
409#define EXACTFUP_tb_p8 193 /* 0x0c1 */
410#define EXACTFUP_t8_pb 194 /* 0x0c2 */
411#define EXACTFUP_t8_p8 195 /* 0x0c3 */
ce553cf5 412
f97d9711 413#define EXACTFLU8 49 /* 0x31 Like EXACTFU, but use /il,
ce553cf5
KW
414 UTF-8, (string is folded, and
415 everything in it is above 255 */
f97d9711
KW
416#define EXACTFLU8_tb_pb 196 /* 0x0c4 */
417#define EXACTFLU8_tb_p8 197 /* 0x0c5 */
418#define EXACTFLU8_t8_pb 198 /* 0x0c6 */
419#define EXACTFLU8_t8_p8 199 /* 0x0c7 */
ce553cf5
KW
420
421#define EXACT_REQ8 50 /* 0x32 Like EXACT, but only UTF-8
422 encoded targets can match */
423#define EXACT_REQ8_tb_pb 200 /* 0x0c8 */
424#define EXACT_REQ8_tb_p8 201 /* 0x0c9 */
425#define EXACT_REQ8_t8_pb 202 /* 0x0ca */
426#define EXACT_REQ8_t8_p8 203 /* 0x0cb */
427
428#define LEXACT_REQ8 51 /* 0x33 Like LEXACT, but only UTF-8
429 encoded targets can match */
430#define LEXACT_REQ8_tb_pb 204 /* 0x0cc */
431#define LEXACT_REQ8_tb_p8 205 /* 0x0cd */
432#define LEXACT_REQ8_t8_pb 206 /* 0x0ce */
433#define LEXACT_REQ8_t8_p8 207 /* 0x0cf */
434
435#define EXACTFU_REQ8 52 /* 0x34 Like EXACTFU, but only
436 UTF-8 encoded targets can match
437 */
438#define EXACTFU_REQ8_tb_pb 208 /* 0x0d0 */
439#define EXACTFU_REQ8_tb_p8 209 /* 0x0d1 */
440#define EXACTFU_REQ8_t8_pb 210 /* 0x0d2 */
441#define EXACTFU_REQ8_t8_p8 211 /* 0x0d3 */
442
443#define EXACTFU_S_EDGE 53 /* 0x35 /di rules, but nothing in
444 it precludes /ui, except begins
445 and/or ends with [Ss]; (string
446 not UTF-8; compile-time only) */
447#define EXACTFU_S_EDGE_tb_pb 212 /* 0x0d4 */
448#define EXACTFU_S_EDGE_tb_p8 213 /* 0x0d5 */
449#define EXACTFU_S_EDGE_t8_pb 214 /* 0x0d6 */
450#define EXACTFU_S_EDGE_t8_p8 215 /* 0x0d7 */
451
452#define LNBREAK 54 /* 0x36 generic newline pattern */
453#define LNBREAK_tb_pb 216 /* 0x0d8 */
454#define LNBREAK_tb_p8 217 /* 0x0d9 */
455#define LNBREAK_t8_pb 218 /* 0x0da */
456#define LNBREAK_t8_p8 219 /* 0x0db */
457
458#define TRIE 55 /* 0x37 Match many EXACT(F[ALU]?)?
459 at once. flags==type */
460#define TRIE_tb_pb 220 /* 0x0dc */
461#define TRIE_tb_p8 221 /* 0x0dd */
462#define TRIE_t8_pb 222 /* 0x0de */
463#define TRIE_t8_p8 223 /* 0x0df */
464
465#define TRIEC 56 /* 0x38 Same as TRIE, but with
466 embedded charclass data */
467#define TRIEC_tb_pb 224 /* 0x0e0 */
468#define TRIEC_tb_p8 225 /* 0x0e1 */
469#define TRIEC_t8_pb 226 /* 0x0e2 */
470#define TRIEC_t8_p8 227 /* 0x0e3 */
471
472#define AHOCORASICK 57 /* 0x39 Aho Corasick stclass.
473 flags==type */
474#define AHOCORASICK_tb_pb 228 /* 0x0e4 */
475#define AHOCORASICK_tb_p8 229 /* 0x0e5 */
476#define AHOCORASICK_t8_pb 230 /* 0x0e6 */
477#define AHOCORASICK_t8_p8 231 /* 0x0e7 */
478
479#define AHOCORASICKC 58 /* 0x3a Same as AHOCORASICK, but
480 with embedded charclass data */
481#define AHOCORASICKC_tb_pb 232 /* 0x0e8 */
482#define AHOCORASICKC_tb_p8 233 /* 0x0e9 */
483#define AHOCORASICKC_t8_pb 234 /* 0x0ea */
484#define AHOCORASICKC_t8_p8 235 /* 0x0eb */
485
486#define NOTHING 59 /* 0x3b Match empty string. */
487#define NOTHING_tb_pb 236 /* 0x0ec */
488#define NOTHING_tb_p8 237 /* 0x0ed */
489#define NOTHING_t8_pb 238 /* 0x0ee */
490#define NOTHING_t8_p8 239 /* 0x0ef */
491
492#define TAIL 60 /* 0x3c Match empty string. Can
493 jump here from outside. */
494#define TAIL_tb_pb 240 /* 0x0f0 */
495#define TAIL_tb_p8 241 /* 0x0f1 */
496#define TAIL_t8_pb 242 /* 0x0f2 */
497#define TAIL_t8_p8 243 /* 0x0f3 */
498
499#define STAR 61 /* 0x3d Match this (simple) thing 0
500 or more times. */
501#define STAR_tb_pb 244 /* 0x0f4 */
502#define STAR_tb_p8 245 /* 0x0f5 */
503#define STAR_t8_pb 246 /* 0x0f6 */
504#define STAR_t8_p8 247 /* 0x0f7 */
505
506#define PLUS 62 /* 0x3e Match this (simple) thing 1
507 or more times. */
508#define PLUS_tb_pb 248 /* 0x0f8 */
509#define PLUS_tb_p8 249 /* 0x0f9 */
510#define PLUS_t8_pb 250 /* 0x0fa */
511#define PLUS_t8_p8 251 /* 0x0fb */
512
513#define CURLY 63 /* 0x3f Match this simple thing
514 {n,m} times. */
515#define CURLY_tb_pb 252 /* 0x0fc */
516#define CURLY_tb_p8 253 /* 0x0fd */
517#define CURLY_t8_pb 254 /* 0x0fe */
518#define CURLY_t8_p8 255 /* 0x0ff */
519
520#define CURLYN 64 /* 0x40 Capture next-after-this
521 simple thing */
522#define CURLYN_tb_pb 256 /* 0x100 */
523#define CURLYN_tb_p8 257 /* 0x101 */
524#define CURLYN_t8_pb 258 /* 0x102 */
525#define CURLYN_t8_p8 259 /* 0x103 */
526
527#define CURLYM 65 /* 0x41 Capture this medium-complex
528 thing {n,m} times. */
529#define CURLYM_tb_pb 260 /* 0x104 */
530#define CURLYM_tb_p8 261 /* 0x105 */
531#define CURLYM_t8_pb 262 /* 0x106 */
532#define CURLYM_t8_p8 263 /* 0x107 */
533
534#define CURLYX 66 /* 0x42 Match this complex thing
535 {n,m} times. */
536#define CURLYX_tb_pb 264 /* 0x108 */
537#define CURLYX_tb_p8 265 /* 0x109 */
538#define CURLYX_t8_pb 266 /* 0x10a */
539#define CURLYX_t8_p8 267 /* 0x10b */
540
541#define WHILEM 67 /* 0x43 Do curly processing and see
542 if rest matches. */
543#define WHILEM_tb_pb 268 /* 0x10c */
544#define WHILEM_tb_p8 269 /* 0x10d */
545#define WHILEM_t8_pb 270 /* 0x10e */
546#define WHILEM_t8_p8 271 /* 0x10f */
547
548#define OPEN 68 /* 0x44 Mark this point in input as
549 start of #n. */
550#define OPEN_tb_pb 272 /* 0x110 */
551#define OPEN_tb_p8 273 /* 0x111 */
552#define OPEN_t8_pb 274 /* 0x112 */
553#define OPEN_t8_p8 275 /* 0x113 */
554
555#define CLOSE 69 /* 0x45 Close corresponding OPEN of
556 #n. */
557#define CLOSE_tb_pb 276 /* 0x114 */
558#define CLOSE_tb_p8 277 /* 0x115 */
559#define CLOSE_t8_pb 278 /* 0x116 */
560#define CLOSE_t8_p8 279 /* 0x117 */
561
562#define SROPEN 70 /* 0x46 Same as OPEN, but for
563 script run */
564#define SROPEN_tb_pb 280 /* 0x118 */
565#define SROPEN_tb_p8 281 /* 0x119 */
566#define SROPEN_t8_pb 282 /* 0x11a */
567#define SROPEN_t8_p8 283 /* 0x11b */
568
569#define SRCLOSE 71 /* 0x47 Close preceding SROPEN */
570#define SRCLOSE_tb_pb 284 /* 0x11c */
571#define SRCLOSE_tb_p8 285 /* 0x11d */
572#define SRCLOSE_t8_pb 286 /* 0x11e */
573#define SRCLOSE_t8_p8 287 /* 0x11f */
574
575#define REF 72 /* 0x48 Match some already matched
576 string */
577#define REF_tb_pb 288 /* 0x120 */
578#define REF_tb_p8 289 /* 0x121 */
579#define REF_t8_pb 290 /* 0x122 */
580#define REF_t8_p8 291 /* 0x123 */
581
582#define REFF 73 /* 0x49 Match already matched
583 string, using /di rules. */
584#define REFF_tb_pb 292 /* 0x124 */
585#define REFF_tb_p8 293 /* 0x125 */
586#define REFF_t8_pb 294 /* 0x126 */
587#define REFF_t8_p8 295 /* 0x127 */
588
589#define REFFL 74 /* 0x4a Match already matched
590 string, using /li rules. */
591#define REFFL_tb_pb 296 /* 0x128 */
592#define REFFL_tb_p8 297 /* 0x129 */
593#define REFFL_t8_pb 298 /* 0x12a */
594#define REFFL_t8_p8 299 /* 0x12b */
595
596#define REFFU 75 /* 0x4b Match already matched
597 string, usng /ui. */
598#define REFFU_tb_pb 300 /* 0x12c */
599#define REFFU_tb_p8 301 /* 0x12d */
600#define REFFU_t8_pb 302 /* 0x12e */
601#define REFFU_t8_p8 303 /* 0x12f */
602
603#define REFFA 76 /* 0x4c Match already matched
604 string, using /aai rules. */
605#define REFFA_tb_pb 304 /* 0x130 */
606#define REFFA_tb_p8 305 /* 0x131 */
607#define REFFA_t8_pb 306 /* 0x132 */
608#define REFFA_t8_p8 307 /* 0x133 */
609
610#define REFN 77 /* 0x4d Match some already matched
611 string */
612#define REFN_tb_pb 308 /* 0x134 */
613#define REFN_tb_p8 309 /* 0x135 */
614#define REFN_t8_pb 310 /* 0x136 */
615#define REFN_t8_p8 311 /* 0x137 */
616
617#define REFFN 78 /* 0x4e Match already matched
618 string, using /di rules. */
619#define REFFN_tb_pb 312 /* 0x138 */
620#define REFFN_tb_p8 313 /* 0x139 */
621#define REFFN_t8_pb 314 /* 0x13a */
622#define REFFN_t8_p8 315 /* 0x13b */
623
624#define REFFLN 79 /* 0x4f Match already matched
625 string, using /li rules. */
626#define REFFLN_tb_pb 316 /* 0x13c */
627#define REFFLN_tb_p8 317 /* 0x13d */
628#define REFFLN_t8_pb 318 /* 0x13e */
629#define REFFLN_t8_p8 319 /* 0x13f */
630
631#define REFFUN 80 /* 0x50 Match already matched
632 string, using /ui rules. */
633#define REFFUN_tb_pb 320 /* 0x140 */
634#define REFFUN_tb_p8 321 /* 0x141 */
635#define REFFUN_t8_pb 322 /* 0x142 */
636#define REFFUN_t8_p8 323 /* 0x143 */
637
638#define REFFAN 81 /* 0x51 Match already matched
639 string, using /aai rules. */
640#define REFFAN_tb_pb 324 /* 0x144 */
641#define REFFAN_tb_p8 325 /* 0x145 */
642#define REFFAN_t8_pb 326 /* 0x146 */
643#define REFFAN_t8_p8 327 /* 0x147 */
644
645#define LONGJMP 82 /* 0x52 Jump far away. */
646#define LONGJMP_tb_pb 328 /* 0x148 */
647#define LONGJMP_tb_p8 329 /* 0x149 */
648#define LONGJMP_t8_pb 330 /* 0x14a */
649#define LONGJMP_t8_p8 331 /* 0x14b */
650
651#define BRANCHJ 83 /* 0x53 BRANCH with long offset. */
652#define BRANCHJ_tb_pb 332 /* 0x14c */
653#define BRANCHJ_tb_p8 333 /* 0x14d */
654#define BRANCHJ_t8_pb 334 /* 0x14e */
655#define BRANCHJ_t8_p8 335 /* 0x14f */
656
657#define IFMATCH 84 /* 0x54 Succeeds if the following
658 matches; non-zero flags "f",
659 next_off "o" means lookbehind
660 assertion starting "f..(f-o)"
661 characters before current */
662#define IFMATCH_tb_pb 336 /* 0x150 */
663#define IFMATCH_tb_p8 337 /* 0x151 */
664#define IFMATCH_t8_pb 338 /* 0x152 */
665#define IFMATCH_t8_p8 339 /* 0x153 */
666
667#define UNLESSM 85 /* 0x55 Fails if the following
668 matches; non-zero flags "f",
669 next_off "o" means lookbehind
670 assertion starting "f..(f-o)"
671 characters before current */
672#define UNLESSM_tb_pb 340 /* 0x154 */
673#define UNLESSM_tb_p8 341 /* 0x155 */
674#define UNLESSM_t8_pb 342 /* 0x156 */
675#define UNLESSM_t8_p8 343 /* 0x157 */
676
677#define SUSPEND 86 /* 0x56 "Independent" sub-RE. */
678#define SUSPEND_tb_pb 344 /* 0x158 */
679#define SUSPEND_tb_p8 345 /* 0x159 */
680#define SUSPEND_t8_pb 346 /* 0x15a */
681#define SUSPEND_t8_p8 347 /* 0x15b */
682
683#define IFTHEN 87 /* 0x57 Switch, should be preceded
684 by switcher. */
685#define IFTHEN_tb_pb 348 /* 0x15c */
686#define IFTHEN_tb_p8 349 /* 0x15d */
687#define IFTHEN_t8_pb 350 /* 0x15e */
688#define IFTHEN_t8_p8 351 /* 0x15f */
689
690#define GROUPP 88 /* 0x58 Whether the group matched.
691 */
692#define GROUPP_tb_pb 352 /* 0x160 */
693#define GROUPP_tb_p8 353 /* 0x161 */
694#define GROUPP_t8_pb 354 /* 0x162 */
695#define GROUPP_t8_p8 355 /* 0x163 */
696
697#define EVAL 89 /* 0x59 Execute some Perl code. */
698#define EVAL_tb_pb 356 /* 0x164 */
699#define EVAL_tb_p8 357 /* 0x165 */
700#define EVAL_t8_pb 358 /* 0x166 */
701#define EVAL_t8_p8 359 /* 0x167 */
702
703#define MINMOD 90 /* 0x5a Next operator is not
704 greedy. */
705#define MINMOD_tb_pb 360 /* 0x168 */
706#define MINMOD_tb_p8 361 /* 0x169 */
707#define MINMOD_t8_pb 362 /* 0x16a */
708#define MINMOD_t8_p8 363 /* 0x16b */
709
710#define LOGICAL 91 /* 0x5b Next opcode should set the
711 flag only. */
712#define LOGICAL_tb_pb 364 /* 0x16c */
713#define LOGICAL_tb_p8 365 /* 0x16d */
714#define LOGICAL_t8_pb 366 /* 0x16e */
715#define LOGICAL_t8_p8 367 /* 0x16f */
716
717#define RENUM 92 /* 0x5c Group with independently
718 numbered parens. */
719#define RENUM_tb_pb 368 /* 0x170 */
720#define RENUM_tb_p8 369 /* 0x171 */
721#define RENUM_t8_pb 370 /* 0x172 */
722#define RENUM_t8_p8 371 /* 0x173 */
723
724#define GOSUB 93 /* 0x5d recurse to paren arg1 at
725 (signed) ofs arg2 */
726#define GOSUB_tb_pb 372 /* 0x174 */
727#define GOSUB_tb_p8 373 /* 0x175 */
728#define GOSUB_t8_pb 374 /* 0x176 */
729#define GOSUB_t8_p8 375 /* 0x177 */
730
731#define GROUPPN 94 /* 0x5e Whether the group matched.
732 */
733#define GROUPPN_tb_pb 376 /* 0x178 */
734#define GROUPPN_tb_p8 377 /* 0x179 */
735#define GROUPPN_t8_pb 378 /* 0x17a */
736#define GROUPPN_t8_p8 379 /* 0x17b */
737
738#define INSUBP 95 /* 0x5f Whether we are in a
739 specific recurse. */
740#define INSUBP_tb_pb 380 /* 0x17c */
741#define INSUBP_tb_p8 381 /* 0x17d */
742#define INSUBP_t8_pb 382 /* 0x17e */
743#define INSUBP_t8_p8 383 /* 0x17f */
744
745#define DEFINEP 96 /* 0x60 Never execute directly. */
746#define DEFINEP_tb_pb 384 /* 0x180 */
747#define DEFINEP_tb_p8 385 /* 0x181 */
748#define DEFINEP_t8_pb 386 /* 0x182 */
749#define DEFINEP_t8_p8 387 /* 0x183 */
750
751#define ENDLIKE 97 /* 0x61 Used only for the type
752 field of verbs */
753#define ENDLIKE_tb_pb 388 /* 0x184 */
754#define ENDLIKE_tb_p8 389 /* 0x185 */
755#define ENDLIKE_t8_pb 390 /* 0x186 */
756#define ENDLIKE_t8_p8 391 /* 0x187 */
757
758#define OPFAIL 98 /* 0x62 Same as (?!), but with verb
759 arg */
760#define OPFAIL_tb_pb 392 /* 0x188 */
761#define OPFAIL_tb_p8 393 /* 0x189 */
762#define OPFAIL_t8_pb 394 /* 0x18a */
763#define OPFAIL_t8_p8 395 /* 0x18b */
764
765#define ACCEPT 99 /* 0x63 Accepts the current matched
766 string, with verbar */
767#define ACCEPT_tb_pb 396 /* 0x18c */
768#define ACCEPT_tb_p8 397 /* 0x18d */
769#define ACCEPT_t8_pb 398 /* 0x18e */
770#define ACCEPT_t8_p8 399 /* 0x18f */
771
772#define VERB 100 /* 0x64 Used only for the type
773 field of verbs */
774#define VERB_tb_pb 400 /* 0x190 */
775#define VERB_tb_p8 401 /* 0x191 */
776#define VERB_t8_pb 402 /* 0x192 */
777#define VERB_t8_p8 403 /* 0x193 */
778
779#define PRUNE 101 /* 0x65 Pattern fails at this
780 startpoint if no-backtracking
781 through this */
782#define PRUNE_tb_pb 404 /* 0x194 */
783#define PRUNE_tb_p8 405 /* 0x195 */
784#define PRUNE_t8_pb 406 /* 0x196 */
785#define PRUNE_t8_p8 407 /* 0x197 */
786
787#define MARKPOINT 102 /* 0x66 Push the current location
788 for rollback by cut. */
789#define MARKPOINT_tb_pb 408 /* 0x198 */
790#define MARKPOINT_tb_p8 409 /* 0x199 */
791#define MARKPOINT_t8_pb 410 /* 0x19a */
792#define MARKPOINT_t8_p8 411 /* 0x19b */
793
794#define SKIP 103 /* 0x67 On failure skip forward (to
795 the mark) before retrying */
796#define SKIP_tb_pb 412 /* 0x19c */
797#define SKIP_tb_p8 413 /* 0x19d */
798#define SKIP_t8_pb 414 /* 0x19e */
799#define SKIP_t8_p8 415 /* 0x19f */
800
801#define COMMIT 104 /* 0x68 Pattern fails outright if
802 backtracking through this */
803#define COMMIT_tb_pb 416 /* 0x1a0 */
804#define COMMIT_tb_p8 417 /* 0x1a1 */
805#define COMMIT_t8_pb 418 /* 0x1a2 */
806#define COMMIT_t8_p8 419 /* 0x1a3 */
807
808#define CUTGROUP 105 /* 0x69 On failure go to the next
809 alternation in the group */
810#define CUTGROUP_tb_pb 420 /* 0x1a4 */
811#define CUTGROUP_tb_p8 421 /* 0x1a5 */
812#define CUTGROUP_t8_pb 422 /* 0x1a6 */
813#define CUTGROUP_t8_p8 423 /* 0x1a7 */
814
815#define KEEPS 106 /* 0x6a $& begins here. */
816#define KEEPS_tb_pb 424 /* 0x1a8 */
817#define KEEPS_tb_p8 425 /* 0x1a9 */
818#define KEEPS_t8_pb 426 /* 0x1aa */
819#define KEEPS_t8_p8 427 /* 0x1ab */
820
821#define OPTIMIZED 107 /* 0x6b Placeholder for dump. */
822#define OPTIMIZED_tb_pb 428 /* 0x1ac */
823#define OPTIMIZED_tb_p8 429 /* 0x1ad */
824#define OPTIMIZED_t8_pb 430 /* 0x1ae */
825#define OPTIMIZED_t8_p8 431 /* 0x1af */
826
827#define PSEUDO 108 /* 0x6c Pseudo opcode for internal
828 use. */
829#define PSEUDO_tb_pb 432 /* 0x1b0 */
830#define PSEUDO_tb_p8 433 /* 0x1b1 */
831#define PSEUDO_t8_pb 434 /* 0x1b2 */
832#define PSEUDO_t8_p8 435 /* 0x1b3 */
833
834#define REGEX_SET 109 /* 0x6d Regex set, temporary node
835 used in pre-optimization
836 compilation */
837#define REGEX_SET_tb_pb 436 /* 0x1b4 */
838#define REGEX_SET_tb_p8 437 /* 0x1b5 */
839#define REGEX_SET_t8_pb 438 /* 0x1b6 */
840#define REGEX_SET_t8_p8 439 /* 0x1b7 */
841
03363afd 842 /* ------------ States ------------- */
ce553cf5
KW
843#define TRIE_next 110 /* 0x6e state for TRIE */
844#define TRIE_next_tb_pb 440 /* 0x1b8 */
845#define TRIE_next_tb_p8 441 /* 0x1b9 */
846#define TRIE_next_t8_pb 442 /* 0x1ba */
847#define TRIE_next_t8_p8 443 /* 0x1bb */
848
849#define TRIE_next_fail 111 /* 0x6f state for TRIE */
850#define TRIE_next_fail_tb_pb 444 /* 0x1bc */
851#define TRIE_next_fail_tb_p8 445 /* 0x1bd */
852#define TRIE_next_fail_t8_pb 446 /* 0x1be */
853#define TRIE_next_fail_t8_p8 447 /* 0x1bf */
854
855#define EVAL_B 112 /* 0x70 state for EVAL */
856#define EVAL_B_tb_pb 448 /* 0x1c0 */
857#define EVAL_B_tb_p8 449 /* 0x1c1 */
858#define EVAL_B_t8_pb 450 /* 0x1c2 */
859#define EVAL_B_t8_p8 451 /* 0x1c3 */
860
861#define EVAL_B_fail 113 /* 0x71 state for EVAL */
862#define EVAL_B_fail_tb_pb 452 /* 0x1c4 */
863#define EVAL_B_fail_tb_p8 453 /* 0x1c5 */
864#define EVAL_B_fail_t8_pb 454 /* 0x1c6 */
865#define EVAL_B_fail_t8_p8 455 /* 0x1c7 */
866
867#define EVAL_postponed_AB 114 /* 0x72 state for EVAL */
868#define EVAL_postponed_AB_tb_pb 456 /* 0x1c8 */
869#define EVAL_postponed_AB_tb_p8 457 /* 0x1c9 */
870#define EVAL_postponed_AB_t8_pb 458 /* 0x1ca */
871#define EVAL_postponed_AB_t8_p8 459 /* 0x1cb */
872
873#define EVAL_postponed_AB_fail 115 /* 0x73 state for EVAL */
874#define EVAL_postponed_AB_fail_tb_pb 460 /* 0x1cc */
875#define EVAL_postponed_AB_fail_tb_p8 461 /* 0x1cd */
876#define EVAL_postponed_AB_fail_t8_pb 462 /* 0x1ce */
877#define EVAL_postponed_AB_fail_t8_p8 463 /* 0x1cf */
878
879#define CURLYX_end 116 /* 0x74 state for CURLYX */
880#define CURLYX_end_tb_pb 464 /* 0x1d0 */
881#define CURLYX_end_tb_p8 465 /* 0x1d1 */
882#define CURLYX_end_t8_pb 466 /* 0x1d2 */
883#define CURLYX_end_t8_p8 467 /* 0x1d3 */
884
885#define CURLYX_end_fail 117 /* 0x75 state for CURLYX */
886#define CURLYX_end_fail_tb_pb 468 /* 0x1d4 */
887#define CURLYX_end_fail_tb_p8 469 /* 0x1d5 */
888#define CURLYX_end_fail_t8_pb 470 /* 0x1d6 */
889#define CURLYX_end_fail_t8_p8 471 /* 0x1d7 */
890
891#define WHILEM_A_pre 118 /* 0x76 state for WHILEM */
892#define WHILEM_A_pre_tb_pb 472 /* 0x1d8 */
893#define WHILEM_A_pre_tb_p8 473 /* 0x1d9 */
894#define WHILEM_A_pre_t8_pb 474 /* 0x1da */
895#define WHILEM_A_pre_t8_p8 475 /* 0x1db */
896
897#define WHILEM_A_pre_fail 119 /* 0x77 state for WHILEM */
898#define WHILEM_A_pre_fail_tb_pb 476 /* 0x1dc */
899#define WHILEM_A_pre_fail_tb_p8 477 /* 0x1dd */
900#define WHILEM_A_pre_fail_t8_pb 478 /* 0x1de */
901#define WHILEM_A_pre_fail_t8_p8 479 /* 0x1df */
902
903#define WHILEM_A_min 120 /* 0x78 state for WHILEM */
904#define WHILEM_A_min_tb_pb 480 /* 0x1e0 */
905#define WHILEM_A_min_tb_p8 481 /* 0x1e1 */
906#define WHILEM_A_min_t8_pb 482 /* 0x1e2 */
907#define WHILEM_A_min_t8_p8 483 /* 0x1e3 */
908
909#define WHILEM_A_min_fail 121 /* 0x79 state for WHILEM */
910#define WHILEM_A_min_fail_tb_pb 484 /* 0x1e4 */
911#define WHILEM_A_min_fail_tb_p8 485 /* 0x1e5 */
912#define WHILEM_A_min_fail_t8_pb 486 /* 0x1e6 */
913#define WHILEM_A_min_fail_t8_p8 487 /* 0x1e7 */
914
915#define WHILEM_A_max 122 /* 0x7a state for WHILEM */
916#define WHILEM_A_max_tb_pb 488 /* 0x1e8 */
917#define WHILEM_A_max_tb_p8 489 /* 0x1e9 */
918#define WHILEM_A_max_t8_pb 490 /* 0x1ea */
919#define WHILEM_A_max_t8_p8 491 /* 0x1eb */
920
921#define WHILEM_A_max_fail 123 /* 0x7b state for WHILEM */
922#define WHILEM_A_max_fail_tb_pb 492 /* 0x1ec */
923#define WHILEM_A_max_fail_tb_p8 493 /* 0x1ed */
924#define WHILEM_A_max_fail_t8_pb 494 /* 0x1ee */
925#define WHILEM_A_max_fail_t8_p8 495 /* 0x1ef */
926
927#define WHILEM_B_min 124 /* 0x7c state for WHILEM */
928#define WHILEM_B_min_tb_pb 496 /* 0x1f0 */
929#define WHILEM_B_min_tb_p8 497 /* 0x1f1 */
930#define WHILEM_B_min_t8_pb 498 /* 0x1f2 */
931#define WHILEM_B_min_t8_p8 499 /* 0x1f3 */
932
933#define WHILEM_B_min_fail 125 /* 0x7d state for WHILEM */
934#define WHILEM_B_min_fail_tb_pb 500 /* 0x1f4 */
935#define WHILEM_B_min_fail_tb_p8 501 /* 0x1f5 */
936#define WHILEM_B_min_fail_t8_pb 502 /* 0x1f6 */
937#define WHILEM_B_min_fail_t8_p8 503 /* 0x1f7 */
938
939#define WHILEM_B_max 126 /* 0x7e state for WHILEM */
940#define WHILEM_B_max_tb_pb 504 /* 0x1f8 */
941#define WHILEM_B_max_tb_p8 505 /* 0x1f9 */
942#define WHILEM_B_max_t8_pb 506 /* 0x1fa */
943#define WHILEM_B_max_t8_p8 507 /* 0x1fb */
944
945#define WHILEM_B_max_fail 127 /* 0x7f state for WHILEM */
946#define WHILEM_B_max_fail_tb_pb 508 /* 0x1fc */
947#define WHILEM_B_max_fail_tb_p8 509 /* 0x1fd */
948#define WHILEM_B_max_fail_t8_pb 510 /* 0x1fe */
949#define WHILEM_B_max_fail_t8_p8 511 /* 0x1ff */
950
951#define BRANCH_next 128 /* 0x80 state for BRANCH */
952#define BRANCH_next_tb_pb 512 /* 0x200 */
953#define BRANCH_next_tb_p8 513 /* 0x201 */
954#define BRANCH_next_t8_pb 514 /* 0x202 */
955#define BRANCH_next_t8_p8 515 /* 0x203 */
956
957#define BRANCH_next_fail 129 /* 0x81 state for BRANCH */
958#define BRANCH_next_fail_tb_pb 516 /* 0x204 */
959#define BRANCH_next_fail_tb_p8 517 /* 0x205 */
960#define BRANCH_next_fail_t8_pb 518 /* 0x206 */
961#define BRANCH_next_fail_t8_p8 519 /* 0x207 */
962
963#define CURLYM_A 130 /* 0x82 state for CURLYM */
964#define CURLYM_A_tb_pb 520 /* 0x208 */
965#define CURLYM_A_tb_p8 521 /* 0x209 */
966#define CURLYM_A_t8_pb 522 /* 0x20a */
967#define CURLYM_A_t8_p8 523 /* 0x20b */
968
969#define CURLYM_A_fail 131 /* 0x83 state for CURLYM */
970#define CURLYM_A_fail_tb_pb 524 /* 0x20c */
971#define CURLYM_A_fail_tb_p8 525 /* 0x20d */
972#define CURLYM_A_fail_t8_pb 526 /* 0x20e */
973#define CURLYM_A_fail_t8_p8 527 /* 0x20f */
974
975#define CURLYM_B 132 /* 0x84 state for CURLYM */
976#define CURLYM_B_tb_pb 528 /* 0x210 */
977#define CURLYM_B_tb_p8 529 /* 0x211 */
978#define CURLYM_B_t8_pb 530 /* 0x212 */
979#define CURLYM_B_t8_p8 531 /* 0x213 */
980
981#define CURLYM_B_fail 133 /* 0x85 state for CURLYM */
982#define CURLYM_B_fail_tb_pb 532 /* 0x214 */
983#define CURLYM_B_fail_tb_p8 533 /* 0x215 */
984#define CURLYM_B_fail_t8_pb 534 /* 0x216 */
985#define CURLYM_B_fail_t8_p8 535 /* 0x217 */
986
987#define IFMATCH_A 134 /* 0x86 state for IFMATCH */
988#define IFMATCH_A_tb_pb 536 /* 0x218 */
989#define IFMATCH_A_tb_p8 537 /* 0x219 */
990#define IFMATCH_A_t8_pb 538 /* 0x21a */
991#define IFMATCH_A_t8_p8 539 /* 0x21b */
992
993#define IFMATCH_A_fail 135 /* 0x87 state for IFMATCH */
994#define IFMATCH_A_fail_tb_pb 540 /* 0x21c */
995#define IFMATCH_A_fail_tb_p8 541 /* 0x21d */
996#define IFMATCH_A_fail_t8_pb 542 /* 0x21e */
997#define IFMATCH_A_fail_t8_p8 543 /* 0x21f */
998
999#define CURLY_B_min 136 /* 0x88 state for CURLY */
1000#define CURLY_B_min_tb_pb 544 /* 0x220 */
1001#define CURLY_B_min_tb_p8 545 /* 0x221 */
1002#define CURLY_B_min_t8_pb 546 /* 0x222 */
1003#define CURLY_B_min_t8_p8 547 /* 0x223 */
1004
1005#define CURLY_B_min_fail 137 /* 0x89 state for CURLY */
1006#define CURLY_B_min_fail_tb_pb 548 /* 0x224 */
1007#define CURLY_B_min_fail_tb_p8 549 /* 0x225 */
1008#define CURLY_B_min_fail_t8_pb 550 /* 0x226 */
1009#define CURLY_B_min_fail_t8_p8 551 /* 0x227 */
1010
1011#define CURLY_B_max 138 /* 0x8a state for CURLY */
1012#define CURLY_B_max_tb_pb 552 /* 0x228 */
1013#define CURLY_B_max_tb_p8 553 /* 0x229 */
1014#define CURLY_B_max_t8_pb 554 /* 0x22a */
1015#define CURLY_B_max_t8_p8 555 /* 0x22b */
1016
1017#define CURLY_B_max_fail 139 /* 0x8b state for CURLY */
1018#define CURLY_B_max_fail_tb_pb 556 /* 0x22c */
1019#define CURLY_B_max_fail_tb_p8 557 /* 0x22d */
1020#define CURLY_B_max_fail_t8_pb 558 /* 0x22e */
1021#define CURLY_B_max_fail_t8_p8 559 /* 0x22f */
1022
1023#define COMMIT_next 140 /* 0x8c state for COMMIT */
1024#define COMMIT_next_tb_pb 560 /* 0x230 */
1025#define COMMIT_next_tb_p8 561 /* 0x231 */
1026#define COMMIT_next_t8_pb 562 /* 0x232 */
1027#define COMMIT_next_t8_p8 563 /* 0x233 */
1028
1029#define COMMIT_next_fail 141 /* 0x8d state for COMMIT */
1030#define COMMIT_next_fail_tb_pb 564 /* 0x234 */
1031#define COMMIT_next_fail_tb_p8 565 /* 0x235 */
1032#define COMMIT_next_fail_t8_pb 566 /* 0x236 */
1033#define COMMIT_next_fail_t8_p8 567 /* 0x237 */
1034
1035#define MARKPOINT_next 142 /* 0x8e state for MARKPOINT */
1036#define MARKPOINT_next_tb_pb 568 /* 0x238 */
1037#define MARKPOINT_next_tb_p8 569 /* 0x239 */
1038#define MARKPOINT_next_t8_pb 570 /* 0x23a */
1039#define MARKPOINT_next_t8_p8 571 /* 0x23b */
1040
1041#define MARKPOINT_next_fail 143 /* 0x8f state for MARKPOINT */
1042#define MARKPOINT_next_fail_tb_pb 572 /* 0x23c */
1043#define MARKPOINT_next_fail_tb_p8 573 /* 0x23d */
1044#define MARKPOINT_next_fail_t8_pb 574 /* 0x23e */
1045#define MARKPOINT_next_fail_t8_p8 575 /* 0x23f */
1046
1047#define SKIP_next 144 /* 0x90 state for SKIP */
1048#define SKIP_next_tb_pb 576 /* 0x240 */
1049#define SKIP_next_tb_p8 577 /* 0x241 */
1050#define SKIP_next_t8_pb 578 /* 0x242 */
1051#define SKIP_next_t8_p8 579 /* 0x243 */
1052
1053#define SKIP_next_fail 145 /* 0x91 state for SKIP */
1054#define SKIP_next_fail_tb_pb 580 /* 0x244 */
1055#define SKIP_next_fail_tb_p8 581 /* 0x245 */
1056#define SKIP_next_fail_t8_pb 582 /* 0x246 */
1057#define SKIP_next_fail_t8_p8 583 /* 0x247 */
1058
1059#define CUTGROUP_next 146 /* 0x92 state for CUTGROUP */
1060#define CUTGROUP_next_tb_pb 584 /* 0x248 */
1061#define CUTGROUP_next_tb_p8 585 /* 0x249 */
1062#define CUTGROUP_next_t8_pb 586 /* 0x24a */
1063#define CUTGROUP_next_t8_p8 587 /* 0x24b */
1064
1065#define CUTGROUP_next_fail 147 /* 0x93 state for CUTGROUP */
1066#define CUTGROUP_next_fail_tb_pb 588 /* 0x24c */
1067#define CUTGROUP_next_fail_tb_p8 589 /* 0x24d */
1068#define CUTGROUP_next_fail_t8_pb 590 /* 0x24e */
1069#define CUTGROUP_next_fail_t8_p8 591 /* 0x24f */
1070
1071#define KEEPS_next 148 /* 0x94 state for KEEPS */
1072#define KEEPS_next_tb_pb 592 /* 0x250 */
1073#define KEEPS_next_tb_p8 593 /* 0x251 */
1074#define KEEPS_next_t8_pb 594 /* 0x252 */
1075#define KEEPS_next_t8_p8 595 /* 0x253 */
1076
1077#define KEEPS_next_fail 149 /* 0x95 state for KEEPS */
1078#define KEEPS_next_fail_tb_pb 596 /* 0x254 */
1079#define KEEPS_next_fail_tb_p8 597 /* 0x255 */
1080#define KEEPS_next_fail_t8_pb 598 /* 0x256 */
1081#define KEEPS_next_fail_t8_p8 599 /* 0x257 */
1082
03363afd 1083
6bda09f9 1084/* PL_regkind[] What type of regop or state is this. */
d09b2d29
IZ
1085
1086#ifndef DOINIT
22c35a8c 1087EXTCONST U8 PL_regkind[];
d09b2d29 1088#else
22c35a8c 1089EXTCONST U8 PL_regkind[] = {
e2e6a0f1
YO
1090 END, /* END */
1091 END, /* SUCCEED */
e2e6a0f1 1092 BOL, /* SBOL */
d3d47aac 1093 BOL, /* MBOL */
e2e6a0f1 1094 EOL, /* SEOL */
d3d47aac
YO
1095 EOL, /* MEOL */
1096 EOL, /* EOS */
1097 GPOS, /* GPOS */
e2e6a0f1
YO
1098 BOUND, /* BOUND */
1099 BOUND, /* BOUNDL */
1e355c70 1100 BOUND, /* BOUNDU */
0c6e81eb 1101 BOUND, /* BOUNDA */
e2e6a0f1
YO
1102 NBOUND, /* NBOUND */
1103 NBOUND, /* NBOUNDL */
1e355c70 1104 NBOUND, /* NBOUNDU */
0c6e81eb 1105 NBOUND, /* NBOUNDA */
e2e6a0f1
YO
1106 REG_ANY, /* REG_ANY */
1107 REG_ANY, /* SANY */
e2e6a0f1 1108 ANYOF, /* ANYOF */
ac44c12e 1109 ANYOF, /* ANYOFD */
a4525e78 1110 ANYOF, /* ANYOFL */
3edce4f5 1111 ANYOF, /* ANYOFPOSIXL */
c316b824 1112 ANYOF, /* ANYOFH */
6966a05b 1113 ANYOF, /* ANYOFHb */
3146c00a 1114 ANYOF, /* ANYOFHr */
34924db0 1115 ANYOF, /* ANYOFHs */
13fcf652 1116 ANYOFR, /* ANYOFR */
2d5613be 1117 ANYOFR, /* ANYOFRb */
67a1b5f9 1118 ANYOFM, /* ANYOFM */
3db0bccc 1119 ANYOFM, /* NANYOFM */
3615ea58
KW
1120 POSIXD, /* POSIXD */
1121 POSIXD, /* POSIXL */
1122 POSIXD, /* POSIXU */
1123 POSIXD, /* POSIXA */
9e84774b
KW
1124 NPOSIXD, /* NPOSIXD */
1125 NPOSIXD, /* NPOSIXL */
1126 NPOSIXD, /* NPOSIXU */
1127 NPOSIXD, /* NPOSIXA */
e2e6a0f1
YO
1128 CLUMP, /* CLUMP */
1129 BRANCH, /* BRANCH */
e2e6a0f1 1130 EXACT, /* EXACT */
ae06e581 1131 EXACT, /* LEXACT */
a4525e78 1132 EXACT, /* EXACTL */
e2e6a0f1
YO
1133 EXACT, /* EXACTF */
1134 EXACT, /* EXACTFL */
01f98ec2 1135 EXACT, /* EXACTFU */
89829bb5 1136 EXACT, /* EXACTFAA */
f97d9711 1137 EXACT, /* EXACTFAA_NO_TRIE */
627a7895 1138 EXACT, /* EXACTFUP */
a4525e78 1139 EXACT, /* EXACTFLU8 */
3f2416ae
KW
1140 EXACT, /* EXACT_REQ8 */
1141 EXACT, /* LEXACT_REQ8 */
1142 EXACT, /* EXACTFU_REQ8 */
95fb0a6e 1143 EXACT, /* EXACTFU_S_EDGE */
7af55186
KW
1144 LNBREAK, /* LNBREAK */
1145 TRIE, /* TRIE */
1146 TRIE, /* TRIEC */
1147 TRIE, /* AHOCORASICK */
1148 TRIE, /* AHOCORASICKC */
e2e6a0f1
YO
1149 NOTHING, /* NOTHING */
1150 NOTHING, /* TAIL */
1151 STAR, /* STAR */
1152 PLUS, /* PLUS */
1153 CURLY, /* CURLY */
1154 CURLY, /* CURLYN */
1155 CURLY, /* CURLYM */
1156 CURLY, /* CURLYX */
1157 WHILEM, /* WHILEM */
1158 OPEN, /* OPEN */
1159 CLOSE, /* CLOSE */
07093db4
KW
1160 SROPEN, /* SROPEN */
1161 SRCLOSE, /* SRCLOSE */
e2e6a0f1
YO
1162 REF, /* REF */
1163 REF, /* REFF */
1164 REF, /* REFFL */
01f98ec2 1165 REF, /* REFFU */
781aab5c 1166 REF, /* REFFA */
016b7209
KW
1167 REF, /* REFN */
1168 REF, /* REFFN */
1169 REF, /* REFFLN */
1170 REF, /* REFFUN */
1171 REF, /* REFFAN */
d3d47aac
YO
1172 LONGJMP, /* LONGJMP */
1173 BRANCHJ, /* BRANCHJ */
e2e6a0f1
YO
1174 BRANCHJ, /* IFMATCH */
1175 BRANCHJ, /* UNLESSM */
1176 BRANCHJ, /* SUSPEND */
1177 BRANCHJ, /* IFTHEN */
1178 GROUPP, /* GROUPP */
e2e6a0f1
YO
1179 EVAL, /* EVAL */
1180 MINMOD, /* MINMOD */
1181 LOGICAL, /* LOGICAL */
1182 BRANCHJ, /* RENUM */
e2e6a0f1 1183 GOSUB, /* GOSUB */
016b7209 1184 GROUPPN, /* GROUPPN */
e2e6a0f1
YO
1185 INSUBP, /* INSUBP */
1186 DEFINEP, /* DEFINEP */
1187 ENDLIKE, /* ENDLIKE */
1188 ENDLIKE, /* OPFAIL */
1189 ENDLIKE, /* ACCEPT */
1190 VERB, /* VERB */
5d458dd8 1191 VERB, /* PRUNE */
e2e6a0f1 1192 VERB, /* MARKPOINT */
5d458dd8 1193 VERB, /* SKIP */
e2e6a0f1 1194 VERB, /* COMMIT */
5d458dd8 1195 VERB, /* CUTGROUP */
ee9b8eae 1196 KEEPS, /* KEEPS */
e2e6a0f1
YO
1197 NOTHING, /* OPTIMIZED */
1198 PSEUDO, /* PSEUDO */
86451f01 1199 REGEX_SET, /* REGEX_SET */
03363afd 1200 /* ------------ States ------------- */
e2e6a0f1
YO
1201 TRIE, /* TRIE_next */
1202 TRIE, /* TRIE_next_fail */
4ee16520
DM
1203 EVAL, /* EVAL_B */
1204 EVAL, /* EVAL_B_fail */
1205 EVAL, /* EVAL_postponed_AB */
1206 EVAL, /* EVAL_postponed_AB_fail */
e2e6a0f1
YO
1207 CURLYX, /* CURLYX_end */
1208 CURLYX, /* CURLYX_end_fail */
1209 WHILEM, /* WHILEM_A_pre */
1210 WHILEM, /* WHILEM_A_pre_fail */
1211 WHILEM, /* WHILEM_A_min */
1212 WHILEM, /* WHILEM_A_min_fail */
1213 WHILEM, /* WHILEM_A_max */
1214 WHILEM, /* WHILEM_A_max_fail */
1215 WHILEM, /* WHILEM_B_min */
1216 WHILEM, /* WHILEM_B_min_fail */
1217 WHILEM, /* WHILEM_B_max */
1218 WHILEM, /* WHILEM_B_max_fail */
1219 BRANCH, /* BRANCH_next */
1220 BRANCH, /* BRANCH_next_fail */
1221 CURLYM, /* CURLYM_A */
1222 CURLYM, /* CURLYM_A_fail */
1223 CURLYM, /* CURLYM_B */
1224 CURLYM, /* CURLYM_B_fail */
1225 IFMATCH, /* IFMATCH_A */
1226 IFMATCH, /* IFMATCH_A_fail */
e2e6a0f1
YO
1227 CURLY, /* CURLY_B_min */
1228 CURLY, /* CURLY_B_min_fail */
1229 CURLY, /* CURLY_B_max */
1230 CURLY, /* CURLY_B_max_fail */
1231 COMMIT, /* COMMIT_next */
1232 COMMIT, /* COMMIT_next_fail */
1233 MARKPOINT, /* MARKPOINT_next */
1234 MARKPOINT, /* MARKPOINT_next_fail */
5d458dd8
YO
1235 SKIP, /* SKIP_next */
1236 SKIP, /* SKIP_next_fail */
1237 CUTGROUP, /* CUTGROUP_next */
1238 CUTGROUP, /* CUTGROUP_next_fail */
ee9b8eae
YO
1239 KEEPS, /* KEEPS_next */
1240 KEEPS, /* KEEPS_next_fail */
d09b2d29
IZ
1241};
1242#endif
1243
f83e001e
YO
1244#ifdef REG_COMP_C
1245
6bda09f9 1246/* regarglen[] - How large is the argument part of the node (in regnodes) */
d09b2d29 1247
29de9391 1248static const U8 regarglen[] = {
03363afd
YO
1249 0, /* END */
1250 0, /* SUCCEED */
03363afd 1251 0, /* SBOL */
d3d47aac 1252 0, /* MBOL */
03363afd 1253 0, /* SEOL */
d3d47aac
YO
1254 0, /* MEOL */
1255 0, /* EOS */
1256 0, /* GPOS */
03363afd
YO
1257 0, /* BOUND */
1258 0, /* BOUNDL */
1e355c70 1259 0, /* BOUNDU */
0c6e81eb 1260 0, /* BOUNDA */
03363afd
YO
1261 0, /* NBOUND */
1262 0, /* NBOUNDL */
1e355c70 1263 0, /* NBOUNDU */
0c6e81eb 1264 0, /* NBOUNDA */
03363afd
YO
1265 0, /* REG_ANY */
1266 0, /* SANY */
46fc0c43
KW
1267 EXTRA_SIZE(struct regnode_charclass), /* ANYOF */
1268 EXTRA_SIZE(struct regnode_charclass), /* ANYOFD */
1269 EXTRA_SIZE(struct regnode_charclass), /* ANYOFL */
1270 EXTRA_SIZE(struct regnode_charclass_posixl), /* ANYOFPOSIXL */
c316b824 1271 EXTRA_SIZE(struct regnode_1), /* ANYOFH */
6966a05b 1272 EXTRA_SIZE(struct regnode_1), /* ANYOFHb */
3146c00a 1273 EXTRA_SIZE(struct regnode_1), /* ANYOFHr */
53d42e43 1274 EXTRA_SIZE(struct regnode_1), /* ANYOFHs */
13fcf652 1275 EXTRA_SIZE(struct regnode_1), /* ANYOFR */
2d5613be 1276 EXTRA_SIZE(struct regnode_1), /* ANYOFRb */
67a1b5f9 1277 EXTRA_SIZE(struct regnode_1), /* ANYOFM */
3db0bccc 1278 EXTRA_SIZE(struct regnode_1), /* NANYOFM */
3615ea58
KW
1279 0, /* POSIXD */
1280 0, /* POSIXL */
1281 0, /* POSIXU */
1282 0, /* POSIXA */
1283 0, /* NPOSIXD */
1284 0, /* NPOSIXL */
1285 0, /* NPOSIXU */
1286 0, /* NPOSIXA */
03363afd
YO
1287 0, /* CLUMP */
1288 0, /* BRANCH */
03363afd 1289 0, /* EXACT */
ae06e581 1290 EXTRA_SIZE(struct regnode_1), /* LEXACT */
a4525e78 1291 0, /* EXACTL */
03363afd
YO
1292 0, /* EXACTF */
1293 0, /* EXACTFL */
01f98ec2 1294 0, /* EXACTFU */
89829bb5 1295 0, /* EXACTFAA */
f97d9711 1296 0, /* EXACTFAA_NO_TRIE */
627a7895 1297 0, /* EXACTFUP */
a4525e78 1298 0, /* EXACTFLU8 */
3f2416ae
KW
1299 0, /* EXACT_REQ8 */
1300 EXTRA_SIZE(struct regnode_1), /* LEXACT_REQ8 */
1301 0, /* EXACTFU_REQ8 */
95fb0a6e 1302 0, /* EXACTFU_S_EDGE */
7af55186
KW
1303 0, /* LNBREAK */
1304 EXTRA_SIZE(struct regnode_1), /* TRIE */
1305 EXTRA_SIZE(struct regnode_charclass), /* TRIEC */
1306 EXTRA_SIZE(struct regnode_1), /* AHOCORASICK */
1307 EXTRA_SIZE(struct regnode_charclass), /* AHOCORASICKC */
03363afd
YO
1308 0, /* NOTHING */
1309 0, /* TAIL */
1310 0, /* STAR */
1311 0, /* PLUS */
1312 EXTRA_SIZE(struct regnode_2), /* CURLY */
1313 EXTRA_SIZE(struct regnode_2), /* CURLYN */
1314 EXTRA_SIZE(struct regnode_2), /* CURLYM */
1315 EXTRA_SIZE(struct regnode_2), /* CURLYX */
1316 0, /* WHILEM */
1317 EXTRA_SIZE(struct regnode_1), /* OPEN */
1318 EXTRA_SIZE(struct regnode_1), /* CLOSE */
07093db4
KW
1319 0, /* SROPEN */
1320 0, /* SRCLOSE */
03363afd
YO
1321 EXTRA_SIZE(struct regnode_1), /* REF */
1322 EXTRA_SIZE(struct regnode_1), /* REFF */
1323 EXTRA_SIZE(struct regnode_1), /* REFFL */
01f98ec2 1324 EXTRA_SIZE(struct regnode_1), /* REFFU */
781aab5c 1325 EXTRA_SIZE(struct regnode_1), /* REFFA */
016b7209
KW
1326 EXTRA_SIZE(struct regnode_1), /* REFN */
1327 EXTRA_SIZE(struct regnode_1), /* REFFN */
1328 EXTRA_SIZE(struct regnode_1), /* REFFLN */
1329 EXTRA_SIZE(struct regnode_1), /* REFFUN */
1330 EXTRA_SIZE(struct regnode_1), /* REFFAN */
d3d47aac
YO
1331 EXTRA_SIZE(struct regnode_1), /* LONGJMP */
1332 EXTRA_SIZE(struct regnode_1), /* BRANCHJ */
03363afd
YO
1333 EXTRA_SIZE(struct regnode_1), /* IFMATCH */
1334 EXTRA_SIZE(struct regnode_1), /* UNLESSM */
1335 EXTRA_SIZE(struct regnode_1), /* SUSPEND */
1336 EXTRA_SIZE(struct regnode_1), /* IFTHEN */
1337 EXTRA_SIZE(struct regnode_1), /* GROUPP */
13f27704 1338 EXTRA_SIZE(struct regnode_2L), /* EVAL */
03363afd
YO
1339 0, /* MINMOD */
1340 0, /* LOGICAL */
1341 EXTRA_SIZE(struct regnode_1), /* RENUM */
1a147d38 1342 EXTRA_SIZE(struct regnode_2L), /* GOSUB */
016b7209 1343 EXTRA_SIZE(struct regnode_1), /* GROUPPN */
1a147d38 1344 EXTRA_SIZE(struct regnode_1), /* INSUBP */
0a4db386 1345 EXTRA_SIZE(struct regnode_1), /* DEFINEP */
e2e6a0f1 1346 0, /* ENDLIKE */
fee50582
YO
1347 EXTRA_SIZE(struct regnode_1), /* OPFAIL */
1348 EXTRA_SIZE(struct regnode_2L), /* ACCEPT */
20832bc5 1349 EXTRA_SIZE(struct regnode_1), /* VERB */
5d458dd8 1350 EXTRA_SIZE(struct regnode_1), /* PRUNE */
e2e6a0f1 1351 EXTRA_SIZE(struct regnode_1), /* MARKPOINT */
5d458dd8 1352 EXTRA_SIZE(struct regnode_1), /* SKIP */
e2e6a0f1 1353 EXTRA_SIZE(struct regnode_1), /* COMMIT */
5d458dd8 1354 EXTRA_SIZE(struct regnode_1), /* CUTGROUP */
ee9b8eae 1355 0, /* KEEPS */
03363afd
YO
1356 0, /* OPTIMIZED */
1357 0, /* PSEUDO */
86451f01 1358 EXTRA_SIZE(struct regnode_p), /* REGEX_SET */
d09b2d29
IZ
1359};
1360
6bda09f9
YO
1361/* reg_off_by_arg[] - Which argument holds the offset to the next node */
1362
29de9391 1363static const char reg_off_by_arg[] = {
03363afd
YO
1364 0, /* END */
1365 0, /* SUCCEED */
03363afd 1366 0, /* SBOL */
d3d47aac 1367 0, /* MBOL */
03363afd 1368 0, /* SEOL */
d3d47aac
YO
1369 0, /* MEOL */
1370 0, /* EOS */
1371 0, /* GPOS */
03363afd
YO
1372 0, /* BOUND */
1373 0, /* BOUNDL */
1e355c70 1374 0, /* BOUNDU */
0c6e81eb 1375 0, /* BOUNDA */
03363afd
YO
1376 0, /* NBOUND */
1377 0, /* NBOUNDL */
1e355c70 1378 0, /* NBOUNDU */
0c6e81eb 1379 0, /* NBOUNDA */
03363afd
YO
1380 0, /* REG_ANY */
1381 0, /* SANY */
03363afd 1382 0, /* ANYOF */
ac44c12e 1383 0, /* ANYOFD */
a4525e78 1384 0, /* ANYOFL */
3edce4f5 1385 0, /* ANYOFPOSIXL */
c316b824 1386 0, /* ANYOFH */
6966a05b 1387 0, /* ANYOFHb */
3146c00a 1388 0, /* ANYOFHr */
34924db0 1389 0, /* ANYOFHs */
13fcf652 1390 0, /* ANYOFR */
2d5613be 1391 0, /* ANYOFRb */
67a1b5f9 1392 0, /* ANYOFM */
3db0bccc 1393 0, /* NANYOFM */
3615ea58
KW
1394 0, /* POSIXD */
1395 0, /* POSIXL */
1396 0, /* POSIXU */
1397 0, /* POSIXA */
1398 0, /* NPOSIXD */
1399 0, /* NPOSIXL */
1400 0, /* NPOSIXU */
1401 0, /* NPOSIXA */
03363afd
YO
1402 0, /* CLUMP */
1403 0, /* BRANCH */
03363afd 1404 0, /* EXACT */
ae06e581 1405 0, /* LEXACT */
a4525e78 1406 0, /* EXACTL */
03363afd
YO
1407 0, /* EXACTF */
1408 0, /* EXACTFL */
01f98ec2 1409 0, /* EXACTFU */
89829bb5 1410 0, /* EXACTFAA */
f97d9711 1411 0, /* EXACTFAA_NO_TRIE */
627a7895 1412 0, /* EXACTFUP */
a4525e78 1413 0, /* EXACTFLU8 */
3f2416ae
KW
1414 0, /* EXACT_REQ8 */
1415 0, /* LEXACT_REQ8 */
1416 0, /* EXACTFU_REQ8 */
95fb0a6e 1417 0, /* EXACTFU_S_EDGE */
7af55186
KW
1418 0, /* LNBREAK */
1419 0, /* TRIE */
1420 0, /* TRIEC */
1421 0, /* AHOCORASICK */
1422 0, /* AHOCORASICKC */
03363afd
YO
1423 0, /* NOTHING */
1424 0, /* TAIL */
1425 0, /* STAR */
1426 0, /* PLUS */
1427 0, /* CURLY */
1428 0, /* CURLYN */
1429 0, /* CURLYM */
1430 0, /* CURLYX */
1431 0, /* WHILEM */
1432 0, /* OPEN */
1433 0, /* CLOSE */
07093db4
KW
1434 0, /* SROPEN */
1435 0, /* SRCLOSE */
03363afd
YO
1436 0, /* REF */
1437 0, /* REFF */
1438 0, /* REFFL */
01f98ec2 1439 0, /* REFFU */
781aab5c 1440 0, /* REFFA */
016b7209
KW
1441 0, /* REFN */
1442 0, /* REFFN */
1443 0, /* REFFLN */
1444 0, /* REFFUN */
1445 0, /* REFFAN */
d3d47aac
YO
1446 1, /* LONGJMP */
1447 1, /* BRANCHJ */
46167d76
KW
1448 1, /* IFMATCH */
1449 1, /* UNLESSM */
03363afd
YO
1450 1, /* SUSPEND */
1451 1, /* IFTHEN */
1452 0, /* GROUPP */
03363afd
YO
1453 0, /* EVAL */
1454 0, /* MINMOD */
1455 0, /* LOGICAL */
1456 1, /* RENUM */
1a147d38 1457 0, /* GOSUB */
016b7209 1458 0, /* GROUPPN */
1a147d38 1459 0, /* INSUBP */
0a4db386 1460 0, /* DEFINEP */
e2e6a0f1 1461 0, /* ENDLIKE */
7f69552c 1462 0, /* OPFAIL */
e2e6a0f1
YO
1463 0, /* ACCEPT */
1464 0, /* VERB */
5d458dd8 1465 0, /* PRUNE */
e2e6a0f1 1466 0, /* MARKPOINT */
5d458dd8 1467 0, /* SKIP */
e2e6a0f1 1468 0, /* COMMIT */
5d458dd8 1469 0, /* CUTGROUP */
ee9b8eae 1470 0, /* KEEPS */
03363afd
YO
1471 0, /* OPTIMIZED */
1472 0, /* PSEUDO */
86451f01 1473 0, /* REGEX_SET */
d09b2d29 1474};
885f9e59 1475
13d6edb4
NC
1476#endif /* REG_COMP_C */
1477
f83e001e 1478
6bda09f9
YO
1479/* reg_name[] - Opcode/state names in string form, for debugging */
1480
22429478 1481#ifndef DOINIT
13d6edb4 1482EXTCONST char * PL_reg_name[];
22429478 1483#else
4764e399 1484EXTCONST char * const PL_reg_name[] = {
03363afd
YO
1485 "END", /* 0000 */
1486 "SUCCEED", /* 0x01 */
d3d47aac 1487 "SBOL", /* 0x02 */
03363afd 1488 "MBOL", /* 0x03 */
d3d47aac
YO
1489 "SEOL", /* 0x04 */
1490 "MEOL", /* 0x05 */
1491 "EOS", /* 0x06 */
1492 "GPOS", /* 0x07 */
1493 "BOUND", /* 0x08 */
1494 "BOUNDL", /* 0x09 */
1495 "BOUNDU", /* 0x0a */
1496 "BOUNDA", /* 0x0b */
1497 "NBOUND", /* 0x0c */
1498 "NBOUNDL", /* 0x0d */
1499 "NBOUNDU", /* 0x0e */
1500 "NBOUNDA", /* 0x0f */
1501 "REG_ANY", /* 0x10 */
1502 "SANY", /* 0x11 */
33c28ab2 1503 "ANYOF", /* 0x12 */
ac44c12e
KW
1504 "ANYOFD", /* 0x13 */
1505 "ANYOFL", /* 0x14 */
3edce4f5 1506 "ANYOFPOSIXL", /* 0x15 */
c316b824 1507 "ANYOFH", /* 0x16 */
6966a05b 1508 "ANYOFHb", /* 0x17 */
3146c00a 1509 "ANYOFHr", /* 0x18 */
34924db0
KW
1510 "ANYOFHs", /* 0x19 */
1511 "ANYOFR", /* 0x1a */
1512 "ANYOFRb", /* 0x1b */
1513 "ANYOFM", /* 0x1c */
1514 "NANYOFM", /* 0x1d */
1515 "POSIXD", /* 0x1e */
1516 "POSIXL", /* 0x1f */
1517 "POSIXU", /* 0x20 */
1518 "POSIXA", /* 0x21 */
1519 "NPOSIXD", /* 0x22 */
1520 "NPOSIXL", /* 0x23 */
1521 "NPOSIXU", /* 0x24 */
1522 "NPOSIXA", /* 0x25 */
1523 "CLUMP", /* 0x26 */
1524 "BRANCH", /* 0x27 */
1525 "EXACT", /* 0x28 */
1526 "LEXACT", /* 0x29 */
1527 "EXACTL", /* 0x2a */
1528 "EXACTF", /* 0x2b */
1529 "EXACTFL", /* 0x2c */
1530 "EXACTFU", /* 0x2d */
1531 "EXACTFAA", /* 0x2e */
f97d9711
KW
1532 "EXACTFAA_NO_TRIE", /* 0x2f */
1533 "EXACTFUP", /* 0x30 */
1534 "EXACTFLU8", /* 0x31 */
34924db0
KW
1535 "EXACT_REQ8", /* 0x32 */
1536 "LEXACT_REQ8", /* 0x33 */
1537 "EXACTFU_REQ8", /* 0x34 */
1538 "EXACTFU_S_EDGE", /* 0x35 */
7af55186
KW
1539 "LNBREAK", /* 0x36 */
1540 "TRIE", /* 0x37 */
1541 "TRIEC", /* 0x38 */
1542 "AHOCORASICK", /* 0x39 */
1543 "AHOCORASICKC", /* 0x3a */
1544 "NOTHING", /* 0x3b */
1545 "TAIL", /* 0x3c */
1546 "STAR", /* 0x3d */
1547 "PLUS", /* 0x3e */
1548 "CURLY", /* 0x3f */
1549 "CURLYN", /* 0x40 */
1550 "CURLYM", /* 0x41 */
1551 "CURLYX", /* 0x42 */
1552 "WHILEM", /* 0x43 */
1553 "OPEN", /* 0x44 */
1554 "CLOSE", /* 0x45 */
1555 "SROPEN", /* 0x46 */
1556 "SRCLOSE", /* 0x47 */
1557 "REF", /* 0x48 */
1558 "REFF", /* 0x49 */
1559 "REFFL", /* 0x4a */
1560 "REFFU", /* 0x4b */
1561 "REFFA", /* 0x4c */
1562 "REFN", /* 0x4d */
1563 "REFFN", /* 0x4e */
1564 "REFFLN", /* 0x4f */
1565 "REFFUN", /* 0x50 */
1566 "REFFAN", /* 0x51 */
1567 "LONGJMP", /* 0x52 */
1568 "BRANCHJ", /* 0x53 */
1569 "IFMATCH", /* 0x54 */
1570 "UNLESSM", /* 0x55 */
1571 "SUSPEND", /* 0x56 */
1572 "IFTHEN", /* 0x57 */
1573 "GROUPP", /* 0x58 */
1574 "EVAL", /* 0x59 */
1575 "MINMOD", /* 0x5a */
1576 "LOGICAL", /* 0x5b */
1577 "RENUM", /* 0x5c */
1578 "GOSUB", /* 0x5d */
1579 "GROUPPN", /* 0x5e */
1580 "INSUBP", /* 0x5f */
1581 "DEFINEP", /* 0x60 */
1582 "ENDLIKE", /* 0x61 */
1583 "OPFAIL", /* 0x62 */
1584 "ACCEPT", /* 0x63 */
1585 "VERB", /* 0x64 */
1586 "PRUNE", /* 0x65 */
1587 "MARKPOINT", /* 0x66 */
1588 "SKIP", /* 0x67 */
1589 "COMMIT", /* 0x68 */
1590 "CUTGROUP", /* 0x69 */
1591 "KEEPS", /* 0x6a */
34924db0
KW
1592 "OPTIMIZED", /* 0x6b */
1593 "PSEUDO", /* 0x6c */
86451f01 1594 "REGEX_SET", /* 0x6d */
03363afd 1595 /* ------------ States ------------- */
24b23f37
YO
1596 "TRIE_next", /* REGNODE_MAX +0x01 */
1597 "TRIE_next_fail", /* REGNODE_MAX +0x02 */
4ee16520
DM
1598 "EVAL_B", /* REGNODE_MAX +0x03 */
1599 "EVAL_B_fail", /* REGNODE_MAX +0x04 */
1600 "EVAL_postponed_AB", /* REGNODE_MAX +0x05 */
1601 "EVAL_postponed_AB_fail", /* REGNODE_MAX +0x06 */
1602 "CURLYX_end", /* REGNODE_MAX +0x07 */
1603 "CURLYX_end_fail", /* REGNODE_MAX +0x08 */
1604 "WHILEM_A_pre", /* REGNODE_MAX +0x09 */
1605 "WHILEM_A_pre_fail", /* REGNODE_MAX +0x0a */
1606 "WHILEM_A_min", /* REGNODE_MAX +0x0b */
1607 "WHILEM_A_min_fail", /* REGNODE_MAX +0x0c */
1608 "WHILEM_A_max", /* REGNODE_MAX +0x0d */
1609 "WHILEM_A_max_fail", /* REGNODE_MAX +0x0e */
1610 "WHILEM_B_min", /* REGNODE_MAX +0x0f */
1611 "WHILEM_B_min_fail", /* REGNODE_MAX +0x10 */
1612 "WHILEM_B_max", /* REGNODE_MAX +0x11 */
1613 "WHILEM_B_max_fail", /* REGNODE_MAX +0x12 */
1614 "BRANCH_next", /* REGNODE_MAX +0x13 */
1615 "BRANCH_next_fail", /* REGNODE_MAX +0x14 */
1616 "CURLYM_A", /* REGNODE_MAX +0x15 */
1617 "CURLYM_A_fail", /* REGNODE_MAX +0x16 */
1618 "CURLYM_B", /* REGNODE_MAX +0x17 */
1619 "CURLYM_B_fail", /* REGNODE_MAX +0x18 */
1620 "IFMATCH_A", /* REGNODE_MAX +0x19 */
1621 "IFMATCH_A_fail", /* REGNODE_MAX +0x1a */
21cbe009
DM
1622 "CURLY_B_min", /* REGNODE_MAX +0x1b */
1623 "CURLY_B_min_fail", /* REGNODE_MAX +0x1c */
1624 "CURLY_B_max", /* REGNODE_MAX +0x1d */
1625 "CURLY_B_max_fail", /* REGNODE_MAX +0x1e */
1626 "COMMIT_next", /* REGNODE_MAX +0x1f */
1627 "COMMIT_next_fail", /* REGNODE_MAX +0x20 */
1628 "MARKPOINT_next", /* REGNODE_MAX +0x21 */
1629 "MARKPOINT_next_fail", /* REGNODE_MAX +0x22 */
1630 "SKIP_next", /* REGNODE_MAX +0x23 */
1631 "SKIP_next_fail", /* REGNODE_MAX +0x24 */
1632 "CUTGROUP_next", /* REGNODE_MAX +0x25 */
1633 "CUTGROUP_next_fail", /* REGNODE_MAX +0x26 */
1634 "KEEPS_next", /* REGNODE_MAX +0x27 */
1635 "KEEPS_next_fail", /* REGNODE_MAX +0x28 */
885f9e59 1636};
22429478 1637#endif /* DOINIT */
d09b2d29 1638
f7819f85
A
1639/* PL_reg_extflags_name[] - Opcode/state names in string form, for debugging */
1640
1641#ifndef DOINIT
1642EXTCONST char * PL_reg_extflags_name[];
1643#else
1644EXTCONST char * const PL_reg_extflags_name[] = {
d262c0c7 1645 /* Bits in extflags defined: 11111111111111110000111111111111 */
52d81aa8
NC
1646 "MULTILINE", /* 0x00000001 */
1647 "SINGLELINE", /* 0x00000002 */
1648 "FOLD", /* 0x00000004 */
1649 "EXTENDED", /* 0x00000008 */
334afb3e 1650 "EXTENDED_MORE", /* 0x00000010 */
e3b64d84
KW
1651 "NOCAPTURE", /* 0x00000020 */
1652 "KEEPCOPY", /* 0x00000040 */
1653 "CHARSET0", /* 0x00000080 : "CHARSET" - 0x00000380 */
1654 "CHARSET1", /* 0x00000100 : "CHARSET" - 0x00000380 */
1655 "CHARSET2", /* 0x00000200 : "CHARSET" - 0x00000380 */
d262c0c7
KW
1656 "STRICT", /* 0x00000400 */
1657 "SPLIT", /* 0x00000800 */
1d32d911
KW
1658 "UNUSED_BIT_12", /* 0x00001000 */
1659 "UNUSED_BIT_13", /* 0x00002000 */
1660 "UNUSED_BIT_14", /* 0x00004000 */
a3b51d37
KW
1661 "UNUSED_BIT_15", /* 0x00008000 */
1662 "NO_INPLACE_SUBST", /* 0x00010000 */
1663 "EVAL_SEEN", /* 0x00020000 */
ee273784 1664 "UNBOUNDED_QUANTIFIER_SEEN",/* 0x00040000 */
e795e964 1665 "CHECK_ALL", /* 0x00080000 */
52d81aa8
NC
1666 "MATCH_UTF8", /* 0x00100000 */
1667 "USE_INTUIT_NOML", /* 0x00200000 */
1668 "USE_INTUIT_ML", /* 0x00400000 */
1669 "INTUIT_TAIL", /* 0x00800000 */
a3b51d37 1670 "IS_ANCHORED", /* 0x01000000 */
52d81aa8
NC
1671 "COPY_DONE", /* 0x02000000 */
1672 "TAINTED_SEEN", /* 0x04000000 */
1673 "TAINTED", /* 0x08000000 */
1674 "START_ONLY", /* 0x10000000 */
dbc200c5 1675 "SKIPWHITE", /* 0x20000000 */
52d81aa8
NC
1676 "WHITE", /* 0x40000000 */
1677 "NULL", /* 0x80000000 */
f7819f85
A
1678};
1679#endif /* DOINIT */
1680
adc2d0c9
JH
1681#ifdef DEBUGGING
1682# define REG_EXTFLAGS_NAME_SIZE 32
1683#endif
1684
337ff307
YO
1685/* PL_reg_intflags_name[] - Opcode/state names in string form, for debugging */
1686
1687#ifndef DOINIT
1688EXTCONST char * PL_reg_intflags_name[];
1689#else
1690EXTCONST char * const PL_reg_intflags_name[] = {
b8f6efdd
YO
1691 "SKIP", /* 0x00000001 - PREGf_SKIP */
1692 "IMPLICIT", /* 0x00000002 - PREGf_IMPLICIT - Converted .* to ^.* */
1693 "NAUGHTY", /* 0x00000004 - PREGf_NAUGHTY - how exponential is this pattern? */
1694 "VERBARG_SEEN", /* 0x00000008 - PREGf_VERBARG_SEEN */
1695 "CUTGROUP_SEEN", /* 0x00000010 - PREGf_CUTGROUP_SEEN */
1696 "USE_RE_EVAL", /* 0x00000020 - PREGf_USE_RE_EVAL - compiled with "use re 'eval'" */
58430ea8 1697 "NOSCAN", /* 0x00000040 - PREGf_NOSCAN */
58430ea8
YO
1698 "GPOS_SEEN", /* 0x00000100 - PREGf_GPOS_SEEN */
1699 "GPOS_FLOAT", /* 0x00000200 - PREGf_GPOS_FLOAT */
d3d47aac
YO
1700 "ANCH_MBOL", /* 0x00000400 - PREGf_ANCH_MBOL */
1701 "ANCH_SBOL", /* 0x00000800 - PREGf_ANCH_SBOL */
1702 "ANCH_GPOS", /* 0x00001000 - PREGf_ANCH_GPOS */
d5a00e4a 1703 "RECURSE_SEEN", /* 0x00002000 - PREGf_RECURSE_SEEN */
337ff307
YO
1704};
1705#endif /* DOINIT */
1706
adc2d0c9 1707#ifdef DEBUGGING
d5a00e4a 1708# define REG_INTFLAGS_NAME_SIZE 13
adc2d0c9
JH
1709#endif
1710
f9ef50a7 1711/* The following have no fixed length. U8 so we can do strchr() on it. */
ded4dd2a 1712#define REGNODE_VARIES(node) (PL_varies_bitmask[(node) >> 3] & (1 << ((node) & 7)))
e52fc539 1713
f9ef50a7 1714#ifndef DOINIT
ded4dd2a 1715EXTCONST U8 PL_varies[] __attribute__deprecated__;
f9ef50a7 1716#else
ded4dd2a 1717EXTCONST U8 PL_varies[] __attribute__deprecated__ = {
62e6ef33 1718 CLUMP, BRANCH, STAR, PLUS, CURLY, CURLYN, CURLYM, CURLYX, WHILEM, REF,
016b7209 1719 REFF, REFFL, REFFU, REFFA, REFN, REFFN, REFFLN, REFFUN, REFFAN,
d3d47aac 1720 BRANCHJ, SUSPEND, IFTHEN,
f9ef50a7
NC
1721 0
1722};
1723#endif /* DOINIT */
1724
ded4dd2a
NC
1725#ifndef DOINIT
1726EXTCONST U8 PL_varies_bitmask[];
1727#else
1728EXTCONST U8 PL_varies_bitmask[] = {
7af55186 1729 0x00, 0x00, 0x00, 0x00, 0xC0, 0x00, 0x00, 0xE0, 0x0F, 0xFF, 0xCB, 0x00, 0x00, 0x00
ded4dd2a
NC
1730};
1731#endif /* DOINIT */
1732
f9ef50a7
NC
1733/* The following always have a length of 1. U8 we can do strchr() on it. */
1734/* (Note that length 1 means "one character" under UTF8, not "one octet".) */
ded4dd2a 1735#define REGNODE_SIMPLE(node) (PL_simple_bitmask[(node) >> 3] & (1 << ((node) & 7)))
e52fc539 1736
f9ef50a7 1737#ifndef DOINIT
ded4dd2a 1738EXTCONST U8 PL_simple[] __attribute__deprecated__;
f9ef50a7 1739#else
ded4dd2a 1740EXTCONST U8 PL_simple[] __attribute__deprecated__ = {
6966a05b 1741 REG_ANY, SANY, ANYOF, ANYOFD, ANYOFL, ANYOFPOSIXL, ANYOFH, ANYOFHb,
34924db0 1742 ANYOFHr, ANYOFHs, ANYOFR, ANYOFRb, ANYOFM, NANYOFM, POSIXD, POSIXL,
86451f01 1743 POSIXU, POSIXA, NPOSIXD, NPOSIXL, NPOSIXU, NPOSIXA, REGEX_SET,
f9ef50a7
NC
1744 0
1745};
1746#endif /* DOINIT */
1747
ded4dd2a
NC
1748#ifndef DOINIT
1749EXTCONST U8 PL_simple_bitmask[];
1750#else
1751EXTCONST U8 PL_simple_bitmask[] = {
86451f01 1752 0x00, 0x00, 0xFF, 0xFF, 0x3F, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x20
ded4dd2a
NC
1753};
1754#endif /* DOINIT */
1755
37442d52 1756/* ex: set ro: */