This is a live mirror of the Perl 5 development currently hosted at https://github.com/perl/perl5
Revert bogus fix for bug #27940, which wasn't really a bug,
[perl5.git] / sv.c
CommitLineData
a0d0e21e 1/* sv.c
79072805 2 *
4bb101f2 3 * Copyright (C) 1991, 1992, 1993, 1994, 1995, 1996, 1997, 1998, 1999,
b94e2f88 4 * 2000, 2001, 2002, 2003, 2004, 2005, 2006, by Larry Wall and others
79072805
LW
5 *
6 * You may distribute under the terms of either the GNU General Public
7 * License or the Artistic License, as specified in the README file.
8 *
a0d0e21e 9 * "I wonder what the Entish is for 'yes' and 'no'," he thought.
645c22ef
DM
10 *
11 *
5e045b90
AMS
12 * This file contains the code that creates, manipulates and destroys
13 * scalar values (SVs). The other types (AV, HV, GV, etc.) reuse the
14 * structure of an SV, so their creation and destruction is handled
15 * here; higher-level functions are in av.c, hv.c, and so on. Opcode
16 * level functions (eg. substr, split, join) for each of the types are
17 * in the pp*.c files.
79072805
LW
18 */
19
20#include "EXTERN.h"
864dbfa3 21#define PERL_IN_SV_C
79072805 22#include "perl.h"
d2f185dc 23#include "regcomp.h"
79072805 24
51371543 25#define FCALL *f
2c5424a7 26
2f8ed50e
OS
27#ifdef __Lynx__
28/* Missing proto on LynxOS */
29 char *gconvert(double, int, int, char *);
30#endif
31
e23c8137 32#ifdef PERL_UTF8_CACHE_ASSERT
ab455f60 33/* if adding more checks watch out for the following tests:
e23c8137
JH
34 * t/op/index.t t/op/length.t t/op/pat.t t/op/substr.t
35 * lib/utf8.t lib/Unicode/Collate/t/index.t
36 * --jhi
37 */
6f207bd3 38# define ASSERT_UTF8_CACHE(cache) \
ab455f60
NC
39 STMT_START { if (cache) { assert((cache)[0] <= (cache)[1]); \
40 assert((cache)[2] <= (cache)[3]); \
41 assert((cache)[3] <= (cache)[1]);} \
42 } STMT_END
e23c8137 43#else
6f207bd3 44# define ASSERT_UTF8_CACHE(cache) NOOP
e23c8137
JH
45#endif
46
f8c7b90f 47#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 48#define SV_COW_NEXT_SV(sv) INT2PTR(SV *,SvUVX(sv))
607fa7f2 49#define SV_COW_NEXT_SV_SET(current,next) SvUV_set(current, PTR2UV(next))
b5ccf5f2 50/* This is a pessimistic view. Scalar must be purely a read-write PV to copy-
765f542d 51 on-write. */
765f542d 52#endif
645c22ef
DM
53
54/* ============================================================================
55
56=head1 Allocation and deallocation of SVs.
57
d2a0f284
JC
58An SV (or AV, HV, etc.) is allocated in two parts: the head (struct
59sv, av, hv...) contains type and reference count information, and for
60many types, a pointer to the body (struct xrv, xpv, xpviv...), which
61contains fields specific to each type. Some types store all they need
62in the head, so don't have a body.
63
64In all but the most memory-paranoid configuations (ex: PURIFY), heads
65and bodies are allocated out of arenas, which by default are
66approximately 4K chunks of memory parcelled up into N heads or bodies.
93e68bfb
JC
67Sv-bodies are allocated by their sv-type, guaranteeing size
68consistency needed to allocate safely from arrays.
69
d2a0f284
JC
70For SV-heads, the first slot in each arena is reserved, and holds a
71link to the next arena, some flags, and a note of the number of slots.
72Snaked through each arena chain is a linked list of free items; when
73this becomes empty, an extra arena is allocated and divided up into N
74items which are threaded into the free list.
75
76SV-bodies are similar, but they use arena-sets by default, which
77separate the link and info from the arena itself, and reclaim the 1st
78slot in the arena. SV-bodies are further described later.
645c22ef
DM
79
80The following global variables are associated with arenas:
81
82 PL_sv_arenaroot pointer to list of SV arenas
83 PL_sv_root pointer to list of free SV structures
84
d2a0f284
JC
85 PL_body_arenas head of linked-list of body arenas
86 PL_body_roots[] array of pointers to list of free bodies of svtype
87 arrays are indexed by the svtype needed
93e68bfb 88
d2a0f284
JC
89A few special SV heads are not allocated from an arena, but are
90instead directly created in the interpreter structure, eg PL_sv_undef.
93e68bfb
JC
91The size of arenas can be changed from the default by setting
92PERL_ARENA_SIZE appropriately at compile time.
645c22ef
DM
93
94The SV arena serves the secondary purpose of allowing still-live SVs
95to be located and destroyed during final cleanup.
96
97At the lowest level, the macros new_SV() and del_SV() grab and free
98an SV head. (If debugging with -DD, del_SV() calls the function S_del_sv()
99to return the SV to the free list with error checking.) new_SV() calls
100more_sv() / sv_add_arena() to add an extra arena if the free list is empty.
101SVs in the free list have their SvTYPE field set to all ones.
102
ff276b08 103At the time of very final cleanup, sv_free_arenas() is called from
645c22ef 104perl_destruct() to physically free all the arenas allocated since the
6a93a7e5 105start of the interpreter.
645c22ef
DM
106
107Manipulation of any of the PL_*root pointers is protected by enclosing
108LOCK_SV_MUTEX; ... UNLOCK_SV_MUTEX calls which should Do the Right Thing
109if threads are enabled.
110
111The function visit() scans the SV arenas list, and calls a specified
112function for each SV it finds which is still live - ie which has an SvTYPE
113other than all 1's, and a non-zero SvREFCNT. visit() is used by the
114following functions (specified as [function that calls visit()] / [function
115called by visit() for each SV]):
116
117 sv_report_used() / do_report_used()
f2524eef 118 dump all remaining SVs (debugging aid)
645c22ef
DM
119
120 sv_clean_objs() / do_clean_objs(),do_clean_named_objs()
121 Attempt to free all objects pointed to by RVs,
122 and, unless DISABLE_DESTRUCTOR_KLUDGE is defined,
123 try to do the same for all objects indirectly
124 referenced by typeglobs too. Called once from
125 perl_destruct(), prior to calling sv_clean_all()
126 below.
127
128 sv_clean_all() / do_clean_all()
129 SvREFCNT_dec(sv) each remaining SV, possibly
130 triggering an sv_free(). It also sets the
131 SVf_BREAK flag on the SV to indicate that the
132 refcnt has been artificially lowered, and thus
133 stopping sv_free() from giving spurious warnings
134 about SVs which unexpectedly have a refcnt
135 of zero. called repeatedly from perl_destruct()
136 until there are no SVs left.
137
93e68bfb 138=head2 Arena allocator API Summary
645c22ef
DM
139
140Private API to rest of sv.c
141
142 new_SV(), del_SV(),
143
144 new_XIV(), del_XIV(),
145 new_XNV(), del_XNV(),
146 etc
147
148Public API:
149
8cf8f3d1 150 sv_report_used(), sv_clean_objs(), sv_clean_all(), sv_free_arenas()
645c22ef 151
645c22ef
DM
152=cut
153
154============================================================================ */
155
4561caa4
CS
156/*
157 * "A time to plant, and a time to uproot what was planted..."
158 */
159
77354fb4
NC
160/*
161 * nice_chunk and nice_chunk size need to be set
162 * and queried under the protection of sv_mutex
163 */
164void
165Perl_offer_nice_chunk(pTHX_ void *chunk, U32 chunk_size)
166{
97aff369 167 dVAR;
77354fb4
NC
168 void *new_chunk;
169 U32 new_chunk_size;
170 LOCK_SV_MUTEX;
171 new_chunk = (void *)(chunk);
172 new_chunk_size = (chunk_size);
173 if (new_chunk_size > PL_nice_chunk_size) {
174 Safefree(PL_nice_chunk);
175 PL_nice_chunk = (char *) new_chunk;
176 PL_nice_chunk_size = new_chunk_size;
177 } else {
178 Safefree(chunk);
179 }
180 UNLOCK_SV_MUTEX;
181}
cac9b346 182
fd0854ff 183#ifdef DEBUG_LEAKING_SCALARS
22162ca8 184# define FREE_SV_DEBUG_FILE(sv) Safefree((sv)->sv_debug_file)
fd0854ff
DM
185#else
186# define FREE_SV_DEBUG_FILE(sv)
187#endif
188
48614a46
NC
189#ifdef PERL_POISON
190# define SvARENA_CHAIN(sv) ((sv)->sv_u.svu_rv)
191/* Whilst I'd love to do this, it seems that things like to check on
192 unreferenced scalars
7e337ee0 193# define POSION_SV_HEAD(sv) PoisonNew(sv, 1, struct STRUCT_SV)
48614a46 194*/
7e337ee0
JH
195# define POSION_SV_HEAD(sv) PoisonNew(&SvANY(sv), 1, void *), \
196 PoisonNew(&SvREFCNT(sv), 1, U32)
48614a46
NC
197#else
198# define SvARENA_CHAIN(sv) SvANY(sv)
199# define POSION_SV_HEAD(sv)
200#endif
201
053fc874
GS
202#define plant_SV(p) \
203 STMT_START { \
fd0854ff 204 FREE_SV_DEBUG_FILE(p); \
48614a46
NC
205 POSION_SV_HEAD(p); \
206 SvARENA_CHAIN(p) = (void *)PL_sv_root; \
053fc874
GS
207 SvFLAGS(p) = SVTYPEMASK; \
208 PL_sv_root = (p); \
209 --PL_sv_count; \
210 } STMT_END
a0d0e21e 211
fba3b22e 212/* sv_mutex must be held while calling uproot_SV() */
053fc874
GS
213#define uproot_SV(p) \
214 STMT_START { \
215 (p) = PL_sv_root; \
bb7bbd9c 216 PL_sv_root = (SV*)SvARENA_CHAIN(p); \
053fc874
GS
217 ++PL_sv_count; \
218 } STMT_END
219
645c22ef 220
cac9b346
NC
221/* make some more SVs by adding another arena */
222
223/* sv_mutex must be held while calling more_sv() */
224STATIC SV*
225S_more_sv(pTHX)
226{
97aff369 227 dVAR;
cac9b346
NC
228 SV* sv;
229
230 if (PL_nice_chunk) {
231 sv_add_arena(PL_nice_chunk, PL_nice_chunk_size, 0);
bd61b366 232 PL_nice_chunk = NULL;
cac9b346
NC
233 PL_nice_chunk_size = 0;
234 }
235 else {
236 char *chunk; /* must use New here to match call to */
d2a0f284 237 Newx(chunk,PERL_ARENA_SIZE,char); /* Safefree() in sv_free_arenas() */
2e7ed132 238 sv_add_arena(chunk, PERL_ARENA_SIZE, 0);
cac9b346
NC
239 }
240 uproot_SV(sv);
241 return sv;
242}
243
645c22ef
DM
244/* new_SV(): return a new, empty SV head */
245
eba0f806
DM
246#ifdef DEBUG_LEAKING_SCALARS
247/* provide a real function for a debugger to play with */
248STATIC SV*
249S_new_SV(pTHX)
250{
251 SV* sv;
252
253 LOCK_SV_MUTEX;
254 if (PL_sv_root)
255 uproot_SV(sv);
256 else
cac9b346 257 sv = S_more_sv(aTHX);
eba0f806
DM
258 UNLOCK_SV_MUTEX;
259 SvANY(sv) = 0;
260 SvREFCNT(sv) = 1;
261 SvFLAGS(sv) = 0;
fd0854ff
DM
262 sv->sv_debug_optype = PL_op ? PL_op->op_type : 0;
263 sv->sv_debug_line = (U16) ((PL_copline == NOLINE) ?
264 (PL_curcop ? CopLINE(PL_curcop) : 0) : PL_copline);
265 sv->sv_debug_inpad = 0;
266 sv->sv_debug_cloned = 0;
fd0854ff 267 sv->sv_debug_file = PL_curcop ? savepv(CopFILE(PL_curcop)): NULL;
fd0854ff 268
eba0f806
DM
269 return sv;
270}
271# define new_SV(p) (p)=S_new_SV(aTHX)
272
273#else
274# define new_SV(p) \
053fc874
GS
275 STMT_START { \
276 LOCK_SV_MUTEX; \
277 if (PL_sv_root) \
278 uproot_SV(p); \
279 else \
cac9b346 280 (p) = S_more_sv(aTHX); \
053fc874
GS
281 UNLOCK_SV_MUTEX; \
282 SvANY(p) = 0; \
283 SvREFCNT(p) = 1; \
284 SvFLAGS(p) = 0; \
285 } STMT_END
eba0f806 286#endif
463ee0b2 287
645c22ef
DM
288
289/* del_SV(): return an empty SV head to the free list */
290
a0d0e21e 291#ifdef DEBUGGING
4561caa4 292
053fc874
GS
293#define del_SV(p) \
294 STMT_START { \
295 LOCK_SV_MUTEX; \
aea4f609 296 if (DEBUG_D_TEST) \
053fc874
GS
297 del_sv(p); \
298 else \
299 plant_SV(p); \
300 UNLOCK_SV_MUTEX; \
301 } STMT_END
a0d0e21e 302
76e3520e 303STATIC void
cea2e8a9 304S_del_sv(pTHX_ SV *p)
463ee0b2 305{
97aff369 306 dVAR;
aea4f609 307 if (DEBUG_D_TEST) {
4633a7c4 308 SV* sva;
a3b680e6 309 bool ok = 0;
3280af22 310 for (sva = PL_sv_arenaroot; sva; sva = (SV *) SvANY(sva)) {
53c1dcc0
AL
311 const SV * const sv = sva + 1;
312 const SV * const svend = &sva[SvREFCNT(sva)];
c0ff570e 313 if (p >= sv && p < svend) {
a0d0e21e 314 ok = 1;
c0ff570e
NC
315 break;
316 }
a0d0e21e
LW
317 }
318 if (!ok) {
0453d815 319 if (ckWARN_d(WARN_INTERNAL))
9014280d 320 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
472d47bc
SB
321 "Attempt to free non-arena SV: 0x%"UVxf
322 pTHX__FORMAT, PTR2UV(p) pTHX__VALUE);
a0d0e21e
LW
323 return;
324 }
325 }
4561caa4 326 plant_SV(p);
463ee0b2 327}
a0d0e21e 328
4561caa4
CS
329#else /* ! DEBUGGING */
330
331#define del_SV(p) plant_SV(p)
332
333#endif /* DEBUGGING */
463ee0b2 334
645c22ef
DM
335
336/*
ccfc67b7
JH
337=head1 SV Manipulation Functions
338
645c22ef
DM
339=for apidoc sv_add_arena
340
341Given a chunk of memory, link it to the head of the list of arenas,
342and split it into a list of free SVs.
343
344=cut
345*/
346
4633a7c4 347void
864dbfa3 348Perl_sv_add_arena(pTHX_ char *ptr, U32 size, U32 flags)
463ee0b2 349{
97aff369 350 dVAR;
0bd48802 351 SV* const sva = (SV*)ptr;
463ee0b2
LW
352 register SV* sv;
353 register SV* svend;
4633a7c4
LW
354
355 /* The first SV in an arena isn't an SV. */
3280af22 356 SvANY(sva) = (void *) PL_sv_arenaroot; /* ptr to next arena */
4633a7c4
LW
357 SvREFCNT(sva) = size / sizeof(SV); /* number of SV slots */
358 SvFLAGS(sva) = flags; /* FAKE if not to be freed */
359
3280af22
NIS
360 PL_sv_arenaroot = sva;
361 PL_sv_root = sva + 1;
4633a7c4
LW
362
363 svend = &sva[SvREFCNT(sva) - 1];
364 sv = sva + 1;
463ee0b2 365 while (sv < svend) {
48614a46 366 SvARENA_CHAIN(sv) = (void *)(SV*)(sv + 1);
03e36789 367#ifdef DEBUGGING
978b032e 368 SvREFCNT(sv) = 0;
03e36789
NC
369#endif
370 /* Must always set typemask because it's awlays checked in on cleanup
371 when the arenas are walked looking for objects. */
8990e307 372 SvFLAGS(sv) = SVTYPEMASK;
463ee0b2
LW
373 sv++;
374 }
48614a46 375 SvARENA_CHAIN(sv) = 0;
03e36789
NC
376#ifdef DEBUGGING
377 SvREFCNT(sv) = 0;
378#endif
4633a7c4
LW
379 SvFLAGS(sv) = SVTYPEMASK;
380}
381
055972dc
DM
382/* visit(): call the named function for each non-free SV in the arenas
383 * whose flags field matches the flags/mask args. */
645c22ef 384
5226ed68 385STATIC I32
055972dc 386S_visit(pTHX_ SVFUNC_t f, U32 flags, U32 mask)
8990e307 387{
97aff369 388 dVAR;
4633a7c4 389 SV* sva;
5226ed68 390 I32 visited = 0;
8990e307 391
3280af22 392 for (sva = PL_sv_arenaroot; sva; sva = (SV*)SvANY(sva)) {
53c1dcc0 393 register const SV * const svend = &sva[SvREFCNT(sva)];
a3b680e6 394 register SV* sv;
4561caa4 395 for (sv = sva + 1; sv < svend; ++sv) {
055972dc
DM
396 if (SvTYPE(sv) != SVTYPEMASK
397 && (sv->sv_flags & mask) == flags
398 && SvREFCNT(sv))
399 {
acfe0abc 400 (FCALL)(aTHX_ sv);
5226ed68
JH
401 ++visited;
402 }
8990e307
LW
403 }
404 }
5226ed68 405 return visited;
8990e307
LW
406}
407
758a08c3
JH
408#ifdef DEBUGGING
409
645c22ef
DM
410/* called by sv_report_used() for each live SV */
411
412static void
acfe0abc 413do_report_used(pTHX_ SV *sv)
645c22ef
DM
414{
415 if (SvTYPE(sv) != SVTYPEMASK) {
416 PerlIO_printf(Perl_debug_log, "****\n");
417 sv_dump(sv);
418 }
419}
758a08c3 420#endif
645c22ef
DM
421
422/*
423=for apidoc sv_report_used
424
425Dump the contents of all SVs not yet freed. (Debugging aid).
426
427=cut
428*/
429
8990e307 430void
864dbfa3 431Perl_sv_report_used(pTHX)
4561caa4 432{
ff270d3a 433#ifdef DEBUGGING
055972dc 434 visit(do_report_used, 0, 0);
96a5add6
AL
435#else
436 PERL_UNUSED_CONTEXT;
ff270d3a 437#endif
4561caa4
CS
438}
439
645c22ef
DM
440/* called by sv_clean_objs() for each live SV */
441
442static void
e15faf7d 443do_clean_objs(pTHX_ SV *ref)
645c22ef 444{
97aff369 445 dVAR;
823a54a3
AL
446 if (SvROK(ref)) {
447 SV * const target = SvRV(ref);
448 if (SvOBJECT(target)) {
449 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning object ref:\n "), sv_dump(ref)));
450 if (SvWEAKREF(ref)) {
451 sv_del_backref(target, ref);
452 SvWEAKREF_off(ref);
453 SvRV_set(ref, NULL);
454 } else {
455 SvROK_off(ref);
456 SvRV_set(ref, NULL);
457 SvREFCNT_dec(target);
458 }
645c22ef
DM
459 }
460 }
461
462 /* XXX Might want to check arrays, etc. */
463}
464
465/* called by sv_clean_objs() for each live SV */
466
467#ifndef DISABLE_DESTRUCTOR_KLUDGE
468static void
acfe0abc 469do_clean_named_objs(pTHX_ SV *sv)
645c22ef 470{
97aff369 471 dVAR;
f7877b28 472 if (SvTYPE(sv) == SVt_PVGV && isGV_with_GP(sv) && GvGP(sv)) {
c69033f2
NC
473 if ((
474#ifdef PERL_DONT_CREATE_GVSV
475 GvSV(sv) &&
476#endif
477 SvOBJECT(GvSV(sv))) ||
645c22ef
DM
478 (GvAV(sv) && SvOBJECT(GvAV(sv))) ||
479 (GvHV(sv) && SvOBJECT(GvHV(sv))) ||
480 (GvIO(sv) && SvOBJECT(GvIO(sv))) ||
481 (GvCV(sv) && SvOBJECT(GvCV(sv))) )
482 {
483 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning named glob object:\n "), sv_dump(sv)));
ec5f3c78 484 SvFLAGS(sv) |= SVf_BREAK;
645c22ef
DM
485 SvREFCNT_dec(sv);
486 }
487 }
488}
489#endif
490
491/*
492=for apidoc sv_clean_objs
493
494Attempt to destroy all objects not yet freed
495
496=cut
497*/
498
4561caa4 499void
864dbfa3 500Perl_sv_clean_objs(pTHX)
4561caa4 501{
97aff369 502 dVAR;
3280af22 503 PL_in_clean_objs = TRUE;
055972dc 504 visit(do_clean_objs, SVf_ROK, SVf_ROK);
4561caa4 505#ifndef DISABLE_DESTRUCTOR_KLUDGE
2d0f3c12 506 /* some barnacles may yet remain, clinging to typeglobs */
055972dc 507 visit(do_clean_named_objs, SVt_PVGV, SVTYPEMASK);
4561caa4 508#endif
3280af22 509 PL_in_clean_objs = FALSE;
4561caa4
CS
510}
511
645c22ef
DM
512/* called by sv_clean_all() for each live SV */
513
514static void
acfe0abc 515do_clean_all(pTHX_ SV *sv)
645c22ef 516{
97aff369 517 dVAR;
645c22ef
DM
518 DEBUG_D((PerlIO_printf(Perl_debug_log, "Cleaning loops: SV at 0x%"UVxf"\n", PTR2UV(sv)) ));
519 SvFLAGS(sv) |= SVf_BREAK;
0e705b3b 520 if (PL_comppad == (AV*)sv) {
7d49f689 521 PL_comppad = NULL;
4608196e 522 PL_curpad = NULL;
0e705b3b 523 }
645c22ef
DM
524 SvREFCNT_dec(sv);
525}
526
527/*
528=for apidoc sv_clean_all
529
530Decrement the refcnt of each remaining SV, possibly triggering a
531cleanup. This function may have to be called multiple times to free
ff276b08 532SVs which are in complex self-referential hierarchies.
645c22ef
DM
533
534=cut
535*/
536
5226ed68 537I32
864dbfa3 538Perl_sv_clean_all(pTHX)
8990e307 539{
97aff369 540 dVAR;
5226ed68 541 I32 cleaned;
3280af22 542 PL_in_clean_all = TRUE;
055972dc 543 cleaned = visit(do_clean_all, 0,0);
3280af22 544 PL_in_clean_all = FALSE;
5226ed68 545 return cleaned;
8990e307 546}
463ee0b2 547
5e258f8c
JC
548/*
549 ARENASETS: a meta-arena implementation which separates arena-info
550 into struct arena_set, which contains an array of struct
551 arena_descs, each holding info for a single arena. By separating
552 the meta-info from the arena, we recover the 1st slot, formerly
553 borrowed for list management. The arena_set is about the size of an
554 arena, avoiding the needless malloc overhead of a naive linked-list
555
556 The cost is 1 arena-set malloc per ~320 arena-mallocs, + the unused
557 memory in the last arena-set (1/2 on average). In trade, we get
558 back the 1st slot in each arena (ie 1.7% of a CV-arena, less for
d2a0f284
JC
559 smaller types). The recovery of the wasted space allows use of
560 small arenas for large, rare body types,
5e258f8c 561*/
5e258f8c 562struct arena_desc {
398c677b
NC
563 char *arena; /* the raw storage, allocated aligned */
564 size_t size; /* its size ~4k typ */
565 int unit_type; /* useful for arena audits */
5e258f8c
JC
566 /* info for sv-heads (eventually)
567 int count, flags;
568 */
569};
570
e6148039
NC
571struct arena_set;
572
573/* Get the maximum number of elements in set[] such that struct arena_set
574 will fit within PERL_ARENA_SIZE, which is probabably just under 4K, and
575 therefore likely to be 1 aligned memory page. */
576
577#define ARENAS_PER_SET ((PERL_ARENA_SIZE - sizeof(struct arena_set*) \
578 - 2 * sizeof(int)) / sizeof (struct arena_desc))
5e258f8c
JC
579
580struct arena_set {
581 struct arena_set* next;
582 int set_size; /* ie ARENAS_PER_SET */
583 int curr; /* index of next available arena-desc */
584 struct arena_desc set[ARENAS_PER_SET];
585};
586
645c22ef
DM
587/*
588=for apidoc sv_free_arenas
589
590Deallocate the memory used by all arenas. Note that all the individual SV
591heads and bodies within the arenas must already have been freed.
592
593=cut
594*/
4633a7c4 595void
864dbfa3 596Perl_sv_free_arenas(pTHX)
4633a7c4 597{
97aff369 598 dVAR;
4633a7c4
LW
599 SV* sva;
600 SV* svanext;
93e68bfb 601 int i;
4633a7c4
LW
602
603 /* Free arenas here, but be careful about fake ones. (We assume
604 contiguity of the fake ones with the corresponding real ones.) */
605
3280af22 606 for (sva = PL_sv_arenaroot; sva; sva = svanext) {
4633a7c4
LW
607 svanext = (SV*) SvANY(sva);
608 while (svanext && SvFAKE(svanext))
609 svanext = (SV*) SvANY(svanext);
610
611 if (!SvFAKE(sva))
1df70142 612 Safefree(sva);
4633a7c4 613 }
93e68bfb 614
5e258f8c
JC
615 {
616 struct arena_set *next, *aroot = (struct arena_set*) PL_body_arenas;
617
618 for (; aroot; aroot = next) {
96a5add6 619 const int max = aroot->curr;
5e258f8c
JC
620 for (i=0; i<max; i++) {
621 assert(aroot->set[i].arena);
622 Safefree(aroot->set[i].arena);
623 }
624 next = aroot->next;
625 Safefree(aroot);
626 }
627 }
dc8220bf 628 PL_body_arenas = 0;
fdda85ca 629
232d1c15 630 for (i=0; i<PERL_ARENA_ROOTS_SIZE; i++)
93e68bfb 631 PL_body_roots[i] = 0;
93e68bfb 632
43c5f42d 633 Safefree(PL_nice_chunk);
bd61b366 634 PL_nice_chunk = NULL;
3280af22
NIS
635 PL_nice_chunk_size = 0;
636 PL_sv_arenaroot = 0;
637 PL_sv_root = 0;
4633a7c4
LW
638}
639
bd81e77b
NC
640/*
641 Here are mid-level routines that manage the allocation of bodies out
642 of the various arenas. There are 5 kinds of arenas:
29489e7c 643
bd81e77b
NC
644 1. SV-head arenas, which are discussed and handled above
645 2. regular body arenas
646 3. arenas for reduced-size bodies
647 4. Hash-Entry arenas
648 5. pte arenas (thread related)
29489e7c 649
bd81e77b
NC
650 Arena types 2 & 3 are chained by body-type off an array of
651 arena-root pointers, which is indexed by svtype. Some of the
652 larger/less used body types are malloced singly, since a large
653 unused block of them is wasteful. Also, several svtypes dont have
654 bodies; the data fits into the sv-head itself. The arena-root
655 pointer thus has a few unused root-pointers (which may be hijacked
656 later for arena types 4,5)
29489e7c 657
bd81e77b
NC
658 3 differs from 2 as an optimization; some body types have several
659 unused fields in the front of the structure (which are kept in-place
660 for consistency). These bodies can be allocated in smaller chunks,
661 because the leading fields arent accessed. Pointers to such bodies
662 are decremented to point at the unused 'ghost' memory, knowing that
663 the pointers are used with offsets to the real memory.
29489e7c 664
bd81e77b
NC
665 HE, HEK arenas are managed separately, with separate code, but may
666 be merge-able later..
667
668 PTE arenas are not sv-bodies, but they share these mid-level
669 mechanics, so are considered here. The new mid-level mechanics rely
670 on the sv_type of the body being allocated, so we just reserve one
671 of the unused body-slots for PTEs, then use it in those (2) PTE
672 contexts below (line ~10k)
673*/
674
bd26d9a3 675/* get_arena(size): this creates custom-sized arenas
5e258f8c
JC
676 TBD: export properly for hv.c: S_more_he().
677*/
678void*
679Perl_get_arena(pTHX_ int arena_size)
680{
7a89be66 681 dVAR;
5e258f8c 682 struct arena_desc* adesc;
476a1e16 683 struct arena_set *newroot, **aroot = (struct arena_set**) &PL_body_arenas;
5e258f8c
JC
684 int curr;
685
476a1e16
JC
686 /* shouldnt need this
687 if (!arena_size) arena_size = PERL_ARENA_SIZE;
688 */
5e258f8c
JC
689
690 /* may need new arena-set to hold new arena */
476a1e16 691 if (!*aroot || (*aroot)->curr >= (*aroot)->set_size) {
5e258f8c
JC
692 Newxz(newroot, 1, struct arena_set);
693 newroot->set_size = ARENAS_PER_SET;
476a1e16
JC
694 newroot->next = *aroot;
695 *aroot = newroot;
ca0270c4 696 DEBUG_m(PerlIO_printf(Perl_debug_log, "new arenaset %p\n", (void*)*aroot));
5e258f8c
JC
697 }
698
699 /* ok, now have arena-set with at least 1 empty/available arena-desc */
476a1e16
JC
700 curr = (*aroot)->curr++;
701 adesc = &((*aroot)->set[curr]);
5e258f8c
JC
702 assert(!adesc->arena);
703
5e258f8c
JC
704 Newxz(adesc->arena, arena_size, char);
705 adesc->size = arena_size;
d2a0f284
JC
706 DEBUG_m(PerlIO_printf(Perl_debug_log, "arena %d added: %p size %d\n",
707 curr, adesc->arena, arena_size));
5e258f8c
JC
708
709 return adesc->arena;
5e258f8c
JC
710}
711
53c1dcc0 712
bd81e77b 713/* return a thing to the free list */
29489e7c 714
bd81e77b
NC
715#define del_body(thing, root) \
716 STMT_START { \
00b6aa41 717 void ** const thing_copy = (void **)thing;\
bd81e77b
NC
718 LOCK_SV_MUTEX; \
719 *thing_copy = *root; \
720 *root = (void*)thing_copy; \
721 UNLOCK_SV_MUTEX; \
722 } STMT_END
29489e7c 723
bd81e77b 724/*
d2a0f284
JC
725
726=head1 SV-Body Allocation
727
728Allocation of SV-bodies is similar to SV-heads, differing as follows;
729the allocation mechanism is used for many body types, so is somewhat
730more complicated, it uses arena-sets, and has no need for still-live
731SV detection.
732
733At the outermost level, (new|del)_X*V macros return bodies of the
734appropriate type. These macros call either (new|del)_body_type or
735(new|del)_body_allocated macro pairs, depending on specifics of the
736type. Most body types use the former pair, the latter pair is used to
737allocate body types with "ghost fields".
738
739"ghost fields" are fields that are unused in certain types, and
740consequently dont need to actually exist. They are declared because
741they're part of a "base type", which allows use of functions as
742methods. The simplest examples are AVs and HVs, 2 aggregate types
743which don't use the fields which support SCALAR semantics.
744
745For these types, the arenas are carved up into *_allocated size
746chunks, we thus avoid wasted memory for those unaccessed members.
747When bodies are allocated, we adjust the pointer back in memory by the
748size of the bit not allocated, so it's as if we allocated the full
749structure. (But things will all go boom if you write to the part that
750is "not there", because you'll be overwriting the last members of the
751preceding structure in memory.)
752
753We calculate the correction using the STRUCT_OFFSET macro. For
754example, if xpv_allocated is the same structure as XPV then the two
755OFFSETs sum to zero, and the pointer is unchanged. If the allocated
756structure is smaller (no initial NV actually allocated) then the net
757effect is to subtract the size of the NV from the pointer, to return a
758new pointer as if an initial NV were actually allocated.
759
760This is the same trick as was used for NV and IV bodies. Ironically it
761doesn't need to be used for NV bodies any more, because NV is now at
762the start of the structure. IV bodies don't need it either, because
763they are no longer allocated.
764
765In turn, the new_body_* allocators call S_new_body(), which invokes
766new_body_inline macro, which takes a lock, and takes a body off the
767linked list at PL_body_roots[sv_type], calling S_more_bodies() if
768necessary to refresh an empty list. Then the lock is released, and
769the body is returned.
770
771S_more_bodies calls get_arena(), and carves it up into an array of N
772bodies, which it strings into a linked list. It looks up arena-size
773and body-size from the body_details table described below, thus
774supporting the multiple body-types.
775
776If PURIFY is defined, or PERL_ARENA_SIZE=0, arenas are not used, and
777the (new|del)_X*V macros are mapped directly to malloc/free.
778
779*/
780
781/*
782
783For each sv-type, struct body_details bodies_by_type[] carries
784parameters which control these aspects of SV handling:
785
786Arena_size determines whether arenas are used for this body type, and if
787so, how big they are. PURIFY or PERL_ARENA_SIZE=0 set this field to
788zero, forcing individual mallocs and frees.
789
790Body_size determines how big a body is, and therefore how many fit into
791each arena. Offset carries the body-pointer adjustment needed for
792*_allocated body types, and is used in *_allocated macros.
793
794But its main purpose is to parameterize info needed in
795Perl_sv_upgrade(). The info here dramatically simplifies the function
796vs the implementation in 5.8.7, making it table-driven. All fields
797are used for this, except for arena_size.
798
799For the sv-types that have no bodies, arenas are not used, so those
800PL_body_roots[sv_type] are unused, and can be overloaded. In
801something of a special case, SVt_NULL is borrowed for HE arenas;
802PL_body_roots[SVt_NULL] is filled by S_more_he, but the
803bodies_by_type[SVt_NULL] slot is not used, as the table is not
804available in hv.c,
805
806PTEs also use arenas, but are never seen in Perl_sv_upgrade.
807Nonetheless, they get their own slot in bodies_by_type[SVt_NULL], so
808they can just use the same allocation semantics. At first, PTEs were
809also overloaded to a non-body sv-type, but this yielded hard-to-find
810malloc bugs, so was simplified by claiming a new slot. This choice
811has no consequence at this time.
812
29489e7c
DM
813*/
814
bd81e77b 815struct body_details {
0fb58b32 816 U8 body_size; /* Size to allocate */
10666ae3 817 U8 copy; /* Size of structure to copy (may be shorter) */
0fb58b32 818 U8 offset;
10666ae3
NC
819 unsigned int type : 4; /* We have space for a sanity check. */
820 unsigned int cant_upgrade : 1; /* Cannot upgrade this type */
821 unsigned int zero_nv : 1; /* zero the NV when upgrading from this */
822 unsigned int arena : 1; /* Allocated from an arena */
823 size_t arena_size; /* Size of arena to allocate */
bd81e77b 824};
29489e7c 825
bd81e77b
NC
826#define HADNV FALSE
827#define NONV TRUE
29489e7c 828
d2a0f284 829
bd81e77b
NC
830#ifdef PURIFY
831/* With -DPURFIY we allocate everything directly, and don't use arenas.
832 This seems a rather elegant way to simplify some of the code below. */
833#define HASARENA FALSE
834#else
835#define HASARENA TRUE
836#endif
837#define NOARENA FALSE
29489e7c 838
d2a0f284
JC
839/* Size the arenas to exactly fit a given number of bodies. A count
840 of 0 fits the max number bodies into a PERL_ARENA_SIZE.block,
841 simplifying the default. If count > 0, the arena is sized to fit
842 only that many bodies, allowing arenas to be used for large, rare
843 bodies (XPVFM, XPVIO) without undue waste. The arena size is
844 limited by PERL_ARENA_SIZE, so we can safely oversize the
845 declarations.
846 */
95db5f15
MB
847#define FIT_ARENA0(body_size) \
848 ((size_t)(PERL_ARENA_SIZE / body_size) * body_size)
849#define FIT_ARENAn(count,body_size) \
850 ( count * body_size <= PERL_ARENA_SIZE) \
851 ? count * body_size \
852 : FIT_ARENA0 (body_size)
853#define FIT_ARENA(count,body_size) \
854 count \
855 ? FIT_ARENAn (count, body_size) \
856 : FIT_ARENA0 (body_size)
d2a0f284 857
bd81e77b 858/* A macro to work out the offset needed to subtract from a pointer to (say)
29489e7c 859
bd81e77b
NC
860typedef struct {
861 STRLEN xpv_cur;
862 STRLEN xpv_len;
863} xpv_allocated;
29489e7c 864
bd81e77b 865to make its members accessible via a pointer to (say)
29489e7c 866
bd81e77b
NC
867struct xpv {
868 NV xnv_nv;
869 STRLEN xpv_cur;
870 STRLEN xpv_len;
871};
29489e7c 872
bd81e77b 873*/
29489e7c 874
bd81e77b
NC
875#define relative_STRUCT_OFFSET(longer, shorter, member) \
876 (STRUCT_OFFSET(shorter, member) - STRUCT_OFFSET(longer, member))
29489e7c 877
bd81e77b
NC
878/* Calculate the length to copy. Specifically work out the length less any
879 final padding the compiler needed to add. See the comment in sv_upgrade
880 for why copying the padding proved to be a bug. */
29489e7c 881
bd81e77b
NC
882#define copy_length(type, last_member) \
883 STRUCT_OFFSET(type, last_member) \
884 + sizeof (((type*)SvANY((SV*)0))->last_member)
29489e7c 885
bd81e77b 886static const struct body_details bodies_by_type[] = {
10666ae3
NC
887 { sizeof(HE), 0, 0, SVt_NULL,
888 FALSE, NONV, NOARENA, FIT_ARENA(0, sizeof(HE)) },
d2a0f284
JC
889
890 /* IVs are in the head, so the allocation size is 0.
891 However, the slot is overloaded for PTEs. */
892 { sizeof(struct ptr_tbl_ent), /* This is used for PTEs. */
893 sizeof(IV), /* This is used to copy out the IV body. */
10666ae3 894 STRUCT_OFFSET(XPVIV, xiv_iv), SVt_IV, FALSE, NONV,
d2a0f284
JC
895 NOARENA /* IVS don't need an arena */,
896 /* But PTEs need to know the size of their arena */
897 FIT_ARENA(0, sizeof(struct ptr_tbl_ent))
898 },
899
bd81e77b 900 /* 8 bytes on most ILP32 with IEEE doubles */
10666ae3 901 { sizeof(NV), sizeof(NV), 0, SVt_NV, FALSE, HADNV, HASARENA,
d2a0f284
JC
902 FIT_ARENA(0, sizeof(NV)) },
903
904 /* RVs are in the head now. */
10666ae3 905 { 0, 0, 0, SVt_RV, FALSE, NONV, NOARENA, 0 },
d2a0f284 906
bd81e77b 907 /* 8 bytes on most ILP32 with IEEE doubles */
d2a0f284
JC
908 { sizeof(xpv_allocated),
909 copy_length(XPV, xpv_len)
910 - relative_STRUCT_OFFSET(xpv_allocated, XPV, xpv_cur),
911 + relative_STRUCT_OFFSET(xpv_allocated, XPV, xpv_cur),
10666ae3 912 SVt_PV, FALSE, NONV, HASARENA, FIT_ARENA(0, sizeof(xpv_allocated)) },
d2a0f284 913
bd81e77b 914 /* 12 */
d2a0f284
JC
915 { sizeof(xpviv_allocated),
916 copy_length(XPVIV, xiv_u)
917 - relative_STRUCT_OFFSET(xpviv_allocated, XPVIV, xpv_cur),
918 + relative_STRUCT_OFFSET(xpviv_allocated, XPVIV, xpv_cur),
10666ae3 919 SVt_PVIV, FALSE, NONV, HASARENA, FIT_ARENA(0, sizeof(xpviv_allocated)) },
d2a0f284 920
bd81e77b 921 /* 20 */
10666ae3 922 { sizeof(XPVNV), copy_length(XPVNV, xiv_u), 0, SVt_PVNV, FALSE, HADNV,
d2a0f284
JC
923 HASARENA, FIT_ARENA(0, sizeof(XPVNV)) },
924
bd81e77b 925 /* 28 */
10666ae3 926 { sizeof(XPVMG), copy_length(XPVMG, xmg_stash), 0, SVt_PVMG, FALSE, HADNV,
d2a0f284
JC
927 HASARENA, FIT_ARENA(0, sizeof(XPVMG)) },
928
bd81e77b 929 /* 36 */
10666ae3 930 { sizeof(XPVBM), sizeof(XPVBM), 0, SVt_PVBM, TRUE, HADNV,
d2a0f284
JC
931 HASARENA, FIT_ARENA(0, sizeof(XPVBM)) },
932
bd81e77b 933 /* 48 */
10666ae3 934 { sizeof(XPVGV), sizeof(XPVGV), 0, SVt_PVGV, TRUE, HADNV,
d2a0f284
JC
935 HASARENA, FIT_ARENA(0, sizeof(XPVGV)) },
936
bd81e77b 937 /* 64 */
10666ae3 938 { sizeof(XPVLV), sizeof(XPVLV), 0, SVt_PVLV, TRUE, HADNV,
d2a0f284
JC
939 HASARENA, FIT_ARENA(0, sizeof(XPVLV)) },
940
941 { sizeof(xpvav_allocated),
942 copy_length(XPVAV, xmg_stash)
943 - relative_STRUCT_OFFSET(xpvav_allocated, XPVAV, xav_fill),
944 + relative_STRUCT_OFFSET(xpvav_allocated, XPVAV, xav_fill),
10666ae3 945 SVt_PVAV, TRUE, HADNV, HASARENA, FIT_ARENA(0, sizeof(xpvav_allocated)) },
d2a0f284
JC
946
947 { sizeof(xpvhv_allocated),
948 copy_length(XPVHV, xmg_stash)
949 - relative_STRUCT_OFFSET(xpvhv_allocated, XPVHV, xhv_fill),
950 + relative_STRUCT_OFFSET(xpvhv_allocated, XPVHV, xhv_fill),
10666ae3 951 SVt_PVHV, TRUE, HADNV, HASARENA, FIT_ARENA(0, sizeof(xpvhv_allocated)) },
d2a0f284 952
c84c4652 953 /* 56 */
4115f141 954 { sizeof(xpvcv_allocated), sizeof(xpvcv_allocated),
c84c4652 955 + relative_STRUCT_OFFSET(xpvcv_allocated, XPVCV, xpv_cur),
10666ae3 956 SVt_PVCV, TRUE, NONV, HASARENA, FIT_ARENA(0, sizeof(xpvcv_allocated)) },
d2a0f284 957
4115f141 958 { sizeof(xpvfm_allocated), sizeof(xpvfm_allocated),
3038937b 959 + relative_STRUCT_OFFSET(xpvfm_allocated, XPVFM, xpv_cur),
10666ae3 960 SVt_PVFM, TRUE, NONV, NOARENA, FIT_ARENA(20, sizeof(xpvfm_allocated)) },
d2a0f284
JC
961
962 /* XPVIO is 84 bytes, fits 48x */
10666ae3 963 { sizeof(XPVIO), sizeof(XPVIO), 0, SVt_PVIO, TRUE, HADNV,
d2a0f284 964 HASARENA, FIT_ARENA(24, sizeof(XPVIO)) },
bd81e77b 965};
29489e7c 966
d2a0f284
JC
967#define new_body_type(sv_type) \
968 (void *)((char *)S_new_body(aTHX_ sv_type))
29489e7c 969
bd81e77b
NC
970#define del_body_type(p, sv_type) \
971 del_body(p, &PL_body_roots[sv_type])
29489e7c 972
29489e7c 973
bd81e77b 974#define new_body_allocated(sv_type) \
d2a0f284 975 (void *)((char *)S_new_body(aTHX_ sv_type) \
bd81e77b 976 - bodies_by_type[sv_type].offset)
29489e7c 977
bd81e77b
NC
978#define del_body_allocated(p, sv_type) \
979 del_body(p + bodies_by_type[sv_type].offset, &PL_body_roots[sv_type])
29489e7c 980
29489e7c 981
bd81e77b
NC
982#define my_safemalloc(s) (void*)safemalloc(s)
983#define my_safecalloc(s) (void*)safecalloc(s, 1)
984#define my_safefree(p) safefree((char*)p)
29489e7c 985
bd81e77b 986#ifdef PURIFY
29489e7c 987
bd81e77b
NC
988#define new_XNV() my_safemalloc(sizeof(XPVNV))
989#define del_XNV(p) my_safefree(p)
29489e7c 990
bd81e77b
NC
991#define new_XPVNV() my_safemalloc(sizeof(XPVNV))
992#define del_XPVNV(p) my_safefree(p)
29489e7c 993
bd81e77b
NC
994#define new_XPVAV() my_safemalloc(sizeof(XPVAV))
995#define del_XPVAV(p) my_safefree(p)
29489e7c 996
bd81e77b
NC
997#define new_XPVHV() my_safemalloc(sizeof(XPVHV))
998#define del_XPVHV(p) my_safefree(p)
29489e7c 999
bd81e77b
NC
1000#define new_XPVMG() my_safemalloc(sizeof(XPVMG))
1001#define del_XPVMG(p) my_safefree(p)
29489e7c 1002
bd81e77b
NC
1003#define new_XPVGV() my_safemalloc(sizeof(XPVGV))
1004#define del_XPVGV(p) my_safefree(p)
29489e7c 1005
bd81e77b 1006#else /* !PURIFY */
29489e7c 1007
bd81e77b
NC
1008#define new_XNV() new_body_type(SVt_NV)
1009#define del_XNV(p) del_body_type(p, SVt_NV)
29489e7c 1010
bd81e77b
NC
1011#define new_XPVNV() new_body_type(SVt_PVNV)
1012#define del_XPVNV(p) del_body_type(p, SVt_PVNV)
29489e7c 1013
bd81e77b
NC
1014#define new_XPVAV() new_body_allocated(SVt_PVAV)
1015#define del_XPVAV(p) del_body_allocated(p, SVt_PVAV)
645c22ef 1016
bd81e77b
NC
1017#define new_XPVHV() new_body_allocated(SVt_PVHV)
1018#define del_XPVHV(p) del_body_allocated(p, SVt_PVHV)
645c22ef 1019
bd81e77b
NC
1020#define new_XPVMG() new_body_type(SVt_PVMG)
1021#define del_XPVMG(p) del_body_type(p, SVt_PVMG)
645c22ef 1022
bd81e77b
NC
1023#define new_XPVGV() new_body_type(SVt_PVGV)
1024#define del_XPVGV(p) del_body_type(p, SVt_PVGV)
1d7c1841 1025
bd81e77b 1026#endif /* PURIFY */
93e68bfb 1027
bd81e77b 1028/* no arena for you! */
93e68bfb 1029
bd81e77b 1030#define new_NOARENA(details) \
d2a0f284 1031 my_safemalloc((details)->body_size + (details)->offset)
bd81e77b 1032#define new_NOARENAZ(details) \
d2a0f284
JC
1033 my_safecalloc((details)->body_size + (details)->offset)
1034
10666ae3
NC
1035#ifdef DEBUGGING
1036static bool done_sanity_check;
1037#endif
1038
d2a0f284
JC
1039STATIC void *
1040S_more_bodies (pTHX_ svtype sv_type)
1041{
1042 dVAR;
1043 void ** const root = &PL_body_roots[sv_type];
96a5add6 1044 const struct body_details * const bdp = &bodies_by_type[sv_type];
d2a0f284
JC
1045 const size_t body_size = bdp->body_size;
1046 char *start;
1047 const char *end;
1048
1049 assert(bdp->arena_size);
10666ae3
NC
1050
1051#ifdef DEBUGGING
1052 if (!done_sanity_check) {
ea471437 1053 unsigned int i = SVt_LAST;
10666ae3
NC
1054
1055 done_sanity_check = TRUE;
1056
1057 while (i--)
1058 assert (bodies_by_type[i].type == i);
1059 }
1060#endif
1061
d2a0f284
JC
1062 start = (char*) Perl_get_arena(aTHX_ bdp->arena_size);
1063
1064 end = start + bdp->arena_size - body_size;
1065
d2a0f284
JC
1066 /* computed count doesnt reflect the 1st slot reservation */
1067 DEBUG_m(PerlIO_printf(Perl_debug_log,
1068 "arena %p end %p arena-size %d type %d size %d ct %d\n",
0e84aef4
JH
1069 start, end,
1070 (int)bdp->arena_size, sv_type, (int)body_size,
1071 (int)bdp->arena_size / (int)body_size));
d2a0f284
JC
1072
1073 *root = (void *)start;
1074
1075 while (start < end) {
1076 char * const next = start + body_size;
1077 *(void**) start = (void *)next;
1078 start = next;
1079 }
1080 *(void **)start = 0;
1081
1082 return *root;
1083}
1084
1085/* grab a new thing from the free list, allocating more if necessary.
1086 The inline version is used for speed in hot routines, and the
1087 function using it serves the rest (unless PURIFY).
1088*/
1089#define new_body_inline(xpv, sv_type) \
1090 STMT_START { \
1091 void ** const r3wt = &PL_body_roots[sv_type]; \
1092 LOCK_SV_MUTEX; \
1093 xpv = *((void **)(r3wt)) \
d4c19fe8 1094 ? *((void **)(r3wt)) : more_bodies(sv_type); \
d2a0f284
JC
1095 *(r3wt) = *(void**)(xpv); \
1096 UNLOCK_SV_MUTEX; \
1097 } STMT_END
1098
1099#ifndef PURIFY
1100
1101STATIC void *
1102S_new_body(pTHX_ svtype sv_type)
1103{
1104 dVAR;
1105 void *xpv;
1106 new_body_inline(xpv, sv_type);
1107 return xpv;
1108}
1109
1110#endif
93e68bfb 1111
bd81e77b
NC
1112/*
1113=for apidoc sv_upgrade
93e68bfb 1114
bd81e77b
NC
1115Upgrade an SV to a more complex form. Generally adds a new body type to the
1116SV, then copies across as much information as possible from the old body.
1117You generally want to use the C<SvUPGRADE> macro wrapper. See also C<svtype>.
93e68bfb 1118
bd81e77b 1119=cut
93e68bfb 1120*/
93e68bfb 1121
bd81e77b 1122void
42d0e0b7 1123Perl_sv_upgrade(pTHX_ register SV *sv, svtype new_type)
cac9b346 1124{
97aff369 1125 dVAR;
bd81e77b
NC
1126 void* old_body;
1127 void* new_body;
42d0e0b7 1128 const svtype old_type = SvTYPE(sv);
d2a0f284 1129 const struct body_details *new_type_details;
bd81e77b
NC
1130 const struct body_details *const old_type_details
1131 = bodies_by_type + old_type;
cac9b346 1132
bd81e77b
NC
1133 if (new_type != SVt_PV && SvIsCOW(sv)) {
1134 sv_force_normal_flags(sv, 0);
1135 }
cac9b346 1136
bd81e77b
NC
1137 if (old_type == new_type)
1138 return;
cac9b346 1139
bd81e77b
NC
1140 if (old_type > new_type)
1141 Perl_croak(aTHX_ "sv_upgrade from type %d down to type %d",
1142 (int)old_type, (int)new_type);
cac9b346 1143
cac9b346 1144
bd81e77b 1145 old_body = SvANY(sv);
de042e1d 1146
bd81e77b
NC
1147 /* Copying structures onto other structures that have been neatly zeroed
1148 has a subtle gotcha. Consider XPVMG
cac9b346 1149
bd81e77b
NC
1150 +------+------+------+------+------+-------+-------+
1151 | NV | CUR | LEN | IV | MAGIC | STASH |
1152 +------+------+------+------+------+-------+-------+
1153 0 4 8 12 16 20 24 28
645c22ef 1154
bd81e77b
NC
1155 where NVs are aligned to 8 bytes, so that sizeof that structure is
1156 actually 32 bytes long, with 4 bytes of padding at the end:
08742458 1157
bd81e77b
NC
1158 +------+------+------+------+------+-------+-------+------+
1159 | NV | CUR | LEN | IV | MAGIC | STASH | ??? |
1160 +------+------+------+------+------+-------+-------+------+
1161 0 4 8 12 16 20 24 28 32
08742458 1162
bd81e77b 1163 so what happens if you allocate memory for this structure:
30f9da9e 1164
bd81e77b
NC
1165 +------+------+------+------+------+-------+-------+------+------+...
1166 | NV | CUR | LEN | IV | MAGIC | STASH | GP | NAME |
1167 +------+------+------+------+------+-------+-------+------+------+...
1168 0 4 8 12 16 20 24 28 32 36
bfc44f79 1169
bd81e77b
NC
1170 zero it, then copy sizeof(XPVMG) bytes on top of it? Not quite what you
1171 expect, because you copy the area marked ??? onto GP. Now, ??? may have
1172 started out as zero once, but it's quite possible that it isn't. So now,
1173 rather than a nicely zeroed GP, you have it pointing somewhere random.
1174 Bugs ensue.
bfc44f79 1175
bd81e77b
NC
1176 (In fact, GP ends up pointing at a previous GP structure, because the
1177 principle cause of the padding in XPVMG getting garbage is a copy of
1178 sizeof(XPVMG) bytes from a XPVGV structure in sv_unglob)
30f9da9e 1179
bd81e77b
NC
1180 So we are careful and work out the size of used parts of all the
1181 structures. */
bfc44f79 1182
bd81e77b
NC
1183 switch (old_type) {
1184 case SVt_NULL:
1185 break;
1186 case SVt_IV:
1187 if (new_type < SVt_PVIV) {
1188 new_type = (new_type == SVt_NV)
1189 ? SVt_PVNV : SVt_PVIV;
bd81e77b
NC
1190 }
1191 break;
1192 case SVt_NV:
1193 if (new_type < SVt_PVNV) {
1194 new_type = SVt_PVNV;
bd81e77b
NC
1195 }
1196 break;
1197 case SVt_RV:
1198 break;
1199 case SVt_PV:
1200 assert(new_type > SVt_PV);
1201 assert(SVt_IV < SVt_PV);
1202 assert(SVt_NV < SVt_PV);
1203 break;
1204 case SVt_PVIV:
1205 break;
1206 case SVt_PVNV:
1207 break;
1208 case SVt_PVMG:
1209 /* Because the XPVMG of PL_mess_sv isn't allocated from the arena,
1210 there's no way that it can be safely upgraded, because perl.c
1211 expects to Safefree(SvANY(PL_mess_sv)) */
1212 assert(sv != PL_mess_sv);
1213 /* This flag bit is used to mean other things in other scalar types.
1214 Given that it only has meaning inside the pad, it shouldn't be set
1215 on anything that can get upgraded. */
00b1698f 1216 assert(!SvPAD_TYPED(sv));
bd81e77b
NC
1217 break;
1218 default:
1219 if (old_type_details->cant_upgrade)
c81225bc
NC
1220 Perl_croak(aTHX_ "Can't upgrade %s (%" UVuf ") to %" UVuf,
1221 sv_reftype(sv, 0), (UV) old_type, (UV) new_type);
bd81e77b 1222 }
2fa1109b 1223 new_type_details = bodies_by_type + new_type;
645c22ef 1224
bd81e77b
NC
1225 SvFLAGS(sv) &= ~SVTYPEMASK;
1226 SvFLAGS(sv) |= new_type;
932e9ff9 1227
ab4416c0
NC
1228 /* This can't happen, as SVt_NULL is <= all values of new_type, so one of
1229 the return statements above will have triggered. */
1230 assert (new_type != SVt_NULL);
bd81e77b 1231 switch (new_type) {
bd81e77b
NC
1232 case SVt_IV:
1233 assert(old_type == SVt_NULL);
1234 SvANY(sv) = (XPVIV*)((char*)&(sv->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
1235 SvIV_set(sv, 0);
1236 return;
1237 case SVt_NV:
1238 assert(old_type == SVt_NULL);
1239 SvANY(sv) = new_XNV();
1240 SvNV_set(sv, 0);
1241 return;
1242 case SVt_RV:
1243 assert(old_type == SVt_NULL);
1244 SvANY(sv) = &sv->sv_u.svu_rv;
1245 SvRV_set(sv, 0);
1246 return;
1247 case SVt_PVHV:
bd81e77b 1248 case SVt_PVAV:
d2a0f284 1249 assert(new_type_details->body_size);
c1ae03ae
NC
1250
1251#ifndef PURIFY
1252 assert(new_type_details->arena);
d2a0f284 1253 assert(new_type_details->arena_size);
c1ae03ae 1254 /* This points to the start of the allocated area. */
d2a0f284
JC
1255 new_body_inline(new_body, new_type);
1256 Zero(new_body, new_type_details->body_size, char);
c1ae03ae
NC
1257 new_body = ((char *)new_body) - new_type_details->offset;
1258#else
1259 /* We always allocated the full length item with PURIFY. To do this
1260 we fake things so that arena is false for all 16 types.. */
1261 new_body = new_NOARENAZ(new_type_details);
1262#endif
1263 SvANY(sv) = new_body;
1264 if (new_type == SVt_PVAV) {
1265 AvMAX(sv) = -1;
1266 AvFILLp(sv) = -1;
1267 AvREAL_only(sv);
1268 }
aeb18a1e 1269
bd81e77b
NC
1270 /* SVt_NULL isn't the only thing upgraded to AV or HV.
1271 The target created by newSVrv also is, and it can have magic.
1272 However, it never has SvPVX set.
1273 */
1274 if (old_type >= SVt_RV) {
1275 assert(SvPVX_const(sv) == 0);
1276 }
aeb18a1e 1277
bd81e77b
NC
1278 /* Could put this in the else clause below, as PVMG must have SvPVX
1279 0 already (the assertion above) */
6136c704 1280 SvPV_set(sv, NULL);
93e68bfb 1281
bd81e77b 1282 if (old_type >= SVt_PVMG) {
e736a858 1283 SvMAGIC_set(sv, ((XPVMG*)old_body)->xmg_u.xmg_magic);
bd81e77b 1284 SvSTASH_set(sv, ((XPVMG*)old_body)->xmg_stash);
bd81e77b
NC
1285 }
1286 break;
93e68bfb 1287
93e68bfb 1288
bd81e77b
NC
1289 case SVt_PVIV:
1290 /* XXX Is this still needed? Was it ever needed? Surely as there is
1291 no route from NV to PVIV, NOK can never be true */
1292 assert(!SvNOKp(sv));
1293 assert(!SvNOK(sv));
1294 case SVt_PVIO:
1295 case SVt_PVFM:
1296 case SVt_PVBM:
1297 case SVt_PVGV:
1298 case SVt_PVCV:
1299 case SVt_PVLV:
1300 case SVt_PVMG:
1301 case SVt_PVNV:
1302 case SVt_PV:
93e68bfb 1303
d2a0f284 1304 assert(new_type_details->body_size);
bd81e77b
NC
1305 /* We always allocated the full length item with PURIFY. To do this
1306 we fake things so that arena is false for all 16 types.. */
1307 if(new_type_details->arena) {
1308 /* This points to the start of the allocated area. */
d2a0f284
JC
1309 new_body_inline(new_body, new_type);
1310 Zero(new_body, new_type_details->body_size, char);
bd81e77b
NC
1311 new_body = ((char *)new_body) - new_type_details->offset;
1312 } else {
1313 new_body = new_NOARENAZ(new_type_details);
1314 }
1315 SvANY(sv) = new_body;
5e2fc214 1316
bd81e77b 1317 if (old_type_details->copy) {
f9ba3d20
NC
1318 /* There is now the potential for an upgrade from something without
1319 an offset (PVNV or PVMG) to something with one (PVCV, PVFM) */
1320 int offset = old_type_details->offset;
1321 int length = old_type_details->copy;
1322
1323 if (new_type_details->offset > old_type_details->offset) {
d4c19fe8 1324 const int difference
f9ba3d20
NC
1325 = new_type_details->offset - old_type_details->offset;
1326 offset += difference;
1327 length -= difference;
1328 }
1329 assert (length >= 0);
1330
1331 Copy((char *)old_body + offset, (char *)new_body + offset, length,
1332 char);
bd81e77b
NC
1333 }
1334
1335#ifndef NV_ZERO_IS_ALLBITS_ZERO
f2524eef 1336 /* If NV 0.0 is stores as all bits 0 then Zero() already creates a
e5ce394c
NC
1337 * correct 0.0 for us. Otherwise, if the old body didn't have an
1338 * NV slot, but the new one does, then we need to initialise the
1339 * freshly created NV slot with whatever the correct bit pattern is
1340 * for 0.0 */
1341 if (old_type_details->zero_nv && !new_type_details->zero_nv)
bd81e77b 1342 SvNV_set(sv, 0);
82048762 1343#endif
5e2fc214 1344
bd81e77b 1345 if (new_type == SVt_PVIO)
f2524eef 1346 IoPAGE_LEN(sv) = 60;
bd81e77b 1347 if (old_type < SVt_RV)
6136c704 1348 SvPV_set(sv, NULL);
bd81e77b
NC
1349 break;
1350 default:
afd78fd5
JH
1351 Perl_croak(aTHX_ "panic: sv_upgrade to unknown type %lu",
1352 (unsigned long)new_type);
bd81e77b 1353 }
73171d91 1354
d2a0f284
JC
1355 if (old_type_details->arena) {
1356 /* If there was an old body, then we need to free it.
1357 Note that there is an assumption that all bodies of types that
1358 can be upgraded came from arenas. Only the more complex non-
1359 upgradable types are allowed to be directly malloc()ed. */
bd81e77b
NC
1360#ifdef PURIFY
1361 my_safefree(old_body);
1362#else
1363 del_body((void*)((char*)old_body + old_type_details->offset),
1364 &PL_body_roots[old_type]);
1365#endif
1366 }
1367}
73171d91 1368
bd81e77b
NC
1369/*
1370=for apidoc sv_backoff
73171d91 1371
bd81e77b
NC
1372Remove any string offset. You should normally use the C<SvOOK_off> macro
1373wrapper instead.
73171d91 1374
bd81e77b 1375=cut
73171d91
NC
1376*/
1377
bd81e77b
NC
1378int
1379Perl_sv_backoff(pTHX_ register SV *sv)
1380{
96a5add6 1381 PERL_UNUSED_CONTEXT;
bd81e77b
NC
1382 assert(SvOOK(sv));
1383 assert(SvTYPE(sv) != SVt_PVHV);
1384 assert(SvTYPE(sv) != SVt_PVAV);
1385 if (SvIVX(sv)) {
1386 const char * const s = SvPVX_const(sv);
1387 SvLEN_set(sv, SvLEN(sv) + SvIVX(sv));
1388 SvPV_set(sv, SvPVX(sv) - SvIVX(sv));
1389 SvIV_set(sv, 0);
1390 Move(s, SvPVX(sv), SvCUR(sv)+1, char);
1391 }
1392 SvFLAGS(sv) &= ~SVf_OOK;
1393 return 0;
1394}
73171d91 1395
bd81e77b
NC
1396/*
1397=for apidoc sv_grow
73171d91 1398
bd81e77b
NC
1399Expands the character buffer in the SV. If necessary, uses C<sv_unref> and
1400upgrades the SV to C<SVt_PV>. Returns a pointer to the character buffer.
1401Use the C<SvGROW> wrapper instead.
93e68bfb 1402
bd81e77b
NC
1403=cut
1404*/
93e68bfb 1405
bd81e77b
NC
1406char *
1407Perl_sv_grow(pTHX_ register SV *sv, register STRLEN newlen)
1408{
1409 register char *s;
93e68bfb 1410
5db06880
NC
1411 if (PL_madskills && newlen >= 0x100000) {
1412 PerlIO_printf(Perl_debug_log,
1413 "Allocation too large: %"UVxf"\n", (UV)newlen);
1414 }
bd81e77b
NC
1415#ifdef HAS_64K_LIMIT
1416 if (newlen >= 0x10000) {
1417 PerlIO_printf(Perl_debug_log,
1418 "Allocation too large: %"UVxf"\n", (UV)newlen);
1419 my_exit(1);
1420 }
1421#endif /* HAS_64K_LIMIT */
1422 if (SvROK(sv))
1423 sv_unref(sv);
1424 if (SvTYPE(sv) < SVt_PV) {
1425 sv_upgrade(sv, SVt_PV);
1426 s = SvPVX_mutable(sv);
1427 }
1428 else if (SvOOK(sv)) { /* pv is offset? */
1429 sv_backoff(sv);
1430 s = SvPVX_mutable(sv);
1431 if (newlen > SvLEN(sv))
1432 newlen += 10 * (newlen - SvCUR(sv)); /* avoid copy each time */
1433#ifdef HAS_64K_LIMIT
1434 if (newlen >= 0x10000)
1435 newlen = 0xFFFF;
1436#endif
1437 }
1438 else
1439 s = SvPVX_mutable(sv);
aeb18a1e 1440
bd81e77b
NC
1441 if (newlen > SvLEN(sv)) { /* need more room? */
1442 newlen = PERL_STRLEN_ROUNDUP(newlen);
1443 if (SvLEN(sv) && s) {
1444#ifdef MYMALLOC
1445 const STRLEN l = malloced_size((void*)SvPVX_const(sv));
1446 if (newlen <= l) {
1447 SvLEN_set(sv, l);
1448 return s;
1449 } else
1450#endif
1451 s = saferealloc(s, newlen);
1452 }
1453 else {
1454 s = safemalloc(newlen);
1455 if (SvPVX_const(sv) && SvCUR(sv)) {
1456 Move(SvPVX_const(sv), s, (newlen < SvCUR(sv)) ? newlen : SvCUR(sv), char);
1457 }
1458 }
1459 SvPV_set(sv, s);
1460 SvLEN_set(sv, newlen);
1461 }
1462 return s;
1463}
aeb18a1e 1464
bd81e77b
NC
1465/*
1466=for apidoc sv_setiv
932e9ff9 1467
bd81e77b
NC
1468Copies an integer into the given SV, upgrading first if necessary.
1469Does not handle 'set' magic. See also C<sv_setiv_mg>.
463ee0b2 1470
bd81e77b
NC
1471=cut
1472*/
463ee0b2 1473
bd81e77b
NC
1474void
1475Perl_sv_setiv(pTHX_ register SV *sv, IV i)
1476{
97aff369 1477 dVAR;
bd81e77b
NC
1478 SV_CHECK_THINKFIRST_COW_DROP(sv);
1479 switch (SvTYPE(sv)) {
1480 case SVt_NULL:
1481 sv_upgrade(sv, SVt_IV);
1482 break;
1483 case SVt_NV:
1484 sv_upgrade(sv, SVt_PVNV);
1485 break;
1486 case SVt_RV:
1487 case SVt_PV:
1488 sv_upgrade(sv, SVt_PVIV);
1489 break;
463ee0b2 1490
bd81e77b
NC
1491 case SVt_PVGV:
1492 case SVt_PVAV:
1493 case SVt_PVHV:
1494 case SVt_PVCV:
1495 case SVt_PVFM:
1496 case SVt_PVIO:
1497 Perl_croak(aTHX_ "Can't coerce %s to integer in %s", sv_reftype(sv,0),
1498 OP_DESC(PL_op));
42d0e0b7 1499 default: NOOP;
bd81e77b
NC
1500 }
1501 (void)SvIOK_only(sv); /* validate number */
1502 SvIV_set(sv, i);
1503 SvTAINT(sv);
1504}
932e9ff9 1505
bd81e77b
NC
1506/*
1507=for apidoc sv_setiv_mg
d33b2eba 1508
bd81e77b 1509Like C<sv_setiv>, but also handles 'set' magic.
1c846c1f 1510
bd81e77b
NC
1511=cut
1512*/
d33b2eba 1513
bd81e77b
NC
1514void
1515Perl_sv_setiv_mg(pTHX_ register SV *sv, IV i)
1516{
1517 sv_setiv(sv,i);
1518 SvSETMAGIC(sv);
1519}
727879eb 1520
bd81e77b
NC
1521/*
1522=for apidoc sv_setuv
d33b2eba 1523
bd81e77b
NC
1524Copies an unsigned integer into the given SV, upgrading first if necessary.
1525Does not handle 'set' magic. See also C<sv_setuv_mg>.
9b94d1dd 1526
bd81e77b
NC
1527=cut
1528*/
d33b2eba 1529
bd81e77b
NC
1530void
1531Perl_sv_setuv(pTHX_ register SV *sv, UV u)
1532{
1533 /* With these two if statements:
1534 u=1.49 s=0.52 cu=72.49 cs=10.64 scripts=270 tests=20865
d33b2eba 1535
bd81e77b
NC
1536 without
1537 u=1.35 s=0.47 cu=73.45 cs=11.43 scripts=270 tests=20865
1c846c1f 1538
bd81e77b
NC
1539 If you wish to remove them, please benchmark to see what the effect is
1540 */
1541 if (u <= (UV)IV_MAX) {
1542 sv_setiv(sv, (IV)u);
1543 return;
1544 }
1545 sv_setiv(sv, 0);
1546 SvIsUV_on(sv);
1547 SvUV_set(sv, u);
1548}
d33b2eba 1549
bd81e77b
NC
1550/*
1551=for apidoc sv_setuv_mg
727879eb 1552
bd81e77b 1553Like C<sv_setuv>, but also handles 'set' magic.
9b94d1dd 1554
bd81e77b
NC
1555=cut
1556*/
5e2fc214 1557
bd81e77b
NC
1558void
1559Perl_sv_setuv_mg(pTHX_ register SV *sv, UV u)
1560{
1561 sv_setiv(sv, 0);
1562 SvIsUV_on(sv);
1563 sv_setuv(sv,u);
1564 SvSETMAGIC(sv);
1565}
5e2fc214 1566
954c1994 1567/*
bd81e77b 1568=for apidoc sv_setnv
954c1994 1569
bd81e77b
NC
1570Copies a double into the given SV, upgrading first if necessary.
1571Does not handle 'set' magic. See also C<sv_setnv_mg>.
954c1994
GS
1572
1573=cut
1574*/
1575
63f97190 1576void
bd81e77b 1577Perl_sv_setnv(pTHX_ register SV *sv, NV num)
79072805 1578{
97aff369 1579 dVAR;
bd81e77b
NC
1580 SV_CHECK_THINKFIRST_COW_DROP(sv);
1581 switch (SvTYPE(sv)) {
79072805 1582 case SVt_NULL:
79072805 1583 case SVt_IV:
bd81e77b 1584 sv_upgrade(sv, SVt_NV);
79072805 1585 break;
ed6116ce 1586 case SVt_RV:
79072805 1587 case SVt_PV:
79072805 1588 case SVt_PVIV:
bd81e77b 1589 sv_upgrade(sv, SVt_PVNV);
79072805 1590 break;
bd4b1eb5 1591
bd4b1eb5 1592 case SVt_PVGV:
bd81e77b
NC
1593 case SVt_PVAV:
1594 case SVt_PVHV:
79072805 1595 case SVt_PVCV:
bd81e77b
NC
1596 case SVt_PVFM:
1597 case SVt_PVIO:
1598 Perl_croak(aTHX_ "Can't coerce %s to number in %s", sv_reftype(sv,0),
1599 OP_NAME(PL_op));
42d0e0b7 1600 default: NOOP;
2068cd4d 1601 }
bd81e77b
NC
1602 SvNV_set(sv, num);
1603 (void)SvNOK_only(sv); /* validate number */
1604 SvTAINT(sv);
79072805
LW
1605}
1606
645c22ef 1607/*
bd81e77b 1608=for apidoc sv_setnv_mg
645c22ef 1609
bd81e77b 1610Like C<sv_setnv>, but also handles 'set' magic.
645c22ef
DM
1611
1612=cut
1613*/
1614
bd81e77b
NC
1615void
1616Perl_sv_setnv_mg(pTHX_ register SV *sv, NV num)
79072805 1617{
bd81e77b
NC
1618 sv_setnv(sv,num);
1619 SvSETMAGIC(sv);
79072805
LW
1620}
1621
bd81e77b
NC
1622/* Print an "isn't numeric" warning, using a cleaned-up,
1623 * printable version of the offending string
1624 */
954c1994 1625
bd81e77b
NC
1626STATIC void
1627S_not_a_number(pTHX_ SV *sv)
79072805 1628{
97aff369 1629 dVAR;
bd81e77b
NC
1630 SV *dsv;
1631 char tmpbuf[64];
1632 const char *pv;
94463019
JH
1633
1634 if (DO_UTF8(sv)) {
396482e1 1635 dsv = sv_2mortal(newSVpvs(""));
94463019
JH
1636 pv = sv_uni_display(dsv, sv, 10, 0);
1637 } else {
1638 char *d = tmpbuf;
551405c4 1639 const char * const limit = tmpbuf + sizeof(tmpbuf) - 8;
94463019
JH
1640 /* each *s can expand to 4 chars + "...\0",
1641 i.e. need room for 8 chars */
ecdeb87c 1642
00b6aa41
AL
1643 const char *s = SvPVX_const(sv);
1644 const char * const end = s + SvCUR(sv);
1645 for ( ; s < end && d < limit; s++ ) {
94463019
JH
1646 int ch = *s & 0xFF;
1647 if (ch & 128 && !isPRINT_LC(ch)) {
1648 *d++ = 'M';
1649 *d++ = '-';
1650 ch &= 127;
1651 }
1652 if (ch == '\n') {
1653 *d++ = '\\';
1654 *d++ = 'n';
1655 }
1656 else if (ch == '\r') {
1657 *d++ = '\\';
1658 *d++ = 'r';
1659 }
1660 else if (ch == '\f') {
1661 *d++ = '\\';
1662 *d++ = 'f';
1663 }
1664 else if (ch == '\\') {
1665 *d++ = '\\';
1666 *d++ = '\\';
1667 }
1668 else if (ch == '\0') {
1669 *d++ = '\\';
1670 *d++ = '0';
1671 }
1672 else if (isPRINT_LC(ch))
1673 *d++ = ch;
1674 else {
1675 *d++ = '^';
1676 *d++ = toCTRL(ch);
1677 }
1678 }
1679 if (s < end) {
1680 *d++ = '.';
1681 *d++ = '.';
1682 *d++ = '.';
1683 }
1684 *d = '\0';
1685 pv = tmpbuf;
a0d0e21e 1686 }
a0d0e21e 1687
533c011a 1688 if (PL_op)
9014280d 1689 Perl_warner(aTHX_ packWARN(WARN_NUMERIC),
94463019
JH
1690 "Argument \"%s\" isn't numeric in %s", pv,
1691 OP_DESC(PL_op));
a0d0e21e 1692 else
9014280d 1693 Perl_warner(aTHX_ packWARN(WARN_NUMERIC),
94463019 1694 "Argument \"%s\" isn't numeric", pv);
a0d0e21e
LW
1695}
1696
c2988b20
NC
1697/*
1698=for apidoc looks_like_number
1699
645c22ef
DM
1700Test if the content of an SV looks like a number (or is a number).
1701C<Inf> and C<Infinity> are treated as numbers (so will not issue a
1702non-numeric warning), even if your atof() doesn't grok them.
c2988b20
NC
1703
1704=cut
1705*/
1706
1707I32
1708Perl_looks_like_number(pTHX_ SV *sv)
1709{
a3b680e6 1710 register const char *sbegin;
c2988b20
NC
1711 STRLEN len;
1712
1713 if (SvPOK(sv)) {
3f7c398e 1714 sbegin = SvPVX_const(sv);
c2988b20
NC
1715 len = SvCUR(sv);
1716 }
1717 else if (SvPOKp(sv))
83003860 1718 sbegin = SvPV_const(sv, len);
c2988b20 1719 else
e0ab1c0e 1720 return SvFLAGS(sv) & (SVf_NOK|SVp_NOK|SVf_IOK|SVp_IOK);
c2988b20
NC
1721 return grok_number(sbegin, len, NULL);
1722}
25da4f38 1723
19f6321d
NC
1724STATIC bool
1725S_glob_2number(pTHX_ GV * const gv)
180488f8
NC
1726{
1727 const U32 wasfake = SvFLAGS(gv) & SVf_FAKE;
1728 SV *const buffer = sv_newmortal();
1729
1730 /* FAKE globs can get coerced, so need to turn this off temporarily if it
1731 is on. */
1732 SvFAKE_off(gv);
1733 gv_efullname3(buffer, gv, "*");
1734 SvFLAGS(gv) |= wasfake;
1735
675c862f
AL
1736 /* We know that all GVs stringify to something that is not-a-number,
1737 so no need to test that. */
1738 if (ckWARN(WARN_NUMERIC))
1739 not_a_number(buffer);
1740 /* We just want something true to return, so that S_sv_2iuv_common
1741 can tail call us and return true. */
19f6321d 1742 return TRUE;
675c862f
AL
1743}
1744
1745STATIC char *
19f6321d 1746S_glob_2pv(pTHX_ GV * const gv, STRLEN * const len)
675c862f
AL
1747{
1748 const U32 wasfake = SvFLAGS(gv) & SVf_FAKE;
1749 SV *const buffer = sv_newmortal();
1750
1751 /* FAKE globs can get coerced, so need to turn this off temporarily if it
1752 is on. */
1753 SvFAKE_off(gv);
1754 gv_efullname3(buffer, gv, "*");
1755 SvFLAGS(gv) |= wasfake;
1756
1757 assert(SvPOK(buffer));
a6d61a6c
NC
1758 if (len) {
1759 *len = SvCUR(buffer);
1760 }
675c862f 1761 return SvPVX(buffer);
180488f8
NC
1762}
1763
25da4f38
IZ
1764/* Actually, ISO C leaves conversion of UV to IV undefined, but
1765 until proven guilty, assume that things are not that bad... */
1766
645c22ef
DM
1767/*
1768 NV_PRESERVES_UV:
1769
1770 As 64 bit platforms often have an NV that doesn't preserve all bits of
28e5dec8
JH
1771 an IV (an assumption perl has been based on to date) it becomes necessary
1772 to remove the assumption that the NV always carries enough precision to
1773 recreate the IV whenever needed, and that the NV is the canonical form.
1774 Instead, IV/UV and NV need to be given equal rights. So as to not lose
645c22ef 1775 precision as a side effect of conversion (which would lead to insanity
28e5dec8
JH
1776 and the dragon(s) in t/op/numconvert.t getting very angry) the intent is
1777 1) to distinguish between IV/UV/NV slots that have cached a valid
1778 conversion where precision was lost and IV/UV/NV slots that have a
1779 valid conversion which has lost no precision
645c22ef 1780 2) to ensure that if a numeric conversion to one form is requested that
28e5dec8
JH
1781 would lose precision, the precise conversion (or differently
1782 imprecise conversion) is also performed and cached, to prevent
1783 requests for different numeric formats on the same SV causing
1784 lossy conversion chains. (lossless conversion chains are perfectly
1785 acceptable (still))
1786
1787
1788 flags are used:
1789 SvIOKp is true if the IV slot contains a valid value
1790 SvIOK is true only if the IV value is accurate (UV if SvIOK_UV true)
1791 SvNOKp is true if the NV slot contains a valid value
1792 SvNOK is true only if the NV value is accurate
1793
1794 so
645c22ef 1795 while converting from PV to NV, check to see if converting that NV to an
28e5dec8
JH
1796 IV(or UV) would lose accuracy over a direct conversion from PV to
1797 IV(or UV). If it would, cache both conversions, return NV, but mark
1798 SV as IOK NOKp (ie not NOK).
1799
645c22ef 1800 While converting from PV to IV, check to see if converting that IV to an
28e5dec8
JH
1801 NV would lose accuracy over a direct conversion from PV to NV. If it
1802 would, cache both conversions, flag similarly.
1803
1804 Before, the SV value "3.2" could become NV=3.2 IV=3 NOK, IOK quite
1805 correctly because if IV & NV were set NV *always* overruled.
645c22ef
DM
1806 Now, "3.2" will become NV=3.2 IV=3 NOK, IOKp, because the flag's meaning
1807 changes - now IV and NV together means that the two are interchangeable:
28e5dec8 1808 SvIVX == (IV) SvNVX && SvNVX == (NV) SvIVX;
d460ef45 1809
645c22ef
DM
1810 The benefit of this is that operations such as pp_add know that if
1811 SvIOK is true for both left and right operands, then integer addition
1812 can be used instead of floating point (for cases where the result won't
1813 overflow). Before, floating point was always used, which could lead to
28e5dec8
JH
1814 loss of precision compared with integer addition.
1815
1816 * making IV and NV equal status should make maths accurate on 64 bit
1817 platforms
1818 * may speed up maths somewhat if pp_add and friends start to use
645c22ef 1819 integers when possible instead of fp. (Hopefully the overhead in
28e5dec8
JH
1820 looking for SvIOK and checking for overflow will not outweigh the
1821 fp to integer speedup)
1822 * will slow down integer operations (callers of SvIV) on "inaccurate"
1823 values, as the change from SvIOK to SvIOKp will cause a call into
1824 sv_2iv each time rather than a macro access direct to the IV slot
1825 * should speed up number->string conversion on integers as IV is
645c22ef 1826 favoured when IV and NV are equally accurate
28e5dec8
JH
1827
1828 ####################################################################
645c22ef
DM
1829 You had better be using SvIOK_notUV if you want an IV for arithmetic:
1830 SvIOK is true if (IV or UV), so you might be getting (IV)SvUV.
1831 On the other hand, SvUOK is true iff UV.
28e5dec8
JH
1832 ####################################################################
1833
645c22ef 1834 Your mileage will vary depending your CPU's relative fp to integer
28e5dec8
JH
1835 performance ratio.
1836*/
1837
1838#ifndef NV_PRESERVES_UV
645c22ef
DM
1839# define IS_NUMBER_UNDERFLOW_IV 1
1840# define IS_NUMBER_UNDERFLOW_UV 2
1841# define IS_NUMBER_IV_AND_UV 2
1842# define IS_NUMBER_OVERFLOW_IV 4
1843# define IS_NUMBER_OVERFLOW_UV 5
1844
1845/* sv_2iuv_non_preserve(): private routine for use by sv_2iv() and sv_2uv() */
28e5dec8
JH
1846
1847/* For sv_2nv these three cases are "SvNOK and don't bother casting" */
1848STATIC int
645c22ef 1849S_sv_2iuv_non_preserve(pTHX_ register SV *sv, I32 numtype)
28e5dec8 1850{
97aff369 1851 dVAR;
3f7c398e 1852 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_2iuv_non '%s', IV=0x%"UVxf" NV=%"NVgf" inttype=%"UVXf"\n", SvPVX_const(sv), SvIVX(sv), SvNVX(sv), (UV)numtype));
28e5dec8
JH
1853 if (SvNVX(sv) < (NV)IV_MIN) {
1854 (void)SvIOKp_on(sv);
1855 (void)SvNOK_on(sv);
45977657 1856 SvIV_set(sv, IV_MIN);
28e5dec8
JH
1857 return IS_NUMBER_UNDERFLOW_IV;
1858 }
1859 if (SvNVX(sv) > (NV)UV_MAX) {
1860 (void)SvIOKp_on(sv);
1861 (void)SvNOK_on(sv);
1862 SvIsUV_on(sv);
607fa7f2 1863 SvUV_set(sv, UV_MAX);
28e5dec8
JH
1864 return IS_NUMBER_OVERFLOW_UV;
1865 }
c2988b20
NC
1866 (void)SvIOKp_on(sv);
1867 (void)SvNOK_on(sv);
1868 /* Can't use strtol etc to convert this string. (See truth table in
1869 sv_2iv */
1870 if (SvNVX(sv) <= (UV)IV_MAX) {
45977657 1871 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
1872 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
1873 SvIOK_on(sv); /* Integer is precise. NOK, IOK */
1874 } else {
1875 /* Integer is imprecise. NOK, IOKp */
1876 }
1877 return SvNVX(sv) < 0 ? IS_NUMBER_UNDERFLOW_UV : IS_NUMBER_IV_AND_UV;
1878 }
1879 SvIsUV_on(sv);
607fa7f2 1880 SvUV_set(sv, U_V(SvNVX(sv)));
c2988b20
NC
1881 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
1882 if (SvUVX(sv) == UV_MAX) {
1883 /* As we know that NVs don't preserve UVs, UV_MAX cannot
1884 possibly be preserved by NV. Hence, it must be overflow.
1885 NOK, IOKp */
1886 return IS_NUMBER_OVERFLOW_UV;
1887 }
1888 SvIOK_on(sv); /* Integer is precise. NOK, UOK */
1889 } else {
1890 /* Integer is imprecise. NOK, IOKp */
28e5dec8 1891 }
c2988b20 1892 return IS_NUMBER_OVERFLOW_IV;
28e5dec8 1893}
645c22ef
DM
1894#endif /* !NV_PRESERVES_UV*/
1895
af359546
NC
1896STATIC bool
1897S_sv_2iuv_common(pTHX_ SV *sv) {
97aff369 1898 dVAR;
af359546 1899 if (SvNOKp(sv)) {
28e5dec8
JH
1900 /* erm. not sure. *should* never get NOKp (without NOK) from sv_2nv
1901 * without also getting a cached IV/UV from it at the same time
1902 * (ie PV->NV conversion should detect loss of accuracy and cache
af359546
NC
1903 * IV or UV at same time to avoid this. */
1904 /* IV-over-UV optimisation - choose to cache IV if possible */
25da4f38
IZ
1905
1906 if (SvTYPE(sv) == SVt_NV)
1907 sv_upgrade(sv, SVt_PVNV);
1908
28e5dec8
JH
1909 (void)SvIOKp_on(sv); /* Must do this first, to clear any SvOOK */
1910 /* < not <= as for NV doesn't preserve UV, ((NV)IV_MAX+1) will almost
1911 certainly cast into the IV range at IV_MAX, whereas the correct
1912 answer is the UV IV_MAX +1. Hence < ensures that dodgy boundary
1913 cases go to UV */
cab190d4
JD
1914#if defined(NAN_COMPARE_BROKEN) && defined(Perl_isnan)
1915 if (Perl_isnan(SvNVX(sv))) {
1916 SvUV_set(sv, 0);
1917 SvIsUV_on(sv);
fdbe6d7c 1918 return FALSE;
cab190d4 1919 }
cab190d4 1920#endif
28e5dec8 1921 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
45977657 1922 SvIV_set(sv, I_V(SvNVX(sv)));
28e5dec8
JH
1923 if (SvNVX(sv) == (NV) SvIVX(sv)
1924#ifndef NV_PRESERVES_UV
1925 && (((UV)1 << NV_PRESERVES_UV_BITS) >
1926 (UV)(SvIVX(sv) > 0 ? SvIVX(sv) : -SvIVX(sv)))
1927 /* Don't flag it as "accurately an integer" if the number
1928 came from a (by definition imprecise) NV operation, and
1929 we're outside the range of NV integer precision */
1930#endif
1931 ) {
1932 SvIOK_on(sv); /* Can this go wrong with rounding? NWC */
1933 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 1934 "0x%"UVxf" iv(%"NVgf" => %"IVdf") (precise)\n",
28e5dec8
JH
1935 PTR2UV(sv),
1936 SvNVX(sv),
1937 SvIVX(sv)));
1938
1939 } else {
1940 /* IV not precise. No need to convert from PV, as NV
1941 conversion would already have cached IV if it detected
1942 that PV->IV would be better than PV->NV->IV
1943 flags already correct - don't set public IOK. */
1944 DEBUG_c(PerlIO_printf(Perl_debug_log,
7234c960 1945 "0x%"UVxf" iv(%"NVgf" => %"IVdf") (imprecise)\n",
28e5dec8
JH
1946 PTR2UV(sv),
1947 SvNVX(sv),
1948 SvIVX(sv)));
1949 }
1950 /* Can the above go wrong if SvIVX == IV_MIN and SvNVX < IV_MIN,
1951 but the cast (NV)IV_MIN rounds to a the value less (more
1952 negative) than IV_MIN which happens to be equal to SvNVX ??
1953 Analogous to 0xFFFFFFFFFFFFFFFF rounding up to NV (2**64) and
1954 NV rounding back to 0xFFFFFFFFFFFFFFFF, so UVX == UV(NVX) and
1955 (NV)UVX == NVX are both true, but the values differ. :-(
1956 Hopefully for 2s complement IV_MIN is something like
1957 0x8000000000000000 which will be exact. NWC */
d460ef45 1958 }
25da4f38 1959 else {
607fa7f2 1960 SvUV_set(sv, U_V(SvNVX(sv)));
28e5dec8
JH
1961 if (
1962 (SvNVX(sv) == (NV) SvUVX(sv))
1963#ifndef NV_PRESERVES_UV
1964 /* Make sure it's not 0xFFFFFFFFFFFFFFFF */
1965 /*&& (SvUVX(sv) != UV_MAX) irrelevant with code below */
1966 && (((UV)1 << NV_PRESERVES_UV_BITS) > SvUVX(sv))
1967 /* Don't flag it as "accurately an integer" if the number
1968 came from a (by definition imprecise) NV operation, and
1969 we're outside the range of NV integer precision */
1970#endif
1971 )
1972 SvIOK_on(sv);
25da4f38 1973 SvIsUV_on(sv);
1c846c1f 1974 DEBUG_c(PerlIO_printf(Perl_debug_log,
57def98f 1975 "0x%"UVxf" 2iv(%"UVuf" => %"IVdf") (as unsigned)\n",
56431972 1976 PTR2UV(sv),
57def98f
JH
1977 SvUVX(sv),
1978 SvUVX(sv)));
25da4f38 1979 }
748a9306
LW
1980 }
1981 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 1982 UV value;
504618e9 1983 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
af359546 1984 /* We want to avoid a possible problem when we cache an IV/ a UV which
25da4f38 1985 may be later translated to an NV, and the resulting NV is not
c2988b20
NC
1986 the same as the direct translation of the initial string
1987 (eg 123.456 can shortcut to the IV 123 with atol(), but we must
1988 be careful to ensure that the value with the .456 is around if the
1989 NV value is requested in the future).
1c846c1f 1990
af359546 1991 This means that if we cache such an IV/a UV, we need to cache the
25da4f38 1992 NV as well. Moreover, we trade speed for space, and do not
28e5dec8 1993 cache the NV if we are sure it's not needed.
25da4f38 1994 */
16b7a9a4 1995
c2988b20
NC
1996 /* SVt_PVNV is one higher than SVt_PVIV, hence this order */
1997 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
1998 == IS_NUMBER_IN_UV) {
5e045b90 1999 /* It's definitely an integer, only upgrade to PVIV */
28e5dec8
JH
2000 if (SvTYPE(sv) < SVt_PVIV)
2001 sv_upgrade(sv, SVt_PVIV);
f7bbb42a 2002 (void)SvIOK_on(sv);
c2988b20
NC
2003 } else if (SvTYPE(sv) < SVt_PVNV)
2004 sv_upgrade(sv, SVt_PVNV);
28e5dec8 2005
f2524eef 2006 /* If NVs preserve UVs then we only use the UV value if we know that
c2988b20
NC
2007 we aren't going to call atof() below. If NVs don't preserve UVs
2008 then the value returned may have more precision than atof() will
2009 return, even though value isn't perfectly accurate. */
2010 if ((numtype & (IS_NUMBER_IN_UV
2011#ifdef NV_PRESERVES_UV
2012 | IS_NUMBER_NOT_INT
2013#endif
2014 )) == IS_NUMBER_IN_UV) {
2015 /* This won't turn off the public IOK flag if it was set above */
2016 (void)SvIOKp_on(sv);
2017
2018 if (!(numtype & IS_NUMBER_NEG)) {
2019 /* positive */;
2020 if (value <= (UV)IV_MAX) {
45977657 2021 SvIV_set(sv, (IV)value);
c2988b20 2022 } else {
af359546 2023 /* it didn't overflow, and it was positive. */
607fa7f2 2024 SvUV_set(sv, value);
c2988b20
NC
2025 SvIsUV_on(sv);
2026 }
2027 } else {
2028 /* 2s complement assumption */
2029 if (value <= (UV)IV_MIN) {
45977657 2030 SvIV_set(sv, -(IV)value);
c2988b20
NC
2031 } else {
2032 /* Too negative for an IV. This is a double upgrade, but
d1be9408 2033 I'm assuming it will be rare. */
c2988b20
NC
2034 if (SvTYPE(sv) < SVt_PVNV)
2035 sv_upgrade(sv, SVt_PVNV);
2036 SvNOK_on(sv);
2037 SvIOK_off(sv);
2038 SvIOKp_on(sv);
9d6ce603 2039 SvNV_set(sv, -(NV)value);
45977657 2040 SvIV_set(sv, IV_MIN);
c2988b20
NC
2041 }
2042 }
2043 }
2044 /* For !NV_PRESERVES_UV and IS_NUMBER_IN_UV and IS_NUMBER_NOT_INT we
2045 will be in the previous block to set the IV slot, and the next
2046 block to set the NV slot. So no else here. */
2047
2048 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2049 != IS_NUMBER_IN_UV) {
2050 /* It wasn't an (integer that doesn't overflow the UV). */
3f7c398e 2051 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8 2052
c2988b20
NC
2053 if (! numtype && ckWARN(WARN_NUMERIC))
2054 not_a_number(sv);
28e5dec8 2055
65202027 2056#if defined(USE_LONG_DOUBLE)
c2988b20
NC
2057 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%" PERL_PRIgldbl ")\n",
2058 PTR2UV(sv), SvNVX(sv)));
65202027 2059#else
1779d84d 2060 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%"NVgf")\n",
c2988b20 2061 PTR2UV(sv), SvNVX(sv)));
65202027 2062#endif
28e5dec8 2063
28e5dec8 2064#ifdef NV_PRESERVES_UV
af359546
NC
2065 (void)SvIOKp_on(sv);
2066 (void)SvNOK_on(sv);
2067 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
2068 SvIV_set(sv, I_V(SvNVX(sv)));
2069 if ((NV)(SvIVX(sv)) == SvNVX(sv)) {
2070 SvIOK_on(sv);
2071 } else {
6f207bd3 2072 NOOP; /* Integer is imprecise. NOK, IOKp */
af359546
NC
2073 }
2074 /* UV will not work better than IV */
2075 } else {
2076 if (SvNVX(sv) > (NV)UV_MAX) {
2077 SvIsUV_on(sv);
2078 /* Integer is inaccurate. NOK, IOKp, is UV */
2079 SvUV_set(sv, UV_MAX);
af359546
NC
2080 } else {
2081 SvUV_set(sv, U_V(SvNVX(sv)));
2082 /* 0xFFFFFFFFFFFFFFFF not an issue in here, NVs
2083 NV preservse UV so can do correct comparison. */
2084 if ((NV)(SvUVX(sv)) == SvNVX(sv)) {
2085 SvIOK_on(sv);
af359546 2086 } else {
6f207bd3 2087 NOOP; /* Integer is imprecise. NOK, IOKp, is UV */
af359546
NC
2088 }
2089 }
4b0c9573 2090 SvIsUV_on(sv);
af359546 2091 }
28e5dec8 2092#else /* NV_PRESERVES_UV */
c2988b20
NC
2093 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2094 == (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT)) {
af359546 2095 /* The IV/UV slot will have been set from value returned by
c2988b20
NC
2096 grok_number above. The NV slot has just been set using
2097 Atof. */
560b0c46 2098 SvNOK_on(sv);
c2988b20
NC
2099 assert (SvIOKp(sv));
2100 } else {
2101 if (((UV)1 << NV_PRESERVES_UV_BITS) >
2102 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
2103 /* Small enough to preserve all bits. */
2104 (void)SvIOKp_on(sv);
2105 SvNOK_on(sv);
45977657 2106 SvIV_set(sv, I_V(SvNVX(sv)));
c2988b20
NC
2107 if ((NV)(SvIVX(sv)) == SvNVX(sv))
2108 SvIOK_on(sv);
2109 /* Assumption: first non-preserved integer is < IV_MAX,
2110 this NV is in the preserved range, therefore: */
2111 if (!(U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))
2112 < (UV)IV_MAX)) {
32fdb065 2113 Perl_croak(aTHX_ "sv_2iv assumed (U_V(fabs((double)SvNVX(sv))) < (UV)IV_MAX) but SvNVX(sv)=%"NVgf" U_V is 0x%"UVxf", IV_MAX is 0x%"UVxf"\n", SvNVX(sv), U_V(SvNVX(sv)), (UV)IV_MAX);
c2988b20
NC
2114 }
2115 } else {
2116 /* IN_UV NOT_INT
2117 0 0 already failed to read UV.
2118 0 1 already failed to read UV.
2119 1 0 you won't get here in this case. IV/UV
2120 slot set, public IOK, Atof() unneeded.
2121 1 1 already read UV.
2122 so there's no point in sv_2iuv_non_preserve() attempting
2123 to use atol, strtol, strtoul etc. */
40a17c4c 2124 sv_2iuv_non_preserve (sv, numtype);
c2988b20
NC
2125 }
2126 }
28e5dec8 2127#endif /* NV_PRESERVES_UV */
25da4f38 2128 }
af359546
NC
2129 }
2130 else {
675c862f 2131 if (isGV_with_GP(sv))
a0933d07 2132 return glob_2number((GV *)sv);
180488f8 2133
af359546
NC
2134 if (!(SvFLAGS(sv) & SVs_PADTMP)) {
2135 if (!PL_localizing && ckWARN(WARN_UNINITIALIZED))
2136 report_uninit(sv);
2137 }
25da4f38
IZ
2138 if (SvTYPE(sv) < SVt_IV)
2139 /* Typically the caller expects that sv_any is not NULL now. */
2140 sv_upgrade(sv, SVt_IV);
af359546
NC
2141 /* Return 0 from the caller. */
2142 return TRUE;
2143 }
2144 return FALSE;
2145}
2146
2147/*
2148=for apidoc sv_2iv_flags
2149
2150Return the integer value of an SV, doing any necessary string
2151conversion. If flags includes SV_GMAGIC, does an mg_get() first.
2152Normally used via the C<SvIV(sv)> and C<SvIVx(sv)> macros.
2153
2154=cut
2155*/
2156
2157IV
2158Perl_sv_2iv_flags(pTHX_ register SV *sv, I32 flags)
2159{
97aff369 2160 dVAR;
af359546 2161 if (!sv)
a0d0e21e 2162 return 0;
af359546
NC
2163 if (SvGMAGICAL(sv)) {
2164 if (flags & SV_GMAGIC)
2165 mg_get(sv);
2166 if (SvIOKp(sv))
2167 return SvIVX(sv);
2168 if (SvNOKp(sv)) {
2169 return I_V(SvNVX(sv));
2170 }
71c558c3
NC
2171 if (SvPOKp(sv) && SvLEN(sv)) {
2172 UV value;
2173 const int numtype
2174 = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
2175
2176 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2177 == IS_NUMBER_IN_UV) {
2178 /* It's definitely an integer */
2179 if (numtype & IS_NUMBER_NEG) {
2180 if (value < (UV)IV_MIN)
2181 return -(IV)value;
2182 } else {
2183 if (value < (UV)IV_MAX)
2184 return (IV)value;
2185 }
2186 }
2187 if (!numtype) {
2188 if (ckWARN(WARN_NUMERIC))
2189 not_a_number(sv);
2190 }
2191 return I_V(Atof(SvPVX_const(sv)));
2192 }
1c7ff15e
NC
2193 if (SvROK(sv)) {
2194 goto return_rok;
af359546 2195 }
1c7ff15e
NC
2196 assert(SvTYPE(sv) >= SVt_PVMG);
2197 /* This falls through to the report_uninit inside S_sv_2iuv_common. */
4cb1ec55 2198 } else if (SvTHINKFIRST(sv)) {
af359546 2199 if (SvROK(sv)) {
1c7ff15e 2200 return_rok:
af359546
NC
2201 if (SvAMAGIC(sv)) {
2202 SV * const tmpstr=AMG_CALLun(sv,numer);
2203 if (tmpstr && (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv)))) {
2204 return SvIV(tmpstr);
2205 }
2206 }
2207 return PTR2IV(SvRV(sv));
2208 }
2209 if (SvIsCOW(sv)) {
2210 sv_force_normal_flags(sv, 0);
2211 }
2212 if (SvREADONLY(sv) && !SvOK(sv)) {
2213 if (ckWARN(WARN_UNINITIALIZED))
2214 report_uninit(sv);
2215 return 0;
2216 }
2217 }
2218 if (!SvIOKp(sv)) {
2219 if (S_sv_2iuv_common(aTHX_ sv))
2220 return 0;
79072805 2221 }
1d7c1841
GS
2222 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2iv(%"IVdf")\n",
2223 PTR2UV(sv),SvIVX(sv)));
25da4f38 2224 return SvIsUV(sv) ? (IV)SvUVX(sv) : SvIVX(sv);
79072805
LW
2225}
2226
645c22ef 2227/*
891f9566 2228=for apidoc sv_2uv_flags
645c22ef
DM
2229
2230Return the unsigned integer value of an SV, doing any necessary string
891f9566
YST
2231conversion. If flags includes SV_GMAGIC, does an mg_get() first.
2232Normally used via the C<SvUV(sv)> and C<SvUVx(sv)> macros.
645c22ef
DM
2233
2234=cut
2235*/
2236
ff68c719 2237UV
891f9566 2238Perl_sv_2uv_flags(pTHX_ register SV *sv, I32 flags)
ff68c719 2239{
97aff369 2240 dVAR;
ff68c719 2241 if (!sv)
2242 return 0;
2243 if (SvGMAGICAL(sv)) {
891f9566
YST
2244 if (flags & SV_GMAGIC)
2245 mg_get(sv);
ff68c719 2246 if (SvIOKp(sv))
2247 return SvUVX(sv);
2248 if (SvNOKp(sv))
2249 return U_V(SvNVX(sv));
71c558c3
NC
2250 if (SvPOKp(sv) && SvLEN(sv)) {
2251 UV value;
2252 const int numtype
2253 = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
2254
2255 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2256 == IS_NUMBER_IN_UV) {
2257 /* It's definitely an integer */
2258 if (!(numtype & IS_NUMBER_NEG))
2259 return value;
2260 }
2261 if (!numtype) {
2262 if (ckWARN(WARN_NUMERIC))
2263 not_a_number(sv);
2264 }
2265 return U_V(Atof(SvPVX_const(sv)));
2266 }
1c7ff15e
NC
2267 if (SvROK(sv)) {
2268 goto return_rok;
3fe9a6f1 2269 }
1c7ff15e
NC
2270 assert(SvTYPE(sv) >= SVt_PVMG);
2271 /* This falls through to the report_uninit inside S_sv_2iuv_common. */
4cb1ec55 2272 } else if (SvTHINKFIRST(sv)) {
ff68c719 2273 if (SvROK(sv)) {
1c7ff15e 2274 return_rok:
deb46114
NC
2275 if (SvAMAGIC(sv)) {
2276 SV *const tmpstr = AMG_CALLun(sv,numer);
2277 if (tmpstr && (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv)))) {
2278 return SvUV(tmpstr);
2279 }
2280 }
2281 return PTR2UV(SvRV(sv));
ff68c719 2282 }
765f542d
NC
2283 if (SvIsCOW(sv)) {
2284 sv_force_normal_flags(sv, 0);
8a818333 2285 }
0336b60e 2286 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 2287 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2288 report_uninit(sv);
ff68c719 2289 return 0;
2290 }
2291 }
af359546
NC
2292 if (!SvIOKp(sv)) {
2293 if (S_sv_2iuv_common(aTHX_ sv))
2294 return 0;
ff68c719 2295 }
25da4f38 2296
1d7c1841
GS
2297 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2uv(%"UVuf")\n",
2298 PTR2UV(sv),SvUVX(sv)));
25da4f38 2299 return SvIsUV(sv) ? SvUVX(sv) : (UV)SvIVX(sv);
ff68c719 2300}
2301
645c22ef
DM
2302/*
2303=for apidoc sv_2nv
2304
2305Return the num value of an SV, doing any necessary string or integer
2306conversion, magic etc. Normally used via the C<SvNV(sv)> and C<SvNVx(sv)>
2307macros.
2308
2309=cut
2310*/
2311
65202027 2312NV
864dbfa3 2313Perl_sv_2nv(pTHX_ register SV *sv)
79072805 2314{
97aff369 2315 dVAR;
79072805
LW
2316 if (!sv)
2317 return 0.0;
8990e307 2318 if (SvGMAGICAL(sv)) {
463ee0b2
LW
2319 mg_get(sv);
2320 if (SvNOKp(sv))
2321 return SvNVX(sv);
0aa395f8 2322 if ((SvPOKp(sv) && SvLEN(sv)) && !SvIOKp(sv)) {
041457d9 2323 if (!SvIOKp(sv) && ckWARN(WARN_NUMERIC) &&
504618e9 2324 !grok_number(SvPVX_const(sv), SvCUR(sv), NULL))
a0d0e21e 2325 not_a_number(sv);
3f7c398e 2326 return Atof(SvPVX_const(sv));
a0d0e21e 2327 }
25da4f38 2328 if (SvIOKp(sv)) {
1c846c1f 2329 if (SvIsUV(sv))
65202027 2330 return (NV)SvUVX(sv);
25da4f38 2331 else
65202027 2332 return (NV)SvIVX(sv);
47a72cb8
NC
2333 }
2334 if (SvROK(sv)) {
2335 goto return_rok;
2336 }
2337 assert(SvTYPE(sv) >= SVt_PVMG);
2338 /* This falls through to the report_uninit near the end of the
2339 function. */
2340 } else if (SvTHINKFIRST(sv)) {
a0d0e21e 2341 if (SvROK(sv)) {
47a72cb8 2342 return_rok:
deb46114
NC
2343 if (SvAMAGIC(sv)) {
2344 SV *const tmpstr = AMG_CALLun(sv,numer);
2345 if (tmpstr && (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv)))) {
2346 return SvNV(tmpstr);
2347 }
2348 }
2349 return PTR2NV(SvRV(sv));
a0d0e21e 2350 }
765f542d
NC
2351 if (SvIsCOW(sv)) {
2352 sv_force_normal_flags(sv, 0);
8a818333 2353 }
0336b60e 2354 if (SvREADONLY(sv) && !SvOK(sv)) {
599cee73 2355 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2356 report_uninit(sv);
ed6116ce
LW
2357 return 0.0;
2358 }
79072805
LW
2359 }
2360 if (SvTYPE(sv) < SVt_NV) {
7e25a7e9
NC
2361 /* The logic to use SVt_PVNV if necessary is in sv_upgrade. */
2362 sv_upgrade(sv, SVt_NV);
906f284f 2363#ifdef USE_LONG_DOUBLE
097ee67d 2364 DEBUG_c({
f93f4e46 2365 STORE_NUMERIC_LOCAL_SET_STANDARD();
1d7c1841
GS
2366 PerlIO_printf(Perl_debug_log,
2367 "0x%"UVxf" num(%" PERL_PRIgldbl ")\n",
2368 PTR2UV(sv), SvNVX(sv));
572bbb43
GS
2369 RESTORE_NUMERIC_LOCAL();
2370 });
65202027 2371#else
572bbb43 2372 DEBUG_c({
f93f4e46 2373 STORE_NUMERIC_LOCAL_SET_STANDARD();
1779d84d 2374 PerlIO_printf(Perl_debug_log, "0x%"UVxf" num(%"NVgf")\n",
1d7c1841 2375 PTR2UV(sv), SvNVX(sv));
097ee67d
JH
2376 RESTORE_NUMERIC_LOCAL();
2377 });
572bbb43 2378#endif
79072805
LW
2379 }
2380 else if (SvTYPE(sv) < SVt_PVNV)
2381 sv_upgrade(sv, SVt_PVNV);
59d8ce62
NC
2382 if (SvNOKp(sv)) {
2383 return SvNVX(sv);
61604483 2384 }
59d8ce62 2385 if (SvIOKp(sv)) {
9d6ce603 2386 SvNV_set(sv, SvIsUV(sv) ? (NV)SvUVX(sv) : (NV)SvIVX(sv));
28e5dec8
JH
2387#ifdef NV_PRESERVES_UV
2388 SvNOK_on(sv);
2389#else
2390 /* Only set the public NV OK flag if this NV preserves the IV */
2391 /* Check it's not 0xFFFFFFFFFFFFFFFF */
2392 if (SvIsUV(sv) ? ((SvUVX(sv) != UV_MAX)&&(SvUVX(sv) == U_V(SvNVX(sv))))
2393 : (SvIVX(sv) == I_V(SvNVX(sv))))
2394 SvNOK_on(sv);
2395 else
2396 SvNOKp_on(sv);
2397#endif
93a17b20 2398 }
748a9306 2399 else if (SvPOKp(sv) && SvLEN(sv)) {
c2988b20 2400 UV value;
3f7c398e 2401 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), &value);
041457d9 2402 if (!SvIOKp(sv) && !numtype && ckWARN(WARN_NUMERIC))
a0d0e21e 2403 not_a_number(sv);
28e5dec8 2404#ifdef NV_PRESERVES_UV
c2988b20
NC
2405 if ((numtype & (IS_NUMBER_IN_UV | IS_NUMBER_NOT_INT))
2406 == IS_NUMBER_IN_UV) {
5e045b90 2407 /* It's definitely an integer */
9d6ce603 2408 SvNV_set(sv, (numtype & IS_NUMBER_NEG) ? -(NV)value : (NV)value);
c2988b20 2409 } else
3f7c398e 2410 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8
JH
2411 SvNOK_on(sv);
2412#else
3f7c398e 2413 SvNV_set(sv, Atof(SvPVX_const(sv)));
28e5dec8
JH
2414 /* Only set the public NV OK flag if this NV preserves the value in
2415 the PV at least as well as an IV/UV would.
2416 Not sure how to do this 100% reliably. */
2417 /* if that shift count is out of range then Configure's test is
2418 wonky. We shouldn't be in here with NV_PRESERVES_UV_BITS ==
2419 UV_BITS */
2420 if (((UV)1 << NV_PRESERVES_UV_BITS) >
c2988b20 2421 U_V(SvNVX(sv) > 0 ? SvNVX(sv) : -SvNVX(sv))) {
28e5dec8 2422 SvNOK_on(sv); /* Definitely small enough to preserve all bits */
c2988b20
NC
2423 } else if (!(numtype & IS_NUMBER_IN_UV)) {
2424 /* Can't use strtol etc to convert this string, so don't try.
2425 sv_2iv and sv_2uv will use the NV to convert, not the PV. */
2426 SvNOK_on(sv);
2427 } else {
2428 /* value has been set. It may not be precise. */
2429 if ((numtype & IS_NUMBER_NEG) && (value > (UV)IV_MIN)) {
2430 /* 2s complement assumption for (UV)IV_MIN */
2431 SvNOK_on(sv); /* Integer is too negative. */
2432 } else {
2433 SvNOKp_on(sv);
2434 SvIOKp_on(sv);
6fa402ec 2435
c2988b20 2436 if (numtype & IS_NUMBER_NEG) {
45977657 2437 SvIV_set(sv, -(IV)value);
c2988b20 2438 } else if (value <= (UV)IV_MAX) {
45977657 2439 SvIV_set(sv, (IV)value);
c2988b20 2440 } else {
607fa7f2 2441 SvUV_set(sv, value);
c2988b20
NC
2442 SvIsUV_on(sv);
2443 }
2444
2445 if (numtype & IS_NUMBER_NOT_INT) {
2446 /* I believe that even if the original PV had decimals,
2447 they are lost beyond the limit of the FP precision.
2448 However, neither is canonical, so both only get p
2449 flags. NWC, 2000/11/25 */
2450 /* Both already have p flags, so do nothing */
2451 } else {
66a1b24b 2452 const NV nv = SvNVX(sv);
c2988b20
NC
2453 if (SvNVX(sv) < (NV)IV_MAX + 0.5) {
2454 if (SvIVX(sv) == I_V(nv)) {
2455 SvNOK_on(sv);
c2988b20 2456 } else {
c2988b20
NC
2457 /* It had no "." so it must be integer. */
2458 }
00b6aa41 2459 SvIOK_on(sv);
c2988b20
NC
2460 } else {
2461 /* between IV_MAX and NV(UV_MAX).
2462 Could be slightly > UV_MAX */
6fa402ec 2463
c2988b20
NC
2464 if (numtype & IS_NUMBER_NOT_INT) {
2465 /* UV and NV both imprecise. */
2466 } else {
66a1b24b 2467 const UV nv_as_uv = U_V(nv);
c2988b20
NC
2468
2469 if (value == nv_as_uv && SvUVX(sv) != UV_MAX) {
2470 SvNOK_on(sv);
c2988b20 2471 }
00b6aa41 2472 SvIOK_on(sv);
c2988b20
NC
2473 }
2474 }
2475 }
2476 }
2477 }
28e5dec8 2478#endif /* NV_PRESERVES_UV */
93a17b20 2479 }
79072805 2480 else {
f7877b28 2481 if (isGV_with_GP(sv)) {
19f6321d 2482 glob_2number((GV *)sv);
180488f8
NC
2483 return 0.0;
2484 }
2485
041457d9 2486 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 2487 report_uninit(sv);
7e25a7e9
NC
2488 assert (SvTYPE(sv) >= SVt_NV);
2489 /* Typically the caller expects that sv_any is not NULL now. */
2490 /* XXX Ilya implies that this is a bug in callers that assume this
2491 and ideally should be fixed. */
a0d0e21e 2492 return 0.0;
79072805 2493 }
572bbb43 2494#if defined(USE_LONG_DOUBLE)
097ee67d 2495 DEBUG_c({
f93f4e46 2496 STORE_NUMERIC_LOCAL_SET_STANDARD();
1d7c1841
GS
2497 PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2nv(%" PERL_PRIgldbl ")\n",
2498 PTR2UV(sv), SvNVX(sv));
572bbb43
GS
2499 RESTORE_NUMERIC_LOCAL();
2500 });
65202027 2501#else
572bbb43 2502 DEBUG_c({
f93f4e46 2503 STORE_NUMERIC_LOCAL_SET_STANDARD();
1779d84d 2504 PerlIO_printf(Perl_debug_log, "0x%"UVxf" 1nv(%"NVgf")\n",
1d7c1841 2505 PTR2UV(sv), SvNVX(sv));
097ee67d
JH
2506 RESTORE_NUMERIC_LOCAL();
2507 });
572bbb43 2508#endif
463ee0b2 2509 return SvNVX(sv);
79072805
LW
2510}
2511
645c22ef
DM
2512/* uiv_2buf(): private routine for use by sv_2pv_flags(): print an IV or
2513 * UV as a string towards the end of buf, and return pointers to start and
2514 * end of it.
2515 *
2516 * We assume that buf is at least TYPE_CHARS(UV) long.
2517 */
2518
864dbfa3 2519static char *
aec46f14 2520S_uiv_2buf(char *buf, IV iv, UV uv, int is_uv, char **peob)
25da4f38 2521{
25da4f38 2522 char *ptr = buf + TYPE_CHARS(UV);
823a54a3 2523 char * const ebuf = ptr;
25da4f38 2524 int sign;
25da4f38
IZ
2525
2526 if (is_uv)
2527 sign = 0;
2528 else if (iv >= 0) {
2529 uv = iv;
2530 sign = 0;
2531 } else {
2532 uv = -iv;
2533 sign = 1;
2534 }
2535 do {
eb160463 2536 *--ptr = '0' + (char)(uv % 10);
25da4f38
IZ
2537 } while (uv /= 10);
2538 if (sign)
2539 *--ptr = '-';
2540 *peob = ebuf;
2541 return ptr;
2542}
2543
9af30d34
NC
2544/* stringify_regexp(): private routine for use by sv_2pv_flags(): converts
2545 * a regexp to its stringified form.
2546 */
2547
2548static char *
2549S_stringify_regexp(pTHX_ SV *sv, MAGIC *mg, STRLEN *lp) {
97aff369 2550 dVAR;
00b6aa41 2551 const regexp * const re = (regexp *)mg->mg_obj;
9af30d34
NC
2552
2553 if (!mg->mg_ptr) {
2554 const char *fptr = "msix";
2555 char reflags[6];
2556 char ch;
2557 int left = 0;
2558 int right = 4;
00b6aa41 2559 bool need_newline = 0;
9af30d34
NC
2560 U16 reganch = (U16)((re->reganch & PMf_COMPILETIME) >> 12);
2561
2562 while((ch = *fptr++)) {
2563 if(reganch & 1) {
2564 reflags[left++] = ch;
2565 }
2566 else {
2567 reflags[right--] = ch;
2568 }
2569 reganch >>= 1;
2570 }
2571 if(left != 4) {
2572 reflags[left] = '-';
2573 left = 5;
2574 }
2575
2576 mg->mg_len = re->prelen + 4 + left;
2577 /*
2578 * If /x was used, we have to worry about a regex ending with a
2579 * comment later being embedded within another regex. If so, we don't
2580 * want this regex's "commentization" to leak out to the right part of
2581 * the enclosing regex, we must cap it with a newline.
2582 *
2583 * So, if /x was used, we scan backwards from the end of the regex. If
2584 * we find a '#' before we find a newline, we need to add a newline
2585 * ourself. If we find a '\n' first (or if we don't find '#' or '\n'),
2586 * we don't need to add anything. -jfriedl
2587 */
2588 if (PMf_EXTENDED & re->reganch) {
2589 const char *endptr = re->precomp + re->prelen;
2590 while (endptr >= re->precomp) {
2591 const char c = *(endptr--);
2592 if (c == '\n')
2593 break; /* don't need another */
2594 if (c == '#') {
2595 /* we end while in a comment, so we need a newline */
2596 mg->mg_len++; /* save space for it */
2597 need_newline = 1; /* note to add it */
2598 break;
2599 }
2600 }
2601 }
2602
2603 Newx(mg->mg_ptr, mg->mg_len + 1 + left, char);
2604 mg->mg_ptr[0] = '(';
2605 mg->mg_ptr[1] = '?';
2606 Copy(reflags, mg->mg_ptr+2, left, char);
2607 *(mg->mg_ptr+left+2) = ':';
2608 Copy(re->precomp, mg->mg_ptr+3+left, re->prelen, char);
2609 if (need_newline)
2610 mg->mg_ptr[mg->mg_len - 2] = '\n';
2611 mg->mg_ptr[mg->mg_len - 1] = ')';
2612 mg->mg_ptr[mg->mg_len] = 0;
2613 }
2614 PL_reginterp_cnt += re->program[0].next_off;
2615
2616 if (re->reganch & ROPT_UTF8)
2617 SvUTF8_on(sv);
2618 else
2619 SvUTF8_off(sv);
2620 if (lp)
2621 *lp = mg->mg_len;
2622 return mg->mg_ptr;
2623}
2624
645c22ef
DM
2625/*
2626=for apidoc sv_2pv_flags
2627
ff276b08 2628Returns a pointer to the string value of an SV, and sets *lp to its length.
645c22ef
DM
2629If flags includes SV_GMAGIC, does an mg_get() first. Coerces sv to a string
2630if necessary.
2631Normally invoked via the C<SvPV_flags> macro. C<sv_2pv()> and C<sv_2pv_nomg>
2632usually end up here too.
2633
2634=cut
2635*/
2636
8d6d96c1
HS
2637char *
2638Perl_sv_2pv_flags(pTHX_ register SV *sv, STRLEN *lp, I32 flags)
2639{
97aff369 2640 dVAR;
79072805 2641 register char *s;
79072805 2642
463ee0b2 2643 if (!sv) {
cdb061a3
NC
2644 if (lp)
2645 *lp = 0;
73d840c0 2646 return (char *)"";
463ee0b2 2647 }
8990e307 2648 if (SvGMAGICAL(sv)) {
8d6d96c1
HS
2649 if (flags & SV_GMAGIC)
2650 mg_get(sv);
463ee0b2 2651 if (SvPOKp(sv)) {
cdb061a3
NC
2652 if (lp)
2653 *lp = SvCUR(sv);
10516c54
NC
2654 if (flags & SV_MUTABLE_RETURN)
2655 return SvPVX_mutable(sv);
4d84ee25
NC
2656 if (flags & SV_CONST_RETURN)
2657 return (char *)SvPVX_const(sv);
463ee0b2
LW
2658 return SvPVX(sv);
2659 }
75dfc8ec
NC
2660 if (SvIOKp(sv) || SvNOKp(sv)) {
2661 char tbuf[64]; /* Must fit sprintf/Gconvert of longest IV/NV */
75dfc8ec
NC
2662 STRLEN len;
2663
2664 if (SvIOKp(sv)) {
e80fed9d 2665 len = SvIsUV(sv)
d9fad198
JH
2666 ? my_snprintf(tbuf, sizeof(tbuf), "%"UVuf, (UV)SvUVX(sv))
2667 : my_snprintf(tbuf, sizeof(tbuf), "%"IVdf, (IV)SvIVX(sv));
75dfc8ec 2668 } else {
e8ada2d0
NC
2669 Gconvert(SvNVX(sv), NV_DIG, 0, tbuf);
2670 len = strlen(tbuf);
75dfc8ec 2671 }
b5b886f0
NC
2672 assert(!SvROK(sv));
2673 {
75dfc8ec
NC
2674 dVAR;
2675
2676#ifdef FIXNEGATIVEZERO
e8ada2d0
NC
2677 if (len == 2 && tbuf[0] == '-' && tbuf[1] == '0') {
2678 tbuf[0] = '0';
2679 tbuf[1] = 0;
75dfc8ec
NC
2680 len = 1;
2681 }
2682#endif
2683 SvUPGRADE(sv, SVt_PV);
2684 if (lp)
2685 *lp = len;
2686 s = SvGROW_mutable(sv, len + 1);
2687 SvCUR_set(sv, len);
2688 SvPOKp_on(sv);
e8ada2d0 2689 return memcpy(s, tbuf, len + 1);
75dfc8ec 2690 }
463ee0b2 2691 }
1c7ff15e
NC
2692 if (SvROK(sv)) {
2693 goto return_rok;
2694 }
2695 assert(SvTYPE(sv) >= SVt_PVMG);
2696 /* This falls through to the report_uninit near the end of the
2697 function. */
2698 } else if (SvTHINKFIRST(sv)) {
ed6116ce 2699 if (SvROK(sv)) {
1c7ff15e 2700 return_rok:
deb46114
NC
2701 if (SvAMAGIC(sv)) {
2702 SV *const tmpstr = AMG_CALLun(sv,string);
2703 if (tmpstr && (!SvROK(tmpstr) || (SvRV(tmpstr) != SvRV(sv)))) {
2704 /* Unwrap this: */
2705 /* char *pv = lp ? SvPV(tmpstr, *lp) : SvPV_nolen(tmpstr);
2706 */
2707
2708 char *pv;
2709 if ((SvFLAGS(tmpstr) & (SVf_POK)) == SVf_POK) {
2710 if (flags & SV_CONST_RETURN) {
2711 pv = (char *) SvPVX_const(tmpstr);
2712 } else {
2713 pv = (flags & SV_MUTABLE_RETURN)
2714 ? SvPVX_mutable(tmpstr) : SvPVX(tmpstr);
2715 }
2716 if (lp)
2717 *lp = SvCUR(tmpstr);
50adf7d2 2718 } else {
deb46114 2719 pv = sv_2pv_flags(tmpstr, lp, flags);
50adf7d2 2720 }
deb46114
NC
2721 if (SvUTF8(tmpstr))
2722 SvUTF8_on(sv);
2723 else
2724 SvUTF8_off(sv);
2725 return pv;
50adf7d2 2726 }
deb46114
NC
2727 }
2728 {
75dfc8ec 2729 SV *tsv;
f9277f47 2730 MAGIC *mg;
d8eae41e
NC
2731 const SV *const referent = (SV*)SvRV(sv);
2732
2733 if (!referent) {
396482e1 2734 tsv = sv_2mortal(newSVpvs("NULLREF"));
042dae7a
NC
2735 } else if (SvTYPE(referent) == SVt_PVMG
2736 && ((SvFLAGS(referent) &
2737 (SVs_OBJECT|SVf_OK|SVs_GMG|SVs_SMG|SVs_RMG))
2738 == (SVs_OBJECT|SVs_SMG))
2739 && (mg = mg_find(referent, PERL_MAGIC_qr))) {
c445ea15 2740 return stringify_regexp(sv, mg, lp);
d8eae41e
NC
2741 } else {
2742 const char *const typestr = sv_reftype(referent, 0);
2743
2744 tsv = sv_newmortal();
2745 if (SvOBJECT(referent)) {
2746 const char *const name = HvNAME_get(SvSTASH(referent));
2747 Perl_sv_setpvf(aTHX_ tsv, "%s=%s(0x%"UVxf")",
2748 name ? name : "__ANON__" , typestr,
2749 PTR2UV(referent));
2750 }
2751 else
2752 Perl_sv_setpvf(aTHX_ tsv, "%s(0x%"UVxf")", typestr,
2753 PTR2UV(referent));
c080367d 2754 }
042dae7a
NC
2755 if (lp)
2756 *lp = SvCUR(tsv);
2757 return SvPVX(tsv);
463ee0b2 2758 }
79072805 2759 }
0336b60e 2760 if (SvREADONLY(sv) && !SvOK(sv)) {
0336b60e 2761 if (ckWARN(WARN_UNINITIALIZED))
29489e7c 2762 report_uninit(sv);
cdb061a3
NC
2763 if (lp)
2764 *lp = 0;
73d840c0 2765 return (char *)"";
79072805 2766 }
79072805 2767 }
28e5dec8
JH
2768 if (SvIOK(sv) || ((SvIOKp(sv) && !SvNOKp(sv)))) {
2769 /* I'm assuming that if both IV and NV are equally valid then
2770 converting the IV is going to be more efficient */
e1ec3a88
AL
2771 const U32 isIOK = SvIOK(sv);
2772 const U32 isUIOK = SvIsUV(sv);
28e5dec8
JH
2773 char buf[TYPE_CHARS(UV)];
2774 char *ebuf, *ptr;
2775
2776 if (SvTYPE(sv) < SVt_PVIV)
2777 sv_upgrade(sv, SVt_PVIV);
4ea1d550 2778 ptr = uiv_2buf(buf, SvIVX(sv), SvUVX(sv), isUIOK, &ebuf);
5902b6a9
NC
2779 /* inlined from sv_setpvn */
2780 SvGROW_mutable(sv, (STRLEN)(ebuf - ptr + 1));
4d84ee25 2781 Move(ptr,SvPVX_mutable(sv),ebuf - ptr,char);
28e5dec8
JH
2782 SvCUR_set(sv, ebuf - ptr);
2783 s = SvEND(sv);
2784 *s = '\0';
2785 if (isIOK)
2786 SvIOK_on(sv);
2787 else
2788 SvIOKp_on(sv);
2789 if (isUIOK)
2790 SvIsUV_on(sv);
2791 }
2792 else if (SvNOKp(sv)) {
c81271c3 2793 const int olderrno = errno;
79072805
LW
2794 if (SvTYPE(sv) < SVt_PVNV)
2795 sv_upgrade(sv, SVt_PVNV);
1c846c1f 2796 /* The +20 is pure guesswork. Configure test needed. --jhi */
5902b6a9 2797 s = SvGROW_mutable(sv, NV_DIG + 20);
c81271c3 2798 /* some Xenix systems wipe out errno here */
79072805 2799#ifdef apollo
463ee0b2 2800 if (SvNVX(sv) == 0.0)
79072805
LW
2801 (void)strcpy(s,"0");
2802 else
2803#endif /*apollo*/
bbce6d69 2804 {
2d4389e4 2805 Gconvert(SvNVX(sv), NV_DIG, 0, s);
bbce6d69 2806 }
79072805 2807 errno = olderrno;
a0d0e21e
LW
2808#ifdef FIXNEGATIVEZERO
2809 if (*s == '-' && s[1] == '0' && !s[2])
2810 strcpy(s,"0");
2811#endif
79072805
LW
2812 while (*s) s++;
2813#ifdef hcx
2814 if (s[-1] == '.')
46fc3d4c 2815 *--s = '\0';
79072805
LW
2816#endif
2817 }
79072805 2818 else {
675c862f 2819 if (isGV_with_GP(sv))
19f6321d 2820 return glob_2pv((GV *)sv, lp);
180488f8 2821
041457d9 2822 if (!PL_localizing && !(SvFLAGS(sv) & SVs_PADTMP) && ckWARN(WARN_UNINITIALIZED))
29489e7c 2823 report_uninit(sv);
cdb061a3 2824 if (lp)
00b6aa41 2825 *lp = 0;
25da4f38
IZ
2826 if (SvTYPE(sv) < SVt_PV)
2827 /* Typically the caller expects that sv_any is not NULL now. */
2828 sv_upgrade(sv, SVt_PV);
73d840c0 2829 return (char *)"";
79072805 2830 }
cdb061a3 2831 {
823a54a3 2832 const STRLEN len = s - SvPVX_const(sv);
cdb061a3
NC
2833 if (lp)
2834 *lp = len;
2835 SvCUR_set(sv, len);
2836 }
79072805 2837 SvPOK_on(sv);
1d7c1841 2838 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2pv(%s)\n",
3f7c398e 2839 PTR2UV(sv),SvPVX_const(sv)));
4d84ee25
NC
2840 if (flags & SV_CONST_RETURN)
2841 return (char *)SvPVX_const(sv);
10516c54
NC
2842 if (flags & SV_MUTABLE_RETURN)
2843 return SvPVX_mutable(sv);
463ee0b2
LW
2844 return SvPVX(sv);
2845}
2846
645c22ef 2847/*
6050d10e
JP
2848=for apidoc sv_copypv
2849
2850Copies a stringified representation of the source SV into the
2851destination SV. Automatically performs any necessary mg_get and
54f0641b 2852coercion of numeric values into strings. Guaranteed to preserve
6050d10e 2853UTF-8 flag even from overloaded objects. Similar in nature to
54f0641b
NIS
2854sv_2pv[_flags] but operates directly on an SV instead of just the
2855string. Mostly uses sv_2pv_flags to do its work, except when that
6050d10e
JP
2856would lose the UTF-8'ness of the PV.
2857
2858=cut
2859*/
2860
2861void
2862Perl_sv_copypv(pTHX_ SV *dsv, register SV *ssv)
2863{
446eaa42 2864 STRLEN len;
53c1dcc0 2865 const char * const s = SvPV_const(ssv,len);
cb50f42d 2866 sv_setpvn(dsv,s,len);
446eaa42 2867 if (SvUTF8(ssv))
cb50f42d 2868 SvUTF8_on(dsv);
446eaa42 2869 else
cb50f42d 2870 SvUTF8_off(dsv);
6050d10e
JP
2871}
2872
2873/*
645c22ef
DM
2874=for apidoc sv_2pvbyte
2875
2876Return a pointer to the byte-encoded representation of the SV, and set *lp
1e54db1a 2877to its length. May cause the SV to be downgraded from UTF-8 as a
645c22ef
DM
2878side-effect.
2879
2880Usually accessed via the C<SvPVbyte> macro.
2881
2882=cut
2883*/
2884
7340a771
GS
2885char *
2886Perl_sv_2pvbyte(pTHX_ register SV *sv, STRLEN *lp)
2887{
0875d2fe 2888 sv_utf8_downgrade(sv,0);
97972285 2889 return lp ? SvPV(sv,*lp) : SvPV_nolen(sv);
7340a771
GS
2890}
2891
645c22ef 2892/*
035cbb0e
RGS
2893=for apidoc sv_2pvutf8
2894
2895Return a pointer to the UTF-8-encoded representation of the SV, and set *lp
2896to its length. May cause the SV to be upgraded to UTF-8 as a side-effect.
2897
2898Usually accessed via the C<SvPVutf8> macro.
2899
2900=cut
2901*/
645c22ef 2902
7340a771
GS
2903char *
2904Perl_sv_2pvutf8(pTHX_ register SV *sv, STRLEN *lp)
2905{
035cbb0e
RGS
2906 sv_utf8_upgrade(sv);
2907 return lp ? SvPV(sv,*lp) : SvPV_nolen(sv);
7340a771 2908}
1c846c1f 2909
7ee2227d 2910
645c22ef
DM
2911/*
2912=for apidoc sv_2bool
2913
2914This function is only called on magical items, and is only used by
8cf8f3d1 2915sv_true() or its macro equivalent.
645c22ef
DM
2916
2917=cut
2918*/
2919
463ee0b2 2920bool
864dbfa3 2921Perl_sv_2bool(pTHX_ register SV *sv)
463ee0b2 2922{
97aff369 2923 dVAR;
5b295bef 2924 SvGETMAGIC(sv);
463ee0b2 2925
a0d0e21e
LW
2926 if (!SvOK(sv))
2927 return 0;
2928 if (SvROK(sv)) {
fabdb6c0
AL
2929 if (SvAMAGIC(sv)) {
2930 SV * const tmpsv = AMG_CALLun(sv,bool_);
2931 if (tmpsv && (!SvROK(tmpsv) || (SvRV(tmpsv) != SvRV(sv))))
2932 return (bool)SvTRUE(tmpsv);
2933 }
2934 return SvRV(sv) != 0;
a0d0e21e 2935 }
463ee0b2 2936 if (SvPOKp(sv)) {
53c1dcc0
AL
2937 register XPV* const Xpvtmp = (XPV*)SvANY(sv);
2938 if (Xpvtmp &&
339049b0 2939 (*sv->sv_u.svu_pv > '0' ||
11343788 2940 Xpvtmp->xpv_cur > 1 ||
339049b0 2941 (Xpvtmp->xpv_cur && *sv->sv_u.svu_pv != '0')))
463ee0b2
LW
2942 return 1;
2943 else
2944 return 0;
2945 }
2946 else {
2947 if (SvIOKp(sv))
2948 return SvIVX(sv) != 0;
2949 else {
2950 if (SvNOKp(sv))
2951 return SvNVX(sv) != 0.0;
180488f8 2952 else {
f7877b28 2953 if (isGV_with_GP(sv))
180488f8
NC
2954 return TRUE;
2955 else
2956 return FALSE;
2957 }
463ee0b2
LW
2958 }
2959 }
79072805
LW
2960}
2961
c461cf8f
JH
2962/*
2963=for apidoc sv_utf8_upgrade
2964
78ea37eb 2965Converts the PV of an SV to its UTF-8-encoded form.
645c22ef 2966Forces the SV to string form if it is not already.
4411f3b6
NIS
2967Always sets the SvUTF8 flag to avoid future validity checks even
2968if all the bytes have hibit clear.
c461cf8f 2969
13a6c0e0
JH
2970This is not as a general purpose byte encoding to Unicode interface:
2971use the Encode extension for that.
2972
8d6d96c1
HS
2973=for apidoc sv_utf8_upgrade_flags
2974
78ea37eb 2975Converts the PV of an SV to its UTF-8-encoded form.
645c22ef 2976Forces the SV to string form if it is not already.
8d6d96c1
HS
2977Always sets the SvUTF8 flag to avoid future validity checks even
2978if all the bytes have hibit clear. If C<flags> has C<SV_GMAGIC> bit set,
2979will C<mg_get> on C<sv> if appropriate, else not. C<sv_utf8_upgrade> and
2980C<sv_utf8_upgrade_nomg> are implemented in terms of this function.
2981
13a6c0e0
JH
2982This is not as a general purpose byte encoding to Unicode interface:
2983use the Encode extension for that.
2984
8d6d96c1
HS
2985=cut
2986*/
2987
2988STRLEN
2989Perl_sv_utf8_upgrade_flags(pTHX_ register SV *sv, I32 flags)
2990{
97aff369 2991 dVAR;
808c356f
RGS
2992 if (sv == &PL_sv_undef)
2993 return 0;
e0e62c2a
NIS
2994 if (!SvPOK(sv)) {
2995 STRLEN len = 0;
d52b7888
NC
2996 if (SvREADONLY(sv) && (SvPOKp(sv) || SvIOKp(sv) || SvNOKp(sv))) {
2997 (void) sv_2pv_flags(sv,&len, flags);
2998 if (SvUTF8(sv))
2999 return len;
3000 } else {
3001 (void) SvPV_force(sv,len);
3002 }
e0e62c2a 3003 }
4411f3b6 3004
f5cee72b 3005 if (SvUTF8(sv)) {
5fec3b1d 3006 return SvCUR(sv);
f5cee72b 3007 }
5fec3b1d 3008
765f542d
NC
3009 if (SvIsCOW(sv)) {
3010 sv_force_normal_flags(sv, 0);
db42d148
NIS
3011 }
3012
88632417 3013 if (PL_encoding && !(flags & SV_UTF8_NO_ENCODING))
799ef3cb 3014 sv_recode_to_utf8(sv, PL_encoding);
9f4817db 3015 else { /* Assume Latin-1/EBCDIC */
c4e7c712
NC
3016 /* This function could be much more efficient if we
3017 * had a FLAG in SVs to signal if there are any hibit
3018 * chars in the PV. Given that there isn't such a flag
3019 * make the loop as fast as possible. */
00b6aa41 3020 const U8 * const s = (U8 *) SvPVX_const(sv);
c4420975 3021 const U8 * const e = (U8 *) SvEND(sv);
93524f2b 3022 const U8 *t = s;
c4e7c712
NC
3023
3024 while (t < e) {
53c1dcc0 3025 const U8 ch = *t++;
00b6aa41
AL
3026 /* Check for hi bit */
3027 if (!NATIVE_IS_INVARIANT(ch)) {
3028 STRLEN len = SvCUR(sv) + 1; /* Plus the \0 */
3029 U8 * const recoded = bytes_to_utf8((U8*)s, &len);
3030
3031 SvPV_free(sv); /* No longer using what was there before. */
3032 SvPV_set(sv, (char*)recoded);
3033 SvCUR_set(sv, len - 1);
3034 SvLEN_set(sv, len); /* No longer know the real size. */
c4e7c712 3035 break;
00b6aa41 3036 }
c4e7c712
NC
3037 }
3038 /* Mark as UTF-8 even if no hibit - saves scanning loop */
3039 SvUTF8_on(sv);
560a288e 3040 }
4411f3b6 3041 return SvCUR(sv);
560a288e
GS
3042}
3043
c461cf8f
JH
3044/*
3045=for apidoc sv_utf8_downgrade
3046
78ea37eb
TS
3047Attempts to convert the PV of an SV from characters to bytes.
3048If the PV contains a character beyond byte, this conversion will fail;
3049in this case, either returns false or, if C<fail_ok> is not
c461cf8f
JH
3050true, croaks.
3051
13a6c0e0
JH
3052This is not as a general purpose Unicode to byte encoding interface:
3053use the Encode extension for that.
3054
c461cf8f
JH
3055=cut
3056*/
3057
560a288e
GS
3058bool
3059Perl_sv_utf8_downgrade(pTHX_ register SV* sv, bool fail_ok)
3060{
97aff369 3061 dVAR;
78ea37eb 3062 if (SvPOKp(sv) && SvUTF8(sv)) {
fa301091 3063 if (SvCUR(sv)) {
03cfe0ae 3064 U8 *s;
652088fc 3065 STRLEN len;
fa301091 3066
765f542d
NC
3067 if (SvIsCOW(sv)) {
3068 sv_force_normal_flags(sv, 0);
3069 }
03cfe0ae
NIS
3070 s = (U8 *) SvPV(sv, len);
3071 if (!utf8_to_bytes(s, &len)) {
fa301091
JH
3072 if (fail_ok)
3073 return FALSE;
3074 else {
3075 if (PL_op)
3076 Perl_croak(aTHX_ "Wide character in %s",
53e06cf0 3077 OP_DESC(PL_op));
fa301091
JH
3078 else
3079 Perl_croak(aTHX_ "Wide character");
3080 }
4b3603a4 3081 }
b162af07 3082 SvCUR_set(sv, len);
67e989fb 3083 }
560a288e 3084 }
ffebcc3e 3085 SvUTF8_off(sv);
560a288e
GS
3086 return TRUE;
3087}
3088
c461cf8f
JH
3089/*
3090=for apidoc sv_utf8_encode
3091
78ea37eb
TS
3092Converts the PV of an SV to UTF-8, but then turns the C<SvUTF8>
3093flag off so that it looks like octets again.
c461cf8f
JH
3094
3095=cut
3096*/
3097
560a288e
GS
3098void
3099Perl_sv_utf8_encode(pTHX_ register SV *sv)
3100{
4c94c214
NC
3101 if (SvIsCOW(sv)) {
3102 sv_force_normal_flags(sv, 0);
3103 }
3104 if (SvREADONLY(sv)) {
3105 Perl_croak(aTHX_ PL_no_modify);
3106 }
a5f5288a 3107 (void) sv_utf8_upgrade(sv);
560a288e
GS
3108 SvUTF8_off(sv);
3109}
3110
4411f3b6
NIS
3111/*
3112=for apidoc sv_utf8_decode
3113
78ea37eb
TS
3114If the PV of the SV is an octet sequence in UTF-8
3115and contains a multiple-byte character, the C<SvUTF8> flag is turned on
3116so that it looks like a character. If the PV contains only single-byte
3117characters, the C<SvUTF8> flag stays being off.
3118Scans PV for validity and returns false if the PV is invalid UTF-8.
4411f3b6
NIS
3119
3120=cut
3121*/
3122
560a288e
GS
3123bool
3124Perl_sv_utf8_decode(pTHX_ register SV *sv)
3125{
78ea37eb 3126 if (SvPOKp(sv)) {
93524f2b
NC
3127 const U8 *c;
3128 const U8 *e;
9cbac4c7 3129
645c22ef
DM
3130 /* The octets may have got themselves encoded - get them back as
3131 * bytes
3132 */
3133 if (!sv_utf8_downgrade(sv, TRUE))
560a288e
GS
3134 return FALSE;
3135
3136 /* it is actually just a matter of turning the utf8 flag on, but
3137 * we want to make sure everything inside is valid utf8 first.
3138 */
93524f2b 3139 c = (const U8 *) SvPVX_const(sv);
63cd0674 3140 if (!is_utf8_string(c, SvCUR(sv)+1))
67e989fb 3141 return FALSE;
93524f2b 3142 e = (const U8 *) SvEND(sv);
511c2ff0 3143 while (c < e) {
b64e5050 3144 const U8 ch = *c++;
c4d5f83a 3145 if (!UTF8_IS_INVARIANT(ch)) {
67e989fb
JH
3146 SvUTF8_on(sv);
3147 break;
3148 }
560a288e 3149 }
560a288e
GS
3150 }
3151 return TRUE;
3152}
3153
954c1994
GS
3154/*
3155=for apidoc sv_setsv
3156
645c22ef
DM
3157Copies the contents of the source SV C<ssv> into the destination SV
3158C<dsv>. The source SV may be destroyed if it is mortal, so don't use this
3159function if the source SV needs to be reused. Does not handle 'set' magic.
3160Loosely speaking, it performs a copy-by-value, obliterating any previous
3161content of the destination.
3162
3163You probably want to use one of the assortment of wrappers, such as
3164C<SvSetSV>, C<SvSetSV_nosteal>, C<SvSetMagicSV> and
3165C<SvSetMagicSV_nosteal>.
3166
8d6d96c1
HS
3167=for apidoc sv_setsv_flags
3168
645c22ef
DM
3169Copies the contents of the source SV C<ssv> into the destination SV
3170C<dsv>. The source SV may be destroyed if it is mortal, so don't use this
3171function if the source SV needs to be reused. Does not handle 'set' magic.
3172Loosely speaking, it performs a copy-by-value, obliterating any previous
3173content of the destination.
3174If the C<flags> parameter has the C<SV_GMAGIC> bit set, will C<mg_get> on
5fcdf167
NC
3175C<ssv> if appropriate, else not. If the C<flags> parameter has the
3176C<NOSTEAL> bit set then the buffers of temps will not be stolen. <sv_setsv>
3177and C<sv_setsv_nomg> are implemented in terms of this function.
645c22ef
DM
3178
3179You probably want to use one of the assortment of wrappers, such as
3180C<SvSetSV>, C<SvSetSV_nosteal>, C<SvSetMagicSV> and
3181C<SvSetMagicSV_nosteal>.
3182
3183This is the primary function for copying scalars, and most other
3184copy-ish functions and macros use this underneath.
8d6d96c1
HS
3185
3186=cut
3187*/
3188
5d0301b7 3189static void
2eb42952 3190S_glob_assign_glob(pTHX_ SV *dstr, SV *sstr, const int dtype)
5d0301b7
NC
3191{
3192 if (dtype != SVt_PVGV) {
3193 const char * const name = GvNAME(sstr);
3194 const STRLEN len = GvNAMELEN(sstr);
3195 /* don't upgrade SVt_PVLV: it can hold a glob */
f7877b28
NC
3196 if (dtype != SVt_PVLV) {
3197 if (dtype >= SVt_PV) {
3198 SvPV_free(dstr);
3199 SvPV_set(dstr, 0);
3200 SvLEN_set(dstr, 0);
3201 SvCUR_set(dstr, 0);
3202 }
5d0301b7 3203 sv_upgrade(dstr, SVt_PVGV);
dedf8e73
NC
3204 (void)SvOK_off(dstr);
3205 SvSCREAM_on(dstr);
f7877b28 3206 }
5d0301b7
NC
3207 GvSTASH(dstr) = GvSTASH(sstr);
3208 if (GvSTASH(dstr))
3209 Perl_sv_add_backref(aTHX_ (SV*)GvSTASH(dstr), dstr);
ae8cc45f 3210 gv_name_set((GV *)dstr, name, len, GV_ADD);
5d0301b7
NC
3211 SvFAKE_on(dstr); /* can coerce to non-glob */
3212 }
3213
3214#ifdef GV_UNIQUE_CHECK
3215 if (GvUNIQUE((GV*)dstr)) {
3216 Perl_croak(aTHX_ PL_no_modify);
3217 }
3218#endif
3219
f7877b28
NC
3220 gp_free((GV*)dstr);
3221 SvSCREAM_off(dstr);
5d0301b7 3222 (void)SvOK_off(dstr);
f7877b28 3223 SvSCREAM_on(dstr);
dedf8e73 3224 GvINTRO_off(dstr); /* one-shot flag */
5d0301b7
NC
3225 GvGP(dstr) = gp_ref(GvGP(sstr));
3226 if (SvTAINTED(sstr))
3227 SvTAINT(dstr);
3228 if (GvIMPORTED(dstr) != GVf_IMPORTED
3229 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3230 {
3231 GvIMPORTED_on(dstr);
3232 }
3233 GvMULTI_on(dstr);
3234 return;
3235}
3236
b8473700 3237static void
2eb42952 3238S_glob_assign_ref(pTHX_ SV *dstr, SV *sstr) {
b8473700
NC
3239 SV * const sref = SvREFCNT_inc(SvRV(sstr));
3240 SV *dref = NULL;
3241 const int intro = GvINTRO(dstr);
2440974c 3242 SV **location;
3386d083 3243 U8 import_flag = 0;
27242d61
NC
3244 const U32 stype = SvTYPE(sref);
3245
b8473700
NC
3246
3247#ifdef GV_UNIQUE_CHECK
3248 if (GvUNIQUE((GV*)dstr)) {
3249 Perl_croak(aTHX_ PL_no_modify);
3250 }
3251#endif
3252
3253 if (intro) {
3254 GvINTRO_off(dstr); /* one-shot flag */
3255 GvLINE(dstr) = CopLINE(PL_curcop);
3256 GvEGV(dstr) = (GV*)dstr;
3257 }
3258 GvMULTI_on(dstr);
27242d61 3259 switch (stype) {
b8473700 3260 case SVt_PVCV:
27242d61
NC
3261 location = (SV **) &GvCV(dstr);
3262 import_flag = GVf_IMPORTED_CV;
3263 goto common;
3264 case SVt_PVHV:
3265 location = (SV **) &GvHV(dstr);
3266 import_flag = GVf_IMPORTED_HV;
3267 goto common;
3268 case SVt_PVAV:
3269 location = (SV **) &GvAV(dstr);
3270 import_flag = GVf_IMPORTED_AV;
3271 goto common;
3272 case SVt_PVIO:
3273 location = (SV **) &GvIOp(dstr);
3274 goto common;
3275 case SVt_PVFM:
3276 location = (SV **) &GvFORM(dstr);
3277 default:
3278 location = &GvSV(dstr);
3279 import_flag = GVf_IMPORTED_SV;
3280 common:
b8473700 3281 if (intro) {
27242d61
NC
3282 if (stype == SVt_PVCV) {
3283 if (GvCVGEN(dstr) && GvCV(dstr) != (CV*)sref) {
3284 SvREFCNT_dec(GvCV(dstr));
3285 GvCV(dstr) = NULL;
3286 GvCVGEN(dstr) = 0; /* Switch off cacheness. */
3287 PL_sub_generation++;
3288 }
b8473700 3289 }
27242d61 3290 SAVEGENERICSV(*location);
b8473700
NC
3291 }
3292 else
27242d61
NC
3293 dref = *location;
3294 if (stype == SVt_PVCV && *location != sref) {
3295 CV* const cv = (CV*)*location;
b8473700
NC
3296 if (cv) {
3297 if (!GvCVGEN((GV*)dstr) &&
3298 (CvROOT(cv) || CvXSUB(cv)))
3299 {
3300 /* Redefining a sub - warning is mandatory if
3301 it was a const and its value changed. */
3302 if (CvCONST(cv) && CvCONST((CV*)sref)
3303 && cv_const_sv(cv) == cv_const_sv((CV*)sref)) {
6f207bd3 3304 NOOP;
b8473700
NC
3305 /* They are 2 constant subroutines generated from
3306 the same constant. This probably means that
3307 they are really the "same" proxy subroutine
3308 instantiated in 2 places. Most likely this is
3309 when a constant is exported twice. Don't warn.
3310 */
3311 }
3312 else if (ckWARN(WARN_REDEFINE)
3313 || (CvCONST(cv)
3314 && (!CvCONST((CV*)sref)
3315 || sv_cmp(cv_const_sv(cv),
3316 cv_const_sv((CV*)sref))))) {
3317 Perl_warner(aTHX_ packWARN(WARN_REDEFINE),
3318 CvCONST(cv)
3319 ? "Constant subroutine %s::%s redefined"
3320 : "Subroutine %s::%s redefined",
3321 HvNAME_get(GvSTASH((GV*)dstr)),
3322 GvENAME((GV*)dstr));
3323 }
3324 }
3325 if (!intro)
cbf82dd0
NC
3326 cv_ckproto_len(cv, (GV*)dstr,
3327 SvPOK(sref) ? SvPVX_const(sref) : NULL,
3328 SvPOK(sref) ? SvCUR(sref) : 0);
b8473700 3329 }
b8473700
NC
3330 GvCVGEN(dstr) = 0; /* Switch off cacheness. */
3331 GvASSUMECV_on(dstr);
3332 PL_sub_generation++;
3333 }
2440974c 3334 *location = sref;
3386d083
NC
3335 if (import_flag && !(GvFLAGS(dstr) & import_flag)
3336 && CopSTASH_ne(PL_curcop, GvSTASH(dstr))) {
3337 GvFLAGS(dstr) |= import_flag;
b8473700
NC
3338 }
3339 break;
3340 }
b37c2d43 3341 SvREFCNT_dec(dref);
b8473700
NC
3342 if (SvTAINTED(sstr))
3343 SvTAINT(dstr);
3344 return;
3345}
3346
8d6d96c1
HS
3347void
3348Perl_sv_setsv_flags(pTHX_ SV *dstr, register SV *sstr, I32 flags)
3349{
97aff369 3350 dVAR;
8990e307
LW
3351 register U32 sflags;
3352 register int dtype;
42d0e0b7 3353 register svtype stype;
463ee0b2 3354
79072805
LW
3355 if (sstr == dstr)
3356 return;
765f542d 3357 SV_CHECK_THINKFIRST_COW_DROP(dstr);
79072805 3358 if (!sstr)
3280af22 3359 sstr = &PL_sv_undef;
8990e307
LW
3360 stype = SvTYPE(sstr);
3361 dtype = SvTYPE(dstr);
79072805 3362
a0d0e21e 3363 SvAMAGIC_off(dstr);
7a5fa8a2 3364 if ( SvVOK(dstr) )
ece467f9
JP
3365 {
3366 /* need to nuke the magic */
3367 mg_free(dstr);
3368 SvRMAGICAL_off(dstr);
3369 }
9e7bc3e8 3370
463ee0b2 3371 /* There's a lot of redundancy below but we're going for speed here */
79072805 3372
8990e307 3373 switch (stype) {
79072805 3374 case SVt_NULL:
aece5585 3375 undef_sstr:
20408e3c
GS
3376 if (dtype != SVt_PVGV) {
3377 (void)SvOK_off(dstr);
3378 return;
3379 }
3380 break;
463ee0b2 3381 case SVt_IV:
aece5585
GA
3382 if (SvIOK(sstr)) {
3383 switch (dtype) {
3384 case SVt_NULL:
8990e307 3385 sv_upgrade(dstr, SVt_IV);
aece5585
GA
3386 break;
3387 case SVt_NV:
aece5585
GA
3388 case SVt_RV:
3389 case SVt_PV:
a0d0e21e 3390 sv_upgrade(dstr, SVt_PVIV);
aece5585
GA
3391 break;
3392 }
3393 (void)SvIOK_only(dstr);
45977657 3394 SvIV_set(dstr, SvIVX(sstr));
25da4f38
IZ
3395 if (SvIsUV(sstr))
3396 SvIsUV_on(dstr);
37c25af0
NC
3397 /* SvTAINTED can only be true if the SV has taint magic, which in
3398 turn means that the SV type is PVMG (or greater). This is the
3399 case statement for SVt_IV, so this cannot be true (whatever gcov
3400 may say). */
3401 assert(!SvTAINTED(sstr));
aece5585 3402 return;
8990e307 3403 }
aece5585
GA
3404 goto undef_sstr;
3405
463ee0b2 3406 case SVt_NV:
aece5585
GA
3407 if (SvNOK(sstr)) {
3408 switch (dtype) {
3409 case SVt_NULL:
3410 case SVt_IV:
8990e307 3411 sv_upgrade(dstr, SVt_NV);
aece5585
GA
3412 break;
3413 case SVt_RV:
3414 case SVt_PV:
3415 case SVt_PVIV:
a0d0e21e 3416 sv_upgrade(dstr, SVt_PVNV);
aece5585
GA
3417 break;
3418 }
9d6ce603 3419 SvNV_set(dstr, SvNVX(sstr));
aece5585 3420 (void)SvNOK_only(dstr);
37c25af0
NC
3421 /* SvTAINTED can only be true if the SV has taint magic, which in
3422 turn means that the SV type is PVMG (or greater). This is the
3423 case statement for SVt_NV, so this cannot be true (whatever gcov
3424 may say). */
3425 assert(!SvTAINTED(sstr));
aece5585 3426 return;
8990e307 3427 }
aece5585
GA
3428 goto undef_sstr;
3429
ed6116ce 3430 case SVt_RV:
8990e307 3431 if (dtype < SVt_RV)
ed6116ce 3432 sv_upgrade(dstr, SVt_RV);
ed6116ce 3433 break;
fc36a67e 3434 case SVt_PVFM:
f8c7b90f 3435#ifdef PERL_OLD_COPY_ON_WRITE
d89fc664
NC
3436 if ((SvFLAGS(sstr) & CAN_COW_MASK) == CAN_COW_FLAGS) {
3437 if (dtype < SVt_PVIV)
3438 sv_upgrade(dstr, SVt_PVIV);
3439 break;
3440 }
3441 /* Fall through */
3442#endif
3443 case SVt_PV:
8990e307 3444 if (dtype < SVt_PV)
463ee0b2 3445 sv_upgrade(dstr, SVt_PV);
463ee0b2
LW
3446 break;
3447 case SVt_PVIV:
8990e307 3448 if (dtype < SVt_PVIV)
463ee0b2 3449 sv_upgrade(dstr, SVt_PVIV);
463ee0b2
LW
3450 break;
3451 case SVt_PVNV:
8990e307 3452 if (dtype < SVt_PVNV)
463ee0b2 3453 sv_upgrade(dstr, SVt_PVNV);
463ee0b2 3454 break;
489f7bfe 3455 default:
a3b680e6
AL
3456 {
3457 const char * const type = sv_reftype(sstr,0);
533c011a 3458 if (PL_op)
a3b680e6 3459 Perl_croak(aTHX_ "Bizarre copy of %s in %s", type, OP_NAME(PL_op));
4633a7c4 3460 else
a3b680e6
AL
3461 Perl_croak(aTHX_ "Bizarre copy of %s", type);
3462 }
4633a7c4
LW
3463 break;
3464
79072805 3465 case SVt_PVGV:
8990e307 3466 if (dtype <= SVt_PVGV) {
d4c19fe8 3467 glob_assign_glob(dstr, sstr, dtype);
b8c701c1 3468 return;
79072805 3469 }
5f66b61c 3470 /*FALLTHROUGH*/
79072805 3471
489f7bfe
NC
3472 case SVt_PVMG:
3473 case SVt_PVLV:
3474 case SVt_PVBM:
8d6d96c1 3475 if (SvGMAGICAL(sstr) && (flags & SV_GMAGIC)) {
973f89ab 3476 mg_get(sstr);
eb160463 3477 if ((int)SvTYPE(sstr) != stype) {
973f89ab 3478 stype = SvTYPE(sstr);
b8c701c1 3479 if (stype == SVt_PVGV && dtype <= SVt_PVGV) {
d4c19fe8 3480 glob_assign_glob(dstr, sstr, dtype);
b8c701c1
NC
3481 return;
3482 }
973f89ab
CS
3483 }
3484 }
ded42b9f 3485 if (stype == SVt_PVLV)
862a34c6 3486 SvUPGRADE(dstr, SVt_PVNV);
ded42b9f 3487 else
42d0e0b7 3488 SvUPGRADE(dstr, (svtype)stype);
79072805
LW
3489 }
3490
ff920335
NC
3491 /* dstr may have been upgraded. */
3492 dtype = SvTYPE(dstr);
8990e307
LW
3493 sflags = SvFLAGS(sstr);
3494
3495 if (sflags & SVf_ROK) {
acaa9288
NC
3496 if (dtype == SVt_PVGV &&
3497 SvROK(sstr) && SvTYPE(SvRV(sstr)) == SVt_PVGV) {
3498 sstr = SvRV(sstr);
3499 if (sstr == dstr) {
3500 if (GvIMPORTED(dstr) != GVf_IMPORTED
3501 && CopSTASH_ne(PL_curcop, GvSTASH(dstr)))
3502 {
3503 GvIMPORTED_on(dstr);
3504 }
3505 GvMULTI_on(dstr);
3506 return;
3507 }
d4c19fe8 3508 glob_assign_glob(dstr, sstr, dtype);
acaa9288
NC
3509 return;
3510 }
3511
8990e307 3512 if (dtype >= SVt_PV) {
b8c701c1 3513 if (dtype == SVt_PVGV) {
d4c19fe8 3514 glob_assign_ref(dstr, sstr);
b8c701c1
NC
3515 return;
3516 }
3f7c398e 3517 if (SvPVX_const(dstr)) {
8bd4d4c5 3518 SvPV_free(dstr);
b162af07
SP
3519 SvLEN_set(dstr, 0);
3520 SvCUR_set(dstr, 0);
a0d0e21e 3521 }
8990e307 3522 }
a0d0e21e 3523 (void)SvOK_off(dstr);
b162af07 3524 SvRV_set(dstr, SvREFCNT_inc(SvRV(sstr)));
dfd48732
NC
3525 SvFLAGS(dstr) |= sflags & (SVf_ROK|SVf_AMAGIC);
3526 assert(!(sflags & SVp_NOK));
3527 assert(!(sflags & SVp_IOK));
3528 assert(!(sflags & SVf_NOK));
3529 assert(!(sflags & SVf_IOK));
ed6116ce 3530 }
c0c44674
NC
3531 else if (dtype == SVt_PVGV) {
3532 if (!(sflags & SVf_OK)) {
3533 if (ckWARN(WARN_MISC))
3534 Perl_warner(aTHX_ packWARN(WARN_MISC),
3535 "Undefined value assigned to typeglob");
3536 }
3537 else {
3538 GV *gv = gv_fetchsv(sstr, GV_ADD, SVt_PVGV);
3539 if (dstr != (SV*)gv) {
3540 if (GvGP(dstr))
3541 gp_free((GV*)dstr);
3542 GvGP(dstr) = gp_ref(GvGP(gv));
3543 }
3544 }
3545 }
8990e307 3546 else if (sflags & SVp_POK) {
765f542d 3547 bool isSwipe = 0;
79072805
LW
3548
3549 /*
3550 * Check to see if we can just swipe the string. If so, it's a
3551 * possible small lose on short strings, but a big win on long ones.
3f7c398e
SP
3552 * It might even be a win on short strings if SvPVX_const(dstr)
3553 * has to be allocated and SvPVX_const(sstr) has to be freed.
79072805
LW
3554 */
3555
120fac95
NC
3556 /* Whichever path we take through the next code, we want this true,
3557 and doing it now facilitates the COW check. */
3558 (void)SvPOK_only(dstr);
3559
765f542d 3560 if (
b8f9541a
NC
3561 /* We're not already COW */
3562 ((sflags & (SVf_FAKE | SVf_READONLY)) != (SVf_FAKE | SVf_READONLY)
f8c7b90f 3563#ifndef PERL_OLD_COPY_ON_WRITE
b8f9541a
NC
3564 /* or we are, but dstr isn't a suitable target. */
3565 || (SvFLAGS(dstr) & CAN_COW_MASK) != CAN_COW_FLAGS
3566#endif
3567 )
765f542d 3568 &&
765f542d
NC
3569 !(isSwipe =
3570 (sflags & SVs_TEMP) && /* slated for free anyway? */
3571 !(sflags & SVf_OOK) && /* and not involved in OOK hack? */
5fcdf167
NC
3572 (!(flags & SV_NOSTEAL)) &&
3573 /* and we're allowed to steal temps */
765f542d
NC
3574 SvREFCNT(sstr) == 1 && /* and no other references to it? */
3575 SvLEN(sstr) && /* and really is a string */
645c22ef 3576 /* and won't be needed again, potentially */
765f542d 3577 !(PL_op && PL_op->op_type == OP_AASSIGN))
f8c7b90f 3578#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 3579 && !((sflags & CAN_COW_MASK) == CAN_COW_FLAGS
120fac95 3580 && (SvFLAGS(dstr) & CAN_COW_MASK) == CAN_COW_FLAGS
765f542d
NC
3581 && SvTYPE(sstr) >= SVt_PVIV)
3582#endif
3583 ) {
3584 /* Failed the swipe test, and it's not a shared hash key either.
3585 Have to copy the string. */
3586 STRLEN len = SvCUR(sstr);
3587 SvGROW(dstr, len + 1); /* inlined from sv_setpvn */
3f7c398e 3588 Move(SvPVX_const(sstr),SvPVX(dstr),len,char);
765f542d
NC
3589 SvCUR_set(dstr, len);
3590 *SvEND(dstr) = '\0';
765f542d 3591 } else {
f8c7b90f 3592 /* If PERL_OLD_COPY_ON_WRITE is not defined, then isSwipe will always
765f542d 3593 be true in here. */
765f542d
NC
3594 /* Either it's a shared hash key, or it's suitable for
3595 copy-on-write or we can swipe the string. */
46187eeb 3596 if (DEBUG_C_TEST) {
ed252734 3597 PerlIO_printf(Perl_debug_log, "Copy on write: sstr --> dstr\n");
e419cbc5
NC
3598 sv_dump(sstr);
3599 sv_dump(dstr);
46187eeb 3600 }
f8c7b90f 3601#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
3602 if (!isSwipe) {
3603 /* I believe I should acquire a global SV mutex if
3604 it's a COW sv (not a shared hash key) to stop
3605 it going un copy-on-write.
3606 If the source SV has gone un copy on write between up there
3607 and down here, then (assert() that) it is of the correct
3608 form to make it copy on write again */
3609 if ((sflags & (SVf_FAKE | SVf_READONLY))
3610 != (SVf_FAKE | SVf_READONLY)) {
3611 SvREADONLY_on(sstr);
3612 SvFAKE_on(sstr);
3613 /* Make the source SV into a loop of 1.
3614 (about to become 2) */
a29f6d03 3615 SV_COW_NEXT_SV_SET(sstr, sstr);
765f542d
NC
3616 }
3617 }
3618#endif
3619 /* Initial code is common. */
94010e71
NC
3620 if (SvPVX_const(dstr)) { /* we know that dtype >= SVt_PV */
3621 SvPV_free(dstr);
79072805 3622 }
765f542d 3623
765f542d
NC
3624 if (!isSwipe) {
3625 /* making another shared SV. */
3626 STRLEN cur = SvCUR(sstr);
3627 STRLEN len = SvLEN(sstr);
f8c7b90f 3628#ifdef PERL_OLD_COPY_ON_WRITE
765f542d 3629 if (len) {
b8f9541a 3630 assert (SvTYPE(dstr) >= SVt_PVIV);
765f542d
NC
3631 /* SvIsCOW_normal */
3632 /* splice us in between source and next-after-source. */
a29f6d03
NC
3633 SV_COW_NEXT_SV_SET(dstr, SV_COW_NEXT_SV(sstr));
3634 SV_COW_NEXT_SV_SET(sstr, dstr);
940132f3 3635 SvPV_set(dstr, SvPVX_mutable(sstr));
a604c751
NC
3636 } else
3637#endif
3638 {
765f542d 3639 /* SvIsCOW_shared_hash */
46187eeb
NC
3640 DEBUG_C(PerlIO_printf(Perl_debug_log,
3641 "Copy on write: Sharing hash\n"));
b8f9541a 3642
bdd68bc3 3643 assert (SvTYPE(dstr) >= SVt_PV);
765f542d 3644 SvPV_set(dstr,
d1db91c6 3645 HEK_KEY(share_hek_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr)))));
bdd68bc3 3646 }
87a1ef3d
SP
3647 SvLEN_set(dstr, len);
3648 SvCUR_set(dstr, cur);
765f542d
NC
3649 SvREADONLY_on(dstr);
3650 SvFAKE_on(dstr);
3651 /* Relesase a global SV mutex. */
3652 }
3653 else
765f542d 3654 { /* Passes the swipe test. */
78d1e721 3655 SvPV_set(dstr, SvPVX_mutable(sstr));
765f542d
NC
3656 SvLEN_set(dstr, SvLEN(sstr));
3657 SvCUR_set(dstr, SvCUR(sstr));
3658
3659 SvTEMP_off(dstr);
3660 (void)SvOK_off(sstr); /* NOTE: nukes most SvFLAGS on sstr */
6136c704 3661 SvPV_set(sstr, NULL);
765f542d
NC
3662 SvLEN_set(sstr, 0);
3663 SvCUR_set(sstr, 0);
3664 SvTEMP_off(sstr);
3665 }
3666 }
8990e307 3667 if (sflags & SVp_NOK) {
9d6ce603 3668 SvNV_set(dstr, SvNVX(sstr));
79072805 3669 }
8990e307 3670 if (sflags & SVp_IOK) {
23525414
NC
3671 SvRELEASE_IVX(dstr);
3672 SvIV_set(dstr, SvIVX(sstr));
3673 /* Must do this otherwise some other overloaded use of 0x80000000
3674 gets confused. I guess SVpbm_VALID */
2b1c7e3e 3675 if (sflags & SVf_IVisUV)
25da4f38 3676 SvIsUV_on(dstr);
79072805 3677 }
dd2eae66
NC
3678 SvFLAGS(dstr) |= sflags & (SVf_IOK|SVp_IOK|SVf_NOK|SVp_NOK|SVf_UTF8
3679 |SVf_AMAGIC);
4f2da183 3680 {
b0a11fe1 3681 const MAGIC * const smg = SvVSTRING_mg(sstr);
4f2da183
NC
3682 if (smg) {
3683 sv_magic(dstr, NULL, PERL_MAGIC_vstring,
3684 smg->mg_ptr, smg->mg_len);
3685 SvRMAGICAL_on(dstr);
3686 }
7a5fa8a2 3687 }
79072805 3688 }
5d581361 3689 else if (sflags & (SVp_IOK|SVp_NOK)) {
c2468cc7 3690 (void)SvOK_off(dstr);
dd2eae66
NC
3691 SvFLAGS(dstr) |= sflags & (SVf_IOK|SVp_IOK|SVf_IVisUV|SVf_NOK|SVp_NOK
3692 |SVf_AMAGIC);
5d581361
NC
3693 if (sflags & SVp_IOK) {
3694 /* XXXX Do we want to set IsUV for IV(ROK)? Be extra safe... */
3695 SvIV_set(dstr, SvIVX(sstr));
3696 }
3332b3c1 3697 if (sflags & SVp_NOK) {
9d6ce603 3698 SvNV_set(dstr, SvNVX(sstr));
3332b3c1
JH
3699 }
3700 }
79072805 3701 else {
f7877b28 3702 if (isGV_with_GP(sstr)) {
180488f8
NC
3703 /* This stringification rule for globs is spread in 3 places.
3704 This feels bad. FIXME. */
3705 const U32 wasfake = sflags & SVf_FAKE;
3706
3707 /* FAKE globs can get coerced, so need to turn this off
3708 temporarily if it is on. */
3709 SvFAKE_off(sstr);
3710 gv_efullname3(dstr, (GV *)sstr, "*");
3711 SvFLAGS(sstr) |= wasfake;
dd2eae66 3712 SvFLAGS(dstr) |= sflags & SVf_AMAGIC;
180488f8 3713 }
20408e3c
GS
3714 else
3715 (void)SvOK_off(dstr);
a0d0e21e 3716 }
27c9684d
AP
3717 if (SvTAINTED(sstr))
3718 SvTAINT(dstr);
79072805
LW
3719}
3720
954c1994
GS
3721/*
3722=for apidoc sv_setsv_mg
3723
3724Like C<sv_setsv>, but also handles 'set' magic.
3725
3726=cut
3727*/
3728
79072805 3729void
864dbfa3 3730Perl_sv_setsv_mg(pTHX_ SV *dstr, register SV *sstr)
ef50df4b
GS
3731{
3732 sv_setsv(dstr,sstr);
3733 SvSETMAGIC(dstr);
3734}
3735
f8c7b90f 3736#ifdef PERL_OLD_COPY_ON_WRITE
ed252734
NC
3737SV *
3738Perl_sv_setsv_cow(pTHX_ SV *dstr, SV *sstr)
3739{
3740 STRLEN cur = SvCUR(sstr);
3741 STRLEN len = SvLEN(sstr);
3742 register char *new_pv;
3743
3744 if (DEBUG_C_TEST) {
3745 PerlIO_printf(Perl_debug_log, "Fast copy on write: %p -> %p\n",
3746 sstr, dstr);
3747 sv_dump(sstr);
3748 if (dstr)
3749 sv_dump(dstr);
3750 }
3751
3752 if (dstr) {
3753 if (SvTHINKFIRST(dstr))
3754 sv_force_normal_flags(dstr, SV_COW_DROP_PV);
3f7c398e
SP
3755 else if (SvPVX_const(dstr))
3756 Safefree(SvPVX_const(dstr));
ed252734
NC
3757 }
3758 else
3759 new_SV(dstr);
862a34c6 3760 SvUPGRADE(dstr, SVt_PVIV);
ed252734
NC
3761
3762 assert (SvPOK(sstr));
3763 assert (SvPOKp(sstr));
3764 assert (!SvIOK(sstr));
3765 assert (!SvIOKp(sstr));
3766 assert (!SvNOK(sstr));
3767 assert (!SvNOKp(sstr));
3768
3769 if (SvIsCOW(sstr)) {
3770
3771 if (SvLEN(sstr) == 0) {
3772 /* source is a COW shared hash key. */
ed252734
NC
3773 DEBUG_C(PerlIO_printf(Perl_debug_log,
3774 "Fast copy on write: Sharing hash\n"));
d1db91c6 3775 new_pv = HEK_KEY(share_hek_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr))));
ed252734
NC
3776 goto common_exit;
3777 }
3778 SV_COW_NEXT_SV_SET(dstr, SV_COW_NEXT_SV(sstr));
3779 } else {
3780 assert ((SvFLAGS(sstr) & CAN_COW_MASK) == CAN_COW_FLAGS);
862a34c6 3781 SvUPGRADE(sstr, SVt_PVIV);
ed252734
NC
3782 SvREADONLY_on(sstr);
3783 SvFAKE_on(sstr);
3784 DEBUG_C(PerlIO_printf(Perl_debug_log,
3785 "Fast copy on write: Converting sstr to COW\n"));
3786 SV_COW_NEXT_SV_SET(dstr, sstr);
3787 }
3788 SV_COW_NEXT_SV_SET(sstr, dstr);
940132f3 3789 new_pv = SvPVX_mutable(sstr);
ed252734
NC
3790
3791 common_exit:
3792 SvPV_set(dstr, new_pv);
3793 SvFLAGS(dstr) = (SVt_PVIV|SVf_POK|SVp_POK|SVf_FAKE|SVf_READONLY);
3794 if (SvUTF8(sstr))
3795 SvUTF8_on(dstr);
87a1ef3d
SP
3796 SvLEN_set(dstr, len);
3797 SvCUR_set(dstr, cur);
ed252734
NC
3798 if (DEBUG_C_TEST) {
3799 sv_dump(dstr);
3800 }
3801 return dstr;
3802}
3803#endif
3804
954c1994
GS
3805/*
3806=for apidoc sv_setpvn
3807
3808Copies a string into an SV. The C<len> parameter indicates the number of
9e09f5f2
MHM
3809bytes to be copied. If the C<ptr> argument is NULL the SV will become
3810undefined. Does not handle 'set' magic. See C<sv_setpvn_mg>.
954c1994
GS
3811
3812=cut
3813*/
3814
ef50df4b 3815void
864dbfa3 3816Perl_sv_setpvn(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
79072805 3817{
97aff369 3818 dVAR;
c6f8c383 3819 register char *dptr;
22c522df 3820
765f542d 3821 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2 3822 if (!ptr) {
a0d0e21e 3823 (void)SvOK_off(sv);
463ee0b2
LW
3824 return;
3825 }
22c522df
JH
3826 else {
3827 /* len is STRLEN which is unsigned, need to copy to signed */
a3b680e6 3828 const IV iv = len;
9c5ffd7c
JH
3829 if (iv < 0)
3830 Perl_croak(aTHX_ "panic: sv_setpvn called with negative strlen");
22c522df 3831 }
862a34c6 3832 SvUPGRADE(sv, SVt_PV);
c6f8c383 3833
5902b6a9 3834 dptr = SvGROW(sv, len + 1);
c6f8c383
GA
3835 Move(ptr,dptr,len,char);
3836 dptr[len] = '\0';
79072805 3837 SvCUR_set(sv, len);
1aa99e6b 3838 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 3839 SvTAINT(sv);
79072805
LW
3840}
3841
954c1994
GS
3842/*
3843=for apidoc sv_setpvn_mg
3844
3845Like C<sv_setpvn>, but also handles 'set' magic.
3846
3847=cut
3848*/
3849
79072805 3850void
864dbfa3 3851Perl_sv_setpvn_mg(pTHX_ register SV *sv, register const char *ptr, register STRLEN len)
ef50df4b
GS
3852{
3853 sv_setpvn(sv,ptr,len);
3854 SvSETMAGIC(sv);
3855}
3856
954c1994
GS
3857/*
3858=for apidoc sv_setpv
3859
3860Copies a string into an SV. The string must be null-terminated. Does not
3861handle 'set' magic. See C<sv_setpv_mg>.
3862
3863=cut
3864*/
3865
ef50df4b 3866void
864dbfa3 3867Perl_sv_setpv(pTHX_ register SV *sv, register const char *ptr)
79072805 3868{
97aff369 3869 dVAR;
79072805
LW
3870 register STRLEN len;
3871
765f542d 3872 SV_CHECK_THINKFIRST_COW_DROP(sv);
463ee0b2 3873 if (!ptr) {
a0d0e21e 3874 (void)SvOK_off(sv);
463ee0b2
LW
3875 return;
3876 }
79072805 3877 len = strlen(ptr);
862a34c6 3878 SvUPGRADE(sv, SVt_PV);
c6f8c383 3879
79072805 3880 SvGROW(sv, len + 1);
463ee0b2 3881 Move(ptr,SvPVX(sv),len+1,char);
79072805 3882 SvCUR_set(sv, len);
1aa99e6b 3883 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2
LW
3884 SvTAINT(sv);
3885}
3886
954c1994
GS
3887/*
3888=for apidoc sv_setpv_mg
3889
3890Like C<sv_setpv>, but also handles 'set' magic.
3891
3892=cut
3893*/
3894
463ee0b2 3895void
864dbfa3 3896Perl_sv_setpv_mg(pTHX_ register SV *sv, register const char *ptr)
ef50df4b
GS
3897{
3898 sv_setpv(sv,ptr);
3899 SvSETMAGIC(sv);
3900}
3901
954c1994 3902/*
47518d95 3903=for apidoc sv_usepvn_flags
954c1994 3904
794a0d33
JH
3905Tells an SV to use C<ptr> to find its string value. Normally the
3906string is stored inside the SV but sv_usepvn allows the SV to use an
3907outside string. The C<ptr> should point to memory that was allocated
c1c21316
NC
3908by C<malloc>. The string length, C<len>, must be supplied. By default
3909this function will realloc (i.e. move) the memory pointed to by C<ptr>,
794a0d33
JH
3910so that pointer should not be freed or used by the programmer after
3911giving it to sv_usepvn, and neither should any pointers from "behind"
c1c21316
NC
3912that pointer (e.g. ptr + 1) be used.
3913
3914If C<flags> & SV_SMAGIC is true, will call SvSETMAGIC. If C<flags> &
3915SV_HAS_TRAILING_NUL is true, then C<ptr[len]> must be NUL, and the realloc
cbf82dd0 3916will be skipped. (i.e. the buffer is actually at least 1 byte longer than
c1c21316 3917C<len>, and already meets the requirements for storing in C<SvPVX>)
954c1994
GS
3918
3919=cut
3920*/
3921
ef50df4b 3922void
47518d95 3923Perl_sv_usepvn_flags(pTHX_ SV *sv, char *ptr, STRLEN len, U32 flags)
463ee0b2 3924{
97aff369 3925 dVAR;
1936d2a7 3926 STRLEN allocate;
765f542d 3927 SV_CHECK_THINKFIRST_COW_DROP(sv);
862a34c6 3928 SvUPGRADE(sv, SVt_PV);
463ee0b2 3929 if (!ptr) {
a0d0e21e 3930 (void)SvOK_off(sv);
47518d95
NC
3931 if (flags & SV_SMAGIC)
3932 SvSETMAGIC(sv);
463ee0b2
LW
3933 return;
3934 }
3f7c398e 3935 if (SvPVX_const(sv))
8bd4d4c5 3936 SvPV_free(sv);
1936d2a7 3937
0b7042f9 3938#ifdef DEBUGGING
2e90b4cd
NC
3939 if (flags & SV_HAS_TRAILING_NUL)
3940 assert(ptr[len] == '\0');
0b7042f9 3941#endif
2e90b4cd 3942
c1c21316 3943 allocate = (flags & SV_HAS_TRAILING_NUL)
8f01dc65 3944 ? len + 1: PERL_STRLEN_ROUNDUP(len + 1);
cbf82dd0
NC
3945 if (flags & SV_HAS_TRAILING_NUL) {
3946 /* It's long enough - do nothing.
3947 Specfically Perl_newCONSTSUB is relying on this. */
3948 } else {
69d25b4f 3949#ifdef DEBUGGING
69d25b4f
NC
3950 /* Force a move to shake out bugs in callers. */
3951 char *new_ptr = safemalloc(allocate);
3952 Copy(ptr, new_ptr, len, char);
3953 PoisonFree(ptr,len,char);
3954 Safefree(ptr);
3955 ptr = new_ptr;
69d25b4f 3956#else
c1c21316 3957 ptr = saferealloc (ptr, allocate);
69d25b4f 3958#endif
cbf82dd0 3959 }
f880fe2f 3960 SvPV_set(sv, ptr);
463ee0b2 3961 SvCUR_set(sv, len);
1936d2a7 3962 SvLEN_set(sv, allocate);
c1c21316
NC
3963 if (!(flags & SV_HAS_TRAILING_NUL)) {
3964 *SvEND(sv) = '\0';
3965 }
1aa99e6b 3966 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 3967 SvTAINT(sv);
47518d95
NC
3968 if (flags & SV_SMAGIC)
3969 SvSETMAGIC(sv);
ef50df4b
GS
3970}
3971
f8c7b90f 3972#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
3973/* Need to do this *after* making the SV normal, as we need the buffer
3974 pointer to remain valid until after we've copied it. If we let go too early,
3975 another thread could invalidate it by unsharing last of the same hash key
3976 (which it can do by means other than releasing copy-on-write Svs)
3977 or by changing the other copy-on-write SVs in the loop. */
3978STATIC void
bdd68bc3 3979S_sv_release_COW(pTHX_ register SV *sv, const char *pvx, STRLEN len, SV *after)
765f542d
NC
3980{
3981 if (len) { /* this SV was SvIsCOW_normal(sv) */
3982 /* we need to find the SV pointing to us. */
cf5629ad 3983 SV *current = SV_COW_NEXT_SV(after);
7a5fa8a2 3984
765f542d
NC
3985 if (current == sv) {
3986 /* The SV we point to points back to us (there were only two of us
3987 in the loop.)
3988 Hence other SV is no longer copy on write either. */
3989 SvFAKE_off(after);
3990 SvREADONLY_off(after);
3991 } else {
3992 /* We need to follow the pointers around the loop. */
3993 SV *next;
3994 while ((next = SV_COW_NEXT_SV(current)) != sv) {
3995 assert (next);
3996 current = next;
3997 /* don't loop forever if the structure is bust, and we have
3998 a pointer into a closed loop. */
3999 assert (current != after);
3f7c398e 4000 assert (SvPVX_const(current) == pvx);
765f542d
NC
4001 }
4002 /* Make the SV before us point to the SV after us. */
a29f6d03 4003 SV_COW_NEXT_SV_SET(current, after);
765f542d
NC
4004 }
4005 } else {
bdd68bc3 4006 unshare_hek(SvSHARED_HEK_FROM_PV(pvx));
765f542d
NC
4007 }
4008}
4009
4010int
4011Perl_sv_release_IVX(pTHX_ register SV *sv)
4012{
4013 if (SvIsCOW(sv))
4014 sv_force_normal_flags(sv, 0);
0c34ef67
MHM
4015 SvOOK_off(sv);
4016 return 0;
765f542d
NC
4017}
4018#endif
645c22ef
DM
4019/*
4020=for apidoc sv_force_normal_flags
4021
4022Undo various types of fakery on an SV: if the PV is a shared string, make
4023a private copy; if we're a ref, stop refing; if we're a glob, downgrade to
765f542d
NC
4024an xpvmg; if we're a copy-on-write scalar, this is the on-write time when
4025we do the copy, and is also used locally. If C<SV_COW_DROP_PV> is set
4026then a copy-on-write scalar drops its PV buffer (if any) and becomes
4027SvPOK_off rather than making a copy. (Used where this scalar is about to be
d3050d9d 4028set to some other value.) In addition, the C<flags> parameter gets passed to
765f542d
NC
4029C<sv_unref_flags()> when unrefing. C<sv_force_normal> calls this function
4030with flags set to 0.
645c22ef
DM
4031
4032=cut
4033*/
4034
6fc92669 4035void
840a7b70 4036Perl_sv_force_normal_flags(pTHX_ register SV *sv, U32 flags)
0f15f207 4037{
97aff369 4038 dVAR;
f8c7b90f 4039#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4040 if (SvREADONLY(sv)) {
4041 /* At this point I believe I should acquire a global SV mutex. */
4042 if (SvFAKE(sv)) {
b64e5050 4043 const char * const pvx = SvPVX_const(sv);
a28509cc
AL
4044 const STRLEN len = SvLEN(sv);
4045 const STRLEN cur = SvCUR(sv);
a28509cc 4046 SV * const next = SV_COW_NEXT_SV(sv); /* next COW sv in the loop. */
46187eeb
NC
4047 if (DEBUG_C_TEST) {
4048 PerlIO_printf(Perl_debug_log,
4049 "Copy on write: Force normal %ld\n",
4050 (long) flags);
e419cbc5 4051 sv_dump(sv);
46187eeb 4052 }
765f542d
NC
4053 SvFAKE_off(sv);
4054 SvREADONLY_off(sv);
9f653bb5 4055 /* This SV doesn't own the buffer, so need to Newx() a new one: */
6136c704 4056 SvPV_set(sv, NULL);
87a1ef3d 4057 SvLEN_set(sv, 0);
765f542d
NC
4058 if (flags & SV_COW_DROP_PV) {
4059 /* OK, so we don't need to copy our buffer. */
4060 SvPOK_off(sv);
4061 } else {
4062 SvGROW(sv, cur + 1);
4063 Move(pvx,SvPVX(sv),cur,char);
87a1ef3d 4064 SvCUR_set(sv, cur);
765f542d
NC
4065 *SvEND(sv) = '\0';
4066 }
bdd68bc3 4067 sv_release_COW(sv, pvx, len, next);
46187eeb 4068 if (DEBUG_C_TEST) {
e419cbc5 4069 sv_dump(sv);
46187eeb 4070 }
765f542d 4071 }
923e4eb5 4072 else if (IN_PERL_RUNTIME)
765f542d
NC
4073 Perl_croak(aTHX_ PL_no_modify);
4074 /* At this point I believe that I can drop the global SV mutex. */
4075 }
4076#else
2213622d 4077 if (SvREADONLY(sv)) {
1c846c1f 4078 if (SvFAKE(sv)) {
b64e5050 4079 const char * const pvx = SvPVX_const(sv);
66a1b24b 4080 const STRLEN len = SvCUR(sv);
10bcdfd6
NC
4081 SvFAKE_off(sv);
4082 SvREADONLY_off(sv);
bd61b366 4083 SvPV_set(sv, NULL);
66a1b24b 4084 SvLEN_set(sv, 0);
1c846c1f 4085 SvGROW(sv, len + 1);
706aa1c9 4086 Move(pvx,SvPVX(sv),len,char);
1c846c1f 4087 *SvEND(sv) = '\0';
bdd68bc3 4088 unshare_hek(SvSHARED_HEK_FROM_PV(pvx));
1c846c1f 4089 }
923e4eb5 4090 else if (IN_PERL_RUNTIME)
cea2e8a9 4091 Perl_croak(aTHX_ PL_no_modify);
0f15f207 4092 }
765f542d 4093#endif
2213622d 4094 if (SvROK(sv))
840a7b70 4095 sv_unref_flags(sv, flags);
6fc92669
GS
4096 else if (SvFAKE(sv) && SvTYPE(sv) == SVt_PVGV)
4097 sv_unglob(sv);
0f15f207 4098}
1c846c1f 4099
645c22ef 4100/*
954c1994
GS
4101=for apidoc sv_chop
4102
1c846c1f 4103Efficient removal of characters from the beginning of the string buffer.
954c1994
GS
4104SvPOK(sv) must be true and the C<ptr> must be a pointer to somewhere inside
4105the string buffer. The C<ptr> becomes the first character of the adjusted
645c22ef 4106string. Uses the "OOK hack".
3f7c398e 4107Beware: after this function returns, C<ptr> and SvPVX_const(sv) may no longer
31869a79 4108refer to the same chunk of data.
954c1994
GS
4109
4110=cut
4111*/
4112
79072805 4113void
f54cb97a 4114Perl_sv_chop(pTHX_ register SV *sv, register const char *ptr)
79072805
LW
4115{
4116 register STRLEN delta;
a0d0e21e 4117 if (!ptr || !SvPOKp(sv))
79072805 4118 return;
3f7c398e 4119 delta = ptr - SvPVX_const(sv);
2213622d 4120 SV_CHECK_THINKFIRST(sv);
79072805
LW
4121 if (SvTYPE(sv) < SVt_PVIV)
4122 sv_upgrade(sv,SVt_PVIV);
4123
4124 if (!SvOOK(sv)) {
50483b2c 4125 if (!SvLEN(sv)) { /* make copy of shared string */
3f7c398e 4126 const char *pvx = SvPVX_const(sv);
a28509cc 4127 const STRLEN len = SvCUR(sv);
50483b2c 4128 SvGROW(sv, len + 1);
706aa1c9 4129 Move(pvx,SvPVX(sv),len,char);
50483b2c
JD
4130 *SvEND(sv) = '\0';
4131 }
45977657 4132 SvIV_set(sv, 0);
a4bfb290
AB
4133 /* Same SvOOK_on but SvOOK_on does a SvIOK_off
4134 and we do that anyway inside the SvNIOK_off
4135 */
7a5fa8a2 4136 SvFLAGS(sv) |= SVf_OOK;
79072805 4137 }
a4bfb290 4138 SvNIOK_off(sv);
b162af07
SP
4139 SvLEN_set(sv, SvLEN(sv) - delta);
4140 SvCUR_set(sv, SvCUR(sv) - delta);
f880fe2f 4141 SvPV_set(sv, SvPVX(sv) + delta);
45977657 4142 SvIV_set(sv, SvIVX(sv) + delta);
79072805
LW
4143}
4144
954c1994
GS
4145/*
4146=for apidoc sv_catpvn
4147
4148Concatenates the string onto the end of the string which is in the SV. The
1e54db1a
JH
4149C<len> indicates number of bytes to copy. If the SV has the UTF-8
4150status set, then the bytes appended should be valid UTF-8.
d5ce4a7c 4151Handles 'get' magic, but not 'set' magic. See C<sv_catpvn_mg>.
954c1994 4152
8d6d96c1
HS
4153=for apidoc sv_catpvn_flags
4154
4155Concatenates the string onto the end of the string which is in the SV. The
1e54db1a
JH
4156C<len> indicates number of bytes to copy. If the SV has the UTF-8
4157status set, then the bytes appended should be valid UTF-8.
8d6d96c1
HS
4158If C<flags> has C<SV_GMAGIC> bit set, will C<mg_get> on C<dsv> if
4159appropriate, else not. C<sv_catpvn> and C<sv_catpvn_nomg> are implemented
4160in terms of this function.
4161
4162=cut
4163*/
4164
4165void
4166Perl_sv_catpvn_flags(pTHX_ register SV *dsv, register const char *sstr, register STRLEN slen, I32 flags)
4167{
97aff369 4168 dVAR;
8d6d96c1 4169 STRLEN dlen;
fabdb6c0 4170 const char * const dstr = SvPV_force_flags(dsv, dlen, flags);
8d6d96c1 4171
8d6d96c1
HS
4172 SvGROW(dsv, dlen + slen + 1);
4173 if (sstr == dstr)
3f7c398e 4174 sstr = SvPVX_const(dsv);
8d6d96c1 4175 Move(sstr, SvPVX(dsv) + dlen, slen, char);
b162af07 4176 SvCUR_set(dsv, SvCUR(dsv) + slen);
8d6d96c1
HS
4177 *SvEND(dsv) = '\0';
4178 (void)SvPOK_only_UTF8(dsv); /* validate pointer */
4179 SvTAINT(dsv);
bddd5118
NC
4180 if (flags & SV_SMAGIC)
4181 SvSETMAGIC(dsv);
79072805
LW
4182}
4183
954c1994 4184/*
954c1994
GS
4185=for apidoc sv_catsv
4186
13e8c8e3
JH
4187Concatenates the string from SV C<ssv> onto the end of the string in
4188SV C<dsv>. Modifies C<dsv> but not C<ssv>. Handles 'get' magic, but
4189not 'set' magic. See C<sv_catsv_mg>.
954c1994 4190
8d6d96c1
HS
4191=for apidoc sv_catsv_flags
4192
4193Concatenates the string from SV C<ssv> onto the end of the string in
4194SV C<dsv>. Modifies C<dsv> but not C<ssv>. If C<flags> has C<SV_GMAGIC>
4195bit set, will C<mg_get> on the SVs if appropriate, else not. C<sv_catsv>
4196and C<sv_catsv_nomg> are implemented in terms of this function.
4197
4198=cut */
4199
ef50df4b 4200void
8d6d96c1 4201Perl_sv_catsv_flags(pTHX_ SV *dsv, register SV *ssv, I32 flags)
79072805 4202{
97aff369 4203 dVAR;
bddd5118 4204 if (ssv) {
00b6aa41
AL
4205 STRLEN slen;
4206 const char *spv = SvPV_const(ssv, slen);
4207 if (spv) {
bddd5118
NC
4208 /* sutf8 and dutf8 were type bool, but under USE_ITHREADS,
4209 gcc version 2.95.2 20000220 (Debian GNU/Linux) for
4210 Linux xxx 2.2.17 on sparc64 with gcc -O2, we erroneously
4211 get dutf8 = 0x20000000, (i.e. SVf_UTF8) even though
4212 dsv->sv_flags doesn't have that bit set.
4fd84b44 4213 Andy Dougherty 12 Oct 2001
bddd5118
NC
4214 */
4215 const I32 sutf8 = DO_UTF8(ssv);
4216 I32 dutf8;
13e8c8e3 4217
bddd5118
NC
4218 if (SvGMAGICAL(dsv) && (flags & SV_GMAGIC))
4219 mg_get(dsv);
4220 dutf8 = DO_UTF8(dsv);
8d6d96c1 4221
bddd5118
NC
4222 if (dutf8 != sutf8) {
4223 if (dutf8) {
4224 /* Not modifying source SV, so taking a temporary copy. */
00b6aa41 4225 SV* const csv = sv_2mortal(newSVpvn(spv, slen));
13e8c8e3 4226
bddd5118
NC
4227 sv_utf8_upgrade(csv);
4228 spv = SvPV_const(csv, slen);
4229 }
4230 else
4231 sv_utf8_upgrade_nomg(dsv);
13e8c8e3 4232 }
bddd5118 4233 sv_catpvn_nomg(dsv, spv, slen);
e84ff256 4234 }
560a288e 4235 }
bddd5118
NC
4236 if (flags & SV_SMAGIC)
4237 SvSETMAGIC(dsv);
79072805
LW
4238}
4239
954c1994 4240/*
954c1994
GS
4241=for apidoc sv_catpv
4242
4243Concatenates the string onto the end of the string which is in the SV.
1e54db1a
JH
4244If the SV has the UTF-8 status set, then the bytes appended should be
4245valid UTF-8. Handles 'get' magic, but not 'set' magic. See C<sv_catpv_mg>.
954c1994 4246
d5ce4a7c 4247=cut */
954c1994 4248
ef50df4b 4249void
0c981600 4250Perl_sv_catpv(pTHX_ register SV *sv, register const char *ptr)
79072805 4251{
97aff369 4252 dVAR;
79072805 4253 register STRLEN len;
463ee0b2 4254 STRLEN tlen;
748a9306 4255 char *junk;
79072805 4256
0c981600 4257 if (!ptr)
79072805 4258 return;
748a9306 4259 junk = SvPV_force(sv, tlen);
0c981600 4260 len = strlen(ptr);
463ee0b2 4261 SvGROW(sv, tlen + len + 1);
0c981600 4262 if (ptr == junk)
3f7c398e 4263 ptr = SvPVX_const(sv);
0c981600 4264 Move(ptr,SvPVX(sv)+tlen,len+1,char);
b162af07 4265 SvCUR_set(sv, SvCUR(sv) + len);
d41ff1b8 4266 (void)SvPOK_only_UTF8(sv); /* validate pointer */
463ee0b2 4267 SvTAINT(sv);
79072805
LW
4268}
4269
954c1994
GS
4270/*
4271=for apidoc sv_catpv_mg
4272
4273Like C<sv_catpv>, but also handles 'set' magic.
4274
4275=cut
4276*/
4277
ef50df4b 4278void
0c981600 4279Perl_sv_catpv_mg(pTHX_ register SV *sv, register const char *ptr)
ef50df4b 4280{
0c981600 4281 sv_catpv(sv,ptr);
ef50df4b
GS
4282 SvSETMAGIC(sv);
4283}
4284
645c22ef
DM
4285/*
4286=for apidoc newSV
4287
561b68a9
SH
4288Creates a new SV. A non-zero C<len> parameter indicates the number of
4289bytes of preallocated string space the SV should have. An extra byte for a
4290trailing NUL is also reserved. (SvPOK is not set for the SV even if string
4291space is allocated.) The reference count for the new SV is set to 1.
4292
4293In 5.9.3, newSV() replaces the older NEWSV() API, and drops the first
4294parameter, I<x>, a debug aid which allowed callers to identify themselves.
4295This aid has been superseded by a new build option, PERL_MEM_LOG (see
4296L<perlhack/PERL_MEM_LOG>). The older API is still there for use in XS
4297modules supporting older perls.
645c22ef
DM
4298
4299=cut
4300*/
4301
79072805 4302SV *
864dbfa3 4303Perl_newSV(pTHX_ STRLEN len)
79072805 4304{
97aff369 4305 dVAR;
79072805 4306 register SV *sv;
1c846c1f 4307
4561caa4 4308 new_SV(sv);
79072805
LW
4309 if (len) {
4310 sv_upgrade(sv, SVt_PV);
4311 SvGROW(sv, len + 1);
4312 }
4313 return sv;
4314}
954c1994 4315/*
92110913 4316=for apidoc sv_magicext
954c1994 4317
68795e93 4318Adds magic to an SV, upgrading it if necessary. Applies the
2d8d5d5a 4319supplied vtable and returns a pointer to the magic added.
92110913 4320
2d8d5d5a
SH
4321Note that C<sv_magicext> will allow things that C<sv_magic> will not.
4322In particular, you can add magic to SvREADONLY SVs, and add more than
4323one instance of the same 'how'.
645c22ef 4324
2d8d5d5a
SH
4325If C<namlen> is greater than zero then a C<savepvn> I<copy> of C<name> is
4326stored, if C<namlen> is zero then C<name> is stored as-is and - as another
4327special case - if C<(name && namlen == HEf_SVKEY)> then C<name> is assumed
4328to contain an C<SV*> and is stored as-is with its REFCNT incremented.
92110913 4329
2d8d5d5a 4330(This is now used as a subroutine by C<sv_magic>.)
954c1994
GS
4331
4332=cut
4333*/
92110913 4334MAGIC *
92e67595 4335Perl_sv_magicext(pTHX_ SV* sv, SV* obj, int how, MGVTBL *vtable,
92110913 4336 const char* name, I32 namlen)
79072805 4337{
97aff369 4338 dVAR;
79072805 4339 MAGIC* mg;
68795e93 4340
92110913 4341 if (SvTYPE(sv) < SVt_PVMG) {
862a34c6 4342 SvUPGRADE(sv, SVt_PVMG);
463ee0b2 4343 }
a02a5408 4344 Newxz(mg, 1, MAGIC);
79072805 4345 mg->mg_moremagic = SvMAGIC(sv);
b162af07 4346 SvMAGIC_set(sv, mg);
75f9d97a 4347
05f95b08
SB
4348 /* Sometimes a magic contains a reference loop, where the sv and
4349 object refer to each other. To prevent a reference loop that
4350 would prevent such objects being freed, we look for such loops
4351 and if we find one we avoid incrementing the object refcount.
87f0b213
JH
4352
4353 Note we cannot do this to avoid self-tie loops as intervening RV must
b5ccf5f2 4354 have its REFCNT incremented to keep it in existence.
87f0b213
JH
4355
4356 */
14befaf4
DM
4357 if (!obj || obj == sv ||
4358 how == PERL_MAGIC_arylen ||
4359 how == PERL_MAGIC_qr ||
8d2f4536 4360 how == PERL_MAGIC_symtab ||
75f9d97a
JH
4361 (SvTYPE(obj) == SVt_PVGV &&
4362 (GvSV(obj) == sv || GvHV(obj) == (HV*)sv || GvAV(obj) == (AV*)sv ||
4363 GvCV(obj) == (CV*)sv || GvIOp(obj) == (IO*)sv ||
2628be26 4364 GvFORM(obj) == (CV*)sv)))
75f9d97a 4365 {
8990e307 4366 mg->mg_obj = obj;
75f9d97a 4367 }
85e6fe83 4368 else {
b37c2d43 4369 mg->mg_obj = SvREFCNT_inc_simple(obj);
85e6fe83
LW
4370 mg->mg_flags |= MGf_REFCOUNTED;
4371 }
b5ccf5f2
YST
4372
4373 /* Normal self-ties simply pass a null object, and instead of
4374 using mg_obj directly, use the SvTIED_obj macro to produce a
4375 new RV as needed. For glob "self-ties", we are tieing the PVIO
4376 with an RV obj pointing to the glob containing the PVIO. In
4377 this case, to avoid a reference loop, we need to weaken the
4378 reference.
4379 */
4380
4381 if (how == PERL_MAGIC_tiedscalar && SvTYPE(sv) == SVt_PVIO &&
4382 obj && SvROK(obj) && GvIO(SvRV(obj)) == (IO*)sv)
4383 {
4384 sv_rvweaken(obj);
4385 }
4386
79072805 4387 mg->mg_type = how;
565764a8 4388 mg->mg_len = namlen;
9cbac4c7 4389 if (name) {
92110913 4390 if (namlen > 0)
1edc1566 4391 mg->mg_ptr = savepvn(name, namlen);
c6ee37c5 4392 else if (namlen == HEf_SVKEY)
b37c2d43 4393 mg->mg_ptr = (char*)SvREFCNT_inc_simple_NN((SV*)name);
68795e93 4394 else
92110913 4395 mg->mg_ptr = (char *) name;
9cbac4c7 4396 }
92110913 4397 mg->mg_virtual = vtable;
68795e93 4398
92110913
NIS
4399 mg_magical(sv);
4400 if (SvGMAGICAL(sv))
4401 SvFLAGS(sv) &= ~(SVf_IOK|SVf_NOK|SVf_POK);
4402 return mg;
4403}
4404
4405/*
4406=for apidoc sv_magic
1c846c1f 4407
92110913
NIS
4408Adds magic to an SV. First upgrades C<sv> to type C<SVt_PVMG> if necessary,
4409then adds a new magic item of type C<how> to the head of the magic list.
4410
2d8d5d5a
SH
4411See C<sv_magicext> (which C<sv_magic> now calls) for a description of the
4412handling of the C<name> and C<namlen> arguments.
4413
4509d3fb
SB
4414You need to use C<sv_magicext> to add magic to SvREADONLY SVs and also
4415to add more than one instance of the same 'how'.
4416
92110913
NIS
4417=cut
4418*/
4419
4420void
4421Perl_sv_magic(pTHX_ register SV *sv, SV *obj, int how, const char *name, I32 namlen)
68795e93 4422{
97aff369 4423 dVAR;
92e67595 4424 MGVTBL *vtable;
92110913 4425 MAGIC* mg;
92110913 4426
f8c7b90f 4427#ifdef PERL_OLD_COPY_ON_WRITE
765f542d
NC
4428 if (SvIsCOW(sv))
4429 sv_force_normal_flags(sv, 0);
4430#endif
92110913 4431 if (SvREADONLY(sv)) {
d8084ca5
DM
4432 if (
4433 /* its okay to attach magic to shared strings; the subsequent
4434 * upgrade to PVMG will unshare the string */
4435 !(SvFAKE(sv) && SvTYPE(sv) < SVt_PVMG)
4436
4437 && IN_PERL_RUNTIME
92110913
NIS
4438 && how != PERL_MAGIC_regex_global
4439 && how != PERL_MAGIC_bm
4440 && how != PERL_MAGIC_fm
4441 && how != PERL_MAGIC_sv
e6469971 4442 && how != PERL_MAGIC_backref
92110913
NIS
4443 )
4444 {
4445 Perl_croak(aTHX_ PL_no_modify);
4446 }
4447 }
4448 if (SvMAGICAL(sv) || (how == PERL_MAGIC_taint && SvTYPE(sv) >= SVt_PVMG)) {
4449 if (SvMAGIC(sv) && (mg = mg_find(sv, how))) {
68795e93
NIS
4450 /* sv_magic() refuses to add a magic of the same 'how' as an
4451 existing one
92110913 4452 */
2a509ed3 4453 if (how == PERL_MAGIC_taint) {
92110913 4454 mg->mg_len |= 1;
2a509ed3
NC
4455 /* Any scalar which already had taint magic on which someone
4456 (erroneously?) did SvIOK_on() or similar will now be
4457 incorrectly sporting public "OK" flags. */
4458 SvFLAGS(sv) &= ~(SVf_IOK|SVf_NOK|SVf_POK);
4459 }
92110913
NIS
4460 return;
4461 }
4462 }
68795e93 4463
79072805 4464 switch (how) {
14befaf4 4465 case PERL_MAGIC_sv:
92110913 4466 vtable = &PL_vtbl_sv;
79072805 4467 break;
14befaf4 4468 case PERL_MAGIC_overload:
92110913 4469 vtable = &PL_vtbl_amagic;
a0d0e21e 4470 break;
14befaf4 4471 case PERL_MAGIC_overload_elem:
92110913 4472 vtable = &PL_vtbl_amagicelem;
a0d0e21e 4473 break;
14befaf4 4474 case PERL_MAGIC_overload_table:
92110913 4475 vtable = &PL_vtbl_ovrld;
a0d0e21e 4476 break;
14befaf4 4477 case PERL_MAGIC_bm:
92110913 4478 vtable = &PL_vtbl_bm;
79072805 4479 break;
14befaf4 4480 case PERL_MAGIC_regdata:
92110913 4481 vtable = &PL_vtbl_regdata;
6cef1e77 4482 break;
14befaf4 4483 case PERL_MAGIC_regdatum:
92110913 4484 vtable = &PL_vtbl_regdatum;
6cef1e77 4485 break;
14befaf4 4486 case PERL_MAGIC_env:
92110913 4487 vtable = &PL_vtbl_env;
79072805 4488 break;
14befaf4 4489 case PERL_MAGIC_fm:
92110913 4490 vtable = &PL_vtbl_fm;
55497cff 4491 break;
14befaf4 4492 case PERL_MAGIC_envelem:
92110913 4493 vtable = &PL_vtbl_envelem;
79072805 4494 break;
14befaf4 4495 case PERL_MAGIC_regex_global:
92110913 4496 vtable = &PL_vtbl_mglob;
93a17b20 4497 break;
14befaf4 4498 case PERL_MAGIC_isa:
92110913 4499 vtable = &PL_vtbl_isa;
463ee0b2 4500 break;
14befaf4 4501 case PERL_MAGIC_isaelem:
92110913 4502 vtable = &PL_vtbl_isaelem;
463ee0b2 4503 break;
14befaf4 4504 case PERL_MAGIC_nkeys:
92110913 4505 vtable = &PL_vtbl_nkeys;
16660edb 4506 break;
14befaf4 4507 case PERL_MAGIC_dbfile:
aec46f14 4508 vtable = NULL;
93a17b20 4509 break;
14befaf4 4510 case PERL_MAGIC_dbline:
92110913 4511 vtable = &PL_vtbl_dbline;
79072805 4512 break;
36477c24 4513#ifdef USE_LOCALE_COLLATE
14befaf4 4514 case PERL_MAGIC_collxfrm:
92110913 4515 vtable = &PL_vtbl_collxfrm;
bbce6d69 4516 break;
36477c24 4517#endif /* USE_LOCALE_COLLATE */
14befaf4 4518 case PERL_MAGIC_tied:
92110913 4519 vtable = &PL_vtbl_pack;
463ee0b2 4520 break;
14befaf4
DM
4521 case PERL_MAGIC_tiedelem:
4522 case PERL_MAGIC_tiedscalar:
92110913 4523 vtable = &PL_vtbl_packelem;
463ee0b2 4524 break;
14befaf4 4525 case PERL_MAGIC_qr:
92110913 4526 vtable = &PL_vtbl_regexp;
c277df42 4527 break;
b3ca2e83
NC
4528 case PERL_MAGIC_hints:
4529 /* As this vtable is all NULL, we can reuse it. */
14befaf4 4530 case PERL_MAGIC_sig:
92110913 4531 vtable = &PL_vtbl_sig;
79072805 4532 break;
14befaf4 4533 case PERL_MAGIC_sigelem:
92110913 4534 vtable = &PL_vtbl_sigelem;
79072805 4535 break;
14befaf4 4536 case PERL_MAGIC_taint:
92110913 4537 vtable = &PL_vtbl_taint;
463ee0b2 4538 break;
14befaf4 4539 case PERL_MAGIC_uvar:
92110913 4540 vtable = &PL_vtbl_uvar;
79072805 4541 break;
14befaf4 4542 case PERL_MAGIC_vec:
92110913 4543 vtable = &PL_vtbl_vec;
79072805 4544 break;
a3874608 4545 case PERL_MAGIC_arylen_p:
bfcb3514 4546 case PERL_MAGIC_rhash:
8d2f4536 4547 case PERL_MAGIC_symtab:
ece467f9 4548 case PERL_MAGIC_vstring:
aec46f14 4549 vtable = NULL;
ece467f9 4550 break;
7e8c5dac
HS
4551 case PERL_MAGIC_utf8:
4552 vtable = &PL_vtbl_utf8;
4553 break;
14befaf4 4554 case PERL_MAGIC_substr:
92110913 4555 vtable = &PL_vtbl_substr;
79072805 4556 break;
14befaf4 4557 case PERL_MAGIC_defelem:
92110913 4558 vtable = &PL_vtbl_defelem;
5f05dabc 4559 break;
14befaf4 4560 case PERL_MAGIC_arylen:
92110913 4561 vtable = &PL_vtbl_arylen;
79072805 4562 break;
14befaf4 4563 case PERL_MAGIC_pos:
92110913 4564 vtable = &PL_vtbl_pos;
a0d0e21e 4565 break;
14befaf4 4566 case PERL_MAGIC_backref:
92110913 4567 vtable = &PL_vtbl_backref;
810b8aa5 4568 break;
b3ca2e83
NC
4569 case PERL_MAGIC_hintselem:
4570 vtable = &PL_vtbl_hintselem;
4571 break;
14befaf4
DM
4572 case PERL_MAGIC_ext:
4573 /* Reserved for use by extensions not perl internals. */
4633a7c4
LW
4574 /* Useful for attaching extension internal data to perl vars. */
4575 /* Note that multiple extensions may clash if magical scalars */
4576 /* etc holding private data from one are passed to another. */
aec46f14 4577 vtable = NULL;
a0d0e21e 4578 break;
79072805 4579 default:
14befaf4 4580 Perl_croak(aTHX_ "Don't know how to handle magic of type \\%o", how);
463ee0b2 4581 }
68795e93 4582
92110913 4583 /* Rest of work is done else where */
aec46f14 4584 mg = sv_magicext(sv,obj,how,vtable,name,namlen);
68795e93 4585
92110913
NIS
4586 switch (how) {
4587 case PERL_MAGIC_taint:
4588 mg->mg_len = 1;
4589 break;
4590 case PERL_MAGIC_ext:
4591 case PERL_MAGIC_dbfile:
4592 SvRMAGICAL_on(sv);
4593 break;
4594 }
463ee0b2
LW
4595}
4596
c461cf8f
JH
4597/*
4598=for apidoc sv_unmagic
4599
645c22ef 4600Removes all magic of type C<type> from an SV.
c461cf8f
JH
4601
4602=cut
4603*/
4604
463ee0b2 4605int
864dbfa3 4606Perl_sv_unmagic(pTHX_ SV *sv, int type)
463ee0b2
LW
4607{
4608 MAGIC* mg;
4609 MAGIC** mgp;
91bba347 4610 if (SvTYPE(sv) < SVt_PVMG || !SvMAGIC(sv))
463ee0b2 4611 return 0;
064cf529 4612 mgp = &(((XPVMG*) SvANY(sv))->xmg_u.xmg_magic);
463ee0b2
LW
4613 for (mg = *mgp; mg; mg = *mgp) {
4614 if (mg->mg_type == type) {
e1ec3a88 4615 const MGVTBL* const vtbl = mg->mg_virtual;
463ee0b2 4616 *mgp = mg->mg_moremagic;
1d7c1841 4617 if (vtbl && vtbl->svt_free)
fc0dc3b3 4618 CALL_FPTR(vtbl->svt_free)(aTHX_ sv, mg);
14befaf4 4619 if (mg->mg_ptr && mg->mg_type != PERL_MAGIC_regex_global) {
92110913 4620 if (mg->mg_len > 0)
1edc1566 4621 Safefree(mg->mg_ptr);
565764a8 4622 else if (mg->mg_len == HEf_SVKEY)
1edc1566 4623 SvREFCNT_dec((SV*)mg->mg_ptr);
d2923cdd 4624 else if (mg->mg_type == PERL_MAGIC_utf8)
7e8c5dac 4625 Safefree(mg->mg_ptr);
9cbac4c7 4626 }
a0d0e21e
LW
4627 if (mg->mg_flags & MGf_REFCOUNTED)
4628 SvREFCNT_dec(mg->mg_obj);
463ee0b2
LW
4629 Safefree(mg);
4630 }
4631 else
4632 mgp = &mg->mg_moremagic;
79072805 4633 }
91bba347 4634 if (!SvMAGIC(sv)) {
463ee0b2 4635 SvMAGICAL_off(sv);
c268c2a6 4636 SvFLAGS(sv) |= (SvFLAGS(sv) & (SVp_IOK|SVp_NOK|SVp_POK)) >> PRIVSHIFT;
86f55936 4637 SvMAGIC_set(sv, NULL);
463ee0b2
LW
4638 }
4639
4640 return 0;
79072805
LW
4641}
4642
c461cf8f
JH
4643/*
4644=for apidoc sv_rvweaken
4645
645c22ef
DM
4646Weaken a reference: set the C<SvWEAKREF> flag on this RV; give the
4647referred-to SV C<PERL_MAGIC_backref> magic if it hasn't already; and
4648push a back-reference to this RV onto the array of backreferences
1e73acc8
AS
4649associated with that magic. If the RV is magical, set magic will be
4650called after the RV is cleared.
c461cf8f
JH
4651
4652=cut
4653*/
4654
810b8aa5 4655SV *
864dbfa3 4656Perl_sv_rvweaken(pTHX_ SV *sv)
810b8aa5
GS
4657{
4658 SV *tsv;
4659 if (!SvOK(sv)) /* let undefs pass */
4660 return sv;
4661 if (!SvROK(sv))
cea2e8a9 4662 Perl_croak(aTHX_ "Can't weaken a nonreference");
810b8aa5 4663 else if (SvWEAKREF(sv)) {
810b8aa5 4664 if (ckWARN(WARN_MISC))
9014280d 4665 Perl_warner(aTHX_ packWARN(WARN_MISC), "Reference is already weak");
810b8aa5
GS
4666 return sv;
4667 }
4668 tsv = SvRV(sv);
e15faf7d 4669 Perl_sv_add_backref(aTHX_ tsv, sv);
810b8aa5 4670 SvWEAKREF_on(sv);
1c846c1f 4671 SvREFCNT_dec(tsv);
810b8aa5
GS
4672 return sv;
4673}
4674
645c22ef
DM
4675/* Give tsv backref magic if it hasn't already got it, then push a
4676 * back-reference to sv onto the array associated with the backref magic.
4677 */
4678
e15faf7d
NC
4679void
4680Perl_sv_add_backref(pTHX_ SV *tsv, SV *sv)
810b8aa5 4681{
97aff369 4682 dVAR;
810b8aa5 4683 AV *av;
86f55936
NC
4684
4685 if (SvTYPE(tsv) == SVt_PVHV) {
4686 AV **const avp = Perl_hv_backreferences_p(aTHX_ (HV*)tsv);
4687
4688 av = *avp;
4689 if (!av) {
4690 /* There is no AV in the offical place - try a fixup. */
4691 MAGIC *const mg = mg_find(tsv, PERL_MAGIC_backref);
4692
4693 if (mg) {
4694 /* Aha. They've got it stowed in magic. Bring it back. */
4695 av = (AV*)mg->mg_obj;
4696 /* Stop mg_free decreasing the refernce count. */
4697 mg->mg_obj = NULL;
4698 /* Stop mg_free even calling the destructor, given that
4699 there's no AV to free up. */
4700 mg->mg_virtual = 0;
4701 sv_unmagic(tsv, PERL_MAGIC_backref);
4702 } else {
4703 av = newAV();
4704 AvREAL_off(av);
b37c2d43 4705 SvREFCNT_inc_simple_void(av);
86f55936
NC
4706 }
4707 *avp = av;
4708 }
4709 } else {
4710 const MAGIC *const mg
4711 = SvMAGICAL(tsv) ? mg_find(tsv, PERL_MAGIC_backref) : NULL;
4712 if (mg)
4713 av = (AV*)mg->mg_obj;
4714 else {
4715 av = newAV();
4716 AvREAL_off(av);
4717 sv_magic(tsv, (SV*)av, PERL_MAGIC_backref, NULL, 0);
4718 /* av now has a refcnt of 2, which avoids it getting freed
4719 * before us during global cleanup. The extra ref is removed
4720 * by magic_killbackrefs() when tsv is being freed */
4721 }
810b8aa5 4722 }
d91d49e8 4723 if (AvFILLp(av) >= AvMAX(av)) {
d91d49e8
MM
4724 av_extend(av, AvFILLp(av)+1);
4725 }
4726 AvARRAY(av)[++AvFILLp(av)] = sv; /* av_push() */
810b8aa5
GS
4727}
4728
645c22ef
DM
4729/* delete a back-reference to ourselves from the backref magic associated
4730 * with the SV we point to.
4731 */
4732
1c846c1f 4733STATIC void
e15faf7d 4734S_sv_del_backref(pTHX_ SV *tsv, SV *sv)
810b8aa5 4735{
97aff369 4736 dVAR;
86f55936 4737 AV *av = NULL;
810b8aa5
GS
4738 SV **svp;
4739 I32 i;
86f55936
NC
4740
4741 if (SvTYPE(tsv) == SVt_PVHV && SvOOK(tsv)) {
4742 av = *Perl_hv_backreferences_p(aTHX_ (HV*)tsv);
5b285ea4
NC
4743 /* We mustn't attempt to "fix up" the hash here by moving the
4744 backreference array back to the hv_aux structure, as that is stored
4745 in the main HvARRAY(), and hfreentries assumes that no-one
4746 reallocates HvARRAY() while it is running. */
86f55936
NC
4747 }
4748 if (!av) {
4749 const MAGIC *const mg
4750 = SvMAGICAL(tsv) ? mg_find(tsv, PERL_MAGIC_backref) : NULL;
4751 if (mg)
4752 av = (AV *)mg->mg_obj;
4753 }
4754 if (!av) {
e15faf7d
NC
4755 if (PL_in_clean_all)
4756 return;
cea2e8a9 4757 Perl_croak(aTHX_ "panic: del_backref");
86f55936
NC
4758 }
4759
4760 if (SvIS_FREED(av))
4761 return;
4762
810b8aa5 4763 svp = AvARRAY(av);
6a76db8b
NC
4764 /* We shouldn't be in here more than once, but for paranoia reasons lets
4765 not assume this. */
4766 for (i = AvFILLp(av); i >= 0; i--) {
4767 if (svp[i] == sv) {
4768 const SSize_t fill = AvFILLp(av);
4769 if (i != fill) {
4770 /* We weren't the last entry.
4771 An unordered list has this property that you can take the
4772 last element off the end to fill the hole, and it's still
4773 an unordered list :-)
4774 */
4775 svp[i] = svp[fill];
4776 }
a0714e2c 4777 svp[fill] = NULL;
6a76db8b
NC
4778 AvFILLp(av) = fill - 1;
4779 }
4780 }
810b8aa5
GS
4781}
4782
86f55936
NC
4783int
4784Perl_sv_kill_backrefs(pTHX_ SV *sv, AV *av)
4785{
4786 SV **svp = AvARRAY(av);
4787
4788 PERL_UNUSED_ARG(sv);
4789
4790 /* Not sure why the av can get freed ahead of its sv, but somehow it does
4791 in ext/B/t/bytecode.t test 15 (involving print <DATA>) */
4792 if (svp && !SvIS_FREED(av)) {
4793 SV *const *const last = svp + AvFILLp(av);
4794
4795 while (svp <= last) {
4796 if (*svp) {
4797 SV *const referrer = *svp;
4798 if (SvWEAKREF(referrer)) {
4799 /* XXX Should we check that it hasn't changed? */
4800 SvRV_set(referrer, 0);
4801 SvOK_off(referrer);
4802 SvWEAKREF_off(referrer);
1e73acc8 4803 SvSETMAGIC(referrer);
86f55936
NC
4804 } else if (SvTYPE(referrer) == SVt_PVGV ||
4805 SvTYPE(referrer) == SVt_PVLV) {
4806 /* You lookin' at me? */
4807 assert(GvSTASH(referrer));
4808 assert(GvSTASH(referrer) == (HV*)sv);
4809 GvSTASH(referrer) = 0;
4810 } else {
4811 Perl_croak(aTHX_
4812 "panic: magic_killbackrefs (flags=%"UVxf")",
4813 (UV)SvFLAGS(referrer));
4814 }
4815
a0714e2c 4816 *svp = NULL;
86f55936
NC
4817 }
4818 svp++;
4819 }
4820 }
4821 SvREFCNT_dec(av); /* remove extra count added by sv_add_backref() */
4822 return 0;
4823}
4824
954c1994
GS
4825/*
4826=for apidoc sv_insert
4827
4828Inserts a string at the specified offset/length within the SV. Similar to
4829the Perl substr() function.
4830
4831=cut
4832*/
4833
79072805 4834void
e1ec3a88 4835Perl_sv_insert(pTHX_ SV *bigstr, STRLEN offset, STRLEN len, const char *little, STRLEN littlelen)
79072805 4836{
97aff369 4837 dVAR;
79072805
LW
4838 register char *big;
4839 register char *mid;
4840 register char *midend;
4841 register char *bigend;
4842 register I32 i;
6ff81951 4843 STRLEN curlen;
1c846c1f 4844
79072805 4845
8990e307 4846 if (!bigstr)
cea2e8a9 4847 Perl_croak(aTHX_ "Can't modify non-existent substring");
6ff81951 4848 SvPV_force(bigstr, curlen);
60fa28ff 4849 (void)SvPOK_only_UTF8(bigstr);
6ff81951
GS
4850 if (offset + len > curlen) {
4851 SvGROW(bigstr, offset+len+1);
93524f2b 4852 Zero(SvPVX(bigstr)+curlen, offset+len-curlen, char);
6ff81951
GS
4853 SvCUR_set(bigstr, offset+len);
4854 }
79072805 4855
69b47968 4856 SvTAINT(bigstr);
79072805
LW
4857 i = littlelen - len;
4858 if (i > 0) { /* string might grow */
a0d0e21e 4859 big = SvGROW(bigstr, SvCUR(bigstr) + i + 1);
79072805
LW
4860 mid = big + offset + len;
4861 midend = bigend = big + SvCUR(bigstr);
4862 bigend += i;
4863 *bigend = '\0';
4864 while (midend > mid) /* shove everything down */
4865 *--bigend = *--midend;
4866 Move(little,big+offset,littlelen,char);
b162af07 4867 SvCUR_set(bigstr, SvCUR(bigstr) + i);
79072805
LW
4868 SvSETMAGIC(bigstr);
4869 return;
4870 }
4871 else if (i == 0) {
463ee0b2 4872 Move(little,SvPVX(bigstr)+offset,len,char);
79072805
LW
4873 SvSETMAGIC(bigstr);
4874 return;
4875 }
4876
463ee0b2 4877 big = SvPVX(bigstr);
79072805
LW
4878 mid = big + offset;
4879 midend = mid + len;
4880 bigend = big + SvCUR(bigstr);
4881
4882 if (midend > bigend)
cea2e8a9 4883 Perl_croak(aTHX_ "panic: sv_insert");
79072805
LW
4884
4885 if (mid - big > bigend - midend) { /* faster to shorten from end */
4886 if (littlelen) {
4887 Move(little, mid, littlelen,char);
4888 mid += littlelen;
4889 }
4890 i = bigend - midend;
4891 if (i > 0) {
4892 Move(midend, mid, i,char);
4893 mid += i;
4894 }
4895 *mid = '\0';
4896 SvCUR_set(bigstr, mid - big);
4897 }
155aba94 4898 else if ((i = mid - big)) { /* faster from front */
79072805
LW
4899 midend -= littlelen;
4900 mid = midend;
4901 sv_chop(bigstr,midend-i);
4902 big += i;
4903 while (i--)
4904 *--midend = *--big;
4905 if (littlelen)
4906 Move(little, mid, littlelen,char);
4907 }
4908 else if (littlelen) {
4909 midend -= littlelen;
4910 sv_chop(bigstr,midend);
4911 Move(little,midend,littlelen,char);
4912 }
4913 else {
4914 sv_chop(bigstr,midend);
4915 }
4916 SvSETMAGIC(bigstr);
4917}
4918
c461cf8f
JH
4919/*
4920=for apidoc sv_replace
4921
4922Make the first argument a copy of the second, then delete the original.
645c22ef
DM
4923The target SV physically takes over ownership of the body of the source SV
4924and inherits its flags; however, the target keeps any magic it owns,
4925and any magic in the source is discarded.
ff276b08 4926Note that this is a rather specialist SV copying operation; most of the
645c22ef 4927time you'll want to use C<sv_setsv> or one of its many macro front-ends.
c461cf8f
JH
4928
4929=cut
4930*/
79072805
LW
4931
4932void
864dbfa3 4933Perl_sv_replace(pTHX_ register SV *sv, register SV *nsv)
79072805 4934{
97aff369 4935 dVAR;
a3b680e6 4936 const U32 refcnt = SvREFCNT(sv);
765f542d 4937 SV_CHECK_THINKFIRST_COW_DROP(sv);
30e5c352 4938 if (SvREFCNT(nsv) != 1) {
7437becc 4939 Perl_croak(aTHX_ "panic: reference miscount on nsv in sv_replace() (%"
30e5c352
NC
4940 UVuf " != 1)", (UV) SvREFCNT(nsv));
4941 }
93a17b20 4942 if (SvMAGICAL(sv)) {
a0d0e21e
LW
4943 if (SvMAGICAL(nsv))
4944 mg_free(nsv);
4945 else
4946 sv_upgrade(nsv, SVt_PVMG);
b162af07 4947 SvMAGIC_set(nsv, SvMAGIC(sv));
a0d0e21e 4948 SvFLAGS(nsv) |= SvMAGICAL(sv);
93a17b20 4949 SvMAGICAL_off(sv);
b162af07 4950 SvMAGIC_set(sv, NULL);
93a17b20 4951 }
79072805
LW
4952 SvREFCNT(sv) = 0;
4953 sv_clear(sv);
477f5d66 4954 assert(!SvREFCNT(sv));
fd0854ff
DM
4955#ifdef DEBUG_LEAKING_SCALARS
4956 sv->sv_flags = nsv->sv_flags;
4957 sv->sv_any = nsv->sv_any;
4958 sv->sv_refcnt = nsv->sv_refcnt;
f34d0642 4959 sv->sv_u = nsv->sv_u;
fd0854ff 4960#else
79072805 4961 StructCopy(nsv,sv,SV);
fd0854ff 4962#endif
7b2c381c
NC
4963 /* Currently could join these into one piece of pointer arithmetic, but
4964 it would be unclear. */
4965 if(SvTYPE(sv) == SVt_IV)
4966 SvANY(sv)
339049b0 4967 = (XPVIV*)((char*)&(sv->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
7b2c381c 4968 else if (SvTYPE(sv) == SVt_RV) {
339049b0 4969 SvANY(sv) = &sv->sv_u.svu_rv;
7b2c381c
NC
4970 }
4971
fd0854ff 4972
f8c7b90f 4973#ifdef PERL_OLD_COPY_ON_WRITE
d3d0e6f1
NC
4974 if (SvIsCOW_normal(nsv)) {
4975 /* We need to follow the pointers around the loop to make the
4976 previous SV point to sv, rather than nsv. */
4977 SV *next;
4978 SV *current = nsv;
4979 while ((next = SV_COW_NEXT_SV(current)) != nsv) {
4980 assert(next);
4981 current = next;
3f7c398e 4982 assert(SvPVX_const(current) == SvPVX_const(nsv));
d3d0e6f1
NC
4983 }
4984 /* Make the SV before us point to the SV after us. */
4985 if (DEBUG_C_TEST) {
4986 PerlIO_printf(Perl_debug_log, "previous is\n");
4987 sv_dump(current);
a29f6d03
NC
4988 PerlIO_printf(Perl_debug_log,
4989 "move it from 0x%"UVxf" to 0x%"UVxf"\n",
d3d0e6f1
NC
4990 (UV) SV_COW_NEXT_SV(current), (UV) sv);
4991 }
a29f6d03 4992 SV_COW_NEXT_SV_SET(current, sv);
d3d0e6f1
NC
4993 }
4994#endif
79072805 4995 SvREFCNT(sv) = refcnt;
1edc1566 4996 SvFLAGS(nsv) |= SVTYPEMASK; /* Mark as freed */
39cf41c2 4997 SvREFCNT(nsv) = 0;
463ee0b2 4998 del_SV(nsv);
79072805
LW
4999}
5000
c461cf8f
JH
5001/*
5002=for apidoc sv_clear
5003
645c22ef
DM
5004Clear an SV: call any destructors, free up any memory used by the body,
5005and free the body itself. The SV's head is I<not> freed, although
5006its type is set to all 1's so that it won't inadvertently be assumed
5007to be live during global destruction etc.
5008This function should only be called when REFCNT is zero. Most of the time
5009you'll want to call C<sv_free()> (or its macro wrapper C<SvREFCNT_dec>)
5010instead.
c461cf8f
JH
5011
5012=cut
5013*/
5014
79072805 5015void
864dbfa3 5016Perl_sv_clear(pTHX_ register SV *sv)
79072805 5017{
27da23d5 5018 dVAR;
82bb6deb 5019 const U32 type = SvTYPE(sv);
8edfc514
NC
5020 const struct body_details *const sv_type_details
5021 = bodies_by_type + type;
82bb6deb 5022
79072805
LW
5023 assert(sv);
5024 assert(SvREFCNT(sv) == 0);
5025
d2a0f284
JC
5026 if (type <= SVt_IV) {
5027 /* See the comment in sv.h about the collusion between this early
5028 return and the overloading of the NULL and IV slots in the size
5029 table. */
82bb6deb 5030 return;
d2a0f284 5031 }
82bb6deb 5032
ed6116ce 5033 if (SvOBJECT(sv)) {
3280af22 5034 if (PL_defstash) { /* Still have a symbol table? */
39644a26 5035 dSP;
893645bd 5036 HV* stash;
d460ef45 5037 do {
b464bac0 5038 CV* destructor;
4e8e7886 5039 stash = SvSTASH(sv);
32251b26 5040 destructor = StashHANDLER(stash,DESTROY);
4e8e7886 5041 if (destructor) {
1b6737cc 5042 SV* const tmpref = newRV(sv);
5cc433a6 5043 SvREADONLY_on(tmpref); /* DESTROY() could be naughty */
4e8e7886 5044 ENTER;
e788e7d3 5045 PUSHSTACKi(PERLSI_DESTROY);
4e8e7886
GS
5046 EXTEND(SP, 2);
5047 PUSHMARK(SP);
5cc433a6 5048 PUSHs(tmpref);
4e8e7886 5049 PUTBACK;
44389ee9 5050 call_sv((SV*)destructor, G_DISCARD|G_EVAL|G_KEEPERR|G_VOID);
7a5fa8a2
NIS
5051
5052
d3acc0f7 5053 POPSTACK;
3095d977 5054 SPAGAIN;
4e8e7886 5055 LEAVE;
5cc433a6
AB
5056 if(SvREFCNT(tmpref) < 2) {
5057 /* tmpref is not kept alive! */
5058 SvREFCNT(sv)--;
b162af07 5059 SvRV_set(tmpref, NULL);
5cc433a6
AB
5060 SvROK_off(tmpref);
5061 }
5062 SvREFCNT_dec(tmpref);
4e8e7886
GS
5063 }
5064 } while (SvOBJECT(sv) && SvSTASH(sv) != stash);
8ebc5c01 5065
6f44e0a4
JP
5066
5067 if (SvREFCNT(sv)) {
5068 if (PL_in_clean_objs)
cea2e8a9 5069 Perl_croak(aTHX_ "DESTROY created new reference to dead object '%s'",
bfcb3514 5070 HvNAME_get(stash));
6f44e0a4
JP
5071 /* DESTROY gave object new lease on life */
5072 return;
5073 }
a0d0e21e 5074 }
4e8e7886 5075
a0d0e21e 5076 if (SvOBJECT(sv)) {
4e8e7886 5077 SvREFCNT_dec(SvSTASH(sv)); /* possibly of changed persuasion */
a0d0e21e 5078 SvOBJECT_off(sv); /* Curse the object. */
82bb6deb 5079 if (type != SVt_PVIO)
3280af22 5080 --PL_sv_objcount; /* XXX Might want something more general */
a0d0e21e 5081 }
463ee0b2 5082 }
82bb6deb 5083 if (type >= SVt_PVMG) {
885ffcb3
NC
5084 if ((type == SVt_PVMG || type == SVt_PVGV) && SvPAD_OUR(sv)) {
5085 SvREFCNT_dec(OURSTASH(sv));
e736a858 5086 } else if (SvMAGIC(sv))
524189f1 5087 mg_free(sv);
00b1698f 5088 if (type == SVt_PVMG && SvPAD_TYPED(sv))
524189f1
JH
5089 SvREFCNT_dec(SvSTASH(sv));
5090 }
82bb6deb 5091 switch (type) {
8990e307 5092 case SVt_PVIO:
df0bd2f4
GS
5093 if (IoIFP(sv) &&
5094 IoIFP(sv) != PerlIO_stdin() &&
5f05dabc 5095 IoIFP(sv) != PerlIO_stdout() &&
5096 IoIFP(sv) != PerlIO_stderr())
93578b34 5097 {
f2b5be74 5098 io_close((IO*)sv, FALSE);
93578b34 5099 }
1d7c1841 5100 if (IoDIRP(sv) && !(IoFLAGS(sv) & IOf_FAKE_DIRP))
1236053a 5101 PerlDir_close(IoDIRP(sv));
1d7c1841 5102 IoDIRP(sv) = (DIR*)NULL;
8990e307
LW
5103 Safefree(IoTOP_NAME(sv));
5104 Safefree(IoFMT_NAME(sv));
5105 Safefree(IoBOTTOM_NAME(sv));
82bb6deb 5106 goto freescalar;
79072805 5107 case SVt_PVBM:
a0d0e21e 5108 goto freescalar;
79072805 5109 case SVt_PVCV:
748a9306 5110 case SVt_PVFM:
85e6fe83 5111 cv_undef((CV*)sv);
a0d0e21e 5112 goto freescalar;
79072805 5113 case SVt_PVHV:
86f55936 5114 Perl_hv_kill_backrefs(aTHX_ (HV*)sv);
85e6fe83 5115 hv_undef((HV*)sv);
a0d0e21e 5116 break;
79072805 5117 case SVt_PVAV:
85e6fe83 5118 av_undef((AV*)sv);
a0d0e21e 5119 break;
02270b4e 5120 case SVt_PVLV:
dd28f7bb
DM
5121 if (LvTYPE(sv) == 'T') { /* for tie: return HE to pool */
5122 SvREFCNT_dec(HeKEY_sv((HE*)LvTARG(sv)));
5123 HeNEXT((HE*)LvTARG(sv)) = PL_hv_fetch_ent_mh;
5124 PL_hv_fetch_ent_mh = (HE*)LvTARG(sv);
5125 }
5126 else if (LvTYPE(sv) != 't') /* unless tie: unrefcnted fake SV** */
5127 SvREFCNT_dec(LvTARG(sv));
02270b4e 5128 goto freescalar;
a0d0e21e 5129 case SVt_PVGV:
1edc1566 5130 gp_free((GV*)sv);
acda4c6a
NC
5131 if (GvNAME_HEK(sv)) {
5132 unshare_hek(GvNAME_HEK(sv));
5133 }
893645bd
NC
5134 /* If we're in a stash, we don't own a reference to it. However it does
5135 have a back reference to us, which needs to be cleared. */
5136 if (GvSTASH(sv))
5137 sv_del_backref((SV*)GvSTASH(sv), sv);
79072805 5138 case SVt_PVMG:
79072805
LW
5139 case SVt_PVNV:
5140 case SVt_PVIV:
a0d0e21e 5141 freescalar:
5228ca4e
NC
5142 /* Don't bother with SvOOK_off(sv); as we're only going to free it. */
5143 if (SvOOK(sv)) {
93524f2b 5144 SvPV_set(sv, SvPVX_mutable(sv) - SvIVX(sv));
5228ca4e
NC
5145 /* Don't even bother with turning off the OOK flag. */
5146 }
79072805 5147 case SVt_PV:
a0d0e21e 5148 case SVt_RV:
810b8aa5 5149 if (SvROK(sv)) {
b37c2d43 5150 SV * const target = SvRV(sv);
810b8aa5 5151 if (SvWEAKREF(sv))
e15faf7d 5152 sv_del_backref(target, sv);
810b8aa5 5153 else
e15faf7d 5154 SvREFCNT_dec(target);
810b8aa5 5155 }
f8c7b90f 5156#ifdef PERL_OLD_COPY_ON_WRITE
3f7c398e 5157 else if (SvPVX_const(sv)) {
765f542d
NC
5158 if (SvIsCOW(sv)) {
5159 /* I believe I need to grab the global SV mutex here and
5160 then recheck the COW status. */
46187eeb
NC
5161 if (DEBUG_C_TEST) {
5162 PerlIO_printf(Perl_debug_log, "Copy on write: clear\n");
e419cbc5 5163 sv_dump(sv);
46187eeb 5164 }
bdd68bc3
NC
5165 sv_release_COW(sv, SvPVX_const(sv), SvLEN(sv),
5166 SV_COW_NEXT_SV(sv));
765f542d
NC
5167 /* And drop it here. */
5168 SvFAKE_off(sv);
5169 } else if (SvLEN(sv)) {
3f7c398e 5170 Safefree(SvPVX_const(sv));
765f542d
NC
5171 }
5172 }
5173#else
3f7c398e 5174 else if (SvPVX_const(sv) && SvLEN(sv))
94010e71 5175 Safefree(SvPVX_mutable(sv));
3f7c398e 5176 else if (SvPVX_const(sv) && SvREADONLY(sv) && SvFAKE(sv)) {
bdd68bc3 5177 unshare_hek(SvSHARED_HEK_FROM_PV(SvPVX_const(sv)));
1c846c1f
NIS
5178 SvFAKE_off(sv);
5179 }
765f542d 5180#endif
79072805
LW
5181 break;
5182 case SVt_NV:
79072805
LW
5183 break;
5184 }
5185
893645bd
NC
5186 SvFLAGS(sv) &= SVf_BREAK;
5187 SvFLAGS(sv) |= SVTYPEMASK;
5188
8edfc514 5189 if (sv_type_details->arena) {
b9502f15 5190 del_body(((char *)SvANY(sv) + sv_type_details->offset),
8edfc514
NC
5191 &PL_body_roots[type]);
5192 }
d2a0f284 5193 else if (sv_type_details->body_size) {
8edfc514
NC
5194 my_safefree(SvANY(sv));
5195 }
79072805
LW
5196}
5197
645c22ef
DM
5198/*
5199=for apidoc sv_newref
5200
5201Increment an SV's reference count. Use the C<SvREFCNT_inc()> wrapper
5202instead.
5203
5204=cut
5205*/
5206
79072805 5207SV *
864dbfa3 5208Perl_sv_newref(pTHX_ SV *sv)
79072805 5209{
96a5add6 5210 PERL_UNUSED_CONTEXT;
463ee0b2 5211 if (sv)
4db098f4 5212 (SvREFCNT(sv))++;
79072805
LW
5213 return sv;
5214}
5215
c461cf8f
JH
5216/*
5217=for apidoc sv_free
5218
645c22ef
DM
5219Decrement an SV's reference count, and if it drops to zero, call
5220C<sv_clear> to invoke destructors and free up any memory used by
5221the body; finally, deallocate the SV's head itself.
5222Normally called via a wrapper macro C<SvREFCNT_dec>.
c461cf8f
JH
5223
5224=cut
5225*/
5226
79072805 5227void
864dbfa3 5228Perl_sv_free(pTHX_ SV *sv)
79072805 5229{
27da23d5 5230 dVAR;
79072805
LW
5231 if (!sv)
5232 return;
a0d0e21e
LW
5233 if (SvREFCNT(sv) == 0) {
5234 if (SvFLAGS(sv) & SVf_BREAK)
645c22ef
DM
5235 /* this SV's refcnt has been artificially decremented to
5236 * trigger cleanup */
a0d0e21e 5237 return;
3280af22 5238 if (PL_in_clean_all) /* All is fair */
1edc1566 5239 return;
d689ffdd
JP
5240 if (SvREADONLY(sv) && SvIMMORTAL(sv)) {
5241 /* make sure SvREFCNT(sv)==0 happens very seldom */
5242 SvREFCNT(sv) = (~(U32)0)/2;
5243 return;
5244 }
41e4abd8 5245 if (ckWARN_d(WARN_INTERNAL)) {
d5dede04 5246 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
472d47bc
SB
5247 "Attempt to free unreferenced scalar: SV 0x%"UVxf
5248 pTHX__FORMAT, PTR2UV(sv) pTHX__VALUE);
41e4abd8
NC
5249#ifdef DEBUG_LEAKING_SCALARS_FORK_DUMP
5250 Perl_dump_sv_child(aTHX_ sv);
5251#endif
5252 }
79072805
LW
5253 return;
5254 }
4db098f4 5255 if (--(SvREFCNT(sv)) > 0)
8990e307 5256 return;
8c4d3c90
NC
5257 Perl_sv_free2(aTHX_ sv);
5258}
5259
5260void
5261Perl_sv_free2(pTHX_ SV *sv)
5262{
27da23d5 5263 dVAR;
463ee0b2
LW
5264#ifdef DEBUGGING
5265 if (SvTEMP(sv)) {
0453d815 5266 if (ckWARN_d(WARN_DEBUGGING))
9014280d 5267 Perl_warner(aTHX_ packWARN(WARN_DEBUGGING),
472d47bc
SB
5268 "Attempt to free temp prematurely: SV 0x%"UVxf
5269 pTHX__FORMAT, PTR2UV(sv) pTHX__VALUE);
79072805 5270 return;
79072805 5271 }
463ee0b2 5272#endif
d689ffdd
JP
5273 if (SvREADONLY(sv) && SvIMMORTAL(sv)) {
5274 /* make sure SvREFCNT(sv)==0 happens very seldom */
5275 SvREFCNT(sv) = (~(U32)0)/2;
5276 return;
5277 }
79072805 5278 sv_clear(sv);
477f5d66
CS
5279 if (! SvREFCNT(sv))
5280 del_SV(sv);
79072805
LW
5281}
5282
954c1994
GS
5283/*
5284=for apidoc sv_len
5285
645c22ef
DM
5286Returns the length of the string in the SV. Handles magic and type
5287coercion. See also C<SvCUR>, which gives raw access to the xpv_cur slot.
954c1994
GS
5288
5289=cut
5290*/
5291
79072805 5292STRLEN
864dbfa3 5293Perl_sv_len(pTHX_ register SV *sv)
79072805 5294{
463ee0b2 5295 STRLEN len;
79072805
LW
5296
5297 if (!sv)
5298 return 0;
5299
8990e307 5300 if (SvGMAGICAL(sv))
565764a8 5301 len = mg_length(sv);
8990e307 5302 else
4d84ee25 5303 (void)SvPV_const(sv, len);
463ee0b2 5304 return len;
79072805
LW
5305}
5306
c461cf8f
JH
5307/*
5308=for apidoc sv_len_utf8
5309
5310Returns the number of characters in the string in an SV, counting wide
1e54db1a 5311UTF-8 bytes as a single character. Handles magic and type coercion.
c461cf8f
JH
5312
5313=cut
5314*/
5315
7e8c5dac
HS
5316/*
5317 * The length is cached in PERL_UTF8_magic, in the mg_len field. Also the
9564a3bd
NC
5318 * mg_ptr is used, by sv_pos_u2b() and sv_pos_b2u() - see the comments below.
5319 * (Note that the mg_len is not the length of the mg_ptr field.
5320 * This allows the cache to store the character length of the string without
5321 * needing to malloc() extra storage to attach to the mg_ptr.)
7a5fa8a2 5322 *
7e8c5dac
HS
5323 */
5324
a0ed51b3 5325STRLEN
864dbfa3 5326Perl_sv_len_utf8(pTHX_ register SV *sv)
a0ed51b3 5327{
a0ed51b3
LW
5328 if (!sv)
5329 return 0;
5330
a0ed51b3 5331 if (SvGMAGICAL(sv))
b76347f2 5332 return mg_length(sv);
a0ed51b3 5333 else
b76347f2 5334 {
26346457 5335 STRLEN len;
e62f0680 5336 const U8 *s = (U8*)SvPV_const(sv, len);
7e8c5dac 5337
26346457
NC
5338 if (PL_utf8cache) {
5339 STRLEN ulen;
5340 MAGIC *mg = SvMAGICAL(sv) ? mg_find(sv, PERL_MAGIC_utf8) : 0;
5341
5342 if (mg && mg->mg_len != -1) {
5343 ulen = mg->mg_len;
5344 if (PL_utf8cache < 0) {
5345 const STRLEN real = Perl_utf8_length(aTHX_ s, s + len);
5346 if (real != ulen) {
5347 /* Need to turn the assertions off otherwise we may
5348 recurse infinitely while printing error messages.
5349 */
5350 SAVEI8(PL_utf8cache);
5351 PL_utf8cache = 0;
5352 Perl_croak(aTHX_ "panic: sv_len_utf8 cache %"UVf
ec07b5e0 5353 " real %"UVf" for %"SVf,
95b63a38 5354 (UV) ulen, (UV) real, (void*)sv);
26346457
NC
5355 }
5356 }
5357 }
5358 else {
5359 ulen = Perl_utf8_length(aTHX_ s, s + len);
5360 if (!SvREADONLY(sv)) {
5361 if (!mg) {
5362 mg = sv_magicext(sv, 0, PERL_MAGIC_utf8,
5363 &PL_vtbl_utf8, 0, 0);
5364 }
cb9e20bb 5365 assert(mg);
26346457 5366 mg->mg_len = ulen;
cb9e20bb 5367 }
cb9e20bb 5368 }
26346457 5369 return ulen;
7e8c5dac 5370 }
26346457 5371 return Perl_utf8_length(aTHX_ s, s + len);
7e8c5dac
HS
5372 }
5373}
5374
9564a3bd
NC
5375/* Walk forwards to find the byte corresponding to the passed in UTF-8
5376 offset. */
bdf30dd6 5377static STRLEN
721e86b6 5378S_sv_pos_u2b_forwards(const U8 *const start, const U8 *const send,
bdf30dd6
NC
5379 STRLEN uoffset)
5380{
5381 const U8 *s = start;
5382
5383 while (s < send && uoffset--)
5384 s += UTF8SKIP(s);
5385 if (s > send) {
5386 /* This is the existing behaviour. Possibly it should be a croak, as
5387 it's actually a bounds error */
5388 s = send;
5389 }
5390 return s - start;
5391}
5392
9564a3bd
NC
5393/* Given the length of the string in both bytes and UTF-8 characters, decide
5394 whether to walk forwards or backwards to find the byte corresponding to
5395 the passed in UTF-8 offset. */
c336ad0b 5396static STRLEN
721e86b6 5397S_sv_pos_u2b_midway(const U8 *const start, const U8 *send,
c336ad0b
NC
5398 STRLEN uoffset, STRLEN uend)
5399{
5400 STRLEN backw = uend - uoffset;
5401 if (uoffset < 2 * backw) {
25a8a4ef 5402 /* The assumption is that going forwards is twice the speed of going
c336ad0b
NC
5403 forward (that's where the 2 * backw comes from).
5404 (The real figure of course depends on the UTF-8 data.) */
721e86b6 5405 return sv_pos_u2b_forwards(start, send, uoffset);
c336ad0b
NC
5406 }
5407
5408 while (backw--) {
5409 send--;
5410 while (UTF8_IS_CONTINUATION(*send))
5411 send--;
5412 }
5413 return send - start;
5414}
5415
9564a3bd
NC
5416/* For the string representation of the given scalar, find the byte
5417 corresponding to the passed in UTF-8 offset. uoffset0 and boffset0
5418 give another position in the string, *before* the sought offset, which
5419 (which is always true, as 0, 0 is a valid pair of positions), which should
5420 help reduce the amount of linear searching.
5421 If *mgp is non-NULL, it should point to the UTF-8 cache magic, which
5422 will be used to reduce the amount of linear searching. The cache will be
5423 created if necessary, and the found value offered to it for update. */
28ccbf94
NC
5424static STRLEN
5425S_sv_pos_u2b_cached(pTHX_ SV *sv, MAGIC **mgp, const U8 *const start,
5426 const U8 *const send, STRLEN uoffset,
5427 STRLEN uoffset0, STRLEN boffset0) {
7087a21c 5428 STRLEN boffset = 0; /* Actually always set, but let's keep gcc happy. */
c336ad0b
NC
5429 bool found = FALSE;
5430
75c33c12
NC
5431 assert (uoffset >= uoffset0);
5432
c336ad0b 5433 if (SvMAGICAL(sv) && !SvREADONLY(sv) && PL_utf8cache
0905937d 5434 && (*mgp || (*mgp = mg_find(sv, PERL_MAGIC_utf8)))) {
d8b2e1f9
NC
5435 if ((*mgp)->mg_ptr) {
5436 STRLEN *cache = (STRLEN *) (*mgp)->mg_ptr;
5437 if (cache[0] == uoffset) {
5438 /* An exact match. */
5439 return cache[1];
5440 }
ab455f60
NC
5441 if (cache[2] == uoffset) {
5442 /* An exact match. */
5443 return cache[3];
5444 }
668af93f
NC
5445
5446 if (cache[0] < uoffset) {
d8b2e1f9
NC
5447 /* The cache already knows part of the way. */
5448 if (cache[0] > uoffset0) {
5449 /* The cache knows more than the passed in pair */
5450 uoffset0 = cache[0];
5451 boffset0 = cache[1];
5452 }
5453 if ((*mgp)->mg_len != -1) {
5454 /* And we know the end too. */
5455 boffset = boffset0
721e86b6 5456 + sv_pos_u2b_midway(start + boffset0, send,
d8b2e1f9
NC
5457 uoffset - uoffset0,
5458 (*mgp)->mg_len - uoffset0);
5459 } else {
5460 boffset = boffset0
721e86b6 5461 + sv_pos_u2b_forwards(start + boffset0,
d8b2e1f9
NC
5462 send, uoffset - uoffset0);
5463 }
dd7c5fd3
NC
5464 }
5465 else if (cache[2] < uoffset) {
5466 /* We're between the two cache entries. */
5467 if (cache[2] > uoffset0) {
5468 /* and the cache knows more than the passed in pair */
5469 uoffset0 = cache[2];
5470 boffset0 = cache[3];
5471 }
5472
668af93f 5473 boffset = boffset0
721e86b6 5474 + sv_pos_u2b_midway(start + boffset0,
668af93f
NC
5475 start + cache[1],
5476 uoffset - uoffset0,
5477 cache[0] - uoffset0);
dd7c5fd3
NC
5478 } else {
5479 boffset = boffset0
721e86b6 5480 + sv_pos_u2b_midway(start + boffset0,
dd7c5fd3
NC
5481 start + cache[3],
5482 uoffset - uoffset0,
5483 cache[2] - uoffset0);
d8b2e1f9 5484 }
668af93f 5485 found = TRUE;
d8b2e1f9
NC
5486 }
5487 else if ((*mgp)->mg_len != -1) {
75c33c12
NC
5488 /* If we can take advantage of a passed in offset, do so. */
5489 /* In fact, offset0 is either 0, or less than offset, so don't
5490 need to worry about the other possibility. */
5491 boffset = boffset0
721e86b6 5492 + sv_pos_u2b_midway(start + boffset0, send,
75c33c12
NC
5493 uoffset - uoffset0,
5494 (*mgp)->mg_len - uoffset0);
c336ad0b
NC
5495 found = TRUE;
5496 }
28ccbf94 5497 }
c336ad0b
NC
5498
5499 if (!found || PL_utf8cache < 0) {
75c33c12 5500 const STRLEN real_boffset
721e86b6 5501 = boffset0 + sv_pos_u2b_forwards(start + boffset0,
75c33c12
NC
5502 send, uoffset - uoffset0);
5503
c336ad0b
NC
5504 if (found && PL_utf8cache < 0) {
5505 if (real_boffset != boffset) {
5506 /* Need to turn the assertions off otherwise we may recurse
5507 infinitely while printing error messages. */
5508 SAVEI8(PL_utf8cache);
5509 PL_utf8cache = 0;
5510 Perl_croak(aTHX_ "panic: sv_pos_u2b_cache cache %"UVf
5511 " real %"UVf" for %"SVf,
95b63a38 5512 (UV) boffset, (UV) real_boffset, (void*)sv);
c336ad0b
NC
5513 }
5514 }
5515 boffset = real_boffset;
28ccbf94 5516 }
0905937d 5517
ab455f60 5518 S_utf8_mg_pos_cache_update(aTHX_ sv, mgp, boffset, uoffset, send - start);
28ccbf94
NC
5519 return boffset;
5520}
5521
9564a3bd
NC
5522
5523/*
5524=for apidoc sv_pos_u2b
5525
5526Converts the value pointed to by offsetp from a count of UTF-8 chars from
5527the start of the string, to a count of the equivalent number of bytes; if
5528lenp is non-zero, it does the same to lenp, but this time starting from
5529the offset, rather than from the start of the string. Handles magic and
5530type coercion.
5531
5532=cut
5533*/
5534
5535/*
5536 * sv_pos_u2b() uses, like sv_pos_b2u(), the mg_ptr of the potential
5537 * PERL_UTF8_magic of the sv to store the mapping between UTF-8 and
5538 * byte offsets. See also the comments of S_utf8_mg_pos_cache_update().
5539 *
5540 */
5541
a0ed51b3 5542void
864dbfa3 5543Perl_sv_pos_u2b(pTHX_ register SV *sv, I32* offsetp, I32* lenp)
a0ed51b3 5544{
245d4a47 5545 const U8 *start;
a0ed51b3
LW
5546 STRLEN len;
5547
5548 if (!sv)
5549 return;
5550
245d4a47 5551 start = (U8*)SvPV_const(sv, len);
7e8c5dac 5552 if (len) {
bdf30dd6
NC
5553 STRLEN uoffset = (STRLEN) *offsetp;
5554 const U8 * const send = start + len;
0905937d 5555 MAGIC *mg = NULL;
721e86b6 5556 const STRLEN boffset = sv_pos_u2b_cached(sv, &mg, start, send,
28ccbf94 5557 uoffset, 0, 0);
bdf30dd6
NC
5558
5559 *offsetp = (I32) boffset;
5560
5561 if (lenp) {
28ccbf94 5562 /* Convert the relative offset to absolute. */
721e86b6
AL
5563 const STRLEN uoffset2 = uoffset + (STRLEN) *lenp;
5564 const STRLEN boffset2
5565 = sv_pos_u2b_cached(sv, &mg, start, send, uoffset2,
28ccbf94 5566 uoffset, boffset) - boffset;
bdf30dd6 5567
28ccbf94 5568 *lenp = boffset2;
bdf30dd6 5569 }
7e8c5dac
HS
5570 }
5571 else {
5572 *offsetp = 0;
5573 if (lenp)
5574 *lenp = 0;
a0ed51b3 5575 }
e23c8137 5576
a0ed51b3
LW
5577 return;
5578}
5579
9564a3bd
NC
5580/* Create and update the UTF8 magic offset cache, with the proffered utf8/
5581 byte length pairing. The (byte) length of the total SV is passed in too,
5582 as blen, because for some (more esoteric) SVs, the call to SvPV_const()
5583 may not have updated SvCUR, so we can't rely on reading it directly.
5584
5585 The proffered utf8/byte length pairing isn't used if the cache already has
5586 two pairs, and swapping either for the proffered pair would increase the
5587 RMS of the intervals between known byte offsets.
5588
5589 The cache itself consists of 4 STRLEN values
5590 0: larger UTF-8 offset
5591 1: corresponding byte offset
5592 2: smaller UTF-8 offset
5593 3: corresponding byte offset
5594
5595 Unused cache pairs have the value 0, 0.
5596 Keeping the cache "backwards" means that the invariant of
5597 cache[0] >= cache[2] is maintained even with empty slots, which means that
5598 the code that uses it doesn't need to worry if only 1 entry has actually
5599 been set to non-zero. It also makes the "position beyond the end of the
5600 cache" logic much simpler, as the first slot is always the one to start
5601 from.
645c22ef 5602*/
ec07b5e0 5603static void
ab455f60
NC
5604S_utf8_mg_pos_cache_update(pTHX_ SV *sv, MAGIC **mgp, STRLEN byte, STRLEN utf8,
5605 STRLEN blen)
ec07b5e0
NC
5606{
5607 STRLEN *cache;
5608 if (SvREADONLY(sv))
5609 return;
5610
5611 if (!*mgp) {
5612 *mgp = sv_magicext(sv, 0, PERL_MAGIC_utf8, (MGVTBL*)&PL_vtbl_utf8, 0,
5613 0);
5614 (*mgp)->mg_len = -1;
5615 }
5616 assert(*mgp);
5617
5618 if (!(cache = (STRLEN *)(*mgp)->mg_ptr)) {
5619 Newxz(cache, PERL_MAGIC_UTF8_CACHESIZE * 2, STRLEN);
5620 (*mgp)->mg_ptr = (char *) cache;
5621 }
5622 assert(cache);
5623
5624 if (PL_utf8cache < 0) {
ef816a78 5625 const U8 *start = (const U8 *) SvPVX_const(sv);
0905937d
NC
5626 const U8 *const end = start + byte;
5627 STRLEN realutf8 = 0;
5628
5629 while (start < end) {
5630 start += UTF8SKIP(start);
5631 realutf8++;
5632 }
5633
5634 /* Can't use S_sv_pos_b2u_forwards as it will scream warnings on
5635 surrogates. FIXME - is it inconsistent that b2u warns, but u2b
5636 doesn't? I don't know whether this difference was introduced with
5637 the caching code in 5.8.1. */
ec07b5e0
NC
5638
5639 if (realutf8 != utf8) {
5640 /* Need to turn the assertions off otherwise we may recurse
5641 infinitely while printing error messages. */
5642 SAVEI8(PL_utf8cache);
5643 PL_utf8cache = 0;
5644 Perl_croak(aTHX_ "panic: utf8_mg_pos_cache_update cache %"UVf
95b63a38 5645 " real %"UVf" for %"SVf, (UV) utf8, (UV) realutf8, (void*)sv);
ec07b5e0
NC
5646 }
5647 }
ab455f60
NC
5648
5649 /* Cache is held with the later position first, to simplify the code
5650 that deals with unbounded ends. */
5651
5652 ASSERT_UTF8_CACHE(cache);
5653 if (cache[1] == 0) {
5654 /* Cache is totally empty */
5655 cache[0] = utf8;
5656 cache[1] = byte;
5657 } else if (cache[3] == 0) {
5658 if (byte > cache[1]) {
5659 /* New one is larger, so goes first. */
5660 cache[2] = cache[0];
5661 cache[3] = cache[1];
5662 cache[0] = utf8;
5663 cache[1] = byte;
5664 } else {
5665 cache[2] = utf8;
5666 cache[3] = byte;
5667 }
5668 } else {
5669#define THREEWAY_SQUARE(a,b,c,d) \
5670 ((float)((d) - (c))) * ((float)((d) - (c))) \
5671 + ((float)((c) - (b))) * ((float)((c) - (b))) \
5672 + ((float)((b) - (a))) * ((float)((b) - (a)))
5673
5674 /* Cache has 2 slots in use, and we know three potential pairs.
5675 Keep the two that give the lowest RMS distance. Do the
5676 calcualation in bytes simply because we always know the byte
5677 length. squareroot has the same ordering as the positive value,
5678 so don't bother with the actual square root. */
5679 const float existing = THREEWAY_SQUARE(0, cache[3], cache[1], blen);
5680 if (byte > cache[1]) {
5681 /* New position is after the existing pair of pairs. */
5682 const float keep_earlier
5683 = THREEWAY_SQUARE(0, cache[3], byte, blen);
5684 const float keep_later
5685 = THREEWAY_SQUARE(0, cache[1], byte, blen);
5686
5687 if (keep_later < keep_earlier) {
5688 if (keep_later < existing) {
5689 cache[2] = cache[0];
5690 cache[3] = cache[1];
5691 cache[0] = utf8;
5692 cache[1] = byte;
5693 }
5694 }
5695 else {
5696 if (keep_earlier < existing) {
5697 cache[0] = utf8;
5698 cache[1] = byte;
5699 }
5700 }
5701 }
57d7fbf1
NC
5702 else if (byte > cache[3]) {
5703 /* New position is between the existing pair of pairs. */
5704 const float keep_earlier
5705 = THREEWAY_SQUARE(0, cache[3], byte, blen);
5706 const float keep_later
5707 = THREEWAY_SQUARE(0, byte, cache[1], blen);
5708
5709 if (keep_later < keep_earlier) {
5710 if (keep_later < existing) {
5711 cache[2] = utf8;
5712 cache[3] = byte;
5713 }
5714 }
5715 else {
5716 if (keep_earlier < existing) {
5717 cache[0] = utf8;
5718 cache[1] = byte;
5719 }
5720 }
5721 }
5722 else {
5723 /* New position is before the existing pair of pairs. */
5724 const float keep_earlier
5725 = THREEWAY_SQUARE(0, byte, cache[3], blen);
5726 const float keep_later
5727 = THREEWAY_SQUARE(0, byte, cache[1], blen);
5728
5729 if (keep_later < keep_earlier) {
5730 if (keep_later < existing) {
5731 cache[2] = utf8;
5732 cache[3] = byte;
5733 }
5734 }
5735 else {
5736 if (keep_earlier < existing) {
5737 cache[0] = cache[2];
5738 cache[1] = cache[3];
5739 cache[2] = utf8;
5740 cache[3] = byte;
5741 }
5742 }
5743 }
ab455f60 5744 }
0905937d 5745 ASSERT_UTF8_CACHE(cache);
ec07b5e0
NC
5746}
5747
5748/* If we don't know the character offset of the end of a region, our only
5749 option is to walk forwards to the target byte offset. */
5750static STRLEN
5751S_sv_pos_b2u_forwards(pTHX_ const U8 *s, const U8 *const target)
5752{
5753 STRLEN len = 0;
5754 while (s < target) {
5755 STRLEN n = 1;
5756
5757 /* Call utf8n_to_uvchr() to validate the sequence
5758 * (unless a simple non-UTF character) */
5759 if (!UTF8_IS_INVARIANT(*s))
5760 utf8n_to_uvchr(s, UTF8SKIP(s), &n, 0);
5761 if (n > 0) {
5762 s += n;
5763 len++;
5764 }
5765 else
5766 break;
5767 }
5768 return len;
5769}
5770
5771/* We already know all of the way, now we may be able to walk back. The same
25a8a4ef
NC
5772 assumption is made as in S_sv_pos_u2b_midway(), namely that walking
5773 backward is half the speed of walking forward. */
ec07b5e0
NC
5774static STRLEN
5775S_sv_pos_b2u_midway(pTHX_ const U8 *s, const U8 *const target, const U8 *end,
5776 STRLEN endu)
5777{
5778 const STRLEN forw = target - s;
5779 STRLEN backw = end - target;
5780
5781 if (forw < 2 * backw) {
5782 return S_sv_pos_b2u_forwards(aTHX_ s, target);
5783 }
5784
5785 while (end > target) {
5786 end--;
5787 while (UTF8_IS_CONTINUATION(*end)) {
5788 end--;
5789 }
5790 endu--;
5791 }
5792 return endu;
5793}
5794
9564a3bd
NC
5795/*
5796=for apidoc sv_pos_b2u
5797
5798Converts the value pointed to by offsetp from a count of bytes from the
5799start of the string, to a count of the equivalent number of UTF-8 chars.
5800Handles magic and type coercion.
5801
5802=cut
5803*/
5804
5805/*
5806 * sv_pos_b2u() uses, like sv_pos_u2b(), the mg_ptr of the potential
5807 * PERL_UTF8_magic of the sv to store the mapping between UTF-8 and
5808 * byte offsets.
5809 *
5810 */
a0ed51b3 5811void
7e8c5dac 5812Perl_sv_pos_b2u(pTHX_ register SV* sv, I32* offsetp)
a0ed51b3 5813{
83003860 5814 const U8* s;
ec07b5e0 5815 const STRLEN byte = *offsetp;
7087a21c 5816 STRLEN len = 0; /* Actually always set, but let's keep gcc happy. */
ab455f60 5817 STRLEN blen;
ec07b5e0
NC
5818 MAGIC* mg = NULL;
5819 const U8* send;
a922f900 5820 bool found = FALSE;
a0ed51b3
LW
5821
5822 if (!sv)
5823 return;
5824
ab455f60 5825 s = (const U8*)SvPV_const(sv, blen);
7e8c5dac 5826
ab455f60 5827 if (blen < byte)
ec07b5e0 5828 Perl_croak(aTHX_ "panic: sv_pos_b2u: bad byte offset");
7e8c5dac 5829
ec07b5e0 5830 send = s + byte;
a67d7df9 5831
ffca234a
NC
5832 if (SvMAGICAL(sv) && !SvREADONLY(sv) && PL_utf8cache
5833 && (mg = mg_find(sv, PERL_MAGIC_utf8))) {
5834 if (mg->mg_ptr) {
d4c19fe8 5835 STRLEN * const cache = (STRLEN *) mg->mg_ptr;
b9f984a5 5836 if (cache[1] == byte) {
ec07b5e0
NC
5837 /* An exact match. */
5838 *offsetp = cache[0];
ec07b5e0 5839 return;
7e8c5dac 5840 }
ab455f60
NC
5841 if (cache[3] == byte) {
5842 /* An exact match. */
5843 *offsetp = cache[2];
5844 return;
5845 }
668af93f
NC
5846
5847 if (cache[1] < byte) {
ec07b5e0 5848 /* We already know part of the way. */
b9f984a5
NC
5849 if (mg->mg_len != -1) {
5850 /* Actually, we know the end too. */
5851 len = cache[0]
5852 + S_sv_pos_b2u_midway(aTHX_ s + cache[1], send,
ab455f60 5853 s + blen, mg->mg_len - cache[0]);
b9f984a5
NC
5854 } else {
5855 len = cache[0]
5856 + S_sv_pos_b2u_forwards(aTHX_ s + cache[1], send);
5857 }
7e8c5dac 5858 }
9f985e4c
NC
5859 else if (cache[3] < byte) {
5860 /* We're between the two cached pairs, so we do the calculation
5861 offset by the byte/utf-8 positions for the earlier pair,
5862 then add the utf-8 characters from the string start to
5863 there. */
5864 len = S_sv_pos_b2u_midway(aTHX_ s + cache[3], send,
5865 s + cache[1], cache[0] - cache[2])
5866 + cache[2];
5867
5868 }
5869 else { /* cache[3] > byte */
5870 len = S_sv_pos_b2u_midway(aTHX_ s, send, s + cache[3],
5871 cache[2]);
7e8c5dac 5872
7e8c5dac 5873 }
ec07b5e0 5874 ASSERT_UTF8_CACHE(cache);
a922f900 5875 found = TRUE;
ffca234a 5876 } else if (mg->mg_len != -1) {
ab455f60 5877 len = S_sv_pos_b2u_midway(aTHX_ s, send, s + blen, mg->mg_len);
a922f900 5878 found = TRUE;
7e8c5dac 5879 }
a0ed51b3 5880 }
a922f900
NC
5881 if (!found || PL_utf8cache < 0) {
5882 const STRLEN real_len = S_sv_pos_b2u_forwards(aTHX_ s, send);
5883
5884 if (found && PL_utf8cache < 0) {
5885 if (len != real_len) {
5886 /* Need to turn the assertions off otherwise we may recurse
5887 infinitely while printing error messages. */
5888 SAVEI8(PL_utf8cache);
5889 PL_utf8cache = 0;
5890 Perl_croak(aTHX_ "panic: sv_pos_b2u cache %"UVf
5891 " real %"UVf" for %"SVf,
95b63a38 5892 (UV) len, (UV) real_len, (void*)sv);
a922f900
NC
5893 }
5894 }
5895 len = real_len;
ec07b5e0
NC
5896 }
5897 *offsetp = len;
5898
ab455f60 5899 S_utf8_mg_pos_cache_update(aTHX_ sv, &mg, byte, len, blen);
a0ed51b3
LW
5900}
5901
954c1994
GS
5902/*
5903=for apidoc sv_eq
5904
5905Returns a boolean indicating whether the strings in the two SVs are
645c22ef
DM
5906identical. Is UTF-8 and 'use bytes' aware, handles get magic, and will
5907coerce its args to strings if necessary.
954c1994
GS
5908
5909=cut
5910*/
5911
79072805 5912I32
e01b9e88 5913Perl_sv_eq(pTHX_ register SV *sv1, register SV *sv2)
79072805 5914{
97aff369 5915 dVAR;
e1ec3a88 5916 const char *pv1;
463ee0b2 5917 STRLEN cur1;
e1ec3a88 5918 const char *pv2;
463ee0b2 5919 STRLEN cur2;
e01b9e88 5920 I32 eq = 0;
bd61b366 5921 char *tpv = NULL;
a0714e2c 5922 SV* svrecode = NULL;
79072805 5923
e01b9e88 5924 if (!sv1) {
79072805
LW
5925 pv1 = "";
5926 cur1 = 0;
5927 }
463ee0b2 5928 else
4d84ee25 5929 pv1 = SvPV_const(sv1, cur1);
79072805 5930
e01b9e88
SC
5931 if (!sv2){
5932 pv2 = "";
5933 cur2 = 0;
92d29cee 5934 }
e01b9e88 5935 else
4d84ee25 5936 pv2 = SvPV_const(sv2, cur2);
79072805 5937
cf48d248 5938 if (cur1 && cur2 && SvUTF8(sv1) != SvUTF8(sv2) && !IN_BYTES) {
799ef3cb
JH
5939 /* Differing utf8ness.
5940 * Do not UTF8size the comparands as a side-effect. */
5941 if (PL_encoding) {
5942 if (SvUTF8(sv1)) {
553e1bcc
AT
5943 svrecode = newSVpvn(pv2, cur2);
5944 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 5945 pv2 = SvPV_const(svrecode, cur2);
799ef3cb
JH
5946 }
5947 else {
553e1bcc
AT
5948 svrecode = newSVpvn(pv1, cur1);
5949 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 5950 pv1 = SvPV_const(svrecode, cur1);
799ef3cb
JH
5951 }
5952 /* Now both are in UTF-8. */
0a1bd7ac
DM
5953 if (cur1 != cur2) {
5954 SvREFCNT_dec(svrecode);
799ef3cb 5955 return FALSE;
0a1bd7ac 5956 }
799ef3cb
JH
5957 }
5958 else {
5959 bool is_utf8 = TRUE;
5960
5961 if (SvUTF8(sv1)) {
5962 /* sv1 is the UTF-8 one,
5963 * if is equal it must be downgrade-able */
9d4ba2ae 5964 char * const pv = (char*)bytes_from_utf8((const U8*)pv1,
799ef3cb
JH
5965 &cur1, &is_utf8);
5966 if (pv != pv1)
553e1bcc 5967 pv1 = tpv = pv;
799ef3cb
JH
5968 }
5969 else {
5970 /* sv2 is the UTF-8 one,
5971 * if is equal it must be downgrade-able */
9d4ba2ae 5972 char * const pv = (char *)bytes_from_utf8((const U8*)pv2,
799ef3cb
JH
5973 &cur2, &is_utf8);
5974 if (pv != pv2)
553e1bcc 5975 pv2 = tpv = pv;
799ef3cb
JH
5976 }
5977 if (is_utf8) {
5978 /* Downgrade not possible - cannot be eq */
bf694877 5979 assert (tpv == 0);
799ef3cb
JH
5980 return FALSE;
5981 }
5982 }
cf48d248
JH
5983 }
5984
5985 if (cur1 == cur2)
765f542d 5986 eq = (pv1 == pv2) || memEQ(pv1, pv2, cur1);
e01b9e88 5987
b37c2d43 5988 SvREFCNT_dec(svrecode);
553e1bcc
AT
5989 if (tpv)
5990 Safefree(tpv);
cf48d248 5991
e01b9e88 5992 return eq;
79072805
LW
5993}
5994
954c1994
GS
5995/*
5996=for apidoc sv_cmp
5997
5998Compares the strings in two SVs. Returns -1, 0, or 1 indicating whether the
5999string in C<sv1> is less than, equal to, or greater than the string in
645c22ef
DM
6000C<sv2>. Is UTF-8 and 'use bytes' aware, handles get magic, and will
6001coerce its args to strings if necessary. See also C<sv_cmp_locale>.
954c1994
GS
6002
6003=cut
6004*/
6005
79072805 6006I32
e01b9e88 6007Perl_sv_cmp(pTHX_ register SV *sv1, register SV *sv2)
79072805 6008{
97aff369 6009 dVAR;
560a288e 6010 STRLEN cur1, cur2;
e1ec3a88 6011 const char *pv1, *pv2;
bd61b366 6012 char *tpv = NULL;
cf48d248 6013 I32 cmp;
a0714e2c 6014 SV *svrecode = NULL;
560a288e 6015
e01b9e88
SC
6016 if (!sv1) {
6017 pv1 = "";
560a288e
GS
6018 cur1 = 0;
6019 }
e01b9e88 6020 else
4d84ee25 6021 pv1 = SvPV_const(sv1, cur1);
560a288e 6022
553e1bcc 6023 if (!sv2) {
e01b9e88 6024 pv2 = "";
560a288e
GS
6025 cur2 = 0;
6026 }
e01b9e88 6027 else
4d84ee25 6028 pv2 = SvPV_const(sv2, cur2);
79072805 6029
cf48d248 6030 if (cur1 && cur2 && SvUTF8(sv1) != SvUTF8(sv2) && !IN_BYTES) {
799ef3cb
JH
6031 /* Differing utf8ness.
6032 * Do not UTF8size the comparands as a side-effect. */
cf48d248 6033 if (SvUTF8(sv1)) {
799ef3cb 6034 if (PL_encoding) {
553e1bcc
AT
6035 svrecode = newSVpvn(pv2, cur2);
6036 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6037 pv2 = SvPV_const(svrecode, cur2);
799ef3cb
JH
6038 }
6039 else {
e1ec3a88 6040 pv2 = tpv = (char*)bytes_to_utf8((const U8*)pv2, &cur2);
799ef3cb 6041 }
cf48d248
JH
6042 }
6043 else {
799ef3cb 6044 if (PL_encoding) {
553e1bcc
AT
6045 svrecode = newSVpvn(pv1, cur1);
6046 sv_recode_to_utf8(svrecode, PL_encoding);
93524f2b 6047 pv1 = SvPV_const(svrecode, cur1);
799ef3cb
JH
6048 }
6049 else {
e1ec3a88 6050 pv1 = tpv = (char*)bytes_to_utf8((const U8*)pv1, &cur1);
799ef3cb 6051 }
cf48d248
JH
6052 }
6053 }
6054
e01b9e88 6055 if (!cur1) {
cf48d248 6056 cmp = cur2 ? -1 : 0;
e01b9e88 6057 } else if (!cur2) {
cf48d248
JH
6058 cmp = 1;
6059 } else {
e1ec3a88 6060 const I32 retval = memcmp((const void*)pv1, (const void*)pv2, cur1 < cur2 ? cur1 : cur2);
e01b9e88
SC
6061
6062 if (retval) {
cf48d248 6063 cmp = retval < 0 ? -1 : 1;
e01b9e88 6064 } else if (cur1 == cur2) {
cf48d248
JH
6065 cmp = 0;
6066 } else {
6067 cmp = cur1 < cur2 ? -1 : 1;
e01b9e88 6068 }
cf48d248 6069 }
16660edb 6070
b37c2d43 6071 SvREFCNT_dec(svrecode);
553e1bcc
AT
6072 if (tpv)
6073 Safefree(tpv);
cf48d248
JH
6074
6075 return cmp;
bbce6d69 6076}
16660edb 6077
c461cf8f
JH
6078/*
6079=for apidoc sv_cmp_locale
6080
645c22ef
DM
6081Compares the strings in two SVs in a locale-aware manner. Is UTF-8 and
6082'use bytes' aware, handles get magic, and will coerce its args to strings
6083if necessary. See also C<sv_cmp_locale>. See also C<sv_cmp>.
c461cf8f
JH
6084
6085=cut
6086*/
6087
bbce6d69 6088I32
864dbfa3 6089Perl_sv_cmp_locale(pTHX_ register SV *sv1, register SV *sv2)
bbce6d69 6090{
97aff369 6091 dVAR;
36477c24 6092#ifdef USE_LOCALE_COLLATE
16660edb 6093
bbce6d69 6094 char *pv1, *pv2;
6095 STRLEN len1, len2;
6096 I32 retval;
16660edb 6097
3280af22 6098 if (PL_collation_standard)
bbce6d69 6099 goto raw_compare;
16660edb 6100
bbce6d69 6101 len1 = 0;
8ac85365 6102 pv1 = sv1 ? sv_collxfrm(sv1, &len1) : (char *) NULL;
bbce6d69 6103 len2 = 0;
8ac85365 6104 pv2 = sv2 ? sv_collxfrm(sv2, &len2) : (char *) NULL;
16660edb 6105
bbce6d69 6106 if (!pv1 || !len1) {
6107 if (pv2 && len2)
6108 return -1;
6109 else
6110 goto raw_compare;
6111 }
6112 else {
6113 if (!pv2 || !len2)
6114 return 1;
6115 }
16660edb 6116
bbce6d69 6117 retval = memcmp((void*)pv1, (void*)pv2, len1 < len2 ? len1 : len2);
16660edb 6118
bbce6d69 6119 if (retval)
16660edb 6120 return retval < 0 ? -1 : 1;
6121
bbce6d69 6122 /*
6123 * When the result of collation is equality, that doesn't mean
6124 * that there are no differences -- some locales exclude some
6125 * characters from consideration. So to avoid false equalities,
6126 * we use the raw string as a tiebreaker.
6127 */
16660edb 6128
bbce6d69 6129 raw_compare:
5f66b61c 6130 /*FALLTHROUGH*/
16660edb 6131
36477c24 6132#endif /* USE_LOCALE_COLLATE */
16660edb 6133
bbce6d69 6134 return sv_cmp(sv1, sv2);
6135}
79072805 6136
645c22ef 6137
36477c24 6138#ifdef USE_LOCALE_COLLATE
645c22ef 6139
7a4c00b4 6140/*
645c22ef
DM
6141=for apidoc sv_collxfrm
6142
6143Add Collate Transform magic to an SV if it doesn't already have it.
6144
6145Any scalar variable may carry PERL_MAGIC_collxfrm magic that contains the
6146scalar data of the variable, but transformed to such a format that a normal
6147memory comparison can be used to compare the data according to the locale
6148settings.
6149
6150=cut
6151*/
6152
bbce6d69 6153char *
864dbfa3 6154Perl_sv_collxfrm(pTHX_ SV *sv, STRLEN *nxp)
bbce6d69 6155{
97aff369 6156 dVAR;
7a4c00b4 6157 MAGIC *mg;
16660edb 6158
14befaf4 6159 mg = SvMAGICAL(sv) ? mg_find(sv, PERL_MAGIC_collxfrm) : (MAGIC *) NULL;
3280af22 6160 if (!mg || !mg->mg_ptr || *(U32*)mg->mg_ptr != PL_collation_ix) {
93524f2b
NC
6161 const char *s;
6162 char *xf;
bbce6d69 6163 STRLEN len, xlen;
6164
7a4c00b4 6165 if (mg)
6166 Safefree(mg->mg_ptr);
93524f2b 6167 s = SvPV_const(sv, len);
bbce6d69 6168 if ((xf = mem_collxfrm(s, len, &xlen))) {
ff0cee69 6169 if (SvREADONLY(sv)) {
6170 SAVEFREEPV(xf);
6171 *nxp = xlen;
3280af22 6172 return xf + sizeof(PL_collation_ix);
ff0cee69 6173 }
7a4c00b4 6174 if (! mg) {
d83f0a82
NC
6175#ifdef PERL_OLD_COPY_ON_WRITE
6176 if (SvIsCOW(sv))
6177 sv_force_normal_flags(sv, 0);
6178#endif
6179 mg = sv_magicext(sv, 0, PERL_MAGIC_collxfrm, &PL_vtbl_collxfrm,
6180 0, 0);
7a4c00b4 6181 assert(mg);
bbce6d69 6182 }
7a4c00b4 6183 mg->mg_ptr = xf;
565764a8 6184 mg->mg_len = xlen;
7a4c00b4 6185 }
6186 else {
ff0cee69 6187 if (mg) {
6188 mg->mg_ptr = NULL;
565764a8 6189 mg->mg_len = -1;
ff0cee69 6190 }
bbce6d69 6191 }
6192 }
7a4c00b4 6193 if (mg && mg->mg_ptr) {
565764a8 6194 *nxp = mg->mg_len;
3280af22 6195 return mg->mg_ptr + sizeof(PL_collation_ix);
bbce6d69 6196 }
6197 else {
6198 *nxp = 0;
6199 return NULL;
16660edb 6200 }
79072805
LW
6201}
6202
36477c24 6203#endif /* USE_LOCALE_COLLATE */
bbce6d69 6204
c461cf8f
JH
6205/*
6206=for apidoc sv_gets
6207
6208Get a line from the filehandle and store it into the SV, optionally
6209appending to the currently-stored string.
6210
6211=cut
6212*/
6213
79072805 6214char *
864dbfa3 6215Perl_sv_gets(pTHX_ register SV *sv, register PerlIO *fp, I32 append)
79072805 6216{
97aff369 6217 dVAR;
e1ec3a88 6218 const char *rsptr;
c07a80fd 6219 STRLEN rslen;
6220 register STDCHAR rslast;
6221 register STDCHAR *bp;
6222 register I32 cnt;
9c5ffd7c 6223 I32 i = 0;
8bfdd7d9 6224 I32 rspara = 0;
c07a80fd 6225
bc44a8a2
NC
6226 if (SvTHINKFIRST(sv))
6227 sv_force_normal_flags(sv, append ? 0 : SV_COW_DROP_PV);
765f542d
NC
6228 /* XXX. If you make this PVIV, then copy on write can copy scalars read
6229 from <>.
6230 However, perlbench says it's slower, because the existing swipe code
6231 is faster than copy on write.
6232 Swings and roundabouts. */
862a34c6 6233 SvUPGRADE(sv, SVt_PV);
99491443 6234
ff68c719 6235 SvSCREAM_off(sv);
efd8b2ba
AE
6236
6237 if (append) {
6238 if (PerlIO_isutf8(fp)) {
6239 if (!SvUTF8(sv)) {
6240 sv_utf8_upgrade_nomg(sv);
6241 sv_pos_u2b(sv,&append,0);
6242 }
6243 } else if (SvUTF8(sv)) {
561b68a9 6244 SV * const tsv = newSV(0);
efd8b2ba
AE
6245 sv_gets(tsv, fp, 0);
6246 sv_utf8_upgrade_nomg(tsv);
6247 SvCUR_set(sv,append);
6248 sv_catsv(sv,tsv);
6249 sv_free(tsv);
6250 goto return_string_or_null;
6251 }
6252 }
6253
6254 SvPOK_only(sv);
6255 if (PerlIO_isutf8(fp))
6256 SvUTF8_on(sv);
c07a80fd 6257
923e4eb5 6258 if (IN_PERL_COMPILETIME) {
8bfdd7d9
HS
6259 /* we always read code in line mode */
6260 rsptr = "\n";
6261 rslen = 1;
6262 }
6263 else if (RsSNARF(PL_rs)) {
7a5fa8a2 6264 /* If it is a regular disk file use size from stat() as estimate
acbd132f
JH
6265 of amount we are going to read -- may result in mallocing
6266 more memory than we really need if the layers below reduce
6267 the size we read (e.g. CRLF or a gzip layer).
e468d35b 6268 */
e311fd51 6269 Stat_t st;
e468d35b 6270 if (!PerlLIO_fstat(PerlIO_fileno(fp), &st) && S_ISREG(st.st_mode)) {
f54cb97a 6271 const Off_t offset = PerlIO_tell(fp);
58f1856e 6272 if (offset != (Off_t) -1 && st.st_size + append > offset) {
e468d35b
NIS
6273 (void) SvGROW(sv, (STRLEN)((st.st_size - offset) + append + 1));
6274 }
6275 }
c07a80fd 6276 rsptr = NULL;
6277 rslen = 0;
6278 }
3280af22 6279 else if (RsRECORD(PL_rs)) {
e311fd51 6280 I32 bytesread;
5b2b9c68 6281 char *buffer;
acbd132f 6282 U32 recsize;
5b2b9c68
HM
6283
6284 /* Grab the size of the record we're getting */
acbd132f 6285 recsize = SvUV(SvRV(PL_rs)); /* RsRECORD() guarantees > 0. */
e311fd51 6286 buffer = SvGROW(sv, (STRLEN)(recsize + append + 1)) + append;
5b2b9c68
HM
6287 /* Go yank in */
6288#ifdef VMS
6289 /* VMS wants read instead of fread, because fread doesn't respect */
6290 /* RMS record boundaries. This is not necessarily a good thing to be */
e468d35b
NIS
6291 /* doing, but we've got no other real choice - except avoid stdio
6292 as implementation - perhaps write a :vms layer ?
6293 */
5b2b9c68
HM
6294 bytesread = PerlLIO_read(PerlIO_fileno(fp), buffer, recsize);
6295#else
6296 bytesread = PerlIO_read(fp, buffer, recsize);
6297#endif
27e6ca2d
AE
6298 if (bytesread < 0)
6299 bytesread = 0;
e311fd51 6300 SvCUR_set(sv, bytesread += append);
e670df4e 6301 buffer[bytesread] = '\0';
efd8b2ba 6302 goto return_string_or_null;
5b2b9c68 6303 }
3280af22 6304 else if (RsPARA(PL_rs)) {
c07a80fd 6305 rsptr = "\n\n";
6306 rslen = 2;
8bfdd7d9 6307 rspara = 1;
c07a80fd 6308 }
7d59b7e4
NIS
6309 else {
6310 /* Get $/ i.e. PL_rs into same encoding as stream wants */
6311 if (PerlIO_isutf8(fp)) {
6312 rsptr = SvPVutf8(PL_rs, rslen);
6313 }
6314 else {
6315 if (SvUTF8(PL_rs)) {
6316 if (!sv_utf8_downgrade(PL_rs, TRUE)) {
6317 Perl_croak(aTHX_ "Wide character in $/");
6318 }
6319 }
93524f2b 6320 rsptr = SvPV_const(PL_rs, rslen);
7d59b7e4
NIS
6321 }
6322 }
6323
c07a80fd 6324 rslast = rslen ? rsptr[rslen - 1] : '\0';
6325
8bfdd7d9 6326 if (rspara) { /* have to do this both before and after */
79072805 6327 do { /* to make sure file boundaries work right */
760ac839 6328 if (PerlIO_eof(fp))
a0d0e21e 6329 return 0;
760ac839 6330 i = PerlIO_getc(fp);
79072805 6331 if (i != '\n') {
a0d0e21e
LW
6332 if (i == -1)
6333 return 0;
760ac839 6334 PerlIO_ungetc(fp,i);
79072805
LW
6335 break;
6336 }
6337 } while (i != EOF);
6338 }
c07a80fd 6339
760ac839
LW
6340 /* See if we know enough about I/O mechanism to cheat it ! */
6341
6342 /* This used to be #ifdef test - it is made run-time test for ease
1c846c1f 6343 of abstracting out stdio interface. One call should be cheap
760ac839
LW
6344 enough here - and may even be a macro allowing compile
6345 time optimization.
6346 */
6347
6348 if (PerlIO_fast_gets(fp)) {
6349
6350 /*
6351 * We're going to steal some values from the stdio struct
6352 * and put EVERYTHING in the innermost loop into registers.
6353 */
6354 register STDCHAR *ptr;
6355 STRLEN bpx;
6356 I32 shortbuffered;
6357
16660edb 6358#if defined(VMS) && defined(PERLIO_IS_STDIO)
6359 /* An ungetc()d char is handled separately from the regular
6360 * buffer, so we getc() it back out and stuff it in the buffer.
6361 */
6362 i = PerlIO_getc(fp);
6363 if (i == EOF) return 0;
6364 *(--((*fp)->_ptr)) = (unsigned char) i;
6365 (*fp)->_cnt++;
6366#endif
c07a80fd 6367
c2960299 6368 /* Here is some breathtakingly efficient cheating */
c07a80fd 6369
a20bf0c3 6370 cnt = PerlIO_get_cnt(fp); /* get count into register */
e468d35b 6371 /* make sure we have the room */
7a5fa8a2 6372 if ((I32)(SvLEN(sv) - append) <= cnt + 1) {
e468d35b 6373 /* Not room for all of it
7a5fa8a2 6374 if we are looking for a separator and room for some
e468d35b
NIS
6375 */
6376 if (rslen && cnt > 80 && (I32)SvLEN(sv) > append) {
7a5fa8a2 6377 /* just process what we have room for */
79072805
LW
6378 shortbuffered = cnt - SvLEN(sv) + append + 1;
6379 cnt -= shortbuffered;
6380 }
6381 else {
6382 shortbuffered = 0;
bbce6d69 6383 /* remember that cnt can be negative */
eb160463 6384 SvGROW(sv, (STRLEN)(append + (cnt <= 0 ? 2 : (cnt + 1))));
79072805
LW
6385 }
6386 }
7a5fa8a2 6387 else
79072805 6388 shortbuffered = 0;
3f7c398e 6389 bp = (STDCHAR*)SvPVX_const(sv) + append; /* move these two too to registers */
a20bf0c3 6390 ptr = (STDCHAR*)PerlIO_get_ptr(fp);
16660edb 6391 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6392 "Screamer: entering, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
16660edb 6393 DEBUG_P(PerlIO_printf(Perl_debug_log,
ba7abf9d 6394 "Screamer: entering: PerlIO * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6395 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6396 PTR2UV(PerlIO_has_base(fp) ? PerlIO_get_base(fp) : 0)));
79072805
LW
6397 for (;;) {
6398 screamer:
93a17b20 6399 if (cnt > 0) {
c07a80fd 6400 if (rslen) {
760ac839
LW
6401 while (cnt > 0) { /* this | eat */
6402 cnt--;
c07a80fd 6403 if ((*bp++ = *ptr++) == rslast) /* really | dust */
6404 goto thats_all_folks; /* screams | sed :-) */
6405 }
6406 }
6407 else {
1c846c1f
NIS
6408 Copy(ptr, bp, cnt, char); /* this | eat */
6409 bp += cnt; /* screams | dust */
c07a80fd 6410 ptr += cnt; /* louder | sed :-) */
a5f75d66 6411 cnt = 0;
93a17b20 6412 }
79072805
LW
6413 }
6414
748a9306 6415 if (shortbuffered) { /* oh well, must extend */
79072805
LW
6416 cnt = shortbuffered;
6417 shortbuffered = 0;
3f7c398e 6418 bpx = bp - (STDCHAR*)SvPVX_const(sv); /* box up before relocation */
79072805
LW
6419 SvCUR_set(sv, bpx);
6420 SvGROW(sv, SvLEN(sv) + append + cnt + 2);
3f7c398e 6421 bp = (STDCHAR*)SvPVX_const(sv) + bpx; /* unbox after relocation */
79072805
LW
6422 continue;
6423 }
6424
16660edb 6425 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841
GS
6426 "Screamer: going to getc, ptr=%"UVuf", cnt=%ld\n",
6427 PTR2UV(ptr),(long)cnt));
cc00df79 6428 PerlIO_set_ptrcnt(fp, (STDCHAR*)ptr, cnt); /* deregisterize cnt and ptr */
ba7abf9d 6429#if 0
16660edb 6430 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6431 "Screamer: pre: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6432 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6433 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
ba7abf9d 6434#endif
1c846c1f 6435 /* This used to call 'filbuf' in stdio form, but as that behaves like
774d564b 6436 getc when cnt <= 0 we use PerlIO_getc here to avoid introducing
6437 another abstraction. */
760ac839 6438 i = PerlIO_getc(fp); /* get more characters */
ba7abf9d 6439#if 0
16660edb 6440 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6441 "Screamer: post: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6442 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6443 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
ba7abf9d 6444#endif
a20bf0c3
JH
6445 cnt = PerlIO_get_cnt(fp);
6446 ptr = (STDCHAR*)PerlIO_get_ptr(fp); /* reregisterize cnt and ptr */
16660edb 6447 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6448 "Screamer: after getc, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
79072805 6449
748a9306
LW
6450 if (i == EOF) /* all done for ever? */
6451 goto thats_really_all_folks;
6452
3f7c398e 6453 bpx = bp - (STDCHAR*)SvPVX_const(sv); /* box up before relocation */
79072805
LW
6454 SvCUR_set(sv, bpx);
6455 SvGROW(sv, bpx + cnt + 2);
3f7c398e 6456 bp = (STDCHAR*)SvPVX_const(sv) + bpx; /* unbox after relocation */
c07a80fd 6457
eb160463 6458 *bp++ = (STDCHAR)i; /* store character from PerlIO_getc */
79072805 6459
c07a80fd 6460 if (rslen && (STDCHAR)i == rslast) /* all done for now? */
79072805 6461 goto thats_all_folks;
79072805
LW
6462 }
6463
6464thats_all_folks:
3f7c398e 6465 if ((rslen > 1 && (STRLEN)(bp - (STDCHAR*)SvPVX_const(sv)) < rslen) ||
36477c24 6466 memNE((char*)bp - rslen, rsptr, rslen))
760ac839 6467 goto screamer; /* go back to the fray */
79072805
LW
6468thats_really_all_folks:
6469 if (shortbuffered)
6470 cnt += shortbuffered;
16660edb 6471 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6472 "Screamer: quitting, ptr=%"UVuf", cnt=%ld\n",PTR2UV(ptr),(long)cnt));
cc00df79 6473 PerlIO_set_ptrcnt(fp, (STDCHAR*)ptr, cnt); /* put these back or we're in trouble */
16660edb 6474 DEBUG_P(PerlIO_printf(Perl_debug_log,
1d7c1841 6475 "Screamer: end: FILE * thinks ptr=%"UVuf", cnt=%ld, base=%"UVuf"\n",
1c846c1f 6476 PTR2UV(PerlIO_get_ptr(fp)), (long)PerlIO_get_cnt(fp),
1d7c1841 6477 PTR2UV(PerlIO_has_base (fp) ? PerlIO_get_base(fp) : 0)));
79072805 6478 *bp = '\0';
3f7c398e 6479 SvCUR_set(sv, bp - (STDCHAR*)SvPVX_const(sv)); /* set length */
16660edb 6480 DEBUG_P(PerlIO_printf(Perl_debug_log,
fb73857a 6481 "Screamer: done, len=%ld, string=|%.*s|\n",
3f7c398e 6482 (long)SvCUR(sv),(int)SvCUR(sv),SvPVX_const(sv)));
760ac839
LW
6483 }
6484 else
79072805 6485 {
6edd2cd5 6486 /*The big, slow, and stupid way. */
27da23d5 6487#ifdef USE_HEAP_INSTEAD_OF_STACK /* Even slower way. */
cbbf8932 6488 STDCHAR *buf = NULL;
a02a5408 6489 Newx(buf, 8192, STDCHAR);
6edd2cd5 6490 assert(buf);
4d2c4e07 6491#else
6edd2cd5 6492 STDCHAR buf[8192];
4d2c4e07 6493#endif
79072805 6494
760ac839 6495screamer2:
c07a80fd 6496 if (rslen) {
00b6aa41 6497 register const STDCHAR * const bpe = buf + sizeof(buf);
760ac839 6498 bp = buf;
eb160463 6499 while ((i = PerlIO_getc(fp)) != EOF && (*bp++ = (STDCHAR)i) != rslast && bp < bpe)
760ac839
LW
6500 ; /* keep reading */
6501 cnt = bp - buf;
c07a80fd 6502 }
6503 else {
760ac839 6504 cnt = PerlIO_read(fp,(char*)buf, sizeof(buf));
16660edb 6505 /* Accomodate broken VAXC compiler, which applies U8 cast to
6506 * both args of ?: operator, causing EOF to change into 255
6507 */
37be0adf 6508 if (cnt > 0)
cbe9e203
JH
6509 i = (U8)buf[cnt - 1];
6510 else
37be0adf 6511 i = EOF;
c07a80fd 6512 }
79072805 6513
cbe9e203
JH
6514 if (cnt < 0)
6515 cnt = 0; /* we do need to re-set the sv even when cnt <= 0 */
6516 if (append)
6517 sv_catpvn(sv, (char *) buf, cnt);
6518 else
6519 sv_setpvn(sv, (char *) buf, cnt);
c07a80fd 6520
6521 if (i != EOF && /* joy */
6522 (!rslen ||
6523 SvCUR(sv) < rslen ||
3f7c398e 6524 memNE(SvPVX_const(sv) + SvCUR(sv) - rslen, rsptr, rslen)))
79072805
LW
6525 {
6526 append = -1;
63e4d877
CS
6527 /*
6528 * If we're reading from a TTY and we get a short read,
6529 * indicating that the user hit his EOF character, we need
6530 * to notice it now, because if we try to read from the TTY
6531 * again, the EOF condition will disappear.
6532 *
6533 * The comparison of cnt to sizeof(buf) is an optimization
6534 * that prevents unnecessary calls to feof().
6535 *
6536 * - jik 9/25/96
6537 */
bb7a0f54 6538 if (!(cnt < (I32)sizeof(buf) && PerlIO_eof(fp)))
63e4d877 6539 goto screamer2;
79072805 6540 }
6edd2cd5 6541
27da23d5 6542#ifdef USE_HEAP_INSTEAD_OF_STACK
6edd2cd5
JH
6543 Safefree(buf);
6544#endif
79072805
LW
6545 }
6546
8bfdd7d9 6547 if (rspara) { /* have to do this both before and after */
c07a80fd 6548 while (i != EOF) { /* to make sure file boundaries work right */
760ac839 6549 i = PerlIO_getc(fp);
79072805 6550 if (i != '\n') {
760ac839 6551 PerlIO_ungetc(fp,i);
79072805
LW
6552 break;
6553 }
6554 }
6555 }
c07a80fd 6556
efd8b2ba 6557return_string_or_null:
bd61b366 6558 return (SvCUR(sv) - append) ? SvPVX(sv) : NULL;
79072805
LW
6559}
6560
954c1994
GS
6561/*
6562=for apidoc sv_inc
6563
645c22ef
DM
6564Auto-increment of the value in the SV, doing string to numeric conversion
6565if necessary. Handles 'get' magic.
954c1994
GS
6566
6567=cut
6568*/
6569
79072805 6570void
864dbfa3 6571Perl_sv_inc(pTHX_ register SV *sv)
79072805 6572{
97aff369 6573 dVAR;
79072805 6574 register char *d;
463ee0b2 6575 int flags;
79072805
LW
6576
6577 if (!sv)
6578 return;
5b295bef 6579 SvGETMAGIC(sv);
ed6116ce 6580 if (SvTHINKFIRST(sv)) {
765f542d
NC
6581 if (SvIsCOW(sv))
6582 sv_force_normal_flags(sv, 0);
0f15f207 6583 if (SvREADONLY(sv)) {
923e4eb5 6584 if (IN_PERL_RUNTIME)
cea2e8a9 6585 Perl_croak(aTHX_ PL_no_modify);
0f15f207 6586 }
a0d0e21e 6587 if (SvROK(sv)) {
b5be31e9 6588 IV i;
9e7bc3e8
JD
6589 if (SvAMAGIC(sv) && AMG_CALLun(sv,inc))
6590 return;
56431972 6591 i = PTR2IV(SvRV(sv));
b5be31e9
SM
6592 sv_unref(sv);
6593 sv_setiv(sv, i);
a0d0e21e 6594 }
ed6116ce 6595 }
8990e307 6596 flags = SvFLAGS(sv);
28e5dec8
JH
6597 if ((flags & (SVp_NOK|SVp_IOK)) == SVp_NOK) {
6598 /* It's (privately or publicly) a float, but not tested as an
6599 integer, so test it to see. */
d460ef45 6600 (void) SvIV(sv);
28e5dec8
JH
6601 flags = SvFLAGS(sv);
6602 }
6603 if ((flags & SVf_IOK) || ((flags & (SVp_IOK | SVp_NOK)) == SVp_IOK)) {
6604 /* It's publicly an integer, or privately an integer-not-float */
59d8ce62 6605#ifdef PERL_PRESERVE_IVUV
28e5dec8 6606 oops_its_int:
59d8ce62 6607#endif
25da4f38
IZ
6608 if (SvIsUV(sv)) {
6609 if (SvUVX(sv) == UV_MAX)
a1e868e7 6610 sv_setnv(sv, UV_MAX_P1);
25da4f38
IZ
6611 else
6612 (void)SvIOK_only_UV(sv);
607fa7f2 6613 SvUV_set(sv, SvUVX(sv) + 1);
25da4f38
IZ
6614 } else {
6615 if (SvIVX(sv) == IV_MAX)
28e5dec8 6616 sv_setuv(sv, (UV)IV_MAX + 1);
25da4f38
IZ
6617 else {
6618 (void)SvIOK_only(sv);
45977657 6619 SvIV_set(sv, SvIVX(sv) + 1);
1c846c1f 6620 }
55497cff 6621 }
79072805
LW
6622 return;
6623 }
28e5dec8
JH
6624 if (flags & SVp_NOK) {
6625 (void)SvNOK_only(sv);
9d6ce603 6626 SvNV_set(sv, SvNVX(sv) + 1.0);
28e5dec8
JH
6627 return;
6628 }
6629
3f7c398e 6630 if (!(flags & SVp_POK) || !*SvPVX_const(sv)) {
28e5dec8 6631 if ((flags & SVTYPEMASK) < SVt_PVIV)
f5282e15 6632 sv_upgrade(sv, ((flags & SVTYPEMASK) > SVt_IV ? SVt_PVIV : SVt_IV));
28e5dec8 6633 (void)SvIOK_only(sv);
45977657 6634 SvIV_set(sv, 1);
79072805
LW
6635 return;
6636 }
463ee0b2 6637 d = SvPVX(sv);
79072805
LW
6638 while (isALPHA(*d)) d++;
6639 while (isDIGIT(*d)) d++;
6640 if (*d) {
28e5dec8 6641#ifdef PERL_PRESERVE_IVUV
d1be9408 6642 /* Got to punt this as an integer if needs be, but we don't issue
28e5dec8
JH
6643 warnings. Probably ought to make the sv_iv_please() that does
6644 the conversion if possible, and silently. */
504618e9 6645 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), NULL);
28e5dec8
JH
6646 if (numtype && !(numtype & IS_NUMBER_INFINITY)) {
6647 /* Need to try really hard to see if it's an integer.
6648 9.22337203685478e+18 is an integer.
6649 but "9.22337203685478e+18" + 0 is UV=9223372036854779904
6650 so $a="9.22337203685478e+18"; $a+0; $a++
6651 needs to be the same as $a="9.22337203685478e+18"; $a++
6652 or we go insane. */
d460ef45 6653
28e5dec8
JH
6654 (void) sv_2iv(sv);
6655 if (SvIOK(sv))
6656 goto oops_its_int;
6657
6658 /* sv_2iv *should* have made this an NV */
6659 if (flags & SVp_NOK) {
6660 (void)SvNOK_only(sv);
9d6ce603 6661 SvNV_set(sv, SvNVX(sv) + 1.0);
28e5dec8
JH
6662 return;
6663 }
6664 /* I don't think we can get here. Maybe I should assert this
6665 And if we do get here I suspect that sv_setnv will croak. NWC
6666 Fall through. */
6667#if defined(USE_LONG_DOUBLE)
6668 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_inc punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"PERL_PRIgldbl"\n",
3f7c398e 6669 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8 6670#else
1779d84d 6671 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_inc punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"NVgf"\n",
3f7c398e 6672 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8
JH
6673#endif
6674 }
6675#endif /* PERL_PRESERVE_IVUV */
3f7c398e 6676 sv_setnv(sv,Atof(SvPVX_const(sv)) + 1.0);
79072805
LW
6677 return;
6678 }
6679 d--;
3f7c398e 6680 while (d >= SvPVX_const(sv)) {
79072805
LW
6681 if (isDIGIT(*d)) {
6682 if (++*d <= '9')
6683 return;
6684 *(d--) = '0';
6685 }
6686 else {
9d116dd7
JH
6687#ifdef EBCDIC
6688 /* MKS: The original code here died if letters weren't consecutive.
6689 * at least it didn't have to worry about non-C locales. The
6690 * new code assumes that ('z'-'a')==('Z'-'A'), letters are
1c846c1f 6691 * arranged in order (although not consecutively) and that only
9d116dd7
JH
6692 * [A-Za-z] are accepted by isALPHA in the C locale.
6693 */
6694 if (*d != 'z' && *d != 'Z') {
6695 do { ++*d; } while (!isALPHA(*d));
6696 return;
6697 }
6698 *(d--) -= 'z' - 'a';
6699#else
79072805
LW
6700 ++*d;
6701 if (isALPHA(*d))
6702 return;
6703 *(d--) -= 'z' - 'a' + 1;
9d116dd7 6704#endif
79072805
LW
6705 }
6706 }
6707 /* oh,oh, the number grew */
6708 SvGROW(sv, SvCUR(sv) + 2);
b162af07 6709 SvCUR_set(sv, SvCUR(sv) + 1);
3f7c398e 6710 for (d = SvPVX(sv) + SvCUR(sv); d > SvPVX_const(sv); d--)
79072805
LW
6711 *d = d[-1];
6712 if (isDIGIT(d[1]))
6713 *d = '1';
6714 else
6715 *d = d[1];
6716}
6717
954c1994
GS
6718/*
6719=for apidoc sv_dec
6720
645c22ef
DM
6721Auto-decrement of the value in the SV, doing string to numeric conversion
6722if necessary. Handles 'get' magic.
954c1994
GS
6723
6724=cut
6725*/
6726
79072805 6727void
864dbfa3 6728Perl_sv_dec(pTHX_ register SV *sv)
79072805 6729{
97aff369 6730 dVAR;
463ee0b2
LW
6731 int flags;
6732
79072805
LW
6733 if (!sv)
6734 return;
5b295bef 6735 SvGETMAGIC(sv);
ed6116ce 6736 if (SvTHINKFIRST(sv)) {
765f542d
NC
6737 if (SvIsCOW(sv))
6738 sv_force_normal_flags(sv, 0);
0f15f207 6739 if (SvREADONLY(sv)) {
923e4eb5 6740 if (IN_PERL_RUNTIME)
cea2e8a9 6741 Perl_croak(aTHX_ PL_no_modify);
0f15f207 6742 }
a0d0e21e 6743 if (SvROK(sv)) {
b5be31e9 6744 IV i;
9e7bc3e8
JD
6745 if (SvAMAGIC(sv) && AMG_CALLun(sv,dec))
6746 return;
56431972 6747 i = PTR2IV(SvRV(sv));
b5be31e9
SM
6748 sv_unref(sv);
6749 sv_setiv(sv, i);
a0d0e21e 6750 }
ed6116ce 6751 }
28e5dec8
JH
6752 /* Unlike sv_inc we don't have to worry about string-never-numbers
6753 and keeping them magic. But we mustn't warn on punting */
8990e307 6754 flags = SvFLAGS(sv);
28e5dec8
JH
6755 if ((flags & SVf_IOK) || ((flags & (SVp_IOK | SVp_NOK)) == SVp_IOK)) {
6756 /* It's publicly an integer, or privately an integer-not-float */
59d8ce62 6757#ifdef PERL_PRESERVE_IVUV
28e5dec8 6758 oops_its_int:
59d8ce62 6759#endif
25da4f38
IZ
6760 if (SvIsUV(sv)) {
6761 if (SvUVX(sv) == 0) {
6762 (void)SvIOK_only(sv);
45977657 6763 SvIV_set(sv, -1);
25da4f38
IZ
6764 }
6765 else {
6766 (void)SvIOK_only_UV(sv);
f4eee32f 6767 SvUV_set(sv, SvUVX(sv) - 1);
1c846c1f 6768 }
25da4f38
IZ
6769 } else {
6770 if (SvIVX(sv) == IV_MIN)
65202027 6771 sv_setnv(sv, (NV)IV_MIN - 1.0);
25da4f38
IZ
6772 else {
6773 (void)SvIOK_only(sv);
45977657 6774 SvIV_set(sv, SvIVX(sv) - 1);
1c846c1f 6775 }
55497cff 6776 }
6777 return;
6778 }
28e5dec8 6779 if (flags & SVp_NOK) {
9d6ce603 6780 SvNV_set(sv, SvNVX(sv) - 1.0);
28e5dec8
JH
6781 (void)SvNOK_only(sv);
6782 return;
6783 }
8990e307 6784 if (!(flags & SVp_POK)) {
ef088171
NC
6785 if ((flags & SVTYPEMASK) < SVt_PVIV)
6786 sv_upgrade(sv, ((flags & SVTYPEMASK) > SVt_IV) ? SVt_PVIV : SVt_IV);
6787 SvIV_set(sv, -1);
6788 (void)SvIOK_only(sv);
79072805
LW
6789 return;
6790 }
28e5dec8
JH
6791#ifdef PERL_PRESERVE_IVUV
6792 {
504618e9 6793 const int numtype = grok_number(SvPVX_const(sv), SvCUR(sv), NULL);
28e5dec8
JH
6794 if (numtype && !(numtype & IS_NUMBER_INFINITY)) {
6795 /* Need to try really hard to see if it's an integer.
6796 9.22337203685478e+18 is an integer.
6797 but "9.22337203685478e+18" + 0 is UV=9223372036854779904
6798 so $a="9.22337203685478e+18"; $a+0; $a--
6799 needs to be the same as $a="9.22337203685478e+18"; $a--
6800 or we go insane. */
d460ef45 6801
28e5dec8
JH
6802 (void) sv_2iv(sv);
6803 if (SvIOK(sv))
6804 goto oops_its_int;
6805
6806 /* sv_2iv *should* have made this an NV */
6807 if (flags & SVp_NOK) {
6808 (void)SvNOK_only(sv);
9d6ce603 6809 SvNV_set(sv, SvNVX(sv) - 1.0);
28e5dec8
JH
6810 return;
6811 }
6812 /* I don't think we can get here. Maybe I should assert this
6813 And if we do get here I suspect that sv_setnv will croak. NWC
6814 Fall through. */
6815#if defined(USE_LONG_DOUBLE)
6816 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_dec punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"PERL_PRIgldbl"\n",
3f7c398e 6817 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8 6818#else
1779d84d 6819 DEBUG_c(PerlIO_printf(Perl_debug_log,"sv_dec punt failed to convert '%s' to IOK or NOKp, UV=0x%"UVxf" NV=%"NVgf"\n",
3f7c398e 6820 SvPVX_const(sv), SvIVX(sv), SvNVX(sv)));
28e5dec8
JH
6821#endif
6822 }
6823 }
6824#endif /* PERL_PRESERVE_IVUV */
3f7c398e 6825 sv_setnv(sv,Atof(SvPVX_const(sv)) - 1.0); /* punt */
79072805
LW
6826}
6827
954c1994
GS
6828/*
6829=for apidoc sv_mortalcopy
6830
645c22ef 6831Creates a new SV which is a copy of the original SV (using C<sv_setsv>).
d4236ebc
DM
6832The new SV is marked as mortal. It will be destroyed "soon", either by an
6833explicit call to FREETMPS, or by an implicit call at places such as
6834statement boundaries. See also C<sv_newmortal> and C<sv_2mortal>.
954c1994
GS
6835
6836=cut
6837*/
6838
79072805
LW
6839/* Make a string that will exist for the duration of the expression
6840 * evaluation. Actually, it may have to last longer than that, but
6841 * hopefully we won't free it until it has been assigned to a
6842 * permanent location. */
6843
6844SV *
864dbfa3 6845Perl_sv_mortalcopy(pTHX_ SV *oldstr)
79072805 6846{
97aff369 6847 dVAR;
463ee0b2 6848 register SV *sv;
b881518d 6849
4561caa4 6850 new_SV(sv);
79072805 6851 sv_setsv(sv,oldstr);
677b06e3
GS
6852 EXTEND_MORTAL(1);
6853 PL_tmps_stack[++PL_tmps_ix] = sv;
8990e307
LW
6854 SvTEMP_on(sv);
6855 return sv;
6856}
6857
954c1994
GS
6858/*
6859=for apidoc sv_newmortal
6860
645c22ef 6861Creates a new null SV which is mortal. The reference count of the SV is
d4236ebc
DM
6862set to 1. It will be destroyed "soon", either by an explicit call to
6863FREETMPS, or by an implicit call at places such as statement boundaries.
6864See also C<sv_mortalcopy> and C<sv_2mortal>.
954c1994
GS
6865
6866=cut
6867*/
6868
8990e307 6869SV *
864dbfa3 6870Perl_sv_newmortal(pTHX)
8990e307 6871{
97aff369 6872 dVAR;
8990e307
LW
6873 register SV *sv;
6874
4561caa4 6875 new_SV(sv);
8990e307 6876 SvFLAGS(sv) = SVs_TEMP;
677b06e3
GS
6877 EXTEND_MORTAL(1);
6878 PL_tmps_stack[++PL_tmps_ix] = sv;
79072805
LW
6879 return sv;
6880}
6881
954c1994
GS
6882/*
6883=for apidoc sv_2mortal
6884
d4236ebc
DM
6885Marks an existing SV as mortal. The SV will be destroyed "soon", either
6886by an explicit call to FREETMPS, or by an implicit call at places such as
37d2ac18
NC
6887statement boundaries. SvTEMP() is turned on which means that the SV's
6888string buffer can be "stolen" if this SV is copied. See also C<sv_newmortal>
6889and C<sv_mortalcopy>.
954c1994
GS
6890
6891=cut
6892*/
6893
79072805 6894SV *
864dbfa3 6895Perl_sv_2mortal(pTHX_ register SV *sv)
79072805 6896{
27da23d5 6897 dVAR;
79072805 6898 if (!sv)
7a5b473e 6899 return NULL;
d689ffdd 6900 if (SvREADONLY(sv) && SvIMMORTAL(sv))
11162842 6901 return sv;
677b06e3
GS
6902 EXTEND_MORTAL(1);
6903 PL_tmps_stack[++PL_tmps_ix] = sv;
8990e307 6904 SvTEMP_on(sv);
79072805
LW
6905 return sv;
6906}
6907
954c1994
GS
6908/*
6909=for apidoc newSVpv
6910
6911Creates a new SV and copies a string into it. The reference count for the
6912SV is set to 1. If C<len> is zero, Perl will compute the length using
6913strlen(). For efficiency, consider using C<newSVpvn> instead.
6914
6915=cut
6916*/
6917
79072805 6918SV *
864dbfa3 6919Perl_newSVpv(pTHX_ const char *s, STRLEN len)
79072805 6920{
97aff369 6921 dVAR;
463ee0b2 6922 register SV *sv;
79072805 6923
4561caa4 6924 new_SV(sv);
616d8c9c 6925 sv_setpvn(sv,s,len ? len : strlen(s));
79072805
LW
6926 return sv;
6927}
6928
954c1994
GS
6929/*
6930=for apidoc newSVpvn
6931
6932Creates a new SV and copies a string into it. The reference count for the
1c846c1f 6933SV is set to 1. Note that if C<len> is zero, Perl will create a zero length
954c1994 6934string. You are responsible for ensuring that the source string is at least
9e09f5f2 6935C<len> bytes long. If the C<s> argument is NULL the new SV will be undefined.
954c1994
GS
6936
6937=cut
6938*/
6939
9da1e3b5 6940SV *
864dbfa3 6941Perl_newSVpvn(pTHX_ const char *s, STRLEN len)
9da1e3b5 6942{
97aff369 6943 dVAR;
9da1e3b5
MUN
6944 register SV *sv;
6945
6946 new_SV(sv);
9da1e3b5
MUN
6947 sv_setpvn(sv,s,len);
6948 return sv;
6949}
6950
bd08039b
NC
6951
6952/*
926f8064 6953=for apidoc newSVhek
bd08039b
NC
6954
6955Creates a new SV from the hash key structure. It will generate scalars that
5aaec2b4
NC
6956point to the shared string table where possible. Returns a new (undefined)
6957SV if the hek is NULL.
bd08039b
NC
6958
6959=cut
6960*/
6961
6962SV *
c1b02ed8 6963Perl_newSVhek(pTHX_ const HEK *hek)
bd08039b 6964{
97aff369 6965 dVAR;
5aaec2b4
NC
6966 if (!hek) {
6967 SV *sv;
6968
6969 new_SV(sv);
6970 return sv;
6971 }
6972
bd08039b
NC
6973 if (HEK_LEN(hek) == HEf_SVKEY) {
6974 return newSVsv(*(SV**)HEK_KEY(hek));
6975 } else {
6976 const int flags = HEK_FLAGS(hek);
6977 if (flags & HVhek_WASUTF8) {
6978 /* Trouble :-)
6979 Andreas would like keys he put in as utf8 to come back as utf8
6980 */
6981 STRLEN utf8_len = HEK_LEN(hek);
b64e5050
AL
6982 const U8 *as_utf8 = bytes_to_utf8 ((U8*)HEK_KEY(hek), &utf8_len);
6983 SV * const sv = newSVpvn ((const char*)as_utf8, utf8_len);
bd08039b
NC
6984
6985 SvUTF8_on (sv);
6986 Safefree (as_utf8); /* bytes_to_utf8() allocates a new string */
6987 return sv;
45e34800 6988 } else if (flags & (HVhek_REHASH|HVhek_UNSHARED)) {
bd08039b
NC
6989 /* We don't have a pointer to the hv, so we have to replicate the
6990 flag into every HEK. This hv is using custom a hasing
6991 algorithm. Hence we can't return a shared string scalar, as
6992 that would contain the (wrong) hash value, and might get passed
45e34800
NC
6993 into an hv routine with a regular hash.
6994 Similarly, a hash that isn't using shared hash keys has to have
6995 the flag in every key so that we know not to try to call
6996 share_hek_kek on it. */
bd08039b 6997
b64e5050 6998 SV * const sv = newSVpvn (HEK_KEY(hek), HEK_LEN(hek));
bd08039b
NC
6999 if (HEK_UTF8(hek))
7000 SvUTF8_on (sv);
7001 return sv;
7002 }
7003 /* This will be overwhelminly the most common case. */
409dfe77
NC
7004 {
7005 /* Inline most of newSVpvn_share(), because share_hek_hek() is far
7006 more efficient than sharepvn(). */
7007 SV *sv;
7008
7009 new_SV(sv);
7010 sv_upgrade(sv, SVt_PV);
7011 SvPV_set(sv, (char *)HEK_KEY(share_hek_hek(hek)));
7012 SvCUR_set(sv, HEK_LEN(hek));
7013 SvLEN_set(sv, 0);
7014 SvREADONLY_on(sv);
7015 SvFAKE_on(sv);
7016 SvPOK_on(sv);
7017 if (HEK_UTF8(hek))
7018 SvUTF8_on(sv);
7019 return sv;
7020 }
bd08039b
NC
7021 }
7022}
7023
1c846c1f
NIS
7024/*
7025=for apidoc newSVpvn_share
7026
3f7c398e 7027Creates a new SV with its SvPVX_const pointing to a shared string in the string
645c22ef
DM
7028table. If the string does not already exist in the table, it is created
7029first. Turns on READONLY and FAKE. The string's hash is stored in the UV
7030slot of the SV; if the C<hash> parameter is non-zero, that value is used;
7031otherwise the hash is computed. The idea here is that as the string table
3f7c398e 7032is used for shared hash keys these strings will have SvPVX_const == HeKEY and
645c22ef 7033hash lookup will avoid string compare.
1c846c1f
NIS
7034
7035=cut
7036*/
7037
7038SV *
c3654f1a 7039Perl_newSVpvn_share(pTHX_ const char *src, I32 len, U32 hash)
1c846c1f 7040{
97aff369 7041 dVAR;
1c846c1f 7042 register SV *sv;
c3654f1a 7043 bool is_utf8 = FALSE;
a51caccf
NC
7044 const char *const orig_src = src;
7045
c3654f1a 7046 if (len < 0) {
77caf834 7047 STRLEN tmplen = -len;
c3654f1a 7048 is_utf8 = TRUE;
75a54232 7049 /* See the note in hv.c:hv_fetch() --jhi */
e1ec3a88 7050 src = (char*)bytes_from_utf8((const U8*)src, &tmplen, &is_utf8);
75a54232
JH
7051 len = tmplen;
7052 }
1c846c1f 7053 if (!hash)
5afd6d42 7054 PERL_HASH(hash, src, len);
1c846c1f 7055 new_SV(sv);
bdd68bc3 7056 sv_upgrade(sv, SVt_PV);
f880fe2f 7057 SvPV_set(sv, sharepvn(src, is_utf8?-len:len, hash));
b162af07 7058 SvCUR_set(sv, len);
b162af07 7059 SvLEN_set(sv, 0);
1c846c1f
NIS
7060 SvREADONLY_on(sv);
7061 SvFAKE_on(sv);
7062 SvPOK_on(sv);
c3654f1a
IH
7063 if (is_utf8)
7064 SvUTF8_on(sv);
a51caccf
NC
7065 if (src != orig_src)
7066 Safefree(src);
1c846c1f
NIS
7067 return sv;
7068}
7069
645c22ef 7070
cea2e8a9 7071#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
7072
7073/* pTHX_ magic can't cope with varargs, so this is a no-context
7074 * version of the main function, (which may itself be aliased to us).
7075 * Don't access this version directly.
7076 */
7077
46fc3d4c 7078SV *
cea2e8a9 7079Perl_newSVpvf_nocontext(const char* pat, ...)
46fc3d4c 7080{
cea2e8a9 7081 dTHX;
46fc3d4c 7082 register SV *sv;
7083 va_list args;
46fc3d4c 7084 va_start(args, pat);
c5be433b 7085 sv = vnewSVpvf(pat, &args);
46fc3d4c 7086 va_end(args);
7087 return sv;
7088}
cea2e8a9 7089#endif
46fc3d4c 7090
954c1994
GS
7091/*
7092=for apidoc newSVpvf
7093
645c22ef 7094Creates a new SV and initializes it with the string formatted like
954c1994
GS
7095C<sprintf>.
7096
7097=cut
7098*/
7099
cea2e8a9
GS
7100SV *
7101Perl_newSVpvf(pTHX_ const char* pat, ...)
7102{
7103 register SV *sv;
7104 va_list args;
cea2e8a9 7105 va_start(args, pat);
c5be433b 7106 sv = vnewSVpvf(pat, &args);
cea2e8a9
GS
7107 va_end(args);
7108 return sv;
7109}
46fc3d4c 7110
645c22ef
DM
7111/* backend for newSVpvf() and newSVpvf_nocontext() */
7112
79072805 7113SV *
c5be433b
GS
7114Perl_vnewSVpvf(pTHX_ const char* pat, va_list* args)
7115{
97aff369 7116 dVAR;
c5be433b
GS
7117 register SV *sv;
7118 new_SV(sv);
4608196e 7119 sv_vsetpvfn(sv, pat, strlen(pat), args, NULL, 0, NULL);
c5be433b
GS
7120 return sv;
7121}
7122
954c1994
GS
7123/*
7124=for apidoc newSVnv
7125
7126Creates a new SV and copies a floating point value into it.
7127The reference count for the SV is set to 1.
7128
7129=cut
7130*/
7131
c5be433b 7132SV *
65202027 7133Perl_newSVnv(pTHX_ NV n)
79072805 7134{
97aff369 7135 dVAR;
463ee0b2 7136 register SV *sv;
79072805 7137
4561caa4 7138 new_SV(sv);
79072805
LW
7139 sv_setnv(sv,n);
7140 return sv;
7141}
7142
954c1994
GS
7143/*
7144=for apidoc newSViv
7145
7146Creates a new SV and copies an integer into it. The reference count for the
7147SV is set to 1.
7148
7149=cut
7150*/
7151
79072805 7152SV *
864dbfa3 7153Perl_newSViv(pTHX_ IV i)
79072805 7154{
97aff369 7155 dVAR;
463ee0b2 7156 register SV *sv;
79072805 7157
4561caa4 7158 new_SV(sv);
79072805
LW
7159 sv_setiv(sv,i);
7160 return sv;
7161}
7162
954c1994 7163/*
1a3327fb
JH
7164=for apidoc newSVuv
7165
7166Creates a new SV and copies an unsigned integer into it.
7167The reference count for the SV is set to 1.
7168
7169=cut
7170*/
7171
7172SV *
7173Perl_newSVuv(pTHX_ UV u)
7174{
97aff369 7175 dVAR;
1a3327fb
JH
7176 register SV *sv;
7177
7178 new_SV(sv);
7179 sv_setuv(sv,u);
7180 return sv;
7181}
7182
7183/*
954c1994
GS
7184=for apidoc newRV_noinc
7185
7186Creates an RV wrapper for an SV. The reference count for the original
7187SV is B<not> incremented.
7188
7189=cut
7190*/
7191
2304df62 7192SV *
864dbfa3 7193Perl_newRV_noinc(pTHX_ SV *tmpRef)
2304df62 7194{
97aff369 7195 dVAR;
2304df62
AD
7196 register SV *sv;
7197
4561caa4 7198 new_SV(sv);
2304df62 7199 sv_upgrade(sv, SVt_RV);
76e3520e 7200 SvTEMP_off(tmpRef);
b162af07 7201 SvRV_set(sv, tmpRef);
2304df62 7202 SvROK_on(sv);
2304df62
AD
7203 return sv;
7204}
7205
ff276b08 7206/* newRV_inc is the official function name to use now.
645c22ef
DM
7207 * newRV_inc is in fact #defined to newRV in sv.h
7208 */
7209
5f05dabc 7210SV *
7f466ec7 7211Perl_newRV(pTHX_ SV *sv)
5f05dabc 7212{
97aff369 7213 dVAR;
7f466ec7 7214 return newRV_noinc(SvREFCNT_inc_simple_NN(sv));
5f05dabc 7215}
5f05dabc 7216
954c1994
GS
7217/*
7218=for apidoc newSVsv
7219
7220Creates a new SV which is an exact duplicate of the original SV.
645c22ef 7221(Uses C<sv_setsv>).
954c1994
GS
7222
7223=cut
7224*/
7225
79072805 7226SV *
864dbfa3 7227Perl_newSVsv(pTHX_ register SV *old)
79072805 7228{
97aff369 7229 dVAR;
463ee0b2 7230 register SV *sv;
79072805
LW
7231
7232 if (!old)
7a5b473e 7233 return NULL;
8990e307 7234 if (SvTYPE(old) == SVTYPEMASK) {
0453d815 7235 if (ckWARN_d(WARN_INTERNAL))
9014280d 7236 Perl_warner(aTHX_ packWARN(WARN_INTERNAL), "semi-panic: attempt to dup freed string");
a0714e2c 7237 return NULL;
79072805 7238 }
4561caa4 7239 new_SV(sv);
e90aabeb
NC
7240 /* SV_GMAGIC is the default for sv_setv()
7241 SV_NOSTEAL prevents TEMP buffers being, well, stolen, and saves games
7242 with SvTEMP_off and SvTEMP_on round a call to sv_setsv. */
7243 sv_setsv_flags(sv, old, SV_GMAGIC | SV_NOSTEAL);
463ee0b2 7244 return sv;
79072805
LW
7245}
7246
645c22ef
DM
7247/*
7248=for apidoc sv_reset
7249
7250Underlying implementation for the C<reset> Perl function.
7251Note that the perl-level function is vaguely deprecated.
7252
7253=cut
7254*/
7255
79072805 7256void
e1ec3a88 7257Perl_sv_reset(pTHX_ register const char *s, HV *stash)
79072805 7258{
27da23d5 7259 dVAR;
4802d5d7 7260 char todo[PERL_UCHAR_MAX+1];
79072805 7261
49d8d3a1
MB
7262 if (!stash)
7263 return;
7264
79072805 7265 if (!*s) { /* reset ?? searches */
aec46f14 7266 MAGIC * const mg = mg_find((SV *)stash, PERL_MAGIC_symtab);
8d2f4536
NC
7267 if (mg) {
7268 PMOP *pm = (PMOP *) mg->mg_obj;
7269 while (pm) {
7270 pm->op_pmdynflags &= ~PMdf_USED;
7271 pm = pm->op_pmnext;
7272 }
79072805
LW
7273 }
7274 return;
7275 }
7276
7277 /* reset variables */
7278
7279 if (!HvARRAY(stash))
7280 return;
463ee0b2
LW
7281
7282 Zero(todo, 256, char);
79072805 7283 while (*s) {
b464bac0
AL
7284 I32 max;
7285 I32 i = (unsigned char)*s;
79072805
LW
7286 if (s[1] == '-') {
7287 s += 2;
7288 }
4802d5d7 7289 max = (unsigned char)*s++;
79072805 7290 for ( ; i <= max; i++) {
463ee0b2
LW
7291 todo[i] = 1;
7292 }
a0d0e21e 7293 for (i = 0; i <= (I32) HvMAX(stash); i++) {
b464bac0 7294 HE *entry;
79072805 7295 for (entry = HvARRAY(stash)[i];
9e35f4b3
GS
7296 entry;
7297 entry = HeNEXT(entry))
7298 {
b464bac0
AL
7299 register GV *gv;
7300 register SV *sv;
7301
1edc1566 7302 if (!todo[(U8)*HeKEY(entry)])
463ee0b2 7303 continue;
1edc1566 7304 gv = (GV*)HeVAL(entry);
79072805 7305 sv = GvSV(gv);
e203899d
NC
7306 if (sv) {
7307 if (SvTHINKFIRST(sv)) {
7308 if (!SvREADONLY(sv) && SvROK(sv))
7309 sv_unref(sv);
7310 /* XXX Is this continue a bug? Why should THINKFIRST
7311 exempt us from resetting arrays and hashes? */
7312 continue;
7313 }
7314 SvOK_off(sv);
7315 if (SvTYPE(sv) >= SVt_PV) {
7316 SvCUR_set(sv, 0);
bd61b366 7317 if (SvPVX_const(sv) != NULL)
e203899d
NC
7318 *SvPVX(sv) = '\0';
7319 SvTAINT(sv);
7320 }
79072805
LW
7321 }
7322 if (GvAV(gv)) {
7323 av_clear(GvAV(gv));
7324 }
bfcb3514 7325 if (GvHV(gv) && !HvNAME_get(GvHV(gv))) {
b0269e46
AB
7326#if defined(VMS)
7327 Perl_die(aTHX_ "Can't reset %%ENV on this system");
7328#else /* ! VMS */
463ee0b2 7329 hv_clear(GvHV(gv));
b0269e46
AB
7330# if defined(USE_ENVIRON_ARRAY)
7331 if (gv == PL_envgv)
7332 my_clearenv();
7333# endif /* USE_ENVIRON_ARRAY */
7334#endif /* VMS */
79072805
LW
7335 }
7336 }
7337 }
7338 }
7339}
7340
645c22ef
DM
7341/*
7342=for apidoc sv_2io
7343
7344Using various gambits, try to get an IO from an SV: the IO slot if its a
7345GV; or the recursive result if we're an RV; or the IO slot of the symbol
7346named after the PV if we're a string.
7347
7348=cut
7349*/
7350
46fc3d4c 7351IO*
864dbfa3 7352Perl_sv_2io(pTHX_ SV *sv)
46fc3d4c 7353{
7354 IO* io;
7355 GV* gv;
7356
7357 switch (SvTYPE(sv)) {
7358 case SVt_PVIO:
7359 io = (IO*)sv;
7360 break;
7361 case SVt_PVGV:
7362 gv = (GV*)sv;
7363 io = GvIO(gv);
7364 if (!io)
cea2e8a9 7365 Perl_croak(aTHX_ "Bad filehandle: %s", GvNAME(gv));
46fc3d4c 7366 break;
7367 default:
7368 if (!SvOK(sv))
cea2e8a9 7369 Perl_croak(aTHX_ PL_no_usym, "filehandle");
46fc3d4c 7370 if (SvROK(sv))
7371 return sv_2io(SvRV(sv));
f776e3cd 7372 gv = gv_fetchsv(sv, 0, SVt_PVIO);
46fc3d4c 7373 if (gv)
7374 io = GvIO(gv);
7375 else
7376 io = 0;
7377 if (!io)
95b63a38 7378 Perl_croak(aTHX_ "Bad filehandle: %"SVf, (void*)sv);
46fc3d4c 7379 break;
7380 }
7381 return io;
7382}
7383
645c22ef
DM
7384/*
7385=for apidoc sv_2cv
7386
7387Using various gambits, try to get a CV from an SV; in addition, try if
7388possible to set C<*st> and C<*gvp> to the stash and GV associated with it.
f2c0649b 7389The flags in C<lref> are passed to sv_fetchsv.
645c22ef
DM
7390
7391=cut
7392*/
7393
79072805 7394CV *
864dbfa3 7395Perl_sv_2cv(pTHX_ SV *sv, HV **st, GV **gvp, I32 lref)
79072805 7396{
27da23d5 7397 dVAR;
a0714e2c 7398 GV *gv = NULL;
601f1833 7399 CV *cv = NULL;
79072805 7400
85dec29a
NC
7401 if (!sv) {
7402 *st = NULL;
7403 *gvp = NULL;
7404 return NULL;
7405 }
79072805 7406 switch (SvTYPE(sv)) {
79072805
LW
7407 case SVt_PVCV:
7408 *st = CvSTASH(sv);
a0714e2c 7409 *gvp = NULL;
79072805
LW
7410 return (CV*)sv;
7411 case SVt_PVHV:
7412 case SVt_PVAV:
ef58ba18 7413 *st = NULL;
a0714e2c 7414 *gvp = NULL;
601f1833 7415 return NULL;
8990e307
LW
7416 case SVt_PVGV:
7417 gv = (GV*)sv;
a0d0e21e 7418 *gvp = gv;
8990e307
LW
7419 *st = GvESTASH(gv);
7420 goto fix_gv;
7421
79072805 7422 default:
5b295bef 7423 SvGETMAGIC(sv);
a0d0e21e 7424 if (SvROK(sv)) {
823a54a3 7425 SV * const *sp = &sv; /* Used in tryAMAGICunDEREF macro. */
f5284f61
IZ
7426 tryAMAGICunDEREF(to_cv);
7427
62f274bf
GS
7428 sv = SvRV(sv);
7429 if (SvTYPE(sv) == SVt_PVCV) {
7430 cv = (CV*)sv;
a0714e2c 7431 *gvp = NULL;
62f274bf
GS
7432 *st = CvSTASH(cv);
7433 return cv;
7434 }
7435 else if(isGV(sv))
7436 gv = (GV*)sv;
7437 else
cea2e8a9 7438 Perl_croak(aTHX_ "Not a subroutine reference");
a0d0e21e 7439 }
62f274bf 7440 else if (isGV(sv))
79072805
LW
7441 gv = (GV*)sv;
7442 else
7a5fd60d 7443 gv = gv_fetchsv(sv, lref, SVt_PVCV);
79072805 7444 *gvp = gv;
ef58ba18
NC
7445 if (!gv) {
7446 *st = NULL;
601f1833 7447 return NULL;
ef58ba18 7448 }
e26df76a
NC
7449 /* Some flags to gv_fetchsv mean don't really create the GV */
7450 if (SvTYPE(gv) != SVt_PVGV) {
7451 *st = NULL;
7452 return NULL;
7453 }
79072805 7454 *st = GvESTASH(gv);
8990e307 7455 fix_gv:
8ebc5c01 7456 if (lref && !GvCVu(gv)) {
4633a7c4 7457 SV *tmpsv;
748a9306 7458 ENTER;
561b68a9 7459 tmpsv = newSV(0);
bd61b366 7460 gv_efullname3(tmpsv, gv, NULL);
f6ec51f7
GS
7461 /* XXX this is probably not what they think they're getting.
7462 * It has the same effect as "sub name;", i.e. just a forward
7463 * declaration! */
774d564b 7464 newSUB(start_subparse(FALSE, 0),
4633a7c4 7465 newSVOP(OP_CONST, 0, tmpsv),
5f66b61c 7466 NULL, NULL);
748a9306 7467 LEAVE;
8ebc5c01 7468 if (!GvCVu(gv))
35c1215d 7469 Perl_croak(aTHX_ "Unable to create sub named \"%"SVf"\"",
95b63a38 7470 (void*)sv);
8990e307 7471 }
8ebc5c01 7472 return GvCVu(gv);
79072805
LW
7473 }
7474}
7475
c461cf8f
JH
7476/*
7477=for apidoc sv_true
7478
7479Returns true if the SV has a true value by Perl's rules.
645c22ef
DM
7480Use the C<SvTRUE> macro instead, which may call C<sv_true()> or may
7481instead use an in-line version.
c461cf8f
JH
7482
7483=cut
7484*/
7485
79072805 7486I32
864dbfa3 7487Perl_sv_true(pTHX_ register SV *sv)
79072805 7488{
8990e307
LW
7489 if (!sv)
7490 return 0;
79072805 7491 if (SvPOK(sv)) {
823a54a3
AL
7492 register const XPV* const tXpv = (XPV*)SvANY(sv);
7493 if (tXpv &&
c2f1de04 7494 (tXpv->xpv_cur > 1 ||
339049b0 7495 (tXpv->xpv_cur && *sv->sv_u.svu_pv != '0')))
79072805
LW
7496 return 1;
7497 else
7498 return 0;
7499 }
7500 else {
7501 if (SvIOK(sv))
463ee0b2 7502 return SvIVX(sv) != 0;
79072805
LW
7503 else {
7504 if (SvNOK(sv))
463ee0b2 7505 return SvNVX(sv) != 0.0;
79072805 7506 else
463ee0b2 7507 return sv_2bool(sv);
79072805
LW
7508 }
7509 }
7510}
79072805 7511
645c22ef 7512/*
c461cf8f
JH
7513=for apidoc sv_pvn_force
7514
7515Get a sensible string out of the SV somehow.
645c22ef
DM
7516A private implementation of the C<SvPV_force> macro for compilers which
7517can't cope with complex macro expressions. Always use the macro instead.
c461cf8f 7518
8d6d96c1
HS
7519=for apidoc sv_pvn_force_flags
7520
7521Get a sensible string out of the SV somehow.
7522If C<flags> has C<SV_GMAGIC> bit set, will C<mg_get> on C<sv> if
7523appropriate, else not. C<sv_pvn_force> and C<sv_pvn_force_nomg> are
7524implemented in terms of this function.
645c22ef
DM
7525You normally want to use the various wrapper macros instead: see
7526C<SvPV_force> and C<SvPV_force_nomg>
8d6d96c1
HS
7527
7528=cut
7529*/
7530
7531char *
7532Perl_sv_pvn_force_flags(pTHX_ SV *sv, STRLEN *lp, I32 flags)
7533{
97aff369 7534 dVAR;
6fc92669 7535 if (SvTHINKFIRST(sv) && !SvROK(sv))
765f542d 7536 sv_force_normal_flags(sv, 0);
1c846c1f 7537
a0d0e21e 7538 if (SvPOK(sv)) {
13c5b33c
NC
7539 if (lp)
7540 *lp = SvCUR(sv);
a0d0e21e
LW
7541 }
7542 else {
a3b680e6 7543 char *s;
13c5b33c
NC
7544 STRLEN len;
7545
4d84ee25 7546 if (SvREADONLY(sv) && !(flags & SV_MUTABLE_RETURN)) {
b64e5050 7547 const char * const ref = sv_reftype(sv,0);
4d84ee25
NC
7548 if (PL_op)
7549 Perl_croak(aTHX_ "Can't coerce readonly %s to string in %s",
b64e5050 7550 ref, OP_NAME(PL_op));
4d84ee25 7551 else
b64e5050 7552 Perl_croak(aTHX_ "Can't coerce readonly %s to string", ref);
4d84ee25 7553 }
b64e5050 7554 if (SvTYPE(sv) > SVt_PVLV && SvTYPE(sv) != SVt_PVFM)
cea2e8a9 7555 Perl_croak(aTHX_ "Can't coerce %s to string in %s", sv_reftype(sv,0),
53e06cf0 7556 OP_NAME(PL_op));
b64e5050 7557 s = sv_2pv_flags(sv, &len, flags);
13c5b33c
NC
7558 if (lp)
7559 *lp = len;
7560
3f7c398e 7561 if (s != SvPVX_const(sv)) { /* Almost, but not quite, sv_setpvn() */
a0d0e21e
LW
7562 if (SvROK(sv))
7563 sv_unref(sv);
862a34c6 7564 SvUPGRADE(sv, SVt_PV); /* Never FALSE */
a0d0e21e 7565 SvGROW(sv, len + 1);
706aa1c9 7566 Move(s,SvPVX(sv),len,char);
a0d0e21e
LW
7567 SvCUR_set(sv, len);
7568 *SvEND(sv) = '\0';
7569 }
7570 if (!SvPOK(sv)) {
7571 SvPOK_on(sv); /* validate pointer */
7572 SvTAINT(sv);
1d7c1841 7573 DEBUG_c(PerlIO_printf(Perl_debug_log, "0x%"UVxf" 2pv(%s)\n",
3f7c398e 7574 PTR2UV(sv),SvPVX_const(sv)));
a0d0e21e
LW
7575 }
7576 }
4d84ee25 7577 return SvPVX_mutable(sv);
a0d0e21e
LW
7578}
7579
645c22ef 7580/*
645c22ef
DM
7581=for apidoc sv_pvbyten_force
7582
0feed65a 7583The backend for the C<SvPVbytex_force> macro. Always use the macro instead.
645c22ef
DM
7584
7585=cut
7586*/
7587
7340a771
GS
7588char *
7589Perl_sv_pvbyten_force(pTHX_ SV *sv, STRLEN *lp)
7590{
46ec2f14 7591 sv_pvn_force(sv,lp);
ffebcc3e 7592 sv_utf8_downgrade(sv,0);
46ec2f14
TS
7593 *lp = SvCUR(sv);
7594 return SvPVX(sv);
7340a771
GS
7595}
7596
645c22ef 7597/*
c461cf8f
JH
7598=for apidoc sv_pvutf8n_force
7599
0feed65a 7600The backend for the C<SvPVutf8x_force> macro. Always use the macro instead.
c461cf8f
JH
7601
7602=cut
7603*/
7604
7340a771
GS
7605char *
7606Perl_sv_pvutf8n_force(pTHX_ SV *sv, STRLEN *lp)
7607{
46ec2f14 7608 sv_pvn_force(sv,lp);
560a288e 7609 sv_utf8_upgrade(sv);
46ec2f14
TS
7610 *lp = SvCUR(sv);
7611 return SvPVX(sv);
7340a771
GS
7612}
7613
c461cf8f
JH
7614/*
7615=for apidoc sv_reftype
7616
7617Returns a string describing what the SV is a reference to.
7618
7619=cut
7620*/
7621
1cb0ed9b 7622char *
bfed75c6 7623Perl_sv_reftype(pTHX_ const SV *sv, int ob)
a0d0e21e 7624{
07409e01
NC
7625 /* The fact that I don't need to downcast to char * everywhere, only in ?:
7626 inside return suggests a const propagation bug in g++. */
c86bf373 7627 if (ob && SvOBJECT(sv)) {
1b6737cc 7628 char * const name = HvNAME_get(SvSTASH(sv));
07409e01 7629 return name ? name : (char *) "__ANON__";
c86bf373 7630 }
a0d0e21e
LW
7631 else {
7632 switch (SvTYPE(sv)) {
7633 case SVt_NULL:
7634 case SVt_IV:
7635 case SVt_NV:
7636 case SVt_RV:
7637 case SVt_PV:
7638 case SVt_PVIV:
7639 case SVt_PVNV:
7640 case SVt_PVMG:
7641 case SVt_PVBM:
1cb0ed9b 7642 if (SvVOK(sv))
439cb1c4 7643 return "VSTRING";
a0d0e21e
LW
7644 if (SvROK(sv))
7645 return "REF";
7646 else
7647 return "SCALAR";
1cb0ed9b 7648
07409e01 7649 case SVt_PVLV: return (char *) (SvROK(sv) ? "REF"
be65207d
DM
7650 /* tied lvalues should appear to be
7651 * scalars for backwards compatitbility */
7652 : (LvTYPE(sv) == 't' || LvTYPE(sv) == 'T')
07409e01 7653 ? "SCALAR" : "LVALUE");
a0d0e21e
LW
7654 case SVt_PVAV: return "ARRAY";
7655 case SVt_PVHV: return "HASH";
7656 case SVt_PVCV: return "CODE";
7657 case SVt_PVGV: return "GLOB";
1d2dff63 7658 case SVt_PVFM: return "FORMAT";
27f9d8f3 7659 case SVt_PVIO: return "IO";
a0d0e21e
LW
7660 default: return "UNKNOWN";
7661 }
7662 }
7663}
7664
954c1994
GS
7665/*
7666=for apidoc sv_isobject
7667
7668Returns a boolean indicating whether the SV is an RV pointing to a blessed
7669object. If the SV is not an RV, or if the object is not blessed, then this
7670will return false.
7671
7672=cut
7673*/
7674
463ee0b2 7675int
864dbfa3 7676Perl_sv_isobject(pTHX_ SV *sv)
85e6fe83 7677{
68dc0745 7678 if (!sv)
7679 return 0;
5b295bef 7680 SvGETMAGIC(sv);
85e6fe83
LW
7681 if (!SvROK(sv))
7682 return 0;
7683 sv = (SV*)SvRV(sv);
7684 if (!SvOBJECT(sv))
7685 return 0;
7686 return 1;
7687}
7688
954c1994
GS
7689/*
7690=for apidoc sv_isa
7691
7692Returns a boolean indicating whether the SV is blessed into the specified
7693class. This does not check for subtypes; use C<sv_derived_from> to verify
7694an inheritance relationship.
7695
7696=cut
7697*/
7698
85e6fe83 7699int
864dbfa3 7700Perl_sv_isa(pTHX_ SV *sv, const char *name)
463ee0b2 7701{
bfcb3514 7702 const char *hvname;
68dc0745 7703 if (!sv)
7704 return 0;
5b295bef 7705 SvGETMAGIC(sv);
ed6116ce 7706 if (!SvROK(sv))
463ee0b2 7707 return 0;
ed6116ce
LW
7708 sv = (SV*)SvRV(sv);
7709 if (!SvOBJECT(sv))
463ee0b2 7710 return 0;
bfcb3514
NC
7711 hvname = HvNAME_get(SvSTASH(sv));
7712 if (!hvname)
e27ad1f2 7713 return 0;
463ee0b2 7714
bfcb3514 7715 return strEQ(hvname, name);
463ee0b2
LW
7716}
7717
954c1994
GS
7718/*
7719=for apidoc newSVrv
7720
7721Creates a new SV for the RV, C<rv>, to point to. If C<rv> is not an RV then
7722it will be upgraded to one. If C<classname> is non-null then the new SV will
7723be blessed in the specified package. The new SV is returned and its
7724reference count is 1.
7725
7726=cut
7727*/
7728
463ee0b2 7729SV*
864dbfa3 7730Perl_newSVrv(pTHX_ SV *rv, const char *classname)
463ee0b2 7731{
97aff369 7732 dVAR;
463ee0b2
LW
7733 SV *sv;
7734
4561caa4 7735 new_SV(sv);
51cf62d8 7736
765f542d 7737 SV_CHECK_THINKFIRST_COW_DROP(rv);
51cf62d8 7738 SvAMAGIC_off(rv);
51cf62d8 7739
0199fce9 7740 if (SvTYPE(rv) >= SVt_PVMG) {
a3b680e6 7741 const U32 refcnt = SvREFCNT(rv);
0199fce9
JD
7742 SvREFCNT(rv) = 0;
7743 sv_clear(rv);
7744 SvFLAGS(rv) = 0;
7745 SvREFCNT(rv) = refcnt;
0199fce9 7746
dc5494d2
NC
7747 sv_upgrade(rv, SVt_RV);
7748 } else if (SvROK(rv)) {
7749 SvREFCNT_dec(SvRV(rv));
7750 } else if (SvTYPE(rv) < SVt_RV)
0199fce9
JD
7751 sv_upgrade(rv, SVt_RV);
7752 else if (SvTYPE(rv) > SVt_RV) {
8bd4d4c5 7753 SvPV_free(rv);
0199fce9
JD
7754 SvCUR_set(rv, 0);
7755 SvLEN_set(rv, 0);
7756 }
51cf62d8 7757
0c34ef67 7758 SvOK_off(rv);
b162af07 7759 SvRV_set(rv, sv);
ed6116ce 7760 SvROK_on(rv);
463ee0b2 7761
a0d0e21e 7762 if (classname) {
1b6737cc 7763 HV* const stash = gv_stashpv(classname, TRUE);
a0d0e21e
LW
7764 (void)sv_bless(rv, stash);
7765 }
7766 return sv;
7767}
7768
954c1994
GS
7769/*
7770=for apidoc sv_setref_pv
7771
7772Copies a pointer into a new SV, optionally blessing the SV. The C<rv>
7773argument will be upgraded to an RV. That RV will be modified to point to
7774the new SV. If the C<pv> argument is NULL then C<PL_sv_undef> will be placed
7775into the SV. The C<classname> argument indicates the package for the
bd61b366 7776blessing. Set C<classname> to C<NULL> to avoid the blessing. The new SV
d34c2299 7777will have a reference count of 1, and the RV will be returned.
954c1994
GS
7778
7779Do not use with other Perl types such as HV, AV, SV, CV, because those
7780objects will become corrupted by the pointer copy process.
7781
7782Note that C<sv_setref_pvn> copies the string while this copies the pointer.
7783
7784=cut
7785*/
7786
a0d0e21e 7787SV*
864dbfa3 7788Perl_sv_setref_pv(pTHX_ SV *rv, const char *classname, void *pv)
a0d0e21e 7789{
97aff369 7790 dVAR;
189b2af5 7791 if (!pv) {
3280af22 7792 sv_setsv(rv, &PL_sv_undef);
189b2af5
GS
7793 SvSETMAGIC(rv);
7794 }
a0d0e21e 7795 else
56431972 7796 sv_setiv(newSVrv(rv,classname), PTR2IV(pv));
a0d0e21e
LW
7797 return rv;
7798}
7799
954c1994
GS
7800/*
7801=for apidoc sv_setref_iv
7802
7803Copies an integer into a new SV, optionally blessing the SV. The C<rv>
7804argument will be upgraded to an RV. That RV will be modified to point to
7805the new SV. The C<classname> argument indicates the package for the
bd61b366 7806blessing. Set C<classname> to C<NULL> to avoid the blessing. The new SV
d34c2299 7807will have a reference count of 1, and the RV will be returned.
954c1994
GS
7808
7809=cut
7810*/
7811
a0d0e21e 7812SV*
864dbfa3 7813Perl_sv_setref_iv(pTHX_ SV *rv, const char *classname, IV iv)
a0d0e21e
LW
7814{
7815 sv_setiv(newSVrv(rv,classname), iv);
7816 return rv;
7817}
7818
954c1994 7819/*
e1c57cef
JH
7820=for apidoc sv_setref_uv
7821
7822Copies an unsigned integer into a new SV, optionally blessing the SV. The C<rv>
7823argument will be upgraded to an RV. That RV will be modified to point to
7824the new SV. The C<classname> argument indicates the package for the
bd61b366 7825blessing. Set C<classname> to C<NULL> to avoid the blessing. The new SV
d34c2299 7826will have a reference count of 1, and the RV will be returned.
e1c57cef
JH
7827
7828=cut
7829*/
7830
7831SV*
7832Perl_sv_setref_uv(pTHX_ SV *rv, const char *classname, UV uv)
7833{
7834 sv_setuv(newSVrv(rv,classname), uv);
7835 return rv;
7836}
7837
7838/*
954c1994
GS
7839=for apidoc sv_setref_nv
7840
7841Copies a double into a new SV, optionally blessing the SV. The C<rv>
7842argument will be upgraded to an RV. That RV will be modified to point to
7843the new SV. The C<classname> argument indicates the package for the
bd61b366 7844blessing. Set C<classname> to C<NULL> to avoid the blessing. The new SV
d34c2299 7845will have a reference count of 1, and the RV will be returned.
954c1994
GS
7846
7847=cut
7848*/
7849
a0d0e21e 7850SV*
65202027 7851Perl_sv_setref_nv(pTHX_ SV *rv, const char *classname, NV nv)
a0d0e21e
LW
7852{
7853 sv_setnv(newSVrv(rv,classname), nv);
7854 return rv;
7855}
463ee0b2 7856
954c1994
GS
7857/*
7858=for apidoc sv_setref_pvn
7859
7860Copies a string into a new SV, optionally blessing the SV. The length of the
7861string must be specified with C<n>. The C<rv> argument will be upgraded to
7862an RV. That RV will be modified to point to the new SV. The C<classname>
7863argument indicates the package for the blessing. Set C<classname> to
bd61b366 7864C<NULL> to avoid the blessing. The new SV will have a reference count
d34c2299 7865of 1, and the RV will be returned.
954c1994
GS
7866
7867Note that C<sv_setref_pv> copies the pointer while this copies the string.
7868
7869=cut
7870*/
7871
a0d0e21e 7872SV*
1b6737cc 7873Perl_sv_setref_pvn(pTHX_ SV *rv, const char *classname, const char *pv, STRLEN n)
a0d0e21e
LW
7874{
7875 sv_setpvn(newSVrv(rv,classname), pv, n);
463ee0b2
LW
7876 return rv;
7877}
7878
954c1994
GS
7879/*
7880=for apidoc sv_bless
7881
7882Blesses an SV into a specified package. The SV must be an RV. The package
7883must be designated by its stash (see C<gv_stashpv()>). The reference count
7884of the SV is unaffected.
7885
7886=cut
7887*/
7888
a0d0e21e 7889SV*
864dbfa3 7890Perl_sv_bless(pTHX_ SV *sv, HV *stash)
a0d0e21e 7891{
97aff369 7892 dVAR;
76e3520e 7893 SV *tmpRef;
a0d0e21e 7894 if (!SvROK(sv))
cea2e8a9 7895 Perl_croak(aTHX_ "Can't bless non-reference value");
76e3520e
GS
7896 tmpRef = SvRV(sv);
7897 if (SvFLAGS(tmpRef) & (SVs_OBJECT|SVf_READONLY)) {
7898 if (SvREADONLY(tmpRef))
cea2e8a9 7899 Perl_croak(aTHX_ PL_no_modify);
76e3520e
GS
7900 if (SvOBJECT(tmpRef)) {
7901 if (SvTYPE(tmpRef) != SVt_PVIO)
3280af22 7902 --PL_sv_objcount;
76e3520e 7903 SvREFCNT_dec(SvSTASH(tmpRef));
2e3febc6 7904 }
a0d0e21e 7905 }
76e3520e
GS
7906 SvOBJECT_on(tmpRef);
7907 if (SvTYPE(tmpRef) != SVt_PVIO)
3280af22 7908 ++PL_sv_objcount;
862a34c6 7909 SvUPGRADE(tmpRef, SVt_PVMG);
b37c2d43 7910 SvSTASH_set(tmpRef, (HV*)SvREFCNT_inc_simple(stash));
a0d0e21e 7911
2e3febc6
CS
7912 if (Gv_AMG(stash))
7913 SvAMAGIC_on(sv);
7914 else
7915 SvAMAGIC_off(sv);
a0d0e21e 7916
1edbfb88
AB
7917 if(SvSMAGICAL(tmpRef))
7918 if(mg_find(tmpRef, PERL_MAGIC_ext) || mg_find(tmpRef, PERL_MAGIC_uvar))
7919 mg_set(tmpRef);
7920
7921
ecdeb87c 7922
a0d0e21e
LW
7923 return sv;
7924}
7925
645c22ef 7926/* Downgrades a PVGV to a PVMG.
645c22ef
DM
7927 */
7928
76e3520e 7929STATIC void
cea2e8a9 7930S_sv_unglob(pTHX_ SV *sv)
a0d0e21e 7931{
97aff369 7932 dVAR;
850fabdf 7933 void *xpvmg;
b37c2d43 7934 SV * const temp = sv_newmortal();
850fabdf 7935
a0d0e21e
LW
7936 assert(SvTYPE(sv) == SVt_PVGV);
7937 SvFAKE_off(sv);
180488f8
NC
7938 gv_efullname3(temp, (GV *) sv, "*");
7939
f7877b28 7940 if (GvGP(sv)) {
1edc1566 7941 gp_free((GV*)sv);
f7877b28 7942 }
e826b3c7 7943 if (GvSTASH(sv)) {
e15faf7d 7944 sv_del_backref((SV*)GvSTASH(sv), sv);
5c284bb0 7945 GvSTASH(sv) = NULL;
e826b3c7 7946 }
a5f75d66 7947 GvMULTI_off(sv);
acda4c6a
NC
7948 if (GvNAME_HEK(sv)) {
7949 unshare_hek(GvNAME_HEK(sv));
7950 }
dedf8e73 7951 SvSCREAM_off(sv);
850fabdf
GS
7952
7953 /* need to keep SvANY(sv) in the right arena */
7954 xpvmg = new_XPVMG();
7955 StructCopy(SvANY(sv), xpvmg, XPVMG);
7956 del_XPVGV(SvANY(sv));
7957 SvANY(sv) = xpvmg;
7958
a0d0e21e
LW
7959 SvFLAGS(sv) &= ~SVTYPEMASK;
7960 SvFLAGS(sv) |= SVt_PVMG;
180488f8
NC
7961
7962 /* Intentionally not calling any local SET magic, as this isn't so much a
7963 set operation as merely an internal storage change. */
7964 sv_setsv_flags(sv, temp, 0);
a0d0e21e
LW
7965}
7966
954c1994 7967/*
840a7b70 7968=for apidoc sv_unref_flags
954c1994
GS
7969
7970Unsets the RV status of the SV, and decrements the reference count of
7971whatever was being referenced by the RV. This can almost be thought of
840a7b70
IZ
7972as a reversal of C<newSVrv>. The C<cflags> argument can contain
7973C<SV_IMMEDIATE_UNREF> to force the reference count to be decremented
7974(otherwise the decrementing is conditional on the reference count being
7975different from one or the reference being a readonly SV).
7889fe52 7976See C<SvROK_off>.
954c1994
GS
7977
7978=cut
7979*/
7980
ed6116ce 7981void
e15faf7d 7982Perl_sv_unref_flags(pTHX_ SV *ref, U32 flags)
ed6116ce 7983{
b64e5050 7984 SV* const target = SvRV(ref);
810b8aa5 7985
e15faf7d
NC
7986 if (SvWEAKREF(ref)) {
7987 sv_del_backref(target, ref);
7988 SvWEAKREF_off(ref);
7989 SvRV_set(ref, NULL);
810b8aa5
GS
7990 return;
7991 }
e15faf7d
NC
7992 SvRV_set(ref, NULL);
7993 SvROK_off(ref);
7994 /* You can't have a || SvREADONLY(target) here, as $a = $$a, where $a was
04ca4930 7995 assigned to as BEGIN {$a = \"Foo"} will fail. */
e15faf7d
NC
7996 if (SvREFCNT(target) != 1 || (flags & SV_IMMEDIATE_UNREF))
7997 SvREFCNT_dec(target);
840a7b70 7998 else /* XXX Hack, but hard to make $a=$a->[1] work otherwise */
e15faf7d 7999 sv_2mortal(target); /* Schedule for freeing later */
ed6116ce 8000}
8990e307 8001
840a7b70 8002/*
645c22ef
DM
8003=for apidoc sv_untaint
8004
8005Untaint an SV. Use C<SvTAINTED_off> instead.
8006=cut
8007*/
8008
bbce6d69 8009void
864dbfa3 8010Perl_sv_untaint(pTHX_ SV *sv)
bbce6d69 8011{
13f57bf8 8012 if (SvTYPE(sv) >= SVt_PVMG && SvMAGIC(sv)) {
b64e5050 8013 MAGIC * const mg = mg_find(sv, PERL_MAGIC_taint);
36477c24 8014 if (mg)
565764a8 8015 mg->mg_len &= ~1;
36477c24 8016 }
bbce6d69 8017}
8018
645c22ef
DM
8019/*
8020=for apidoc sv_tainted
8021
8022Test an SV for taintedness. Use C<SvTAINTED> instead.
8023=cut
8024*/
8025
bbce6d69 8026bool
864dbfa3 8027Perl_sv_tainted(pTHX_ SV *sv)
bbce6d69 8028{
13f57bf8 8029 if (SvTYPE(sv) >= SVt_PVMG && SvMAGIC(sv)) {
823a54a3 8030 const MAGIC * const mg = mg_find(sv, PERL_MAGIC_taint);
2ddb8a4f 8031 if (mg && (mg->mg_len & 1) )
36477c24 8032 return TRUE;
8033 }
8034 return FALSE;
bbce6d69 8035}
8036
09540bc3
JH
8037/*
8038=for apidoc sv_setpviv
8039
8040Copies an integer into the given SV, also updating its string value.
8041Does not handle 'set' magic. See C<sv_setpviv_mg>.
8042
8043=cut
8044*/
8045
8046void
8047Perl_sv_setpviv(pTHX_ SV *sv, IV iv)
8048{
8049 char buf[TYPE_CHARS(UV)];
8050 char *ebuf;
b64e5050 8051 char * const ptr = uiv_2buf(buf, iv, 0, 0, &ebuf);
09540bc3
JH
8052
8053 sv_setpvn(sv, ptr, ebuf - ptr);
8054}
8055
8056/*
8057=for apidoc sv_setpviv_mg
8058
8059Like C<sv_setpviv>, but also handles 'set' magic.
8060
8061=cut
8062*/
8063
8064void
8065Perl_sv_setpviv_mg(pTHX_ SV *sv, IV iv)
8066{
df7eb254 8067 sv_setpviv(sv, iv);
09540bc3
JH
8068 SvSETMAGIC(sv);
8069}
8070
cea2e8a9 8071#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
8072
8073/* pTHX_ magic can't cope with varargs, so this is a no-context
8074 * version of the main function, (which may itself be aliased to us).
8075 * Don't access this version directly.
8076 */
8077
cea2e8a9
GS
8078void
8079Perl_sv_setpvf_nocontext(SV *sv, const char* pat, ...)
8080{
8081 dTHX;
8082 va_list args;
8083 va_start(args, pat);
c5be433b 8084 sv_vsetpvf(sv, pat, &args);
cea2e8a9
GS
8085 va_end(args);
8086}
8087
645c22ef
DM
8088/* pTHX_ magic can't cope with varargs, so this is a no-context
8089 * version of the main function, (which may itself be aliased to us).
8090 * Don't access this version directly.
8091 */
cea2e8a9
GS
8092
8093void
8094Perl_sv_setpvf_mg_nocontext(SV *sv, const char* pat, ...)
8095{
8096 dTHX;
8097 va_list args;
8098 va_start(args, pat);
c5be433b 8099 sv_vsetpvf_mg(sv, pat, &args);
cea2e8a9 8100 va_end(args);
cea2e8a9
GS
8101}
8102#endif
8103
954c1994
GS
8104/*
8105=for apidoc sv_setpvf
8106
bffc3d17
SH
8107Works like C<sv_catpvf> but copies the text into the SV instead of
8108appending it. Does not handle 'set' magic. See C<sv_setpvf_mg>.
954c1994
GS
8109
8110=cut
8111*/
8112
46fc3d4c 8113void
864dbfa3 8114Perl_sv_setpvf(pTHX_ SV *sv, const char* pat, ...)
46fc3d4c 8115{
8116 va_list args;
46fc3d4c 8117 va_start(args, pat);
c5be433b 8118 sv_vsetpvf(sv, pat, &args);
46fc3d4c 8119 va_end(args);
8120}
8121
bffc3d17
SH
8122/*
8123=for apidoc sv_vsetpvf
8124
8125Works like C<sv_vcatpvf> but copies the text into the SV instead of
8126appending it. Does not handle 'set' magic. See C<sv_vsetpvf_mg>.
8127
8128Usually used via its frontend C<sv_setpvf>.
8129
8130=cut
8131*/
645c22ef 8132
c5be433b
GS
8133void
8134Perl_sv_vsetpvf(pTHX_ SV *sv, const char* pat, va_list* args)
8135{
4608196e 8136 sv_vsetpvfn(sv, pat, strlen(pat), args, NULL, 0, NULL);
c5be433b 8137}
ef50df4b 8138
954c1994
GS
8139/*
8140=for apidoc sv_setpvf_mg
8141
8142Like C<sv_setpvf>, but also handles 'set' magic.
8143
8144=cut
8145*/
8146
ef50df4b 8147void
864dbfa3 8148Perl_sv_setpvf_mg(pTHX_ SV *sv, const char* pat, ...)
ef50df4b
GS
8149{
8150 va_list args;
ef50df4b 8151 va_start(args, pat);
c5be433b 8152 sv_vsetpvf_mg(sv, pat, &args);
ef50df4b 8153 va_end(args);
c5be433b
GS
8154}
8155
bffc3d17
SH
8156/*
8157=for apidoc sv_vsetpvf_mg
8158
8159Like C<sv_vsetpvf>, but also handles 'set' magic.
8160
8161Usually used via its frontend C<sv_setpvf_mg>.
8162
8163=cut
8164*/
645c22ef 8165
c5be433b
GS
8166void
8167Perl_sv_vsetpvf_mg(pTHX_ SV *sv, const char* pat, va_list* args)
8168{
4608196e 8169 sv_vsetpvfn(sv, pat, strlen(pat), args, NULL, 0, NULL);
ef50df4b
GS
8170 SvSETMAGIC(sv);
8171}
8172
cea2e8a9 8173#if defined(PERL_IMPLICIT_CONTEXT)
645c22ef
DM
8174
8175/* pTHX_ magic can't cope with varargs, so this is a no-context
8176 * version of the main function, (which may itself be aliased to us).
8177 * Don't access this version directly.
8178 */
8179
cea2e8a9
GS
8180void
8181Perl_sv_catpvf_nocontext(SV *sv, const char* pat, ...)
8182{
8183 dTHX;
8184 va_list args;
8185 va_start(args, pat);
c5be433b 8186 sv_vcatpvf(sv, pat, &args);
cea2e8a9
GS
8187 va_end(args);
8188}
8189
645c22ef
DM
8190/* pTHX_ magic can't cope with varargs, so this is a no-context
8191 * version of the main function, (which may itself be aliased to us).
8192 * Don't access this version directly.
8193 */
8194
cea2e8a9
GS
8195void
8196Perl_sv_catpvf_mg_nocontext(SV *sv, const char* pat, ...)
8197{
8198 dTHX;
8199 va_list args;
8200 va_start(args, pat);
c5be433b 8201 sv_vcatpvf_mg(sv, pat, &args);
cea2e8a9 8202 va_end(args);
cea2e8a9
GS
8203}
8204#endif
8205
954c1994
GS
8206/*
8207=for apidoc sv_catpvf
8208
d5ce4a7c
GA
8209Processes its arguments like C<sprintf> and appends the formatted
8210output to an SV. If the appended data contains "wide" characters
8211(including, but not limited to, SVs with a UTF-8 PV formatted with %s,
8212and characters >255 formatted with %c), the original SV might get
bffc3d17 8213upgraded to UTF-8. Handles 'get' magic, but not 'set' magic. See
cdd94ca7
NC
8214C<sv_catpvf_mg>. If the original SV was UTF-8, the pattern should be
8215valid UTF-8; if the original SV was bytes, the pattern should be too.
954c1994 8216
d5ce4a7c 8217=cut */
954c1994 8218
46fc3d4c 8219void
864dbfa3 8220Perl_sv_catpvf(pTHX_ SV *sv, const char* pat, ...)
46fc3d4c 8221{
8222 va_list args;
46fc3d4c 8223 va_start(args, pat);
c5be433b 8224 sv_vcatpvf(sv, pat, &args);
46fc3d4c 8225 va_end(args);
8226}
8227
bffc3d17
SH
8228/*
8229=for apidoc sv_vcatpvf
8230
8231Processes its arguments like C<vsprintf> and appends the formatted output
8232to an SV. Does not handle 'set' magic. See C<sv_vcatpvf_mg>.
8233
8234Usually used via its frontend C<sv_catpvf>.
8235
8236=cut
8237*/
645c22ef 8238
ef50df4b 8239void
c5be433b
GS
8240Perl_sv_vcatpvf(pTHX_ SV *sv, const char* pat, va_list* args)
8241{
4608196e 8242 sv_vcatpvfn(sv, pat, strlen(pat), args, NULL, 0, NULL);
c5be433b
GS
8243}
8244
954c1994
GS
8245/*
8246=for apidoc sv_catpvf_mg
8247
8248Like C<sv_catpvf>, but also handles 'set' magic.
8249
8250=cut
8251*/
8252
c5be433b 8253void
864dbfa3 8254Perl_sv_catpvf_mg(pTHX_ SV *sv, const char* pat, ...)
ef50df4b
GS
8255{
8256 va_list args;
ef50df4b 8257 va_start(args, pat);
c5be433b 8258 sv_vcatpvf_mg(sv, pat, &args);
ef50df4b 8259 va_end(args);
c5be433b
GS
8260}
8261
bffc3d17
SH
8262/*
8263=for apidoc sv_vcatpvf_mg
8264
8265Like C<sv_vcatpvf>, but also handles 'set' magic.
8266
8267Usually used via its frontend C<sv_catpvf_mg>.
8268
8269=cut
8270*/
645c22ef 8271
c5be433b
GS
8272void
8273Perl_sv_vcatpvf_mg(pTHX_ SV *sv, const char* pat, va_list* args)
8274{
4608196e 8275 sv_vcatpvfn(sv, pat, strlen(pat), args, NULL, 0, NULL);
ef50df4b
GS
8276 SvSETMAGIC(sv);
8277}
8278
954c1994
GS
8279/*
8280=for apidoc sv_vsetpvfn
8281
bffc3d17 8282Works like C<sv_vcatpvfn> but copies the text into the SV instead of
954c1994
GS
8283appending it.
8284
bffc3d17 8285Usually used via one of its frontends C<sv_vsetpvf> and C<sv_vsetpvf_mg>.
645c22ef 8286
954c1994
GS
8287=cut
8288*/
8289
46fc3d4c 8290void
7d5ea4e7 8291Perl_sv_vsetpvfn(pTHX_ SV *sv, const char *pat, STRLEN patlen, va_list *args, SV **svargs, I32 svmax, bool *maybe_tainted)
46fc3d4c 8292{
8293 sv_setpvn(sv, "", 0);
7d5ea4e7 8294 sv_vcatpvfn(sv, pat, patlen, args, svargs, svmax, maybe_tainted);
46fc3d4c 8295}
8296
2d00ba3b 8297STATIC I32
9dd79c3f 8298S_expect_number(pTHX_ char** pattern)
211dfcf1 8299{
97aff369 8300 dVAR;
211dfcf1
HS
8301 I32 var = 0;
8302 switch (**pattern) {
8303 case '1': case '2': case '3':
8304 case '4': case '5': case '6':
8305 case '7': case '8': case '9':
2fba7546
GA
8306 var = *(*pattern)++ - '0';
8307 while (isDIGIT(**pattern)) {
5f66b61c 8308 const I32 tmp = var * 10 + (*(*pattern)++ - '0');
2fba7546
GA
8309 if (tmp < var)
8310 Perl_croak(aTHX_ "Integer overflow in format string for %s", (PL_op ? OP_NAME(PL_op) : "sv_vcatpvfn"));
8311 var = tmp;
8312 }
211dfcf1
HS
8313 }
8314 return var;
8315}
211dfcf1 8316
c445ea15
AL
8317STATIC char *
8318S_F0convert(NV nv, char *endbuf, STRLEN *len)
4151a5fe 8319{
a3b680e6 8320 const int neg = nv < 0;
4151a5fe 8321 UV uv;
4151a5fe
IZ
8322
8323 if (neg)
8324 nv = -nv;
8325 if (nv < UV_MAX) {
b464bac0 8326 char *p = endbuf;
4151a5fe 8327 nv += 0.5;
028f8eaa 8328 uv = (UV)nv;
4151a5fe
IZ
8329 if (uv & 1 && uv == nv)
8330 uv--; /* Round to even */
8331 do {
a3b680e6 8332 const unsigned dig = uv % 10;
4151a5fe
IZ
8333 *--p = '0' + dig;
8334 } while (uv /= 10);
8335 if (neg)
8336 *--p = '-';
8337 *len = endbuf - p;
8338 return p;
8339 }
bd61b366 8340 return NULL;
4151a5fe
IZ
8341}
8342
8343
954c1994
GS
8344/*
8345=for apidoc sv_vcatpvfn
8346
8347Processes its arguments like C<vsprintf> and appends the formatted output
8348to an SV. Uses an array of SVs if the C style variable argument list is
8349missing (NULL). When running with taint checks enabled, indicates via
8350C<maybe_tainted> if results are untrustworthy (often due to the use of
8351locales).
8352
bffc3d17 8353Usually used via one of its frontends C<sv_vcatpvf> and C<sv_vcatpvf_mg>.
645c22ef 8354
954c1994
GS
8355=cut
8356*/
8357
8896765a
RB
8358
8359#define VECTORIZE_ARGS vecsv = va_arg(*args, SV*);\
8360 vecstr = (U8*)SvPV_const(vecsv,veclen);\
8361 vec_utf8 = DO_UTF8(vecsv);
8362
1ef29b0e
RGS
8363/* XXX maybe_tainted is never assigned to, so the doc above is lying. */
8364
46fc3d4c 8365void
7d5ea4e7 8366Perl_sv_vcatpvfn(pTHX_ SV *sv, const char *pat, STRLEN patlen, va_list *args, SV **svargs, I32 svmax, bool *maybe_tainted)
46fc3d4c 8367{
97aff369 8368 dVAR;
46fc3d4c 8369 char *p;
8370 char *q;
a3b680e6 8371 const char *patend;
fc36a67e 8372 STRLEN origlen;
46fc3d4c 8373 I32 svix = 0;
27da23d5 8374 static const char nullstr[] = "(null)";
a0714e2c 8375 SV *argsv = NULL;
b464bac0
AL
8376 bool has_utf8 = DO_UTF8(sv); /* has the result utf8? */
8377 const bool pat_utf8 = has_utf8; /* the pattern is in utf8? */
a0714e2c 8378 SV *nsv = NULL;
4151a5fe
IZ
8379 /* Times 4: a decimal digit takes more than 3 binary digits.
8380 * NV_DIG: mantissa takes than many decimal digits.
8381 * Plus 32: Playing safe. */
8382 char ebuf[IV_DIG * 4 + NV_DIG + 32];
8383 /* large enough for "%#.#f" --chip */
8384 /* what about long double NVs? --jhi */
db79b45b 8385
53c1dcc0
AL
8386 PERL_UNUSED_ARG(maybe_tainted);
8387
46fc3d4c 8388 /* no matter what, this is a string now */
fc36a67e 8389 (void)SvPV_force(sv, origlen);
46fc3d4c 8390
8896765a 8391 /* special-case "", "%s", and "%-p" (SVf - see below) */
46fc3d4c 8392 if (patlen == 0)
8393 return;
0dbb1585 8394 if (patlen == 2 && pat[0] == '%' && pat[1] == 's') {
2d03de9c
AL
8395 if (args) {
8396 const char * const s = va_arg(*args, char*);
8397 sv_catpv(sv, s ? s : nullstr);
8398 }
8399 else if (svix < svmax) {
8400 sv_catsv(sv, *svargs);
2d03de9c
AL
8401 }
8402 return;
0dbb1585 8403 }
8896765a
RB
8404 if (args && patlen == 3 && pat[0] == '%' &&
8405 pat[1] == '-' && pat[2] == 'p') {
8406 argsv = va_arg(*args, SV*);
8407 sv_catsv(sv, argsv);
8896765a 8408 return;
46fc3d4c 8409 }
8410
1d917b39 8411#ifndef USE_LONG_DOUBLE
4151a5fe 8412 /* special-case "%.<number>[gf]" */
7af36d83 8413 if ( !args && patlen <= 5 && pat[0] == '%' && pat[1] == '.'
4151a5fe
IZ
8414 && (pat[patlen-1] == 'g' || pat[patlen-1] == 'f') ) {
8415 unsigned digits = 0;
8416 const char *pp;
8417
8418 pp = pat + 2;
8419 while (*pp >= '0' && *pp <= '9')
8420 digits = 10 * digits + (*pp++ - '0');
028f8eaa 8421 if (pp - pat == (int)patlen - 1) {
4151a5fe
IZ
8422 NV nv;
8423
7af36d83 8424 if (svix < svmax)
4151a5fe
IZ
8425 nv = SvNV(*svargs);
8426 else
8427 return;
8428 if (*pp == 'g') {
2873255c
NC
8429 /* Add check for digits != 0 because it seems that some
8430 gconverts are buggy in this case, and we don't yet have
8431 a Configure test for this. */
8432 if (digits && digits < sizeof(ebuf) - NV_DIG - 10) {
8433 /* 0, point, slack */
2e59c212 8434 Gconvert(nv, (int)digits, 0, ebuf);
4151a5fe
IZ
8435 sv_catpv(sv, ebuf);
8436 if (*ebuf) /* May return an empty string for digits==0 */
8437 return;
8438 }
8439 } else if (!digits) {
8440 STRLEN l;
8441
8442 if ((p = F0convert(nv, ebuf + sizeof ebuf, &l))) {
8443 sv_catpvn(sv, p, l);
8444 return;
8445 }
8446 }
8447 }
8448 }
1d917b39 8449#endif /* !USE_LONG_DOUBLE */
4151a5fe 8450
2cf2cfc6 8451 if (!args && svix < svmax && DO_UTF8(*svargs))
205f51d8 8452 has_utf8 = TRUE;
2cf2cfc6 8453
46fc3d4c 8454 patend = (char*)pat + patlen;
8455 for (p = (char*)pat; p < patend; p = q) {
8456 bool alt = FALSE;
8457 bool left = FALSE;
b22c7a20 8458 bool vectorize = FALSE;
211dfcf1 8459 bool vectorarg = FALSE;
2cf2cfc6 8460 bool vec_utf8 = FALSE;
46fc3d4c 8461 char fill = ' ';
8462 char plus = 0;
8463 char intsize = 0;
8464 STRLEN width = 0;
fc36a67e 8465 STRLEN zeros = 0;
46fc3d4c 8466 bool has_precis = FALSE;
8467 STRLEN precis = 0;
c445ea15 8468 const I32 osvix = svix;
2cf2cfc6 8469 bool is_utf8 = FALSE; /* is this item utf8? */
20f6aaab
AS
8470#ifdef HAS_LDBL_SPRINTF_BUG
8471 /* This is to try to fix a bug with irix/nonstop-ux/powerux and
205f51d8 8472 with sfio - Allen <allens@cpan.org> */
20f6aaab
AS
8473 bool fix_ldbl_sprintf_bug = FALSE;
8474#endif
205f51d8 8475
46fc3d4c 8476 char esignbuf[4];
89ebb4a3 8477 U8 utf8buf[UTF8_MAXBYTES+1];
46fc3d4c 8478 STRLEN esignlen = 0;
8479
bd61b366 8480 const char *eptr = NULL;
fc36a67e 8481 STRLEN elen = 0;
a0714e2c 8482 SV *vecsv = NULL;
4608196e 8483 const U8 *vecstr = NULL;
b22c7a20 8484 STRLEN veclen = 0;
934abaf1 8485 char c = 0;
46fc3d4c 8486 int i;
9c5ffd7c 8487 unsigned base = 0;
8c8eb53c
RB
8488 IV iv = 0;
8489 UV uv = 0;
9e5b023a
JH
8490 /* we need a long double target in case HAS_LONG_DOUBLE but
8491 not USE_LONG_DOUBLE
8492 */
35fff930 8493#if defined(HAS_LONG_DOUBLE) && LONG_DOUBLESIZE > DOUBLESIZE
9e5b023a
JH
8494 long double nv;
8495#else
65202027 8496 NV nv;
9e5b023a 8497#endif
46fc3d4c 8498 STRLEN have;
8499 STRLEN need;
8500 STRLEN gap;
7af36d83 8501 const char *dotstr = ".";
b22c7a20 8502 STRLEN dotstrlen = 1;
211dfcf1 8503 I32 efix = 0; /* explicit format parameter index */
eb3fce90 8504 I32 ewix = 0; /* explicit width index */
211dfcf1
HS
8505 I32 epix = 0; /* explicit precision index */
8506 I32 evix = 0; /* explicit vector index */
eb3fce90 8507 bool asterisk = FALSE;
46fc3d4c 8508
211dfcf1 8509 /* echo everything up to the next format specification */
46fc3d4c 8510 for (q = p; q < patend && *q != '%'; ++q) ;
8511 if (q > p) {
db79b45b
JH
8512 if (has_utf8 && !pat_utf8)
8513 sv_catpvn_utf8_upgrade(sv, p, q - p, nsv);
8514 else
8515 sv_catpvn(sv, p, q - p);
46fc3d4c 8516 p = q;
8517 }
8518 if (q++ >= patend)
8519 break;
8520
211dfcf1
HS
8521/*
8522 We allow format specification elements in this order:
8523 \d+\$ explicit format parameter index
8524 [-+ 0#]+ flags
a472f209 8525 v|\*(\d+\$)?v vector with optional (optionally specified) arg
f3583277 8526 0 flag (as above): repeated to allow "v02"
211dfcf1
HS
8527 \d+|\*(\d+\$)? width using optional (optionally specified) arg
8528 \.(\d*|\*(\d+\$)?) precision using optional (optionally specified) arg
8529 [hlqLV] size
8896765a
RB
8530 [%bcdefginopsuxDFOUX] format (mandatory)
8531*/
8532
8533 if (args) {
8534/*
8535 As of perl5.9.3, printf format checking is on by default.
8536 Internally, perl uses %p formats to provide an escape to
8537 some extended formatting. This block deals with those
8538 extensions: if it does not match, (char*)q is reset and
8539 the normal format processing code is used.
8540
8541 Currently defined extensions are:
8542 %p include pointer address (standard)
8543 %-p (SVf) include an SV (previously %_)
8544 %-<num>p include an SV with precision <num>
8545 %1p (VDf) include a v-string (as %vd)
8546 %<num>p reserved for future extensions
8547
8548 Robin Barker 2005-07-14
211dfcf1 8549*/
8896765a
RB
8550 char* r = q;
8551 bool sv = FALSE;
8552 STRLEN n = 0;
8553 if (*q == '-')
8554 sv = *q++;
c445ea15 8555 n = expect_number(&q);
8896765a
RB
8556 if (*q++ == 'p') {
8557 if (sv) { /* SVf */
8558 if (n) {
8559 precis = n;
8560 has_precis = TRUE;
8561 }
8562 argsv = va_arg(*args, SV*);
8563 eptr = SvPVx_const(argsv, elen);
8564 if (DO_UTF8(argsv))
8565 is_utf8 = TRUE;
8566 goto string;
8567 }
8568#if vdNUMBER
8569 else if (n == vdNUMBER) { /* VDf */
8570 vectorize = TRUE;
8571 VECTORIZE_ARGS
8572 goto format_vd;
8573 }
8574#endif
8575 else if (n) {
8576 if (ckWARN_d(WARN_INTERNAL))
8577 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
8578 "internal %%<num>p might conflict with future printf extensions");
8579 }
8580 }
8581 q = r;
8582 }
8583
c445ea15 8584 if ( (width = expect_number(&q)) ) {
211dfcf1
HS
8585 if (*q == '$') {
8586 ++q;
8587 efix = width;
8588 } else {
8589 goto gotwidth;
8590 }
8591 }
8592
fc36a67e 8593 /* FLAGS */
8594
46fc3d4c 8595 while (*q) {
8596 switch (*q) {
8597 case ' ':
8598 case '+':
8599 plus = *q++;
8600 continue;
8601
8602 case '-':
8603 left = TRUE;
8604 q++;
8605 continue;
8606
8607 case '0':
8608 fill = *q++;
8609 continue;
8610
8611 case '#':
8612 alt = TRUE;
8613 q++;
8614 continue;
8615
fc36a67e 8616 default:
8617 break;
8618 }
8619 break;
8620 }
46fc3d4c 8621
211dfcf1 8622 tryasterisk:
eb3fce90 8623 if (*q == '*') {
211dfcf1 8624 q++;
c445ea15 8625 if ( (ewix = expect_number(&q)) )
211dfcf1
HS
8626 if (*q++ != '$')
8627 goto unknown;
eb3fce90 8628 asterisk = TRUE;
211dfcf1
HS
8629 }
8630 if (*q == 'v') {
eb3fce90 8631 q++;
211dfcf1
HS
8632 if (vectorize)
8633 goto unknown;
9cbac4c7 8634 if ((vectorarg = asterisk)) {
211dfcf1
HS
8635 evix = ewix;
8636 ewix = 0;
8637 asterisk = FALSE;
8638 }
8639 vectorize = TRUE;
8640 goto tryasterisk;
eb3fce90
JH
8641 }
8642
211dfcf1 8643 if (!asterisk)
858a90f9 8644 {
7a5fa8a2 8645 if( *q == '0' )
f3583277 8646 fill = *q++;
c445ea15 8647 width = expect_number(&q);
858a90f9 8648 }
211dfcf1
HS
8649
8650 if (vectorize) {
8651 if (vectorarg) {
8652 if (args)
8653 vecsv = va_arg(*args, SV*);
7ad96abb
NC
8654 else if (evix) {
8655 vecsv = (evix > 0 && evix <= svmax)
8656 ? svargs[evix-1] : &PL_sv_undef;
8657 } else {
8658 vecsv = svix < svmax ? svargs[svix++] : &PL_sv_undef;
8659 }
245d4a47 8660 dotstr = SvPV_const(vecsv, dotstrlen);
640283f5
NC
8661 /* Keep the DO_UTF8 test *after* the SvPV call, else things go
8662 bad with tied or overloaded values that return UTF8. */
211dfcf1 8663 if (DO_UTF8(vecsv))
2cf2cfc6 8664 is_utf8 = TRUE;
640283f5
NC
8665 else if (has_utf8) {
8666 vecsv = sv_mortalcopy(vecsv);
8667 sv_utf8_upgrade(vecsv);
8668 dotstr = SvPV_const(vecsv, dotstrlen);
8669 is_utf8 = TRUE;
8670 }
211dfcf1
HS
8671 }
8672 if (args) {
8896765a 8673 VECTORIZE_ARGS
eb3fce90 8674 }
7ad96abb 8675 else if (efix ? (efix > 0 && efix <= svmax) : svix < svmax) {
211dfcf1 8676 vecsv = svargs[efix ? efix-1 : svix++];
245d4a47 8677 vecstr = (U8*)SvPV_const(vecsv,veclen);
2cf2cfc6 8678 vec_utf8 = DO_UTF8(vecsv);
96b8f7ce
JP
8679
8680 /* if this is a version object, we need to convert
8681 * back into v-string notation and then let the
8682 * vectorize happen normally
d7aa5382 8683 */
96b8f7ce
JP
8684 if (sv_derived_from(vecsv, "version")) {
8685 char *version = savesvpv(vecsv);
34ba6322
SP
8686 if ( hv_exists((HV*)SvRV(vecsv), "alpha", 5 ) ) {
8687 Perl_warner(aTHX_ packWARN(WARN_INTERNAL),
8688 "vector argument not supported with alpha versions");
8689 goto unknown;
8690 }
96b8f7ce
JP
8691 vecsv = sv_newmortal();
8692 /* scan_vstring is expected to be called during
8693 * tokenization, so we need to fake up the end
8694 * of the buffer for it
8695 */
8696 PL_bufend = version + veclen;
8697 scan_vstring(version, vecsv);
8698 vecstr = (U8*)SvPV_const(vecsv, veclen);
8699 vec_utf8 = DO_UTF8(vecsv);
8700 Safefree(version);
d7aa5382 8701 }
211dfcf1
HS
8702 }
8703 else {
8704 vecstr = (U8*)"";
8705 veclen = 0;
8706 }
eb3fce90 8707 }
fc36a67e 8708
eb3fce90 8709 if (asterisk) {
fc36a67e 8710 if (args)
8711 i = va_arg(*args, int);
8712 else
eb3fce90
JH
8713 i = (ewix ? ewix <= svmax : svix < svmax) ?
8714 SvIVx(svargs[ewix ? ewix-1 : svix++]) : 0;
fc36a67e 8715 left |= (i < 0);
8716 width = (i < 0) ? -i : i;
fc36a67e 8717 }
211dfcf1 8718 gotwidth:
fc36a67e 8719
8720 /* PRECISION */
46fc3d4c 8721
fc36a67e 8722 if (*q == '.') {
8723 q++;
8724 if (*q == '*') {
211dfcf1 8725 q++;
c445ea15 8726 if ( ((epix = expect_number(&q))) && (*q++ != '$') )
7b8dd722
HS
8727 goto unknown;
8728 /* XXX: todo, support specified precision parameter */
8729 if (epix)
211dfcf1 8730 goto unknown;
46fc3d4c 8731 if (args)
8732 i = va_arg(*args, int);
8733 else
eb3fce90
JH
8734 i = (ewix ? ewix <= svmax : svix < svmax)
8735 ? SvIVx(svargs[ewix ? ewix-1 : svix++]) : 0;
fc36a67e 8736 precis = (i < 0) ? 0 : i;
fc36a67e 8737 }
8738 else {
8739 precis = 0;
8740 while (isDIGIT(*q))
8741 precis = precis * 10 + (*q++ - '0');
8742 }
8743 has_precis = TRUE;
8744 }
46fc3d4c 8745
fc36a67e 8746 /* SIZE */
46fc3d4c 8747
fc36a67e 8748 switch (*q) {
c623ac67
GS
8749#ifdef WIN32
8750 case 'I': /* Ix, I32x, and I64x */
8751# ifdef WIN64
8752 if (q[1] == '6' && q[2] == '4') {
8753 q += 3;
8754 intsize = 'q';
8755 break;
8756 }
8757# endif
8758 if (q[1] == '3' && q[2] == '2') {
8759 q += 3;
8760 break;
8761 }
8762# ifdef WIN64
8763 intsize = 'q';
8764# endif
8765 q++;
8766 break;
8767#endif
9e5b023a 8768#if defined(HAS_QUAD) || defined(HAS_LONG_DOUBLE)
6f9bb7fd 8769 case 'L': /* Ld */
5f66b61c 8770 /*FALLTHROUGH*/
e5c81feb 8771#ifdef HAS_QUAD
6f9bb7fd 8772 case 'q': /* qd */
9e5b023a 8773#endif
6f9bb7fd
GS
8774 intsize = 'q';
8775 q++;
8776 break;
8777#endif
fc36a67e 8778 case 'l':
9e5b023a 8779#if defined(HAS_QUAD) || defined(HAS_LONG_DOUBLE)
205f51d8 8780 if (*(q + 1) == 'l') { /* lld, llf */
fc36a67e 8781 intsize = 'q';
8782 q += 2;
46fc3d4c 8783 break;
cf2093f6 8784 }
fc36a67e 8785#endif
5f66b61c 8786 /*FALLTHROUGH*/
fc36a67e 8787 case 'h':
5f66b61c 8788 /*FALLTHROUGH*/
fc36a67e 8789 case 'V':
8790 intsize = *q++;
46fc3d4c 8791 break;
8792 }
8793
fc36a67e 8794 /* CONVERSION */
8795
211dfcf1
HS
8796 if (*q == '%') {
8797 eptr = q++;
8798 elen = 1;
26372e71
GA
8799 if (vectorize) {
8800 c = '%';
8801 goto unknown;
8802 }
211dfcf1
HS
8803 goto string;
8804 }
8805
26372e71 8806 if (!vectorize && !args) {
86c51f8b
NC
8807 if (efix) {
8808 const I32 i = efix-1;
8809 argsv = (i >= 0 && i < svmax) ? svargs[i] : &PL_sv_undef;
8810 } else {
8811 argsv = (svix >= 0 && svix < svmax)
8812 ? svargs[svix++] : &PL_sv_undef;
8813 }
863811b2 8814 }
211dfcf1 8815
46fc3d4c 8816 switch (c = *q++) {
8817
8818 /* STRINGS */
8819
46fc3d4c 8820 case 'c':
26372e71
GA
8821 if (vectorize)
8822 goto unknown;
8823 uv = (args) ? va_arg(*args, int) : SvIVx(argsv);
1bd104fb
JH
8824 if ((uv > 255 ||
8825 (!UNI_IS_INVARIANT(uv) && SvUTF8(sv)))
0064a8a9 8826 && !IN_BYTES) {
dfe13c55 8827 eptr = (char*)utf8buf;
9041c2e3 8828 elen = uvchr_to_utf8((U8*)eptr, uv) - utf8buf;
2cf2cfc6 8829 is_utf8 = TRUE;
7e2040f0
GS
8830 }
8831 else {
8832 c = (char)uv;
8833 eptr = &c;
8834 elen = 1;
a0ed51b3 8835 }
46fc3d4c 8836 goto string;
8837
46fc3d4c 8838 case 's':
26372e71
GA
8839 if (vectorize)
8840 goto unknown;
8841 if (args) {
fc36a67e 8842 eptr = va_arg(*args, char*);
c635e13b 8843 if (eptr)
1d7c1841
GS
8844#ifdef MACOS_TRADITIONAL
8845 /* On MacOS, %#s format is used for Pascal strings */
8846 if (alt)
8847 elen = *eptr++;
8848 else
8849#endif
c635e13b 8850 elen = strlen(eptr);
8851 else {
27da23d5 8852 eptr = (char *)nullstr;
c635e13b 8853 elen = sizeof nullstr - 1;
8854 }
46fc3d4c 8855 }
211dfcf1 8856 else {
4d84ee25 8857 eptr = SvPVx_const(argsv, elen);
7e2040f0 8858 if (DO_UTF8(argsv)) {
a0ed51b3
LW
8859 if (has_precis && precis < elen) {
8860 I32 p = precis;
7e2040f0 8861 sv_pos_u2b(argsv, &p, 0); /* sticks at end */
a0ed51b3
LW
8862 precis = p;
8863 }
8864 if (width) { /* fudge width (can't fudge elen) */
7e2040f0 8865 width += elen - sv_len_utf8(argsv);
a0ed51b3 8866 }
2cf2cfc6 8867 is_utf8 = TRUE;
a0ed51b3
LW
8868 }
8869 }
fc36a67e 8870
46fc3d4c 8871 string:
8872 if (has_precis && elen > precis)
8873 elen = precis;
8874 break;
8875
8876 /* INTEGERS */
8877
fc36a67e 8878 case 'p':
be75b157 8879 if (alt || vectorize)
c2e66d9e 8880 goto unknown;
211dfcf1 8881 uv = PTR2UV(args ? va_arg(*args, void*) : argsv);
fc36a67e 8882 base = 16;
8883 goto integer;
8884
46fc3d4c 8885 case 'D':
29fe7a80 8886#ifdef IV_IS_QUAD
22f3ae8c 8887 intsize = 'q';
29fe7a80 8888#else
46fc3d4c 8889 intsize = 'l';
29fe7a80 8890#endif
5f66b61c 8891 /*FALLTHROUGH*/
46fc3d4c 8892 case 'd':
8893 case 'i':
8896765a
RB
8894#if vdNUMBER
8895 format_vd:
8896#endif
b22c7a20 8897 if (vectorize) {
ba210ebe 8898 STRLEN ulen;
211dfcf1
HS
8899 if (!veclen)
8900 continue;
2cf2cfc6
A
8901 if (vec_utf8)
8902 uv = utf8n_to_uvchr(vecstr, veclen, &ulen,
8903 UTF8_ALLOW_ANYUV);
b22c7a20 8904 else {
e83d50c9 8905 uv = *vecstr;
b22c7a20
GS
8906 ulen = 1;
8907 }
8908 vecstr += ulen;
8909 veclen -= ulen;
e83d50c9
JP
8910 if (plus)
8911 esignbuf[esignlen++] = plus;
b22c7a20
GS
8912 }
8913 else if (args) {
46fc3d4c 8914 switch (intsize) {
8915 case 'h': iv = (short)va_arg(*args, int); break;
46fc3d4c 8916 case 'l': iv = va_arg(*args, long); break;
fc36a67e 8917 case 'V': iv = va_arg(*args, IV); break;
b10c0dba 8918 default: iv = va_arg(*args, int); break;
cf2093f6
JH
8919#ifdef HAS_QUAD
8920 case 'q': iv = va_arg(*args, Quad_t); break;
8921#endif
46fc3d4c 8922 }
8923 }
8924 else {
b10c0dba 8925 IV tiv = SvIVx(argsv); /* work around GCC bug #13488 */
46fc3d4c 8926 switch (intsize) {
b10c0dba
MHM
8927 case 'h': iv = (short)tiv; break;
8928 case 'l': iv = (long)tiv; break;
8929 case 'V':
8930 default: iv = tiv; break;
cf2093f6 8931#ifdef HAS_QUAD
b10c0dba 8932 case 'q': iv = (Quad_t)tiv; break;
cf2093f6 8933#endif
46fc3d4c 8934 }
8935 }
e83d50c9
JP
8936 if ( !vectorize ) /* we already set uv above */
8937 {
8938 if (iv >= 0) {
8939 uv = iv;
8940 if (plus)
8941 esignbuf[esignlen++] = plus;
8942 }
8943 else {
8944 uv = -iv;
8945 esignbuf[esignlen++] = '-';
8946 }
46fc3d4c 8947 }
8948 base = 10;
8949 goto integer;
8950
fc36a67e 8951 case 'U':
29fe7a80 8952#ifdef IV_IS_QUAD
22f3ae8c 8953 intsize = 'q';
29fe7a80 8954#else
fc36a67e 8955 intsize = 'l';
29fe7a80 8956#endif
5f66b61c 8957 /*FALLTHROUGH*/
fc36a67e 8958 case 'u':
8959 base = 10;
8960 goto uns_integer;
8961
4f19785b
WSI
8962 case 'b':
8963 base = 2;
8964 goto uns_integer;
8965
46fc3d4c 8966 case 'O':
29fe7a80 8967#ifdef IV_IS_QUAD
22f3ae8c 8968 intsize = 'q';
29fe7a80 8969#else
46fc3d4c 8970 intsize = 'l';
29fe7a80 8971#endif
5f66b61c 8972 /*FALLTHROUGH*/
46fc3d4c 8973 case 'o':
8974 base = 8;
8975 goto uns_integer;
8976
8977 case 'X':
46fc3d4c 8978 case 'x':
8979 base = 16;
46fc3d4c 8980
8981 uns_integer:
b22c7a20 8982 if (vectorize) {
ba210ebe 8983 STRLEN ulen;
b22c7a20 8984 vector:
211dfcf1
HS
8985 if (!veclen)
8986 continue;
2cf2cfc6
A
8987 if (vec_utf8)
8988 uv = utf8n_to_uvchr(vecstr, veclen, &ulen,
8989 UTF8_ALLOW_ANYUV);
b22c7a20 8990 else {
a05b299f 8991 uv = *vecstr;
b22c7a20
GS
8992 ulen = 1;
8993 }
8994 vecstr += ulen;
8995 veclen -= ulen;
8996 }
8997 else if (args) {
46fc3d4c 8998 switch (intsize) {
8999 case 'h': uv = (unsigned short)va_arg(*args, unsigned); break;
46fc3d4c 9000 case 'l': uv = va_arg(*args, unsigned long); break;
fc36a67e 9001 case 'V': uv = va_arg(*args, UV); break;
b10c0dba 9002 default: uv = va_arg(*args, unsigned); break;
cf2093f6 9003#ifdef HAS_QUAD
9e3321a5 9004 case 'q': uv = va_arg(*args, Uquad_t); break;
cf2093f6 9005#endif
46fc3d4c 9006 }
9007 }
9008 else {
b10c0dba 9009 UV tuv = SvUVx(argsv); /* work around GCC bug #13488 */
46fc3d4c 9010 switch (intsize) {
b10c0dba
MHM
9011 case 'h': uv = (unsigned short)tuv; break;
9012 case 'l': uv = (unsigned long)tuv; break;
9013 case 'V':
9014 default: uv = tuv; break;
cf2093f6 9015#ifdef HAS_QUAD
b10c0dba 9016 case 'q': uv = (Uquad_t)tuv; break;
cf2093f6 9017#endif
46fc3d4c 9018 }
9019 }
9020
9021 integer:
4d84ee25
NC
9022 {
9023 char *ptr = ebuf + sizeof ebuf;
1387f30c
DD
9024 bool tempalt = uv ? alt : FALSE; /* Vectors can't change alt */
9025 zeros = 0;
9026
4d84ee25
NC
9027 switch (base) {
9028 unsigned dig;
9029 case 16:
4d84ee25
NC
9030 p = (char*)((c == 'X')
9031 ? "0123456789ABCDEF" : "0123456789abcdef");
9032 do {
9033 dig = uv & 15;
9034 *--ptr = p[dig];
9035 } while (uv >>= 4);
1387f30c 9036 if (tempalt) {
4d84ee25
NC
9037 esignbuf[esignlen++] = '0';
9038 esignbuf[esignlen++] = c; /* 'x' or 'X' */
9039 }
9040 break;
9041 case 8:
9042 do {
9043 dig = uv & 7;
9044 *--ptr = '0' + dig;
9045 } while (uv >>= 3);
9046 if (alt && *ptr != '0')
9047 *--ptr = '0';
9048 break;
9049 case 2:
9050 do {
9051 dig = uv & 1;
9052 *--ptr = '0' + dig;
9053 } while (uv >>= 1);
1387f30c 9054 if (tempalt) {
4d84ee25
NC
9055 esignbuf[esignlen++] = '0';
9056 esignbuf[esignlen++] = 'b';
9057 }
9058 break;
9059 default: /* it had better be ten or less */
9060 do {
9061 dig = uv % base;
9062 *--ptr = '0' + dig;
9063 } while (uv /= base);
9064 break;
46fc3d4c 9065 }
4d84ee25
NC
9066 elen = (ebuf + sizeof ebuf) - ptr;
9067 eptr = ptr;
9068 if (has_precis) {
9069 if (precis > elen)
9070 zeros = precis - elen;
9071 else if (precis == 0 && elen == 1 && *eptr == '0')
9072 elen = 0;
eda88b6d 9073 }
c10ed8b9 9074 }
46fc3d4c 9075 break;
9076
9077 /* FLOATING POINT */
9078
fc36a67e 9079 case 'F':
9080 c = 'f'; /* maybe %F isn't supported here */
5f66b61c 9081 /*FALLTHROUGH*/
46fc3d4c 9082 case 'e': case 'E':
fc36a67e 9083 case 'f':
46fc3d4c 9084 case 'g': case 'G':
26372e71
GA
9085 if (vectorize)
9086 goto unknown;
46fc3d4c 9087
9088 /* This is evil, but floating point is even more evil */
9089
9e5b023a
JH
9090 /* for SV-style calling, we can only get NV
9091 for C-style calling, we assume %f is double;
9092 for simplicity we allow any of %Lf, %llf, %qf for long double
9093 */
9094 switch (intsize) {
9095 case 'V':
9096#if defined(USE_LONG_DOUBLE)
9097 intsize = 'q';
9098#endif
9099 break;
8a2e3f14 9100/* [perl #20339] - we should accept and ignore %lf rather than die */
00e17364 9101 case 'l':
5f66b61c 9102 /*FALLTHROUGH*/
9e5b023a
JH
9103 default:
9104#if defined(USE_LONG_DOUBLE)
9105 intsize = args ? 0 : 'q';
9106#endif
9107 break;
9108 case 'q':
9109#if defined(HAS_LONG_DOUBLE)
9110 break;
9111#else
5f66b61c 9112 /*FALLTHROUGH*/
9e5b023a
JH
9113#endif
9114 case 'h':
9e5b023a
JH
9115 goto unknown;
9116 }
9117
9118 /* now we need (long double) if intsize == 'q', else (double) */
26372e71 9119 nv = (args) ?
35fff930
JH
9120#if LONG_DOUBLESIZE > DOUBLESIZE
9121 intsize == 'q' ?
205f51d8
AS
9122 va_arg(*args, long double) :
9123 va_arg(*args, double)
35fff930 9124#else
205f51d8 9125 va_arg(*args, double)
35fff930 9126#endif
9e5b023a 9127 : SvNVx(argsv);
fc36a67e 9128
9129 need = 0;
9130 if (c != 'e' && c != 'E') {
9131 i = PERL_INT_MIN;
9e5b023a
JH
9132 /* FIXME: if HAS_LONG_DOUBLE but not USE_LONG_DOUBLE this
9133 will cast our (long double) to (double) */
73b309ea 9134 (void)Perl_frexp(nv, &i);
fc36a67e 9135 if (i == PERL_INT_MIN)
cea2e8a9 9136 Perl_die(aTHX_ "panic: frexp");
c635e13b 9137 if (i > 0)
fc36a67e 9138 need = BIT_DIGITS(i);
9139 }
9140 need += has_precis ? precis : 6; /* known default */
20f6aaab 9141
fc36a67e 9142 if (need < width)
9143 need = width;
9144
20f6aaab
AS
9145#ifdef HAS_LDBL_SPRINTF_BUG
9146 /* This is to try to fix a bug with irix/nonstop-ux/powerux and
205f51d8
AS
9147 with sfio - Allen <allens@cpan.org> */
9148
9149# ifdef DBL_MAX
9150# define MY_DBL_MAX DBL_MAX
9151# else /* XXX guessing! HUGE_VAL may be defined as infinity, so not using */
9152# if DOUBLESIZE >= 8
9153# define MY_DBL_MAX 1.7976931348623157E+308L
9154# else
9155# define MY_DBL_MAX 3.40282347E+38L
9156# endif
9157# endif
9158
9159# ifdef HAS_LDBL_SPRINTF_BUG_LESS1 /* only between -1L & 1L - Allen */
9160# define MY_DBL_MAX_BUG 1L
20f6aaab 9161# else
205f51d8 9162# define MY_DBL_MAX_BUG MY_DBL_MAX
20f6aaab 9163# endif
20f6aaab 9164
205f51d8
AS
9165# ifdef DBL_MIN
9166# define MY_DBL_MIN DBL_MIN
9167# else /* XXX guessing! -Allen */
9168# if DOUBLESIZE >= 8
9169# define MY_DBL_MIN 2.2250738585072014E-308L
9170# else
9171# define MY_DBL_MIN 1.17549435E-38L
9172# endif
9173# endif
20f6aaab 9174
205f51d8
AS
9175 if ((intsize == 'q') && (c == 'f') &&
9176 ((nv < MY_DBL_MAX_BUG) && (nv > -MY_DBL_MAX_BUG)) &&
9177 (need < DBL_DIG)) {
9178 /* it's going to be short enough that
9179 * long double precision is not needed */
9180
9181 if ((nv <= 0L) && (nv >= -0L))
9182 fix_ldbl_sprintf_bug = TRUE; /* 0 is 0 - easiest */
9183 else {
9184 /* would use Perl_fp_class as a double-check but not
9185 * functional on IRIX - see perl.h comments */
9186
9187 if ((nv >= MY_DBL_MIN) || (nv <= -MY_DBL_MIN)) {
9188 /* It's within the range that a double can represent */
9189#if defined(DBL_MAX) && !defined(DBL_MIN)
9190 if ((nv >= ((long double)1/DBL_MAX)) ||
9191 (nv <= (-(long double)1/DBL_MAX)))
20f6aaab 9192#endif
205f51d8 9193 fix_ldbl_sprintf_bug = TRUE;
20f6aaab 9194 }
205f51d8
AS
9195 }
9196 if (fix_ldbl_sprintf_bug == TRUE) {
9197 double temp;
9198
9199 intsize = 0;
9200 temp = (double)nv;
9201 nv = (NV)temp;
9202 }
20f6aaab 9203 }
205f51d8
AS
9204
9205# undef MY_DBL_MAX
9206# undef MY_DBL_MAX_BUG
9207# undef MY_DBL_MIN
9208
20f6aaab
AS
9209#endif /* HAS_LDBL_SPRINTF_BUG */
9210
46fc3d4c 9211 need += 20; /* fudge factor */
80252599
GS
9212 if (PL_efloatsize < need) {
9213 Safefree(PL_efloatbuf);
9214 PL_efloatsize = need + 20; /* more fudge */
a02a5408 9215 Newx(PL_efloatbuf, PL_efloatsize, char);
7d5ea4e7 9216 PL_efloatbuf[0] = '\0';
46fc3d4c 9217 }
9218
4151a5fe
IZ
9219 if ( !(width || left || plus || alt) && fill != '0'
9220 && has_precis && intsize != 'q' ) { /* Shortcuts */
2873255c
NC
9221 /* See earlier comment about buggy Gconvert when digits,
9222 aka precis is 0 */
9223 if ( c == 'g' && precis) {
2e59c212 9224 Gconvert((NV)nv, (int)precis, 0, PL_efloatbuf);
4150c189
NC
9225 /* May return an empty string for digits==0 */
9226 if (*PL_efloatbuf) {
9227 elen = strlen(PL_efloatbuf);
4151a5fe 9228 goto float_converted;
4150c189 9229 }
4151a5fe
IZ
9230 } else if ( c == 'f' && !precis) {
9231 if ((eptr = F0convert(nv, ebuf + sizeof ebuf, &elen)))
9232 break;
9233 }
9234 }
4d84ee25
NC
9235 {
9236 char *ptr = ebuf + sizeof ebuf;
9237 *--ptr = '\0';
9238 *--ptr = c;
9239 /* FIXME: what to do if HAS_LONG_DOUBLE but not PERL_PRIfldbl? */
9e5b023a 9240#if defined(HAS_LONG_DOUBLE) && defined(PERL_PRIfldbl)
4d84ee25
NC
9241 if (intsize == 'q') {
9242 /* Copy the one or more characters in a long double
9243 * format before the 'base' ([efgEFG]) character to
9244 * the format string. */
9245 static char const prifldbl[] = PERL_PRIfldbl;
9246 char const *p = prifldbl + sizeof(prifldbl) - 3;
9247 while (p >= prifldbl) { *--ptr = *p--; }
9248 }
65202027 9249#endif
4d84ee25
NC
9250 if (has_precis) {
9251 base = precis;
9252 do { *--ptr = '0' + (base % 10); } while (base /= 10);
9253 *--ptr = '.';
9254 }
9255 if (width) {
9256 base = width;
9257 do { *--ptr = '0' + (base % 10); } while (base /= 10);
9258 }
9259 if (fill == '0')
9260 *--ptr = fill;
9261 if (left)
9262 *--ptr = '-';
9263 if (plus)
9264 *--ptr = plus;
9265 if (alt)
9266 *--ptr = '#';
9267 *--ptr = '%';
9268
9269 /* No taint. Otherwise we are in the strange situation
9270 * where printf() taints but print($float) doesn't.
9271 * --jhi */
9e5b023a 9272#if defined(HAS_LONG_DOUBLE)
4150c189 9273 elen = ((intsize == 'q')
d9fad198
JH
9274 ? my_snprintf(PL_efloatbuf, PL_efloatsize, ptr, nv)
9275 : my_snprintf(PL_efloatbuf, PL_efloatsize, ptr, (double)nv));
9e5b023a 9276#else
4150c189 9277 elen = my_sprintf(PL_efloatbuf, ptr, nv);
9e5b023a 9278#endif
4d84ee25 9279 }
4151a5fe 9280 float_converted:
80252599 9281 eptr = PL_efloatbuf;
46fc3d4c 9282 break;
9283
fc36a67e 9284 /* SPECIAL */
9285
9286 case 'n':
26372e71
GA
9287 if (vectorize)
9288 goto unknown;
fc36a67e 9289 i = SvCUR(sv) - origlen;
26372e71 9290 if (args) {
c635e13b 9291 switch (intsize) {
9292 case 'h': *(va_arg(*args, short*)) = i; break;
9293 default: *(va_arg(*args, int*)) = i; break;
9294 case 'l': *(va_arg(*args, long*)) = i; break;
9295 case 'V': *(va_arg(*args, IV*)) = i; break;
cf2093f6
JH
9296#ifdef HAS_QUAD
9297 case 'q': *(va_arg(*args, Quad_t*)) = i; break;
9298#endif
c635e13b 9299 }
fc36a67e 9300 }
9dd79c3f 9301 else
211dfcf1 9302 sv_setuv_mg(argsv, (UV)i);
fc36a67e 9303 continue; /* not "break" */
9304
9305 /* UNKNOWN */
9306
46fc3d4c 9307 default:
fc36a67e 9308 unknown:
041457d9
DM
9309 if (!args
9310 && (PL_op->op_type == OP_PRTF || PL_op->op_type == OP_SPRINTF)
9311 && ckWARN(WARN_PRINTF))
9312 {
c4420975 9313 SV * const msg = sv_newmortal();
35c1215d
NC
9314 Perl_sv_setpvf(aTHX_ msg, "Invalid conversion in %sprintf: ",
9315 (PL_op->op_type == OP_PRTF) ? "" : "s");
0f4b6630 9316 if (c) {
0f4b6630 9317 if (isPRINT(c))
1c846c1f 9318 Perl_sv_catpvf(aTHX_ msg,
0f4b6630
JH
9319 "\"%%%c\"", c & 0xFF);
9320 else
9321 Perl_sv_catpvf(aTHX_ msg,
57def98f 9322 "\"%%\\%03"UVof"\"",
0f4b6630 9323 (UV)c & 0xFF);
0f4b6630 9324 } else
396482e1 9325 sv_catpvs(msg, "end of string");
95b63a38 9326 Perl_warner(aTHX_ packWARN(WARN_PRINTF), "%"SVf, (void*)msg); /* yes, this is reentrant */
c635e13b 9327 }
fb73857a 9328
9329 /* output mangled stuff ... */
9330 if (c == '\0')
9331 --q;
46fc3d4c 9332 eptr = p;
9333 elen = q - p;
fb73857a 9334
9335 /* ... right here, because formatting flags should not apply */
9336 SvGROW(sv, SvCUR(sv) + elen + 1);
9337 p = SvEND(sv);
4459522c 9338 Copy(eptr, p, elen, char);
fb73857a 9339 p += elen;
9340 *p = '\0';
3f7c398e 9341 SvCUR_set(sv, p - SvPVX_const(sv));
58e33a90 9342 svix = osvix;
fb73857a 9343 continue; /* not "break" */
46fc3d4c 9344 }
9345
cc61b222
TS
9346 if (is_utf8 != has_utf8) {
9347 if (is_utf8) {
9348 if (SvCUR(sv))
9349 sv_utf8_upgrade(sv);
9350 }
9351 else {
9352 const STRLEN old_elen = elen;
9353 SV * const nsv = sv_2mortal(newSVpvn(eptr, elen));
9354 sv_utf8_upgrade(nsv);
9355 eptr = SvPVX_const(nsv);
9356 elen = SvCUR(nsv);
9357
9358 if (width) { /* fudge width (can't fudge elen) */
9359 width += elen - old_elen;
9360 }
9361 is_utf8 = TRUE;
9362 }
9363 }
9364
6c94ec8b 9365 have = esignlen + zeros + elen;
ed2b91d2
GA
9366 if (have < zeros)
9367 Perl_croak_nocontext(PL_memory_wrap);
6c94ec8b 9368
46fc3d4c 9369 need = (have > width ? have : width);
9370 gap = need - have;
9371
d2641cbd
PC
9372 if (need >= (((STRLEN)~0) - SvCUR(sv) - dotstrlen - 1))
9373 Perl_croak_nocontext(PL_memory_wrap);
b22c7a20 9374 SvGROW(sv, SvCUR(sv) + need + dotstrlen + 1);
46fc3d4c 9375 p = SvEND(sv);
9376 if (esignlen && fill == '0') {
53c1dcc0 9377 int i;
eb160463 9378 for (i = 0; i < (int)esignlen; i++)
46fc3d4c 9379 *p++ = esignbuf[i];
9380 }
9381 if (gap && !left) {
9382 memset(p, fill, gap);
9383 p += gap;
9384 }
9385 if (esignlen && fill != '0') {
53c1dcc0 9386 int i;
eb160463 9387 for (i = 0; i < (int)esignlen; i++)
46fc3d4c 9388 *p++ = esignbuf[i];
9389 }
fc36a67e 9390 if (zeros) {
53c1dcc0 9391 int i;
fc36a67e 9392 for (i = zeros; i; i--)
9393 *p++ = '0';
9394 }
46fc3d4c 9395 if (elen) {
4459522c 9396 Copy(eptr, p, elen, char);
46fc3d4c 9397 p += elen;
9398 }
9399 if (gap && left) {
9400 memset(p, ' ', gap);
9401 p += gap;
9402 }
b22c7a20
GS
9403 if (vectorize) {
9404 if (veclen) {
4459522c 9405 Copy(dotstr, p, dotstrlen, char);
b22c7a20
GS
9406 p += dotstrlen;
9407 }
9408 else
9409 vectorize = FALSE; /* done iterating over vecstr */
9410 }
2cf2cfc6
A
9411 if (is_utf8)
9412 has_utf8 = TRUE;
9413 if (has_utf8)
7e2040f0 9414 SvUTF8_on(sv);
46fc3d4c 9415 *p = '\0';
3f7c398e 9416 SvCUR_set(sv, p - SvPVX_const(sv));
b22c7a20
GS
9417 if (vectorize) {
9418 esignlen = 0;
9419 goto vector;
9420 }
46fc3d4c 9421 }
9422}
51371543 9423
645c22ef
DM
9424/* =========================================================================
9425
9426=head1 Cloning an interpreter
9427
9428All the macros and functions in this section are for the private use of
9429the main function, perl_clone().
9430
9431The foo_dup() functions make an exact copy of an existing foo thinngy.
9432During the course of a cloning, a hash table is used to map old addresses
9433to new addresses. The table is created and manipulated with the
9434ptr_table_* functions.
9435
9436=cut
9437
9438============================================================================*/
9439
9440
1d7c1841
GS
9441#if defined(USE_ITHREADS)
9442
d4c19fe8 9443/* XXX Remove this so it doesn't have to go thru the macro and return for nothing */
1d7c1841
GS
9444#ifndef GpREFCNT_inc
9445# define GpREFCNT_inc(gp) ((gp) ? (++(gp)->gp_refcnt, (gp)) : (GP*)NULL)
9446#endif
9447
9448
a41cc44e
NC
9449/* Certain cases in Perl_ss_dup have been merged, by relying on the fact
9450 that currently av_dup and hv_dup are the same as sv_dup. If this changes,
9451 please unmerge ss_dup. */
d2d73c3e 9452#define sv_dup_inc(s,t) SvREFCNT_inc(sv_dup(s,t))
7f466ec7 9453#define sv_dup_inc_NN(s,t) SvREFCNT_inc_NN(sv_dup(s,t))
d2d73c3e
AB
9454#define av_dup(s,t) (AV*)sv_dup((SV*)s,t)
9455#define av_dup_inc(s,t) (AV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9456#define hv_dup(s,t) (HV*)sv_dup((SV*)s,t)
9457#define hv_dup_inc(s,t) (HV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9458#define cv_dup(s,t) (CV*)sv_dup((SV*)s,t)
9459#define cv_dup_inc(s,t) (CV*)SvREFCNT_inc(sv_dup((SV*)s,t))
9460#define io_dup(s,t) (IO*)sv_dup((SV*)s,t)
9461#define io_dup_inc(s,t) (IO*)SvREFCNT_inc(sv_dup((SV*)s,t))
9462#define gv_dup(s,t) (GV*)sv_dup((SV*)s,t)
9463#define gv_dup_inc(s,t) (GV*)SvREFCNT_inc(sv_dup((SV*)s,t))
6136c704
AL
9464#define SAVEPV(p) ((p) ? savepv(p) : NULL)
9465#define SAVEPVN(p,n) ((p) ? savepvn(p,n) : NULL)
8cf8f3d1 9466
d2d73c3e 9467
d2f185dc
AMS
9468/* Duplicate a regexp. Required reading: pregcomp() and pregfree() in
9469 regcomp.c. AMS 20010712 */
645c22ef 9470
1d7c1841 9471REGEXP *
53c1dcc0 9472Perl_re_dup(pTHX_ const REGEXP *r, CLONE_PARAMS *param)
1d7c1841 9473{
27da23d5 9474 dVAR;
d2f185dc
AMS
9475 REGEXP *ret;
9476 int i, len, npar;
9477 struct reg_substr_datum *s;
9478
9479 if (!r)
9480 return (REGEXP *)NULL;
9481
9482 if ((ret = (REGEXP *)ptr_table_fetch(PL_ptr_table, r)))
9483 return ret;
9484
9485 len = r->offsets[0];
9486 npar = r->nparens+1;
9487
a02a5408 9488 Newxc(ret, sizeof(regexp) + (len+1)*sizeof(regnode), char, regexp);
d2f185dc
AMS
9489 Copy(r->program, ret->program, len+1, regnode);
9490
a02a5408 9491 Newx(ret->startp, npar, I32);
d2f185dc 9492 Copy(r->startp, ret->startp, npar, I32);
a02a5408 9493 Newx(ret->endp, npar, I32);
d2f185dc
AMS
9494 Copy(r->startp, ret->startp, npar, I32);
9495
a02a5408 9496 Newx(ret->substrs, 1, struct reg_substr_data);
d2f185dc
AMS
9497 for (s = ret->substrs->data, i = 0; i < 3; i++, s++) {
9498 s->min_offset = r->substrs->data[i].min_offset;
9499 s->max_offset = r->substrs->data[i].max_offset;
9500 s->substr = sv_dup_inc(r->substrs->data[i].substr, param);
33b8afdf 9501 s->utf8_substr = sv_dup_inc(r->substrs->data[i].utf8_substr, param);
d2f185dc
AMS
9502 }
9503
70612e96 9504 ret->regstclass = NULL;
d2f185dc
AMS
9505 if (r->data) {
9506 struct reg_data *d;
e1ec3a88 9507 const int count = r->data->count;
53c1dcc0 9508 int i;
d2f185dc 9509
a02a5408 9510 Newxc(d, sizeof(struct reg_data) + count*sizeof(void *),
d2f185dc 9511 char, struct reg_data);
a02a5408 9512 Newx(d->what, count, U8);
d2f185dc
AMS
9513
9514 d->count = count;
9515 for (i = 0; i < count; i++) {
9516 d->what[i] = r->data->what[i];
9517 switch (d->what[i]) {
a3621e74
YO
9518 /* legal options are one of: sfpont
9519 see also regcomp.h and pregfree() */
d2f185dc
AMS
9520 case 's':
9521 d->data[i] = sv_dup_inc((SV *)r->data->data[i], param);
9522 break;
9523 case 'p':
9524 d->data[i] = av_dup_inc((AV *)r->data->data[i], param);
9525 break;
9526 case 'f':
9527 /* This is cheating. */
a02a5408 9528 Newx(d->data[i], 1, struct regnode_charclass_class);
d2f185dc
AMS
9529 StructCopy(r->data->data[i], d->data[i],
9530 struct regnode_charclass_class);
70612e96 9531 ret->regstclass = (regnode*)d->data[i];
d2f185dc
AMS
9532 break;
9533 case 'o':
33773810
AMS
9534 /* Compiled op trees are readonly, and can thus be
9535 shared without duplication. */
b34c0dd4 9536 OP_REFCNT_LOCK;
9b978d73 9537 d->data[i] = (void*)OpREFCNT_inc((OP*)r->data->data[i]);
b34c0dd4 9538 OP_REFCNT_UNLOCK;
9b978d73 9539 break;
d2f185dc
AMS
9540 case 'n':
9541 d->data[i] = r->data->data[i];
9542 break;
a3621e74
YO
9543 case 't':
9544 d->data[i] = r->data->data[i];
9545 OP_REFCNT_LOCK;
9546 ((reg_trie_data*)d->data[i])->refcount++;
9547 OP_REFCNT_UNLOCK;
9548 break;
be8e71aa
YO
9549 case 'T':
9550 d->data[i] = r->data->data[i];
9551 OP_REFCNT_LOCK;
9552 ((reg_ac_data*)d->data[i])->refcount++;
9553 OP_REFCNT_UNLOCK;
9554 /* Trie stclasses are readonly and can thus be shared
9555 * without duplication. We free the stclass in pregfree
9556 * when the corresponding reg_ac_data struct is freed.
9557 */
9558 ret->regstclass= r->regstclass;
9559 break;
a3621e74
YO
9560 default:
9561 Perl_croak(aTHX_ "panic: re_dup unknown data code '%c'", r->data->what[i]);
d2f185dc
AMS
9562 }
9563 }
9564
9565 ret->data = d;
9566 }
9567 else
9568 ret->data = NULL;
9569
a02a5408 9570 Newx(ret->offsets, 2*len+1, U32);
d2f185dc
AMS
9571 Copy(r->offsets, ret->offsets, 2*len+1, U32);
9572
e01c5899 9573 ret->precomp = SAVEPVN(r->precomp, r->prelen);
d2f185dc
AMS
9574 ret->refcnt = r->refcnt;
9575 ret->minlen = r->minlen;
9576 ret->prelen = r->prelen;
9577 ret->nparens = r->nparens;
9578 ret->lastparen = r->lastparen;
9579 ret->lastcloseparen = r->lastcloseparen;
9580 ret->reganch = r->reganch;
9581
70612e96
RG
9582 ret->sublen = r->sublen;
9583
9584 if (RX_MATCH_COPIED(ret))
e01c5899 9585 ret->subbeg = SAVEPVN(r->subbeg, r->sublen);
70612e96 9586 else
bd61b366 9587 ret->subbeg = NULL;
f8c7b90f 9588#ifdef PERL_OLD_COPY_ON_WRITE
a0714e2c 9589 ret->saved_copy = NULL;
9a26048b 9590#endif
70612e96 9591
d2f185dc
AMS
9592 ptr_table_store(PL_ptr_table, r, ret);
9593 return ret;
1d7c1841
GS
9594}
9595
d2d73c3e 9596/* duplicate a file handle */
645c22ef 9597
1d7c1841 9598PerlIO *
a8fc9800 9599Perl_fp_dup(pTHX_ PerlIO *fp, char type, CLONE_PARAMS *param)
1d7c1841
GS
9600{
9601 PerlIO *ret;
53c1dcc0
AL
9602
9603 PERL_UNUSED_ARG(type);
73d840c0 9604
1d7c1841
GS
9605 if (!fp)
9606 return (PerlIO*)NULL;
9607
9608 /* look for it in the table first */
9609 ret = (PerlIO*)ptr_table_fetch(PL_ptr_table, fp);
9610 if (ret)
9611 return ret;
9612
9613 /* create anew and remember what it is */
ecdeb87c 9614 ret = PerlIO_fdupopen(aTHX_ fp, param, PERLIO_DUP_CLONE);
1d7c1841
GS
9615 ptr_table_store(PL_ptr_table, fp, ret);
9616 return ret;
9617}
9618
645c22ef
DM
9619/* duplicate a directory handle */
9620
1d7c1841
GS
9621DIR *
9622Perl_dirp_dup(pTHX_ DIR *dp)
9623{
96a5add6 9624 PERL_UNUSED_CONTEXT;
1d7c1841
GS
9625 if (!dp)
9626 return (DIR*)NULL;
9627 /* XXX TODO */
9628 return dp;
9629}
9630
ff276b08 9631/* duplicate a typeglob */
645c22ef 9632
1d7c1841 9633GP *
a8fc9800 9634Perl_gp_dup(pTHX_ GP *gp, CLONE_PARAMS* param)
1d7c1841
GS
9635{
9636 GP *ret;
b37c2d43 9637
1d7c1841
GS
9638 if (!gp)
9639 return (GP*)NULL;
9640 /* look for it in the table first */
9641 ret = (GP*)ptr_table_fetch(PL_ptr_table, gp);
9642 if (ret)
9643 return ret;
9644
9645 /* create anew and remember what it is */
a02a5408 9646 Newxz(ret, 1, GP);
1d7c1841
GS
9647 ptr_table_store(PL_ptr_table, gp, ret);
9648
9649 /* clone */
9650 ret->gp_refcnt = 0; /* must be before any other dups! */
d2d73c3e
AB
9651 ret->gp_sv = sv_dup_inc(gp->gp_sv, param);
9652 ret->gp_io = io_dup_inc(gp->gp_io, param);
9653 ret->gp_form = cv_dup_inc(gp->gp_form, param);
9654 ret->gp_av = av_dup_inc(gp->gp_av, param);
9655 ret->gp_hv = hv_dup_inc(gp->gp_hv, param);
9656 ret->gp_egv = gv_dup(gp->gp_egv, param);/* GvEGV is not refcounted */
9657 ret->gp_cv = cv_dup_inc(gp->gp_cv, param);
1d7c1841 9658 ret->gp_cvgen = gp->gp_cvgen;
1d7c1841 9659 ret->gp_line = gp->gp_line;
f4890806 9660 ret->gp_file_hek = hek_dup(gp->gp_file_hek, param);
1d7c1841
GS
9661 return ret;
9662}
9663
645c22ef
DM
9664/* duplicate a chain of magic */
9665
1d7c1841 9666MAGIC *
a8fc9800 9667Perl_mg_dup(pTHX_ MAGIC *mg, CLONE_PARAMS* param)
1d7c1841 9668{
cb359b41
JH
9669 MAGIC *mgprev = (MAGIC*)NULL;
9670 MAGIC *mgret;
1d7c1841
GS
9671 if (!mg)
9672 return (MAGIC*)NULL;
9673 /* look for it in the table first */
9674 mgret = (MAGIC*)ptr_table_fetch(PL_ptr_table, mg);
9675 if (mgret)
9676 return mgret;
9677
9678 for (; mg; mg = mg->mg_moremagic) {
9679 MAGIC *nmg;
a02a5408 9680 Newxz(nmg, 1, MAGIC);
cb359b41 9681 if (mgprev)
1d7c1841 9682 mgprev->mg_moremagic = nmg;
cb359b41
JH
9683 else
9684 mgret = nmg;
1d7c1841
GS
9685 nmg->mg_virtual = mg->mg_virtual; /* XXX copy dynamic vtable? */
9686 nmg->mg_private = mg->mg_private;
9687 nmg->mg_type = mg->mg_type;
9688 nmg->mg_flags = mg->mg_flags;
14befaf4 9689 if (mg->mg_type == PERL_MAGIC_qr) {
d2f185dc 9690 nmg->mg_obj = (SV*)re_dup((REGEXP*)mg->mg_obj, param);
1d7c1841 9691 }
05bd4103 9692 else if(mg->mg_type == PERL_MAGIC_backref) {
d7cbc7b5
NC
9693 /* The backref AV has its reference count deliberately bumped by
9694 1. */
9695 nmg->mg_obj = SvREFCNT_inc(av_dup_inc((AV*) mg->mg_obj, param));
05bd4103 9696 }
8d2f4536
NC
9697 else if (mg->mg_type == PERL_MAGIC_symtab) {
9698 nmg->mg_obj = mg->mg_obj;
9699 }
1d7c1841
GS
9700 else {
9701 nmg->mg_obj = (mg->mg_flags & MGf_REFCOUNTED)
d2d73c3e
AB
9702 ? sv_dup_inc(mg->mg_obj, param)
9703 : sv_dup(mg->mg_obj, param);
1d7c1841
GS
9704 }
9705 nmg->mg_len = mg->mg_len;
9706 nmg->mg_ptr = mg->mg_ptr; /* XXX random ptr? */
14befaf4 9707 if (mg->mg_ptr && mg->mg_type != PERL_MAGIC_regex_global) {
68795e93 9708 if (mg->mg_len > 0) {
1d7c1841 9709 nmg->mg_ptr = SAVEPVN(mg->mg_ptr, mg->mg_len);
14befaf4
DM
9710 if (mg->mg_type == PERL_MAGIC_overload_table &&
9711 AMT_AMAGIC((AMT*)mg->mg_ptr))
9712 {
c445ea15 9713 const AMT * const amtp = (AMT*)mg->mg_ptr;
0bcc34c2 9714 AMT * const namtp = (AMT*)nmg->mg_ptr;
1d7c1841
GS
9715 I32 i;
9716 for (i = 1; i < NofAMmeth; i++) {
d2d73c3e 9717 namtp->table[i] = cv_dup_inc(amtp->table[i], param);
1d7c1841
GS
9718 }
9719 }
9720 }
9721 else if (mg->mg_len == HEf_SVKEY)
d2d73c3e 9722 nmg->mg_ptr = (char*)sv_dup_inc((SV*)mg->mg_ptr, param);
1d7c1841 9723 }
68795e93
NIS
9724 if ((mg->mg_flags & MGf_DUP) && mg->mg_virtual && mg->mg_virtual->svt_dup) {
9725 CALL_FPTR(nmg->mg_virtual->svt_dup)(aTHX_ nmg, param);
9726 }
1d7c1841
GS
9727 mgprev = nmg;
9728 }
9729 return mgret;
9730}
9731
645c22ef
DM
9732/* create a new pointer-mapping table */
9733
1d7c1841
GS
9734PTR_TBL_t *
9735Perl_ptr_table_new(pTHX)
9736{
9737 PTR_TBL_t *tbl;
96a5add6
AL
9738 PERL_UNUSED_CONTEXT;
9739
a02a5408 9740 Newxz(tbl, 1, PTR_TBL_t);
1d7c1841
GS
9741 tbl->tbl_max = 511;
9742 tbl->tbl_items = 0;
a02a5408 9743 Newxz(tbl->tbl_ary, tbl->tbl_max + 1, PTR_TBL_ENT_t*);
1d7c1841
GS
9744 return tbl;
9745}
9746
7119fd33
NC
9747#define PTR_TABLE_HASH(ptr) \
9748 ((PTR2UV(ptr) >> 3) ^ (PTR2UV(ptr) >> (3 + 7)) ^ (PTR2UV(ptr) >> (3 + 17)))
134ca3d6 9749
93e68bfb
JC
9750/*
9751 we use the PTE_SVSLOT 'reservation' made above, both here (in the
9752 following define) and at call to new_body_inline made below in
9753 Perl_ptr_table_store()
9754 */
9755
9756#define del_pte(p) del_body_type(p, PTE_SVSLOT)
32e691d0 9757
645c22ef
DM
9758/* map an existing pointer using a table */
9759
7bf61b54 9760STATIC PTR_TBL_ENT_t *
b0e6ae5b 9761S_ptr_table_find(PTR_TBL_t *tbl, const void *sv) {
1d7c1841 9762 PTR_TBL_ENT_t *tblent;
4373e329 9763 const UV hash = PTR_TABLE_HASH(sv);
1d7c1841
GS
9764 assert(tbl);
9765 tblent = tbl->tbl_ary[hash & tbl->tbl_max];
9766 for (; tblent; tblent = tblent->next) {
9767 if (tblent->oldval == sv)
7bf61b54 9768 return tblent;
1d7c1841 9769 }
d4c19fe8 9770 return NULL;
7bf61b54
NC
9771}
9772
9773void *
9774Perl_ptr_table_fetch(pTHX_ PTR_TBL_t *tbl, const void *sv)
9775{
b0e6ae5b 9776 PTR_TBL_ENT_t const *const tblent = ptr_table_find(tbl, sv);
96a5add6 9777 PERL_UNUSED_CONTEXT;
d4c19fe8 9778 return tblent ? tblent->newval : NULL;
1d7c1841
GS
9779}
9780
645c22ef
DM
9781/* add a new entry to a pointer-mapping table */
9782
1d7c1841 9783void
44f8325f 9784Perl_ptr_table_store(pTHX_ PTR_TBL_t *tbl, const void *oldsv, void *newsv)
1d7c1841 9785{
0c9fdfe0 9786 PTR_TBL_ENT_t *tblent = ptr_table_find(tbl, oldsv);
96a5add6 9787 PERL_UNUSED_CONTEXT;
1d7c1841 9788
7bf61b54
NC
9789 if (tblent) {
9790 tblent->newval = newsv;
9791 } else {
9792 const UV entry = PTR_TABLE_HASH(oldsv) & tbl->tbl_max;
9793
d2a0f284
JC
9794 new_body_inline(tblent, PTE_SVSLOT);
9795
7bf61b54
NC
9796 tblent->oldval = oldsv;
9797 tblent->newval = newsv;
9798 tblent->next = tbl->tbl_ary[entry];
9799 tbl->tbl_ary[entry] = tblent;
9800 tbl->tbl_items++;
9801 if (tblent->next && tbl->tbl_items > tbl->tbl_max)
9802 ptr_table_split(tbl);
1d7c1841 9803 }
1d7c1841
GS
9804}
9805
645c22ef
DM
9806/* double the hash bucket size of an existing ptr table */
9807
1d7c1841
GS
9808void
9809Perl_ptr_table_split(pTHX_ PTR_TBL_t *tbl)
9810{
9811 PTR_TBL_ENT_t **ary = tbl->tbl_ary;
4373e329 9812 const UV oldsize = tbl->tbl_max + 1;
1d7c1841
GS
9813 UV newsize = oldsize * 2;
9814 UV i;
96a5add6 9815 PERL_UNUSED_CONTEXT;
1d7c1841
GS
9816
9817 Renew(ary, newsize, PTR_TBL_ENT_t*);
9818 Zero(&ary[oldsize], newsize-oldsize, PTR_TBL_ENT_t*);
9819 tbl->tbl_max = --newsize;
9820 tbl->tbl_ary = ary;
9821 for (i=0; i < oldsize; i++, ary++) {
9822 PTR_TBL_ENT_t **curentp, **entp, *ent;
9823 if (!*ary)
9824 continue;
9825 curentp = ary + oldsize;
9826 for (entp = ary, ent = *ary; ent; ent = *entp) {
134ca3d6 9827 if ((newsize & PTR_TABLE_HASH(ent->oldval)) != i) {
1d7c1841
GS
9828 *entp = ent->next;
9829 ent->next = *curentp;
9830 *curentp = ent;
9831 continue;
9832 }
9833 else
9834 entp = &ent->next;
9835 }
9836 }
9837}
9838
645c22ef
DM
9839/* remove all the entries from a ptr table */
9840
a0739874
DM
9841void
9842Perl_ptr_table_clear(pTHX_ PTR_TBL_t *tbl)
9843{
d5cefff9 9844 if (tbl && tbl->tbl_items) {
c445ea15 9845 register PTR_TBL_ENT_t * const * const array = tbl->tbl_ary;
d5cefff9 9846 UV riter = tbl->tbl_max;
a0739874 9847
d5cefff9
NC
9848 do {
9849 PTR_TBL_ENT_t *entry = array[riter];
ab1e7f95 9850
d5cefff9 9851 while (entry) {
00b6aa41 9852 PTR_TBL_ENT_t * const oentry = entry;
d5cefff9
NC
9853 entry = entry->next;
9854 del_pte(oentry);
9855 }
9856 } while (riter--);
a0739874 9857
d5cefff9
NC
9858 tbl->tbl_items = 0;
9859 }
a0739874
DM
9860}
9861
645c22ef
DM
9862/* clear and free a ptr table */
9863
a0739874
DM
9864void
9865Perl_ptr_table_free(pTHX_ PTR_TBL_t *tbl)
9866{
9867 if (!tbl) {
9868 return;
9869 }
9870 ptr_table_clear(tbl);
9871 Safefree(tbl->tbl_ary);
9872 Safefree(tbl);
9873}
9874
5bd07a3d 9875
83841fad 9876void
eb86f8b3 9877Perl_rvpv_dup(pTHX_ SV *dstr, const SV *sstr, CLONE_PARAMS* param)
83841fad
NIS
9878{
9879 if (SvROK(sstr)) {
b162af07
SP
9880 SvRV_set(dstr, SvWEAKREF(sstr)
9881 ? sv_dup(SvRV(sstr), param)
9882 : sv_dup_inc(SvRV(sstr), param));
f880fe2f 9883
83841fad 9884 }
3f7c398e 9885 else if (SvPVX_const(sstr)) {
83841fad
NIS
9886 /* Has something there */
9887 if (SvLEN(sstr)) {
68795e93 9888 /* Normal PV - clone whole allocated space */
3f7c398e 9889 SvPV_set(dstr, SAVEPVN(SvPVX_const(sstr), SvLEN(sstr)-1));
d3d0e6f1
NC
9890 if (SvREADONLY(sstr) && SvFAKE(sstr)) {
9891 /* Not that normal - actually sstr is copy on write.
9892 But we are a true, independant SV, so: */
9893 SvREADONLY_off(dstr);
9894 SvFAKE_off(dstr);
9895 }
68795e93 9896 }
83841fad
NIS
9897 else {
9898 /* Special case - not normally malloced for some reason */
f7877b28
NC
9899 if (isGV_with_GP(sstr)) {
9900 /* Don't need to do anything here. */
9901 }
9902 else if ((SvREADONLY(sstr) && SvFAKE(sstr))) {
ef10be65
NC
9903 /* A "shared" PV - clone it as "shared" PV */
9904 SvPV_set(dstr,
9905 HEK_KEY(hek_dup(SvSHARED_HEK_FROM_PV(SvPVX_const(sstr)),
9906 param)));
83841fad
NIS
9907 }
9908 else {
9909 /* Some other special case - random pointer */
f880fe2f 9910 SvPV_set(dstr, SvPVX(sstr));
d3d0e6f1 9911 }
83841fad
NIS
9912 }
9913 }
9914 else {
4608196e 9915 /* Copy the NULL */
f880fe2f 9916 if (SvTYPE(dstr) == SVt_RV)
b162af07 9917 SvRV_set(dstr, NULL);
f880fe2f 9918 else
6136c704 9919 SvPV_set(dstr, NULL);
83841fad
NIS
9920 }
9921}
9922
662fb8b2
NC
9923/* duplicate an SV of any type (including AV, HV etc) */
9924
1d7c1841 9925SV *
eb86f8b3 9926Perl_sv_dup(pTHX_ const SV *sstr, CLONE_PARAMS* param)
1d7c1841 9927{
27da23d5 9928 dVAR;
1d7c1841
GS
9929 SV *dstr;
9930
9931 if (!sstr || SvTYPE(sstr) == SVTYPEMASK)
6136c704 9932 return NULL;
1d7c1841
GS
9933 /* look for it in the table first */
9934 dstr = (SV*)ptr_table_fetch(PL_ptr_table, sstr);
9935 if (dstr)
9936 return dstr;
9937
0405e91e
AB
9938 if(param->flags & CLONEf_JOIN_IN) {
9939 /** We are joining here so we don't want do clone
9940 something that is bad **/
eb86f8b3
AL
9941 if (SvTYPE(sstr) == SVt_PVHV) {
9942 const char * const hvname = HvNAME_get(sstr);
9943 if (hvname)
9944 /** don't clone stashes if they already exist **/
9945 return (SV*)gv_stashpv(hvname,0);
0405e91e
AB
9946 }
9947 }
9948
1d7c1841
GS
9949 /* create anew and remember what it is */
9950 new_SV(dstr);
fd0854ff
DM
9951
9952#ifdef DEBUG_LEAKING_SCALARS
9953 dstr->sv_debug_optype = sstr->sv_debug_optype;
9954 dstr->sv_debug_line = sstr->sv_debug_line;
9955 dstr->sv_debug_inpad = sstr->sv_debug_inpad;
9956 dstr->sv_debug_cloned = 1;
fd0854ff 9957 dstr->sv_debug_file = savepv(sstr->sv_debug_file);
fd0854ff
DM
9958#endif
9959
1d7c1841
GS
9960 ptr_table_store(PL_ptr_table, sstr, dstr);
9961
9962 /* clone */
9963 SvFLAGS(dstr) = SvFLAGS(sstr);
9964 SvFLAGS(dstr) &= ~SVf_OOK; /* don't propagate OOK hack */
9965 SvREFCNT(dstr) = 0; /* must be before any other dups! */
9966
9967#ifdef DEBUGGING
3f7c398e 9968 if (SvANY(sstr) && PL_watch_pvx && SvPVX_const(sstr) == PL_watch_pvx)
1d7c1841 9969 PerlIO_printf(Perl_debug_log, "watch at %p hit, found string \"%s\"\n",
3f7c398e 9970 PL_watch_pvx, SvPVX_const(sstr));
1d7c1841
GS
9971#endif
9972
9660f481
DM
9973 /* don't clone objects whose class has asked us not to */
9974 if (SvOBJECT(sstr) && ! (SvFLAGS(SvSTASH(sstr)) & SVphv_CLONEABLE)) {
9975 SvFLAGS(dstr) &= ~SVTYPEMASK;
9976 SvOBJECT_off(dstr);
9977 return dstr;
9978 }
9979
1d7c1841
GS
9980 switch (SvTYPE(sstr)) {
9981 case SVt_NULL:
9982 SvANY(dstr) = NULL;
9983 break;
9984 case SVt_IV:
339049b0 9985 SvANY(dstr) = (XPVIV*)((char*)&(dstr->sv_u.svu_iv) - STRUCT_OFFSET(XPVIV, xiv_iv));
45977657 9986 SvIV_set(dstr, SvIVX(sstr));
1d7c1841
GS
9987 break;
9988 case SVt_NV:
9989 SvANY(dstr) = new_XNV();
9d6ce603 9990 SvNV_set(dstr, SvNVX(sstr));
1d7c1841
GS
9991 break;
9992 case SVt_RV:
339049b0 9993 SvANY(dstr) = &(dstr->sv_u.svu_rv);
83841fad 9994 Perl_rvpv_dup(aTHX_ dstr, sstr, param);
1d7c1841 9995 break;
662fb8b2
NC
9996 default:
9997 {
9998 /* These are all the types that need complex bodies allocating. */
662fb8b2 9999 void *new_body;
2bcc16b3
NC
10000 const svtype sv_type = SvTYPE(sstr);
10001 const struct body_details *const sv_type_details
10002 = bodies_by_type + sv_type;
662fb8b2 10003
93e68bfb 10004 switch (sv_type) {
662fb8b2 10005 default:
bb263b4e 10006 Perl_croak(aTHX_ "Bizarre SvTYPE [%" IVdf "]", (IV)SvTYPE(sstr));
662fb8b2
NC
10007 break;
10008
662fb8b2
NC
10009 case SVt_PVGV:
10010 if (GvUNIQUE((GV*)sstr)) {
6f207bd3 10011 NOOP; /* Do sharing here, and fall through */
662fb8b2 10012 }
c22188b4
NC
10013 case SVt_PVIO:
10014 case SVt_PVFM:
10015 case SVt_PVHV:
10016 case SVt_PVAV:
93e68bfb 10017 case SVt_PVBM:
662fb8b2 10018 case SVt_PVCV:
662fb8b2 10019 case SVt_PVLV:
662fb8b2 10020 case SVt_PVMG:
662fb8b2 10021 case SVt_PVNV:
662fb8b2 10022 case SVt_PVIV:
662fb8b2 10023 case SVt_PV:
d2a0f284 10024 assert(sv_type_details->body_size);
c22188b4 10025 if (sv_type_details->arena) {
d2a0f284 10026 new_body_inline(new_body, sv_type);
c22188b4 10027 new_body
b9502f15 10028 = (void*)((char*)new_body - sv_type_details->offset);
c22188b4
NC
10029 } else {
10030 new_body = new_NOARENA(sv_type_details);
10031 }
1d7c1841 10032 }
662fb8b2
NC
10033 assert(new_body);
10034 SvANY(dstr) = new_body;
10035
2bcc16b3 10036#ifndef PURIFY
b9502f15
NC
10037 Copy(((char*)SvANY(sstr)) + sv_type_details->offset,
10038 ((char*)SvANY(dstr)) + sv_type_details->offset,
f32993d6 10039 sv_type_details->copy, char);
2bcc16b3
NC
10040#else
10041 Copy(((char*)SvANY(sstr)),
10042 ((char*)SvANY(dstr)),
d2a0f284 10043 sv_type_details->body_size + sv_type_details->offset, char);
2bcc16b3 10044#endif
662fb8b2 10045
f7877b28
NC
10046 if (sv_type != SVt_PVAV && sv_type != SVt_PVHV
10047 && !isGV_with_GP(dstr))
662fb8b2
NC
10048 Perl_rvpv_dup(aTHX_ dstr, sstr, param);
10049
10050 /* The Copy above means that all the source (unduplicated) pointers
10051 are now in the destination. We can check the flags and the
10052 pointers in either, but it's possible that there's less cache
10053 missing by always going for the destination.
10054 FIXME - instrument and check that assumption */
f32993d6 10055 if (sv_type >= SVt_PVMG) {
885ffcb3
NC
10056 if ((sv_type == SVt_PVMG) && SvPAD_OUR(dstr)) {
10057 OURSTASH_set(dstr, hv_dup_inc(OURSTASH(dstr), param));
e736a858 10058 } else if (SvMAGIC(dstr))
662fb8b2
NC
10059 SvMAGIC_set(dstr, mg_dup(SvMAGIC(dstr), param));
10060 if (SvSTASH(dstr))
10061 SvSTASH_set(dstr, hv_dup_inc(SvSTASH(dstr), param));
1d7c1841 10062 }
662fb8b2 10063
f32993d6
NC
10064 /* The cast silences a GCC warning about unhandled types. */
10065 switch ((int)sv_type) {
662fb8b2
NC
10066 case SVt_PV:
10067 break;
10068 case SVt_PVIV:
10069 break;
10070 case SVt_PVNV:
10071 break;
10072 case SVt_PVMG:
10073 break;
10074 case SVt_PVBM:
10075 break;
10076 case SVt_PVLV:
10077 /* XXX LvTARGOFF sometimes holds PMOP* when DEBUGGING */
10078 if (LvTYPE(dstr) == 't') /* for tie: unrefcnted fake (SV**) */
10079 LvTARG(dstr) = dstr;
10080 else if (LvTYPE(dstr) == 'T') /* for tie: fake HE */
10081 LvTARG(dstr) = (SV*)he_dup((HE*)LvTARG(dstr), 0, param);
10082 else
10083 LvTARG(dstr) = sv_dup_inc(LvTARG(dstr), param);
10084 break;
10085 case SVt_PVGV:
acda4c6a
NC
10086 if (GvNAME_HEK(dstr))
10087 GvNAME_HEK(dstr) = hek_dup(GvNAME_HEK(dstr), param);
f5c1e807 10088
e15faf7d
NC
10089 /* Don't call sv_add_backref here as it's going to be created
10090 as part of the magic cloning of the symbol table. */
f7877b28
NC
10091 GvSTASH(dstr) = hv_dup(GvSTASH(dstr), param);
10092 if(isGV_with_GP(sstr)) {
10093 /* Danger Will Robinson - GvGP(dstr) isn't initialised
10094 at the point of this comment. */
10095 GvGP(dstr) = gp_dup(GvGP(sstr), param);
10096 (void)GpREFCNT_inc(GvGP(dstr));
10097 } else
10098 Perl_rvpv_dup(aTHX_ dstr, sstr, param);
662fb8b2
NC
10099 break;
10100 case SVt_PVIO:
10101 IoIFP(dstr) = fp_dup(IoIFP(dstr), IoTYPE(dstr), param);
10102 if (IoOFP(dstr) == IoIFP(sstr))
10103 IoOFP(dstr) = IoIFP(dstr);
10104 else
10105 IoOFP(dstr) = fp_dup(IoOFP(dstr), IoTYPE(dstr), param);
10106 /* PL_rsfp_filters entries have fake IoDIRP() */
662fb8b2
NC
10107 if(IoFLAGS(dstr) & IOf_FAKE_DIRP) {
10108 /* I have no idea why fake dirp (rsfps)
10109 should be treated differently but otherwise
10110 we end up with leaks -- sky*/
10111 IoTOP_GV(dstr) = gv_dup_inc(IoTOP_GV(dstr), param);
10112 IoFMT_GV(dstr) = gv_dup_inc(IoFMT_GV(dstr), param);
10113 IoBOTTOM_GV(dstr) = gv_dup_inc(IoBOTTOM_GV(dstr), param);
10114 } else {
10115 IoTOP_GV(dstr) = gv_dup(IoTOP_GV(dstr), param);
10116 IoFMT_GV(dstr) = gv_dup(IoFMT_GV(dstr), param);
10117 IoBOTTOM_GV(dstr) = gv_dup(IoBOTTOM_GV(dstr), param);
100ce7e1
NC
10118 if (IoDIRP(dstr)) {
10119 IoDIRP(dstr) = dirp_dup(IoDIRP(dstr));
10120 } else {
6f207bd3 10121 NOOP;
100ce7e1
NC
10122 /* IoDIRP(dstr) is already a copy of IoDIRP(sstr) */
10123 }
662fb8b2
NC
10124 }
10125 IoTOP_NAME(dstr) = SAVEPV(IoTOP_NAME(dstr));
10126 IoFMT_NAME(dstr) = SAVEPV(IoFMT_NAME(dstr));
10127 IoBOTTOM_NAME(dstr) = SAVEPV(IoBOTTOM_NAME(dstr));
10128 break;
10129 case SVt_PVAV:
10130 if (AvARRAY((AV*)sstr)) {
10131 SV **dst_ary, **src_ary;
10132 SSize_t items = AvFILLp((AV*)sstr) + 1;
10133
10134 src_ary = AvARRAY((AV*)sstr);
a02a5408 10135 Newxz(dst_ary, AvMAX((AV*)sstr)+1, SV*);
662fb8b2
NC
10136 ptr_table_store(PL_ptr_table, src_ary, dst_ary);
10137 SvPV_set(dstr, (char*)dst_ary);
10138 AvALLOC((AV*)dstr) = dst_ary;
10139 if (AvREAL((AV*)sstr)) {
10140 while (items-- > 0)
10141 *dst_ary++ = sv_dup_inc(*src_ary++, param);
10142 }
10143 else {
10144 while (items-- > 0)
10145 *dst_ary++ = sv_dup(*src_ary++, param);
10146 }
10147 items = AvMAX((AV*)sstr) - AvFILLp((AV*)sstr);
10148 while (items-- > 0) {
10149 *dst_ary++ = &PL_sv_undef;
10150 }
bfcb3514 10151 }
662fb8b2 10152 else {
bd61b366 10153 SvPV_set(dstr, NULL);
662fb8b2 10154 AvALLOC((AV*)dstr) = (SV**)NULL;
b79f7545 10155 }
662fb8b2
NC
10156 break;
10157 case SVt_PVHV:
7e265ef3
AL
10158 if (HvARRAY((HV*)sstr)) {
10159 STRLEN i = 0;
10160 const bool sharekeys = !!HvSHAREKEYS(sstr);
10161 XPVHV * const dxhv = (XPVHV*)SvANY(dstr);
10162 XPVHV * const sxhv = (XPVHV*)SvANY(sstr);
10163 char *darray;
10164 Newx(darray, PERL_HV_ARRAY_ALLOC_BYTES(dxhv->xhv_max+1)
10165 + (SvOOK(sstr) ? sizeof(struct xpvhv_aux) : 0),
10166 char);
10167 HvARRAY(dstr) = (HE**)darray;
10168 while (i <= sxhv->xhv_max) {
10169 const HE * const source = HvARRAY(sstr)[i];
10170 HvARRAY(dstr)[i] = source
10171 ? he_dup(source, sharekeys, param) : 0;
10172 ++i;
10173 }
10174 if (SvOOK(sstr)) {
10175 HEK *hvname;
10176 const struct xpvhv_aux * const saux = HvAUX(sstr);
10177 struct xpvhv_aux * const daux = HvAUX(dstr);
10178 /* This flag isn't copied. */
10179 /* SvOOK_on(hv) attacks the IV flags. */
10180 SvFLAGS(dstr) |= SVf_OOK;
10181
10182 hvname = saux->xhv_name;
10183 daux->xhv_name = hvname ? hek_dup(hvname, param) : hvname;
10184
10185 daux->xhv_riter = saux->xhv_riter;
10186 daux->xhv_eiter = saux->xhv_eiter
10187 ? he_dup(saux->xhv_eiter,
10188 (bool)!!HvSHAREKEYS(sstr), param) : 0;
10189 daux->xhv_backreferences =
10190 saux->xhv_backreferences
86f55936 10191 ? (AV*) SvREFCNT_inc(
7e265ef3 10192 sv_dup((SV*)saux->xhv_backreferences, param))
86f55936 10193 : 0;
7e265ef3
AL
10194 /* Record stashes for possible cloning in Perl_clone(). */
10195 if (hvname)
10196 av_push(param->stashes, dstr);
662fb8b2 10197 }
662fb8b2 10198 }
7e265ef3
AL
10199 else
10200 SvPV_set(dstr, NULL);
662fb8b2 10201 break;
662fb8b2 10202 case SVt_PVCV:
bb172083
NC
10203 if (!(param->flags & CLONEf_COPY_STACKS)) {
10204 CvDEPTH(dstr) = 0;
10205 }
10206 case SVt_PVFM:
662fb8b2
NC
10207 /* NOTE: not refcounted */
10208 CvSTASH(dstr) = hv_dup(CvSTASH(dstr), param);
10209 OP_REFCNT_LOCK;
d04ba589
NC
10210 if (!CvISXSUB(dstr))
10211 CvROOT(dstr) = OpREFCNT_inc(CvROOT(dstr));
662fb8b2 10212 OP_REFCNT_UNLOCK;
cfae286e 10213 if (CvCONST(dstr) && CvISXSUB(dstr)) {
662fb8b2
NC
10214 CvXSUBANY(dstr).any_ptr = GvUNIQUE(CvGV(dstr)) ?
10215 SvREFCNT_inc(CvXSUBANY(dstr).any_ptr) :
10216 sv_dup_inc((SV *)CvXSUBANY(dstr).any_ptr, param);
10217 }
10218 /* don't dup if copying back - CvGV isn't refcounted, so the
10219 * duped GV may never be freed. A bit of a hack! DAPM */
10220 CvGV(dstr) = (param->flags & CLONEf_JOIN_IN) ?
a0714e2c 10221 NULL : gv_dup(CvGV(dstr), param) ;
662fb8b2
NC
10222 PAD_DUP(CvPADLIST(dstr), CvPADLIST(sstr), param);
10223 CvOUTSIDE(dstr) =
10224 CvWEAKOUTSIDE(sstr)
10225 ? cv_dup( CvOUTSIDE(dstr), param)
10226 : cv_dup_inc(CvOUTSIDE(dstr), param);
aed2304a 10227 if (!CvISXSUB(dstr))
662fb8b2
NC
10228 CvFILE(dstr) = SAVEPV(CvFILE(dstr));
10229 break;
bfcb3514 10230 }
1d7c1841 10231 }
1d7c1841
GS
10232 }
10233
10234 if (SvOBJECT(dstr) && SvTYPE(dstr) != SVt_PVIO)
10235 ++PL_sv_objcount;
10236
10237 return dstr;
d2d73c3e 10238 }
1d7c1841 10239
645c22ef
DM
10240/* duplicate a context */
10241
1d7c1841 10242PERL_CONTEXT *
a8fc9800 10243Perl_cx_dup(pTHX_ PERL_CONTEXT *cxs, I32 ix, I32 max, CLONE_PARAMS* param)
1d7c1841
GS
10244{
10245 PERL_CONTEXT *ncxs;
10246
10247 if (!cxs)
10248 return (PERL_CONTEXT*)NULL;
10249
10250 /* look for it in the table first */
10251 ncxs = (PERL_CONTEXT*)ptr_table_fetch(PL_ptr_table, cxs);
10252 if (ncxs)
10253 return ncxs;
10254
10255 /* create anew and remember what it is */
a02a5408 10256 Newxz(ncxs, max + 1, PERL_CONTEXT);
1d7c1841
GS
10257 ptr_table_store(PL_ptr_table, cxs, ncxs);
10258
10259 while (ix >= 0) {
c445ea15
AL
10260 PERL_CONTEXT * const cx = &cxs[ix];
10261 PERL_CONTEXT * const ncx = &ncxs[ix];
1d7c1841
GS
10262 ncx->cx_type = cx->cx_type;
10263 if (CxTYPE(cx) == CXt_SUBST) {
10264 Perl_croak(aTHX_ "Cloning substitution context is unimplemented");
10265 }
10266 else {
10267 ncx->blk_oldsp = cx->blk_oldsp;
10268 ncx->blk_oldcop = cx->blk_oldcop;
1d7c1841
GS
10269 ncx->blk_oldmarksp = cx->blk_oldmarksp;
10270 ncx->blk_oldscopesp = cx->blk_oldscopesp;
10271 ncx->blk_oldpm = cx->blk_oldpm;
10272 ncx->blk_gimme = cx->blk_gimme;
10273 switch (CxTYPE(cx)) {
10274 case CXt_SUB:
10275 ncx->blk_sub.cv = (cx->blk_sub.olddepth == 0
d2d73c3e
AB
10276 ? cv_dup_inc(cx->blk_sub.cv, param)
10277 : cv_dup(cx->blk_sub.cv,param));
1d7c1841 10278 ncx->blk_sub.argarray = (cx->blk_sub.hasargs
d2d73c3e 10279 ? av_dup_inc(cx->blk_sub.argarray, param)
7d49f689 10280 : NULL);
d2d73c3e 10281 ncx->blk_sub.savearray = av_dup_inc(cx->blk_sub.savearray, param);
1d7c1841
GS
10282 ncx->blk_sub.olddepth = cx->blk_sub.olddepth;
10283 ncx->blk_sub.hasargs = cx->blk_sub.hasargs;
10284 ncx->blk_sub.lval = cx->blk_sub.lval;
f39bc417 10285 ncx->blk_sub.retop = cx->blk_sub.retop;
d8d97e70
DM
10286 ncx->blk_sub.oldcomppad = (PAD*)ptr_table_fetch(PL_ptr_table,
10287 cx->blk_sub.oldcomppad);
1d7c1841
GS
10288 break;
10289 case CXt_EVAL:
10290 ncx->blk_eval.old_in_eval = cx->blk_eval.old_in_eval;
10291 ncx->blk_eval.old_op_type = cx->blk_eval.old_op_type;
b47cad08 10292 ncx->blk_eval.old_namesv = sv_dup_inc(cx->blk_eval.old_namesv, param);
1d7c1841 10293 ncx->blk_eval.old_eval_root = cx->blk_eval.old_eval_root;
d2d73c3e 10294 ncx->blk_eval.cur_text = sv_dup(cx->blk_eval.cur_text, param);
f39bc417 10295 ncx->blk_eval.retop = cx->blk_eval.retop;
1d7c1841
GS
10296 break;
10297 case CXt_LOOP:
10298 ncx->blk_loop.label = cx->blk_loop.label;
10299 ncx->blk_loop.resetsp = cx->blk_loop.resetsp;
10300 ncx->blk_loop.redo_op = cx->blk_loop.redo_op;
10301 ncx->blk_loop.next_op = cx->blk_loop.next_op;
10302 ncx->blk_loop.last_op = cx->blk_loop.last_op;
10303 ncx->blk_loop.iterdata = (CxPADLOOP(cx)
10304 ? cx->blk_loop.iterdata
d2d73c3e 10305 : gv_dup((GV*)cx->blk_loop.iterdata, param));
f3548bdc
DM
10306 ncx->blk_loop.oldcomppad
10307 = (PAD*)ptr_table_fetch(PL_ptr_table,
10308 cx->blk_loop.oldcomppad);
d2d73c3e
AB
10309 ncx->blk_loop.itersave = sv_dup_inc(cx->blk_loop.itersave, param);
10310 ncx->blk_loop.iterlval = sv_dup_inc(cx->blk_loop.iterlval, param);
10311 ncx->blk_loop.iterary = av_dup_inc(cx->blk_loop.iterary, param);
1d7c1841
GS
10312 ncx->blk_loop.iterix = cx->blk_loop.iterix;
10313 ncx->blk_loop.itermax = cx->blk_loop.itermax;
10314 break;
10315 case CXt_FORMAT:
d2d73c3e
AB
10316 ncx->blk_sub.cv = cv_dup(cx->blk_sub.cv, param);
10317 ncx->blk_sub.gv = gv_dup(cx->blk_sub.gv, param);
10318 ncx->blk_sub.dfoutgv = gv_dup_inc(cx->blk_sub.dfoutgv, param);
1d7c1841 10319 ncx->blk_sub.hasargs = cx->blk_sub.hasargs;
f39bc417 10320 ncx->blk_sub.retop = cx->blk_sub.retop;
1d7c1841
GS
10321 break;
10322 case CXt_BLOCK:
10323 case CXt_NULL:
10324 break;
10325 }
10326 }
10327 --ix;
10328 }
10329 return ncxs;
10330}
10331
645c22ef
DM
10332/* duplicate a stack info structure */
10333
1d7c1841 10334PERL_SI *
a8fc9800 10335Perl_si_dup(pTHX_ PERL_SI *si, CLONE_PARAMS* param)
1d7c1841
GS
10336{
10337 PERL_SI *nsi;
10338
10339 if (!si)
10340 return (PERL_SI*)NULL;
10341
10342 /* look for it in the table first */
10343 nsi = (PERL_SI*)ptr_table_fetch(PL_ptr_table, si);
10344 if (nsi)
10345 return nsi;
10346
10347 /* create anew and remember what it is */
a02a5408 10348 Newxz(nsi, 1, PERL_SI);
1d7c1841
GS
10349 ptr_table_store(PL_ptr_table, si, nsi);
10350
d2d73c3e 10351 nsi->si_stack = av_dup_inc(si->si_stack, param);
1d7c1841
GS
10352 nsi->si_cxix = si->si_cxix;
10353 nsi->si_cxmax = si->si_cxmax;
d2d73c3e 10354 nsi->si_cxstack = cx_dup(si->si_cxstack, si->si_cxix, si->si_cxmax, param);
1d7c1841 10355 nsi->si_type = si->si_type;
d2d73c3e
AB
10356 nsi->si_prev = si_dup(si->si_prev, param);
10357 nsi->si_next = si_dup(si->si_next, param);
1d7c1841
GS
10358 nsi->si_markoff = si->si_markoff;
10359
10360 return nsi;
10361}
10362
10363#define POPINT(ss,ix) ((ss)[--(ix)].any_i32)
10364#define TOPINT(ss,ix) ((ss)[ix].any_i32)
10365#define POPLONG(ss,ix) ((ss)[--(ix)].any_long)
10366#define TOPLONG(ss,ix) ((ss)[ix].any_long)
10367#define POPIV(ss,ix) ((ss)[--(ix)].any_iv)
10368#define TOPIV(ss,ix) ((ss)[ix].any_iv)
38d8b13e
HS
10369#define POPBOOL(ss,ix) ((ss)[--(ix)].any_bool)
10370#define TOPBOOL(ss,ix) ((ss)[ix].any_bool)
1d7c1841
GS
10371#define POPPTR(ss,ix) ((ss)[--(ix)].any_ptr)
10372#define TOPPTR(ss,ix) ((ss)[ix].any_ptr)
10373#define POPDPTR(ss,ix) ((ss)[--(ix)].any_dptr)
10374#define TOPDPTR(ss,ix) ((ss)[ix].any_dptr)
10375#define POPDXPTR(ss,ix) ((ss)[--(ix)].any_dxptr)
10376#define TOPDXPTR(ss,ix) ((ss)[ix].any_dxptr)
10377
10378/* XXXXX todo */
10379#define pv_dup_inc(p) SAVEPV(p)
10380#define pv_dup(p) SAVEPV(p)
10381#define svp_dup_inc(p,pp) any_dup(p,pp)
10382
645c22ef
DM
10383/* map any object to the new equivent - either something in the
10384 * ptr table, or something in the interpreter structure
10385 */
10386
1d7c1841 10387void *
53c1dcc0 10388Perl_any_dup(pTHX_ void *v, const PerlInterpreter *proto_perl)
1d7c1841
GS
10389{
10390 void *ret;
10391
10392 if (!v)
10393 return (void*)NULL;
10394
10395 /* look for it in the table first */
10396 ret = ptr_table_fetch(PL_ptr_table, v);
10397 if (ret)
10398 return ret;
10399
10400 /* see if it is part of the interpreter structure */
10401 if (v >= (void*)proto_perl && v < (void*)(proto_perl+1))
acfe0abc 10402 ret = (void*)(((char*)aTHX) + (((char*)v) - (char*)proto_perl));
05ec9bb3 10403 else {
1d7c1841 10404 ret = v;
05ec9bb3 10405 }
1d7c1841
GS
10406
10407 return ret;
10408}
10409
645c22ef
DM
10410/* duplicate the save stack */
10411
1d7c1841 10412ANY *
a8fc9800 10413Perl_ss_dup(pTHX_ PerlInterpreter *proto_perl, CLONE_PARAMS* param)
1d7c1841 10414{
53c1dcc0
AL
10415 ANY * const ss = proto_perl->Tsavestack;
10416 const I32 max = proto_perl->Tsavestack_max;
10417 I32 ix = proto_perl->Tsavestack_ix;
1d7c1841
GS
10418 ANY *nss;
10419 SV *sv;
10420 GV *gv;
10421 AV *av;
10422 HV *hv;
10423 void* ptr;
10424 int intval;
10425 long longval;
10426 GP *gp;
10427 IV iv;
c4e33207 10428 char *c = NULL;
1d7c1841 10429 void (*dptr) (void*);
acfe0abc 10430 void (*dxptr) (pTHX_ void*);
1d7c1841 10431
a02a5408 10432 Newxz(nss, max, ANY);
1d7c1841
GS
10433
10434 while (ix > 0) {
b464bac0 10435 I32 i = POPINT(ss,ix);
1d7c1841
GS
10436 TOPINT(nss,ix) = i;
10437 switch (i) {
10438 case SAVEt_ITEM: /* normal string */
a41cc44e 10439 case SAVEt_SV: /* scalar reference */
1d7c1841 10440 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10441 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10442 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10443 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10444 break;
05ec9bb3
NIS
10445 case SAVEt_SHARED_PVREF: /* char* in shared space */
10446 c = (char*)POPPTR(ss,ix);
10447 TOPPTR(nss,ix) = savesharedpv(c);
10448 ptr = POPPTR(ss,ix);
10449 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10450 break;
1d7c1841
GS
10451 case SAVEt_GENERIC_SVREF: /* generic sv */
10452 case SAVEt_SVREF: /* scalar reference */
10453 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10454 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10455 ptr = POPPTR(ss,ix);
10456 TOPPTR(nss,ix) = svp_dup_inc((SV**)ptr, proto_perl);/* XXXXX */
10457 break;
a41cc44e 10458 case SAVEt_HV: /* hash reference */
1d7c1841 10459 case SAVEt_AV: /* array reference */
337d28f5
NC
10460 sv = POPPTR(ss,ix);
10461 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10462 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10463 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10464 break;
10465 case SAVEt_INT: /* int reference */
10466 ptr = POPPTR(ss,ix);
10467 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10468 intval = (int)POPINT(ss,ix);
10469 TOPINT(nss,ix) = intval;
10470 break;
10471 case SAVEt_LONG: /* long reference */
10472 ptr = POPPTR(ss,ix);
10473 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10474 longval = (long)POPLONG(ss,ix);
10475 TOPLONG(nss,ix) = longval;
10476 break;
10477 case SAVEt_I32: /* I32 reference */
10478 case SAVEt_I16: /* I16 reference */
10479 case SAVEt_I8: /* I8 reference */
88effcc9 10480 case SAVEt_COP_ARYBASE: /* call CopARYBASE_set */
1d7c1841
GS
10481 ptr = POPPTR(ss,ix);
10482 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10483 i = POPINT(ss,ix);
10484 TOPINT(nss,ix) = i;
10485 break;
10486 case SAVEt_IV: /* IV reference */
10487 ptr = POPPTR(ss,ix);
10488 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10489 iv = POPIV(ss,ix);
10490 TOPIV(nss,ix) = iv;
10491 break;
a41cc44e
NC
10492 case SAVEt_HPTR: /* HV* reference */
10493 case SAVEt_APTR: /* AV* reference */
1d7c1841
GS
10494 case SAVEt_SPTR: /* SV* reference */
10495 ptr = POPPTR(ss,ix);
10496 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10497 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10498 TOPPTR(nss,ix) = sv_dup(sv, param);
1d7c1841
GS
10499 break;
10500 case SAVEt_VPTR: /* random* reference */
10501 ptr = POPPTR(ss,ix);
10502 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10503 ptr = POPPTR(ss,ix);
10504 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10505 break;
b03d03b0 10506 case SAVEt_GENERIC_PVREF: /* generic char* */
1d7c1841
GS
10507 case SAVEt_PPTR: /* char* reference */
10508 ptr = POPPTR(ss,ix);
10509 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10510 c = (char*)POPPTR(ss,ix);
10511 TOPPTR(nss,ix) = pv_dup(c);
10512 break;
1d7c1841
GS
10513 case SAVEt_NSTAB:
10514 gv = (GV*)POPPTR(ss,ix);
d2d73c3e 10515 TOPPTR(nss,ix) = gv_dup(gv, param);
1d7c1841
GS
10516 break;
10517 case SAVEt_GP: /* scalar reference */
10518 gp = (GP*)POPPTR(ss,ix);
d2d73c3e 10519 TOPPTR(nss,ix) = gp = gp_dup(gp, param);
1d7c1841
GS
10520 (void)GpREFCNT_inc(gp);
10521 gv = (GV*)POPPTR(ss,ix);
2ed3c8fc 10522 TOPPTR(nss,ix) = gv_dup_inc(gv, param);
1d7c1841
GS
10523 c = (char*)POPPTR(ss,ix);
10524 TOPPTR(nss,ix) = pv_dup(c);
10525 iv = POPIV(ss,ix);
10526 TOPIV(nss,ix) = iv;
10527 iv = POPIV(ss,ix);
10528 TOPIV(nss,ix) = iv;
10529 break;
10530 case SAVEt_FREESV:
26d9b02f 10531 case SAVEt_MORTALIZESV:
1d7c1841 10532 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10533 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10534 break;
10535 case SAVEt_FREEOP:
10536 ptr = POPPTR(ss,ix);
10537 if (ptr && (((OP*)ptr)->op_private & OPpREFCOUNTED)) {
10538 /* these are assumed to be refcounted properly */
53c1dcc0 10539 OP *o;
1d7c1841
GS
10540 switch (((OP*)ptr)->op_type) {
10541 case OP_LEAVESUB:
10542 case OP_LEAVESUBLV:
10543 case OP_LEAVEEVAL:
10544 case OP_LEAVE:
10545 case OP_SCOPE:
10546 case OP_LEAVEWRITE:
e977893f
GS
10547 TOPPTR(nss,ix) = ptr;
10548 o = (OP*)ptr;
10549 OpREFCNT_inc(o);
1d7c1841
GS
10550 break;
10551 default:
5f66b61c 10552 TOPPTR(nss,ix) = NULL;
1d7c1841
GS
10553 break;
10554 }
10555 }
10556 else
5f66b61c 10557 TOPPTR(nss,ix) = NULL;
1d7c1841
GS
10558 break;
10559 case SAVEt_FREEPV:
10560 c = (char*)POPPTR(ss,ix);
10561 TOPPTR(nss,ix) = pv_dup_inc(c);
10562 break;
10563 case SAVEt_CLEARSV:
10564 longval = POPLONG(ss,ix);
10565 TOPLONG(nss,ix) = longval;
10566 break;
10567 case SAVEt_DELETE:
10568 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 10569 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841
GS
10570 c = (char*)POPPTR(ss,ix);
10571 TOPPTR(nss,ix) = pv_dup_inc(c);
10572 i = POPINT(ss,ix);
10573 TOPINT(nss,ix) = i;
10574 break;
10575 case SAVEt_DESTRUCTOR:
10576 ptr = POPPTR(ss,ix);
10577 TOPPTR(nss,ix) = any_dup(ptr, proto_perl); /* XXX quite arbitrary */
10578 dptr = POPDPTR(ss,ix);
8141890a
JH
10579 TOPDPTR(nss,ix) = DPTR2FPTR(void (*)(void*),
10580 any_dup(FPTR2DPTR(void *, dptr),
10581 proto_perl));
1d7c1841
GS
10582 break;
10583 case SAVEt_DESTRUCTOR_X:
10584 ptr = POPPTR(ss,ix);
10585 TOPPTR(nss,ix) = any_dup(ptr, proto_perl); /* XXX quite arbitrary */
10586 dxptr = POPDXPTR(ss,ix);
8141890a
JH
10587 TOPDXPTR(nss,ix) = DPTR2FPTR(void (*)(pTHX_ void*),
10588 any_dup(FPTR2DPTR(void *, dxptr),
10589 proto_perl));
1d7c1841
GS
10590 break;
10591 case SAVEt_REGCONTEXT:
10592 case SAVEt_ALLOC:
10593 i = POPINT(ss,ix);
10594 TOPINT(nss,ix) = i;
10595 ix -= i;
10596 break;
10597 case SAVEt_STACK_POS: /* Position on Perl stack */
10598 i = POPINT(ss,ix);
10599 TOPINT(nss,ix) = i;
10600 break;
10601 case SAVEt_AELEM: /* array element */
10602 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10603 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841
GS
10604 i = POPINT(ss,ix);
10605 TOPINT(nss,ix) = i;
10606 av = (AV*)POPPTR(ss,ix);
d2d73c3e 10607 TOPPTR(nss,ix) = av_dup_inc(av, param);
1d7c1841
GS
10608 break;
10609 case SAVEt_HELEM: /* hash element */
10610 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10611 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10612 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10613 TOPPTR(nss,ix) = sv_dup_inc(sv, param);
1d7c1841 10614 hv = (HV*)POPPTR(ss,ix);
d2d73c3e 10615 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
1d7c1841
GS
10616 break;
10617 case SAVEt_OP:
10618 ptr = POPPTR(ss,ix);
10619 TOPPTR(nss,ix) = ptr;
10620 break;
10621 case SAVEt_HINTS:
10622 i = POPINT(ss,ix);
10623 TOPINT(nss,ix) = i;
b3ca2e83 10624 ptr = POPPTR(ss,ix);
080ac856 10625 if (ptr) {
7b6dd8c3 10626 HINTS_REFCNT_LOCK;
080ac856 10627 ((struct refcounted_he *)ptr)->refcounted_he_refcnt++;
7b6dd8c3
NC
10628 HINTS_REFCNT_UNLOCK;
10629 }
cbb1fbea 10630 TOPPTR(nss,ix) = ptr;
a8f8b6a7
NC
10631 if (i & HINT_LOCALIZE_HH) {
10632 hv = (HV*)POPPTR(ss,ix);
10633 TOPPTR(nss,ix) = hv_dup_inc(hv, param);
10634 }
1d7c1841 10635 break;
c4410b1b
GS
10636 case SAVEt_COMPPAD:
10637 av = (AV*)POPPTR(ss,ix);
58ed4fbe 10638 TOPPTR(nss,ix) = av_dup(av, param);
c4410b1b 10639 break;
c3564e5c
GS
10640 case SAVEt_PADSV:
10641 longval = (long)POPLONG(ss,ix);
10642 TOPLONG(nss,ix) = longval;
10643 ptr = POPPTR(ss,ix);
10644 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
10645 sv = (SV*)POPPTR(ss,ix);
d2d73c3e 10646 TOPPTR(nss,ix) = sv_dup(sv, param);
c3564e5c 10647 break;
a1bb4754 10648 case SAVEt_BOOL:
38d8b13e 10649 ptr = POPPTR(ss,ix);
b9609c01 10650 TOPPTR(nss,ix) = any_dup(ptr, proto_perl);
38d8b13e 10651 longval = (long)POPBOOL(ss,ix);
b9609c01 10652 TOPBOOL(nss,ix) = (bool)longval;
a1bb4754 10653 break;
8bd2680e
MHM
10654 case SAVEt_SET_SVFLAGS:
10655 i = POPINT(ss,ix);
10656 TOPINT(nss,ix) = i;
10657 i = POPINT(ss,ix);
10658 TOPINT(nss,ix) = i;
10659 sv = (SV*)POPPTR(ss,ix);
10660 TOPPTR(nss,ix) = sv_dup(sv, param);
10661 break;
5bfb7d0e
NC
10662 case SAVEt_RE_STATE:
10663 {
10664 const struct re_save_state *const old_state
10665 = (struct re_save_state *)
10666 (ss + ix - SAVESTACK_ALLOC_FOR_RE_SAVE_STATE);
10667 struct re_save_state *const new_state
10668 = (struct re_save_state *)
10669 (nss + ix - SAVESTACK_ALLOC_FOR_RE_SAVE_STATE);
10670
10671 Copy(old_state, new_state, 1, struct re_save_state);
10672 ix -= SAVESTACK_ALLOC_FOR_RE_SAVE_STATE;
10673
10674 new_state->re_state_bostr
10675 = pv_dup(old_state->re_state_bostr);
10676 new_state->re_state_reginput
10677 = pv_dup(old_state->re_state_reginput);
5bfb7d0e
NC
10678 new_state->re_state_regeol
10679 = pv_dup(old_state->re_state_regeol);
10680 new_state->re_state_regstartp
10681 = any_dup(old_state->re_state_regstartp, proto_perl);
10682 new_state->re_state_regendp
10683 = any_dup(old_state->re_state_regendp, proto_perl);
10684 new_state->re_state_reglastparen
10685 = any_dup(old_state->re_state_reglastparen, proto_perl);
10686 new_state->re_state_reglastcloseparen
10687 = any_dup(old_state->re_state_reglastcloseparen,
10688 proto_perl);
5bfb7d0e
NC
10689 /* XXX This just has to be broken. The old save_re_context
10690 code did SAVEGENERICPV(PL_reg_start_tmp);
10691 PL_reg_start_tmp is char **.
10692 Look above to what the dup code does for
10693 SAVEt_GENERIC_PVREF
10694 It can never have worked.
10695 So this is merely a faithful copy of the exiting bug: */
10696 new_state->re_state_reg_start_tmp
10697 = (char **) pv_dup((char *)
10698 old_state->re_state_reg_start_tmp);
10699 /* I assume that it only ever "worked" because no-one called
10700 (pseudo)fork while the regexp engine had re-entered itself.
10701 */
5bfb7d0e
NC
10702#ifdef PERL_OLD_COPY_ON_WRITE
10703 new_state->re_state_nrs
10704 = sv_dup(old_state->re_state_nrs, param);
10705#endif
10706 new_state->re_state_reg_magic
10707 = any_dup(old_state->re_state_reg_magic, proto_perl);
10708 new_state->re_state_reg_oldcurpm
10709 = any_dup(old_state->re_state_reg_oldcurpm, proto_perl);
10710 new_state->re_state_reg_curpm
10711 = any_dup(old_state->re_state_reg_curpm, proto_perl);
10712 new_state->re_state_reg_oldsaved
10713 = pv_dup(old_state->re_state_reg_oldsaved);
10714 new_state->re_state_reg_poscache
10715 = pv_dup(old_state->re_state_reg_poscache);
5bfb7d0e
NC
10716 new_state->re_state_reg_starttry
10717 = pv_dup(old_state->re_state_reg_starttry);
5bfb7d0e
NC
10718 break;
10719 }
68da3b2f
NC
10720 case SAVEt_COMPILE_WARNINGS:
10721 ptr = POPPTR(ss,ix);
10722 TOPPTR(nss,ix) = DUP_WARNINGS((STRLEN*)ptr);
7b6dd8c3 10723 break;
1d7c1841 10724 default:
ca05af4a 10725 Perl_croak(aTHX_ "panic: ss_dup inconsistency (%"IVdf")", (IV) i);
1d7c1841
GS
10726 }
10727 }
10728
bd81e77b
NC
10729 return nss;
10730}
10731
10732
10733/* if sv is a stash, call $class->CLONE_SKIP(), and set the SVphv_CLONEABLE
10734 * flag to the result. This is done for each stash before cloning starts,
10735 * so we know which stashes want their objects cloned */
10736
10737static void
10738do_mark_cloneable_stash(pTHX_ SV *sv)
10739{
10740 const HEK * const hvname = HvNAME_HEK((HV*)sv);
10741 if (hvname) {
10742 GV* const cloner = gv_fetchmethod_autoload((HV*)sv, "CLONE_SKIP", 0);
10743 SvFLAGS(sv) |= SVphv_CLONEABLE; /* clone objects by default */
10744 if (cloner && GvCV(cloner)) {
10745 dSP;
10746 UV status;
10747
10748 ENTER;
10749 SAVETMPS;
10750 PUSHMARK(SP);
10751 XPUSHs(sv_2mortal(newSVhek(hvname)));
10752 PUTBACK;
10753 call_sv((SV*)GvCV(cloner), G_SCALAR);
10754 SPAGAIN;
10755 status = POPu;
10756 PUTBACK;
10757 FREETMPS;
10758 LEAVE;
10759 if (status)
10760 SvFLAGS(sv) &= ~SVphv_CLONEABLE;
10761 }
10762 }
10763}
10764
10765
10766
10767/*
10768=for apidoc perl_clone
10769
10770Create and return a new interpreter by cloning the current one.
10771
10772perl_clone takes these flags as parameters:
10773
10774CLONEf_COPY_STACKS - is used to, well, copy the stacks also,
10775without it we only clone the data and zero the stacks,
10776with it we copy the stacks and the new perl interpreter is
10777ready to run at the exact same point as the previous one.
10778The pseudo-fork code uses COPY_STACKS while the
10779threads->new doesn't.
10780
10781CLONEf_KEEP_PTR_TABLE
10782perl_clone keeps a ptr_table with the pointer of the old
10783variable as a key and the new variable as a value,
10784this allows it to check if something has been cloned and not
10785clone it again but rather just use the value and increase the
10786refcount. If KEEP_PTR_TABLE is not set then perl_clone will kill
10787the ptr_table using the function
10788C<ptr_table_free(PL_ptr_table); PL_ptr_table = NULL;>,
10789reason to keep it around is if you want to dup some of your own
10790variable who are outside the graph perl scans, example of this
10791code is in threads.xs create
10792
10793CLONEf_CLONE_HOST
10794This is a win32 thing, it is ignored on unix, it tells perls
10795win32host code (which is c++) to clone itself, this is needed on
10796win32 if you want to run two threads at the same time,
10797if you just want to do some stuff in a separate perl interpreter
10798and then throw it away and return to the original one,
10799you don't need to do anything.
10800
10801=cut
10802*/
10803
10804/* XXX the above needs expanding by someone who actually understands it ! */
10805EXTERN_C PerlInterpreter *
10806perl_clone_host(PerlInterpreter* proto_perl, UV flags);
10807
10808PerlInterpreter *
10809perl_clone(PerlInterpreter *proto_perl, UV flags)
10810{
10811 dVAR;
10812#ifdef PERL_IMPLICIT_SYS
10813
10814 /* perlhost.h so we need to call into it
10815 to clone the host, CPerlHost should have a c interface, sky */
10816
10817 if (flags & CLONEf_CLONE_HOST) {
10818 return perl_clone_host(proto_perl,flags);
10819 }
10820 return perl_clone_using(proto_perl, flags,
10821 proto_perl->IMem,
10822 proto_perl->IMemShared,
10823 proto_perl->IMemParse,
10824 proto_perl->IEnv,
10825 proto_perl->IStdIO,
10826 proto_perl->ILIO,
10827 proto_perl->IDir,
10828 proto_perl->ISock,
10829 proto_perl->IProc);
10830}
10831
10832PerlInterpreter *
10833perl_clone_using(PerlInterpreter *proto_perl, UV flags,
10834 struct IPerlMem* ipM, struct IPerlMem* ipMS,
10835 struct IPerlMem* ipMP, struct IPerlEnv* ipE,
10836 struct IPerlStdIO* ipStd, struct IPerlLIO* ipLIO,
10837 struct IPerlDir* ipD, struct IPerlSock* ipS,
10838 struct IPerlProc* ipP)
10839{
10840 /* XXX many of the string copies here can be optimized if they're
10841 * constants; they need to be allocated as common memory and just
10842 * their pointers copied. */
10843
10844 IV i;
10845 CLONE_PARAMS clone_params;
5f66b61c 10846 CLONE_PARAMS* const param = &clone_params;
bd81e77b 10847
5f66b61c 10848 PerlInterpreter * const my_perl = (PerlInterpreter*)(*ipM->pMalloc)(ipM, sizeof(PerlInterpreter));
bd81e77b
NC
10849 /* for each stash, determine whether its objects should be cloned */
10850 S_visit(proto_perl, do_mark_cloneable_stash, SVt_PVHV, SVTYPEMASK);
10851 PERL_SET_THX(my_perl);
10852
10853# ifdef DEBUGGING
7e337ee0 10854 PoisonNew(my_perl, 1, PerlInterpreter);
5f66b61c
AL
10855 PL_op = NULL;
10856 PL_curcop = NULL;
bd81e77b
NC
10857 PL_markstack = 0;
10858 PL_scopestack = 0;
10859 PL_savestack = 0;
10860 PL_savestack_ix = 0;
10861 PL_savestack_max = -1;
10862 PL_sig_pending = 0;
10863 Zero(&PL_debug_pad, 1, struct perl_debug_pad);
10864# else /* !DEBUGGING */
10865 Zero(my_perl, 1, PerlInterpreter);
10866# endif /* DEBUGGING */
10867
10868 /* host pointers */
10869 PL_Mem = ipM;
10870 PL_MemShared = ipMS;
10871 PL_MemParse = ipMP;
10872 PL_Env = ipE;
10873 PL_StdIO = ipStd;
10874 PL_LIO = ipLIO;
10875 PL_Dir = ipD;
10876 PL_Sock = ipS;
10877 PL_Proc = ipP;
10878#else /* !PERL_IMPLICIT_SYS */
10879 IV i;
10880 CLONE_PARAMS clone_params;
10881 CLONE_PARAMS* param = &clone_params;
5f66b61c 10882 PerlInterpreter * const my_perl = (PerlInterpreter*)PerlMem_malloc(sizeof(PerlInterpreter));
bd81e77b
NC
10883 /* for each stash, determine whether its objects should be cloned */
10884 S_visit(proto_perl, do_mark_cloneable_stash, SVt_PVHV, SVTYPEMASK);
10885 PERL_SET_THX(my_perl);
10886
10887# ifdef DEBUGGING
7e337ee0 10888 PoisonNew(my_perl, 1, PerlInterpreter);
5f66b61c
AL
10889 PL_op = NULL;
10890 PL_curcop = NULL;
bd81e77b
NC
10891 PL_markstack = 0;
10892 PL_scopestack = 0;
10893 PL_savestack = 0;
10894 PL_savestack_ix = 0;
10895 PL_savestack_max = -1;
10896 PL_sig_pending = 0;
10897 Zero(&PL_debug_pad, 1, struct perl_debug_pad);
10898# else /* !DEBUGGING */
10899 Zero(my_perl, 1, PerlInterpreter);
10900# endif /* DEBUGGING */
10901#endif /* PERL_IMPLICIT_SYS */
10902 param->flags = flags;
10903 param->proto_perl = proto_perl;
10904
7cb608b5
NC
10905 INIT_TRACK_MEMPOOL(my_perl->Imemory_debug_header, my_perl);
10906
fdda85ca 10907 PL_body_arenas = NULL;
bd81e77b
NC
10908 Zero(&PL_body_roots, 1, PL_body_roots);
10909
10910 PL_nice_chunk = NULL;
10911 PL_nice_chunk_size = 0;
10912 PL_sv_count = 0;
10913 PL_sv_objcount = 0;
a0714e2c
SS
10914 PL_sv_root = NULL;
10915 PL_sv_arenaroot = NULL;
bd81e77b
NC
10916
10917 PL_debug = proto_perl->Idebug;
10918
10919 PL_hash_seed = proto_perl->Ihash_seed;
10920 PL_rehash_seed = proto_perl->Irehash_seed;
10921
10922#ifdef USE_REENTRANT_API
10923 /* XXX: things like -Dm will segfault here in perlio, but doing
10924 * PERL_SET_CONTEXT(proto_perl);
10925 * breaks too many other things
10926 */
10927 Perl_reentrant_init(aTHX);
10928#endif
10929
10930 /* create SV map for pointer relocation */
10931 PL_ptr_table = ptr_table_new();
10932
10933 /* initialize these special pointers as early as possible */
10934 SvANY(&PL_sv_undef) = NULL;
10935 SvREFCNT(&PL_sv_undef) = (~(U32)0)/2;
10936 SvFLAGS(&PL_sv_undef) = SVf_READONLY|SVt_NULL;
10937 ptr_table_store(PL_ptr_table, &proto_perl->Isv_undef, &PL_sv_undef);
10938
10939 SvANY(&PL_sv_no) = new_XPVNV();
10940 SvREFCNT(&PL_sv_no) = (~(U32)0)/2;
10941 SvFLAGS(&PL_sv_no) = SVp_IOK|SVf_IOK|SVp_NOK|SVf_NOK
10942 |SVp_POK|SVf_POK|SVf_READONLY|SVt_PVNV;
bb7a0f54 10943 SvPV_set(&PL_sv_no, savepvn(PL_No, 0));
bd81e77b
NC
10944 SvCUR_set(&PL_sv_no, 0);
10945 SvLEN_set(&PL_sv_no, 1);
10946 SvIV_set(&PL_sv_no, 0);
10947 SvNV_set(&PL_sv_no, 0);
10948 ptr_table_store(PL_ptr_table, &proto_perl->Isv_no, &PL_sv_no);
10949
10950 SvANY(&PL_sv_yes) = new_XPVNV();
10951 SvREFCNT(&PL_sv_yes) = (~(U32)0)/2;
10952 SvFLAGS(&PL_sv_yes) = SVp_IOK|SVf_IOK|SVp_NOK|SVf_NOK
10953 |SVp_POK|SVf_POK|SVf_READONLY|SVt_PVNV;
bb7a0f54 10954 SvPV_set(&PL_sv_yes, savepvn(PL_Yes, 1));
bd81e77b
NC
10955 SvCUR_set(&PL_sv_yes, 1);
10956 SvLEN_set(&PL_sv_yes, 2);
10957 SvIV_set(&PL_sv_yes, 1);
10958 SvNV_set(&PL_sv_yes, 1);
10959 ptr_table_store(PL_ptr_table, &proto_perl->Isv_yes, &PL_sv_yes);
10960
10961 /* create (a non-shared!) shared string table */
10962 PL_strtab = newHV();
10963 HvSHAREKEYS_off(PL_strtab);
10964 hv_ksplit(PL_strtab, HvTOTALKEYS(proto_perl->Istrtab));
10965 ptr_table_store(PL_ptr_table, proto_perl->Istrtab, PL_strtab);
10966
10967 PL_compiling = proto_perl->Icompiling;
10968
10969 /* These two PVs will be free'd special way so must set them same way op.c does */
10970 PL_compiling.cop_stashpv = savesharedpv(PL_compiling.cop_stashpv);
10971 ptr_table_store(PL_ptr_table, proto_perl->Icompiling.cop_stashpv, PL_compiling.cop_stashpv);
10972
10973 PL_compiling.cop_file = savesharedpv(PL_compiling.cop_file);
10974 ptr_table_store(PL_ptr_table, proto_perl->Icompiling.cop_file, PL_compiling.cop_file);
10975
10976 ptr_table_store(PL_ptr_table, &proto_perl->Icompiling, &PL_compiling);
72dc9ed5 10977 PL_compiling.cop_warnings = DUP_WARNINGS(PL_compiling.cop_warnings);
c28fe1ec 10978 if (PL_compiling.cop_hints_hash) {
cbb1fbea 10979 HINTS_REFCNT_LOCK;
c28fe1ec 10980 PL_compiling.cop_hints_hash->refcounted_he_refcnt++;
cbb1fbea
NC
10981 HINTS_REFCNT_UNLOCK;
10982 }
bd81e77b
NC
10983 PL_curcop = (COP*)any_dup(proto_perl->Tcurcop, proto_perl);
10984
10985 /* pseudo environmental stuff */
10986 PL_origargc = proto_perl->Iorigargc;
10987 PL_origargv = proto_perl->Iorigargv;
10988
10989 param->stashes = newAV(); /* Setup array of objects to call clone on */
10990
10991 /* Set tainting stuff before PerlIO_debug can possibly get called */
10992 PL_tainting = proto_perl->Itainting;
10993 PL_taint_warn = proto_perl->Itaint_warn;
10994
10995#ifdef PERLIO_LAYERS
10996 /* Clone PerlIO tables as soon as we can handle general xx_dup() */
10997 PerlIO_clone(aTHX_ proto_perl, param);
10998#endif
10999
11000 PL_envgv = gv_dup(proto_perl->Ienvgv, param);
11001 PL_incgv = gv_dup(proto_perl->Iincgv, param);
11002 PL_hintgv = gv_dup(proto_perl->Ihintgv, param);
11003 PL_origfilename = SAVEPV(proto_perl->Iorigfilename);
11004 PL_diehook = sv_dup_inc(proto_perl->Idiehook, param);
11005 PL_warnhook = sv_dup_inc(proto_perl->Iwarnhook, param);
11006
11007 /* switches */
11008 PL_minus_c = proto_perl->Iminus_c;
11009 PL_patchlevel = sv_dup_inc(proto_perl->Ipatchlevel, param);
11010 PL_localpatches = proto_perl->Ilocalpatches;
11011 PL_splitstr = proto_perl->Isplitstr;
11012 PL_preprocess = proto_perl->Ipreprocess;
11013 PL_minus_n = proto_perl->Iminus_n;
11014 PL_minus_p = proto_perl->Iminus_p;
11015 PL_minus_l = proto_perl->Iminus_l;
11016 PL_minus_a = proto_perl->Iminus_a;
bc9b29db 11017 PL_minus_E = proto_perl->Iminus_E;
bd81e77b
NC
11018 PL_minus_F = proto_perl->Iminus_F;
11019 PL_doswitches = proto_perl->Idoswitches;
11020 PL_dowarn = proto_perl->Idowarn;
11021 PL_doextract = proto_perl->Idoextract;
11022 PL_sawampersand = proto_perl->Isawampersand;
11023 PL_unsafe = proto_perl->Iunsafe;
11024 PL_inplace = SAVEPV(proto_perl->Iinplace);
11025 PL_e_script = sv_dup_inc(proto_perl->Ie_script, param);
11026 PL_perldb = proto_perl->Iperldb;
11027 PL_perl_destruct_level = proto_perl->Iperl_destruct_level;
11028 PL_exit_flags = proto_perl->Iexit_flags;
11029
11030 /* magical thingies */
11031 /* XXX time(&PL_basetime) when asked for? */
11032 PL_basetime = proto_perl->Ibasetime;
11033 PL_formfeed = sv_dup(proto_perl->Iformfeed, param);
11034
11035 PL_maxsysfd = proto_perl->Imaxsysfd;
bd81e77b
NC
11036 PL_statusvalue = proto_perl->Istatusvalue;
11037#ifdef VMS
11038 PL_statusvalue_vms = proto_perl->Istatusvalue_vms;
11039#else
11040 PL_statusvalue_posix = proto_perl->Istatusvalue_posix;
11041#endif
11042 PL_encoding = sv_dup(proto_perl->Iencoding, param);
11043
11044 sv_setpvn(PERL_DEBUG_PAD(0), "", 0); /* For regex debugging. */
11045 sv_setpvn(PERL_DEBUG_PAD(1), "", 0); /* ext/re needs these */
11046 sv_setpvn(PERL_DEBUG_PAD(2), "", 0); /* even without DEBUGGING. */
11047
11048 /* Clone the regex array */
11049 PL_regex_padav = newAV();
11050 {
11051 const I32 len = av_len((AV*)proto_perl->Iregex_padav);
7a5b473e 11052 SV* const * const regexen = AvARRAY((AV*)proto_perl->Iregex_padav);
bd81e77b 11053 IV i;
7f466ec7 11054 av_push(PL_regex_padav, sv_dup_inc_NN(regexen[0],param));
bd81e77b 11055 for(i = 1; i <= len; i++) {
7a5b473e
AL
11056 const SV * const regex = regexen[i];
11057 SV * const sv =
11058 SvREPADTMP(regex)
11059 ? sv_dup_inc(regex, param)
11060 : SvREFCNT_inc(
11061 newSViv(PTR2IV(re_dup(
11062 INT2PTR(REGEXP *, SvIVX(regex)), param))))
11063 ;
11064 av_push(PL_regex_padav, sv);
bd81e77b
NC
11065 }
11066 }
11067 PL_regex_pad = AvARRAY(PL_regex_padav);
11068
11069 /* shortcuts to various I/O objects */
11070 PL_stdingv = gv_dup(proto_perl->Istdingv, param);
11071 PL_stderrgv = gv_dup(proto_perl->Istderrgv, param);
11072 PL_defgv = gv_dup(proto_perl->Idefgv, param);
11073 PL_argvgv = gv_dup(proto_perl->Iargvgv, param);
11074 PL_argvoutgv = gv_dup(proto_perl->Iargvoutgv, param);
11075 PL_argvout_stack = av_dup_inc(proto_perl->Iargvout_stack, param);
1d7c1841 11076
bd81e77b
NC
11077 /* shortcuts to regexp stuff */
11078 PL_replgv = gv_dup(proto_perl->Ireplgv, param);
9660f481 11079
bd81e77b
NC
11080 /* shortcuts to misc objects */
11081 PL_errgv = gv_dup(proto_perl->Ierrgv, param);
9660f481 11082
bd81e77b
NC
11083 /* shortcuts to debugging objects */
11084 PL_DBgv = gv_dup(proto_perl->IDBgv, param);
11085 PL_DBline = gv_dup(proto_perl->IDBline, param);
11086 PL_DBsub = gv_dup(proto_perl->IDBsub, param);
11087 PL_DBsingle = sv_dup(proto_perl->IDBsingle, param);
11088 PL_DBtrace = sv_dup(proto_perl->IDBtrace, param);
11089 PL_DBsignal = sv_dup(proto_perl->IDBsignal, param);
11090 PL_DBassertion = sv_dup(proto_perl->IDBassertion, param);
11091 PL_lineary = av_dup(proto_perl->Ilineary, param);
11092 PL_dbargs = av_dup(proto_perl->Idbargs, param);
9660f481 11093
bd81e77b
NC
11094 /* symbol tables */
11095 PL_defstash = hv_dup_inc(proto_perl->Tdefstash, param);
11096 PL_curstash = hv_dup(proto_perl->Tcurstash, param);
11097 PL_debstash = hv_dup(proto_perl->Idebstash, param);
11098 PL_globalstash = hv_dup(proto_perl->Iglobalstash, param);
11099 PL_curstname = sv_dup_inc(proto_perl->Icurstname, param);
11100
11101 PL_beginav = av_dup_inc(proto_perl->Ibeginav, param);
11102 PL_beginav_save = av_dup_inc(proto_perl->Ibeginav_save, param);
11103 PL_checkav_save = av_dup_inc(proto_perl->Icheckav_save, param);
11104 PL_endav = av_dup_inc(proto_perl->Iendav, param);
11105 PL_checkav = av_dup_inc(proto_perl->Icheckav, param);
11106 PL_initav = av_dup_inc(proto_perl->Iinitav, param);
11107
11108 PL_sub_generation = proto_perl->Isub_generation;
11109
11110 /* funky return mechanisms */
11111 PL_forkprocess = proto_perl->Iforkprocess;
11112
11113 /* subprocess state */
11114 PL_fdpid = av_dup_inc(proto_perl->Ifdpid, param);
11115
11116 /* internal state */
11117 PL_maxo = proto_perl->Imaxo;
11118 if (proto_perl->Iop_mask)
11119 PL_op_mask = SAVEPVN(proto_perl->Iop_mask, PL_maxo);
11120 else
bd61b366 11121 PL_op_mask = NULL;
bd81e77b
NC
11122 /* PL_asserting = proto_perl->Iasserting; */
11123
11124 /* current interpreter roots */
11125 PL_main_cv = cv_dup_inc(proto_perl->Imain_cv, param);
11126 PL_main_root = OpREFCNT_inc(proto_perl->Imain_root);
11127 PL_main_start = proto_perl->Imain_start;
11128 PL_eval_root = proto_perl->Ieval_root;
11129 PL_eval_start = proto_perl->Ieval_start;
11130
11131 /* runtime control stuff */
11132 PL_curcopdb = (COP*)any_dup(proto_perl->Icurcopdb, proto_perl);
11133 PL_copline = proto_perl->Icopline;
11134
11135 PL_filemode = proto_perl->Ifilemode;
11136 PL_lastfd = proto_perl->Ilastfd;
11137 PL_oldname = proto_perl->Ioldname; /* XXX not quite right */
11138 PL_Argv = NULL;
bd61b366 11139 PL_Cmd = NULL;
bd81e77b
NC
11140 PL_gensym = proto_perl->Igensym;
11141 PL_preambled = proto_perl->Ipreambled;
11142 PL_preambleav = av_dup_inc(proto_perl->Ipreambleav, param);
11143 PL_laststatval = proto_perl->Ilaststatval;
11144 PL_laststype = proto_perl->Ilaststype;
a0714e2c 11145 PL_mess_sv = NULL;
bd81e77b
NC
11146
11147 PL_ors_sv = sv_dup_inc(proto_perl->Iors_sv, param);
11148
11149 /* interpreter atexit processing */
11150 PL_exitlistlen = proto_perl->Iexitlistlen;
11151 if (PL_exitlistlen) {
11152 Newx(PL_exitlist, PL_exitlistlen, PerlExitListEntry);
11153 Copy(proto_perl->Iexitlist, PL_exitlist, PL_exitlistlen, PerlExitListEntry);
9660f481 11154 }
bd81e77b
NC
11155 else
11156 PL_exitlist = (PerlExitListEntry*)NULL;
f16dd614
DM
11157
11158 PL_my_cxt_size = proto_perl->Imy_cxt_size;
4c901e72 11159 if (PL_my_cxt_size) {
f16dd614
DM
11160 Newx(PL_my_cxt_list, PL_my_cxt_size, void *);
11161 Copy(proto_perl->Imy_cxt_list, PL_my_cxt_list, PL_my_cxt_size, void *);
11162 }
11163 else
11164 PL_my_cxt_list = (void**)NULL;
bd81e77b
NC
11165 PL_modglobal = hv_dup_inc(proto_perl->Imodglobal, param);
11166 PL_custom_op_names = hv_dup_inc(proto_perl->Icustom_op_names,param);
11167 PL_custom_op_descs = hv_dup_inc(proto_perl->Icustom_op_descs,param);
11168
11169 PL_profiledata = NULL;
11170 PL_rsfp = fp_dup(proto_perl->Irsfp, '<', param);
11171 /* PL_rsfp_filters entries have fake IoDIRP() */
11172 PL_rsfp_filters = av_dup_inc(proto_perl->Irsfp_filters, param);
9660f481 11173
bd81e77b 11174 PL_compcv = cv_dup(proto_perl->Icompcv, param);
9660f481 11175
bd81e77b 11176 PAD_CLONE_VARS(proto_perl, param);
9660f481 11177
bd81e77b
NC
11178#ifdef HAVE_INTERP_INTERN
11179 sys_intern_dup(&proto_perl->Isys_intern, &PL_sys_intern);
11180#endif
645c22ef 11181
bd81e77b
NC
11182 /* more statics moved here */
11183 PL_generation = proto_perl->Igeneration;
11184 PL_DBcv = cv_dup(proto_perl->IDBcv, param);
645c22ef 11185
bd81e77b
NC
11186 PL_in_clean_objs = proto_perl->Iin_clean_objs;
11187 PL_in_clean_all = proto_perl->Iin_clean_all;
6a78b4db 11188
bd81e77b
NC
11189 PL_uid = proto_perl->Iuid;
11190 PL_euid = proto_perl->Ieuid;
11191 PL_gid = proto_perl->Igid;
11192 PL_egid = proto_perl->Iegid;
11193 PL_nomemok = proto_perl->Inomemok;
11194 PL_an = proto_perl->Ian;
11195 PL_evalseq = proto_perl->Ievalseq;
11196 PL_origenviron = proto_perl->Iorigenviron; /* XXX not quite right */
11197 PL_origalen = proto_perl->Iorigalen;
11198#ifdef PERL_USES_PL_PIDSTATUS
11199 PL_pidstatus = newHV(); /* XXX flag for cloning? */
11200#endif
11201 PL_osname = SAVEPV(proto_perl->Iosname);
11202 PL_sighandlerp = proto_perl->Isighandlerp;
6a78b4db 11203
bd81e77b 11204 PL_runops = proto_perl->Irunops;
6a78b4db 11205
bd81e77b 11206 Copy(proto_perl->Itokenbuf, PL_tokenbuf, 256, char);
6a78b4db 11207
bd81e77b
NC
11208#ifdef CSH
11209 PL_cshlen = proto_perl->Icshlen;
11210 PL_cshname = proto_perl->Icshname; /* XXX never deallocated */
11211#endif
645c22ef 11212
bd81e77b
NC
11213 PL_lex_state = proto_perl->Ilex_state;
11214 PL_lex_defer = proto_perl->Ilex_defer;
11215 PL_lex_expect = proto_perl->Ilex_expect;
11216 PL_lex_formbrack = proto_perl->Ilex_formbrack;
11217 PL_lex_dojoin = proto_perl->Ilex_dojoin;
11218 PL_lex_starts = proto_perl->Ilex_starts;
11219 PL_lex_stuff = sv_dup_inc(proto_perl->Ilex_stuff, param);
11220 PL_lex_repl = sv_dup_inc(proto_perl->Ilex_repl, param);
11221 PL_lex_op = proto_perl->Ilex_op;
11222 PL_lex_inpat = proto_perl->Ilex_inpat;
11223 PL_lex_inwhat = proto_perl->Ilex_inwhat;
11224 PL_lex_brackets = proto_perl->Ilex_brackets;
11225 i = (PL_lex_brackets < 120 ? 120 : PL_lex_brackets);
11226 PL_lex_brackstack = SAVEPVN(proto_perl->Ilex_brackstack,i);
11227 PL_lex_casemods = proto_perl->Ilex_casemods;
11228 i = (PL_lex_casemods < 12 ? 12 : PL_lex_casemods);
11229 PL_lex_casestack = SAVEPVN(proto_perl->Ilex_casestack,i);
645c22ef 11230
5db06880
NC
11231#ifdef PERL_MAD
11232 Copy(proto_perl->Inexttoke, PL_nexttoke, 5, NEXTTOKE);
11233 PL_lasttoke = proto_perl->Ilasttoke;
5336380d
NC
11234 PL_realtokenstart = proto_perl->Irealtokenstart;
11235 PL_faketokens = proto_perl->Ifaketokens;
11236 PL_thismad = proto_perl->Ithismad;
11237 PL_thistoken = proto_perl->Ithistoken;
11238 PL_thisopen = proto_perl->Ithisopen;
11239 PL_thisstuff = proto_perl->Ithisstuff;
11240 PL_thisclose = proto_perl->Ithisclose;
11241 PL_thiswhite = proto_perl->Ithiswhite;
11242 PL_nextwhite = proto_perl->Inextwhite;
11243 PL_skipwhite = proto_perl->Iskipwhite;
11244 PL_endwhite = proto_perl->Iendwhite;
11245 PL_curforce = proto_perl->Icurforce;
5db06880 11246#else
bd81e77b
NC
11247 Copy(proto_perl->Inextval, PL_nextval, 5, YYSTYPE);
11248 Copy(proto_perl->Inexttype, PL_nexttype, 5, I32);
11249 PL_nexttoke = proto_perl->Inexttoke;
5db06880 11250#endif
c43294b8 11251
bd81e77b
NC
11252 /* XXX This is probably masking the deeper issue of why
11253 * SvANY(proto_perl->Ilinestr) can be NULL at this point. For test case:
11254 * http://archive.develooper.com/perl5-porters%40perl.org/msg83298.html
11255 * (A little debugging with a watchpoint on it may help.)
11256 */
11257 if (SvANY(proto_perl->Ilinestr)) {
11258 PL_linestr = sv_dup_inc(proto_perl->Ilinestr, param);
11259 i = proto_perl->Ibufptr - SvPVX_const(proto_perl->Ilinestr);
11260 PL_bufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11261 i = proto_perl->Ioldbufptr - SvPVX_const(proto_perl->Ilinestr);
11262 PL_oldbufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11263 i = proto_perl->Ioldoldbufptr - SvPVX_const(proto_perl->Ilinestr);
11264 PL_oldoldbufptr = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11265 i = proto_perl->Ilinestart - SvPVX_const(proto_perl->Ilinestr);
11266 PL_linestart = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11267 }
11268 else {
561b68a9 11269 PL_linestr = newSV(79);
bd81e77b
NC
11270 sv_upgrade(PL_linestr,SVt_PVIV);
11271 sv_setpvn(PL_linestr,"",0);
11272 PL_bufptr = PL_oldbufptr = PL_oldoldbufptr = PL_linestart = SvPVX(PL_linestr);
11273 }
11274 PL_bufend = SvPVX(PL_linestr) + SvCUR(PL_linestr);
11275 PL_pending_ident = proto_perl->Ipending_ident;
11276 PL_sublex_info = proto_perl->Isublex_info; /* XXX not quite right */
11277
11278 PL_expect = proto_perl->Iexpect;
11279
11280 PL_multi_start = proto_perl->Imulti_start;
11281 PL_multi_end = proto_perl->Imulti_end;
11282 PL_multi_open = proto_perl->Imulti_open;
11283 PL_multi_close = proto_perl->Imulti_close;
11284
11285 PL_error_count = proto_perl->Ierror_count;
11286 PL_subline = proto_perl->Isubline;
11287 PL_subname = sv_dup_inc(proto_perl->Isubname, param);
c43294b8 11288
bd81e77b
NC
11289 /* XXX See comment on SvANY(proto_perl->Ilinestr) above */
11290 if (SvANY(proto_perl->Ilinestr)) {
11291 i = proto_perl->Ilast_uni - SvPVX_const(proto_perl->Ilinestr);
11292 PL_last_uni = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11293 i = proto_perl->Ilast_lop - SvPVX_const(proto_perl->Ilinestr);
11294 PL_last_lop = SvPVX(PL_linestr) + (i < 0 ? 0 : i);
11295 PL_last_lop_op = proto_perl->Ilast_lop_op;
11296 }
11297 else {
11298 PL_last_uni = SvPVX(PL_linestr);
11299 PL_last_lop = SvPVX(PL_linestr);
11300 PL_last_lop_op = 0;
11301 }
11302 PL_in_my = proto_perl->Iin_my;
11303 PL_in_my_stash = hv_dup(proto_perl->Iin_my_stash, param);
11304#ifdef FCRYPT
11305 PL_cryptseen = proto_perl->Icryptseen;
11306#endif
1d7c1841 11307
bd81e77b 11308 PL_hints = proto_perl->Ihints;
1d7c1841 11309
bd81e77b 11310 PL_amagic_generation = proto_perl->Iamagic_generation;
d2d73c3e 11311
bd81e77b
NC
11312#ifdef USE_LOCALE_COLLATE
11313 PL_collation_ix = proto_perl->Icollation_ix;
11314 PL_collation_name = SAVEPV(proto_perl->Icollation_name);
11315 PL_collation_standard = proto_perl->Icollation_standard;
11316 PL_collxfrm_base = proto_perl->Icollxfrm_base;
11317 PL_collxfrm_mult = proto_perl->Icollxfrm_mult;
11318#endif /* USE_LOCALE_COLLATE */
1d7c1841 11319
bd81e77b
NC
11320#ifdef USE_LOCALE_NUMERIC
11321 PL_numeric_name = SAVEPV(proto_perl->Inumeric_name);
11322 PL_numeric_standard = proto_perl->Inumeric_standard;
11323 PL_numeric_local = proto_perl->Inumeric_local;
11324 PL_numeric_radix_sv = sv_dup_inc(proto_perl->Inumeric_radix_sv, param);
11325#endif /* !USE_LOCALE_NUMERIC */
1d7c1841 11326
bd81e77b
NC
11327 /* utf8 character classes */
11328 PL_utf8_alnum = sv_dup_inc(proto_perl->Iutf8_alnum, param);
11329 PL_utf8_alnumc = sv_dup_inc(proto_perl->Iutf8_alnumc, param);
11330 PL_utf8_ascii = sv_dup_inc(proto_perl->Iutf8_ascii, param);
11331 PL_utf8_alpha = sv_dup_inc(proto_perl->Iutf8_alpha, param);
11332 PL_utf8_space = sv_dup_inc(proto_perl->Iutf8_space, param);
11333 PL_utf8_cntrl = sv_dup_inc(proto_perl->Iutf8_cntrl, param);
11334 PL_utf8_graph = sv_dup_inc(proto_perl->Iutf8_graph, param);
11335 PL_utf8_digit = sv_dup_inc(proto_perl->Iutf8_digit, param);
11336 PL_utf8_upper = sv_dup_inc(proto_perl->Iutf8_upper, param);
11337 PL_utf8_lower = sv_dup_inc(proto_perl->Iutf8_lower, param);
11338 PL_utf8_print = sv_dup_inc(proto_perl->Iutf8_print, param);
11339 PL_utf8_punct = sv_dup_inc(proto_perl->Iutf8_punct, param);
11340 PL_utf8_xdigit = sv_dup_inc(proto_perl->Iutf8_xdigit, param);
11341 PL_utf8_mark = sv_dup_inc(proto_perl->Iutf8_mark, param);
11342 PL_utf8_toupper = sv_dup_inc(proto_perl->Iutf8_toupper, param);
11343 PL_utf8_totitle = sv_dup_inc(proto_perl->Iutf8_totitle, param);
11344 PL_utf8_tolower = sv_dup_inc(proto_perl->Iutf8_tolower, param);
11345 PL_utf8_tofold = sv_dup_inc(proto_perl->Iutf8_tofold, param);
11346 PL_utf8_idstart = sv_dup_inc(proto_perl->Iutf8_idstart, param);
11347 PL_utf8_idcont = sv_dup_inc(proto_perl->Iutf8_idcont, param);
1d7c1841 11348
bd81e77b
NC
11349 /* Did the locale setup indicate UTF-8? */
11350 PL_utf8locale = proto_perl->Iutf8locale;
11351 /* Unicode features (see perlrun/-C) */
11352 PL_unicode = proto_perl->Iunicode;
1d7c1841 11353
bd81e77b
NC
11354 /* Pre-5.8 signals control */
11355 PL_signals = proto_perl->Isignals;
1d7c1841 11356
bd81e77b
NC
11357 /* times() ticks per second */
11358 PL_clocktick = proto_perl->Iclocktick;
1d7c1841 11359
bd81e77b
NC
11360 /* Recursion stopper for PerlIO_find_layer */
11361 PL_in_load_module = proto_perl->Iin_load_module;
8df990a8 11362
bd81e77b
NC
11363 /* sort() routine */
11364 PL_sort_RealCmp = proto_perl->Isort_RealCmp;
e5dd39fc 11365
bd81e77b
NC
11366 /* Not really needed/useful since the reenrant_retint is "volatile",
11367 * but do it for consistency's sake. */
11368 PL_reentrant_retint = proto_perl->Ireentrant_retint;
1d7c1841 11369
bd81e77b
NC
11370 /* Hooks to shared SVs and locks. */
11371 PL_sharehook = proto_perl->Isharehook;
11372 PL_lockhook = proto_perl->Ilockhook;
11373 PL_unlockhook = proto_perl->Iunlockhook;
11374 PL_threadhook = proto_perl->Ithreadhook;
1d7c1841 11375
bd81e77b
NC
11376 PL_runops_std = proto_perl->Irunops_std;
11377 PL_runops_dbg = proto_perl->Irunops_dbg;
1d7c1841 11378
bd81e77b
NC
11379#ifdef THREADS_HAVE_PIDS
11380 PL_ppid = proto_perl->Ippid;
11381#endif
1d7c1841 11382
bd81e77b 11383 /* swatch cache */
5c284bb0 11384 PL_last_swash_hv = NULL; /* reinits on demand */
bd81e77b
NC
11385 PL_last_swash_klen = 0;
11386 PL_last_swash_key[0]= '\0';
11387 PL_last_swash_tmps = (U8*)NULL;
11388 PL_last_swash_slen = 0;
1d7c1841 11389
bd81e77b
NC
11390 PL_glob_index = proto_perl->Iglob_index;
11391 PL_srand_called = proto_perl->Isrand_called;
11392 PL_uudmap['M'] = 0; /* reinits on demand */
bd61b366 11393 PL_bitcount = NULL; /* reinits on demand */
05ec9bb3 11394
bd81e77b
NC
11395 if (proto_perl->Ipsig_pend) {
11396 Newxz(PL_psig_pend, SIG_SIZE, int);
11397 }
11398 else {
11399 PL_psig_pend = (int*)NULL;
11400 }
05ec9bb3 11401
bd81e77b
NC
11402 if (proto_perl->Ipsig_ptr) {
11403 Newxz(PL_psig_ptr, SIG_SIZE, SV*);
11404 Newxz(PL_psig_name, SIG_SIZE, SV*);
11405 for (i = 1; i < SIG_SIZE; i++) {
11406 PL_psig_ptr[i] = sv_dup_inc(proto_perl->Ipsig_ptr[i], param);
11407 PL_psig_name[i] = sv_dup_inc(proto_perl->Ipsig_name[i], param);
11408 }
11409 }
11410 else {
11411 PL_psig_ptr = (SV**)NULL;
11412 PL_psig_name = (SV**)NULL;
11413 }
05ec9bb3 11414
bd81e77b 11415 /* thrdvar.h stuff */
1d7c1841 11416
bd81e77b
NC
11417 if (flags & CLONEf_COPY_STACKS) {
11418 /* next allocation will be PL_tmps_stack[PL_tmps_ix+1] */
11419 PL_tmps_ix = proto_perl->Ttmps_ix;
11420 PL_tmps_max = proto_perl->Ttmps_max;
11421 PL_tmps_floor = proto_perl->Ttmps_floor;
11422 Newxz(PL_tmps_stack, PL_tmps_max, SV*);
11423 i = 0;
11424 while (i <= PL_tmps_ix) {
11425 PL_tmps_stack[i] = sv_dup_inc(proto_perl->Ttmps_stack[i], param);
11426 ++i;
11427 }
d2d73c3e 11428
bd81e77b
NC
11429 /* next PUSHMARK() sets *(PL_markstack_ptr+1) */
11430 i = proto_perl->Tmarkstack_max - proto_perl->Tmarkstack;
11431 Newxz(PL_markstack, i, I32);
11432 PL_markstack_max = PL_markstack + (proto_perl->Tmarkstack_max
11433 - proto_perl->Tmarkstack);
11434 PL_markstack_ptr = PL_markstack + (proto_perl->Tmarkstack_ptr
11435 - proto_perl->Tmarkstack);
11436 Copy(proto_perl->Tmarkstack, PL_markstack,
11437 PL_markstack_ptr - PL_markstack + 1, I32);
d2d73c3e 11438
bd81e77b
NC
11439 /* next push_scope()/ENTER sets PL_scopestack[PL_scopestack_ix]
11440 * NOTE: unlike the others! */
11441 PL_scopestack_ix = proto_perl->Tscopestack_ix;
11442 PL_scopestack_max = proto_perl->Tscopestack_max;
11443 Newxz(PL_scopestack, PL_scopestack_max, I32);
11444 Copy(proto_perl->Tscopestack, PL_scopestack, PL_scopestack_ix, I32);
d419787a 11445
bd81e77b
NC
11446 /* NOTE: si_dup() looks at PL_markstack */
11447 PL_curstackinfo = si_dup(proto_perl->Tcurstackinfo, param);
d2d73c3e 11448
bd81e77b
NC
11449 /* PL_curstack = PL_curstackinfo->si_stack; */
11450 PL_curstack = av_dup(proto_perl->Tcurstack, param);
11451 PL_mainstack = av_dup(proto_perl->Tmainstack, param);
1d7c1841 11452
bd81e77b
NC
11453 /* next PUSHs() etc. set *(PL_stack_sp+1) */
11454 PL_stack_base = AvARRAY(PL_curstack);
11455 PL_stack_sp = PL_stack_base + (proto_perl->Tstack_sp
11456 - proto_perl->Tstack_base);
11457 PL_stack_max = PL_stack_base + AvMAX(PL_curstack);
1d7c1841 11458
bd81e77b
NC
11459 /* next SSPUSHFOO() sets PL_savestack[PL_savestack_ix]
11460 * NOTE: unlike the others! */
11461 PL_savestack_ix = proto_perl->Tsavestack_ix;
11462 PL_savestack_max = proto_perl->Tsavestack_max;
11463 /*Newxz(PL_savestack, PL_savestack_max, ANY);*/
11464 PL_savestack = ss_dup(proto_perl, param);
11465 }
11466 else {
11467 init_stacks();
11468 ENTER; /* perl_destruct() wants to LEAVE; */
34394ecd
DM
11469
11470 /* although we're not duplicating the tmps stack, we should still
11471 * add entries for any SVs on the tmps stack that got cloned by a
11472 * non-refcount means (eg a temp in @_); otherwise they will be
11473 * orphaned
11474 */
11475 for (i = 0; i<= proto_perl->Ttmps_ix; i++) {
6136c704 11476 SV * const nsv = (SV*)ptr_table_fetch(PL_ptr_table,
34394ecd
DM
11477 proto_perl->Ttmps_stack[i]);
11478 if (nsv && !SvREFCNT(nsv)) {
11479 EXTEND_MORTAL(1);
b37c2d43 11480 PL_tmps_stack[++PL_tmps_ix] = SvREFCNT_inc_simple(nsv);
34394ecd
DM
11481 }
11482 }
bd81e77b 11483 }
1d7c1841 11484
bd81e77b
NC
11485 PL_start_env = proto_perl->Tstart_env; /* XXXXXX */
11486 PL_top_env = &PL_start_env;
1d7c1841 11487
bd81e77b 11488 PL_op = proto_perl->Top;
4a4c6fe3 11489
a0714e2c 11490 PL_Sv = NULL;
bd81e77b
NC
11491 PL_Xpv = (XPV*)NULL;
11492 PL_na = proto_perl->Tna;
1fcf4c12 11493
bd81e77b
NC
11494 PL_statbuf = proto_perl->Tstatbuf;
11495 PL_statcache = proto_perl->Tstatcache;
11496 PL_statgv = gv_dup(proto_perl->Tstatgv, param);
11497 PL_statname = sv_dup_inc(proto_perl->Tstatname, param);
11498#ifdef HAS_TIMES
11499 PL_timesbuf = proto_perl->Ttimesbuf;
11500#endif
1d7c1841 11501
bd81e77b
NC
11502 PL_tainted = proto_perl->Ttainted;
11503 PL_curpm = proto_perl->Tcurpm; /* XXX No PMOP ref count */
11504 PL_rs = sv_dup_inc(proto_perl->Trs, param);
11505 PL_last_in_gv = gv_dup(proto_perl->Tlast_in_gv, param);
11506 PL_ofs_sv = sv_dup_inc(proto_perl->Tofs_sv, param);
11507 PL_defoutgv = gv_dup_inc(proto_perl->Tdefoutgv, param);
11508 PL_chopset = proto_perl->Tchopset; /* XXX never deallocated */
11509 PL_toptarget = sv_dup_inc(proto_perl->Ttoptarget, param);
11510 PL_bodytarget = sv_dup_inc(proto_perl->Tbodytarget, param);
11511 PL_formtarget = sv_dup(proto_perl->Tformtarget, param);
1d7c1841 11512
bd81e77b
NC
11513 PL_restartop = proto_perl->Trestartop;
11514 PL_in_eval = proto_perl->Tin_eval;
11515 PL_delaymagic = proto_perl->Tdelaymagic;
11516 PL_dirty = proto_perl->Tdirty;
11517 PL_localizing = proto_perl->Tlocalizing;
1d7c1841 11518
bd81e77b 11519 PL_errors = sv_dup_inc(proto_perl->Terrors, param);
4608196e 11520 PL_hv_fetch_ent_mh = NULL;
bd81e77b 11521 PL_modcount = proto_perl->Tmodcount;
5f66b61c 11522 PL_lastgotoprobe = NULL;
bd81e77b 11523 PL_dumpindent = proto_perl->Tdumpindent;
1d7c1841 11524
bd81e77b
NC
11525 PL_sortcop = (OP*)any_dup(proto_perl->Tsortcop, proto_perl);
11526 PL_sortstash = hv_dup(proto_perl->Tsortstash, param);
11527 PL_firstgv = gv_dup(proto_perl->Tfirstgv, param);
11528 PL_secondgv = gv_dup(proto_perl->Tsecondgv, param);
bd61b366 11529 PL_efloatbuf = NULL; /* reinits on demand */
bd81e77b 11530 PL_efloatsize = 0; /* reinits on demand */
d2d73c3e 11531
bd81e77b 11532 /* regex stuff */
1d7c1841 11533
bd81e77b
NC
11534 PL_screamfirst = NULL;
11535 PL_screamnext = NULL;
11536 PL_maxscream = -1; /* reinits on demand */
a0714e2c 11537 PL_lastscream = NULL;
1d7c1841 11538
bd81e77b 11539 PL_watchaddr = NULL;
bd61b366 11540 PL_watchok = NULL;
1d7c1841 11541
bd81e77b 11542 PL_regdummy = proto_perl->Tregdummy;
bd81e77b
NC
11543 PL_colorset = 0; /* reinits PL_colors[] */
11544 /*PL_colors[6] = {0,0,0,0,0,0};*/
1d7c1841 11545
bd81e77b
NC
11546 /* RE engine - function pointers */
11547 PL_regcompp = proto_perl->Tregcompp;
11548 PL_regexecp = proto_perl->Tregexecp;
11549 PL_regint_start = proto_perl->Tregint_start;
11550 PL_regint_string = proto_perl->Tregint_string;
11551 PL_regfree = proto_perl->Tregfree;
46ab3289 11552 Zero(&PL_reg_state, 1, struct re_save_state);
bd81e77b 11553 PL_reginterp_cnt = 0;
5d9a96ca 11554 PL_regmatch_slab = NULL;
1d7c1841 11555
bd81e77b
NC
11556 /* Pluggable optimizer */
11557 PL_peepp = proto_perl->Tpeepp;
1d7c1841 11558
bd81e77b 11559 PL_stashcache = newHV();
1d7c1841 11560
bd81e77b
NC
11561 if (!(flags & CLONEf_KEEP_PTR_TABLE)) {
11562 ptr_table_free(PL_ptr_table);
11563 PL_ptr_table = NULL;
11564 }
1d7c1841 11565
bd81e77b
NC
11566 /* Call the ->CLONE method, if it exists, for each of the stashes
11567 identified by sv_dup() above.
11568 */
11569 while(av_len(param->stashes) != -1) {
11570 HV* const stash = (HV*) av_shift(param->stashes);
11571 GV* const cloner = gv_fetchmethod_autoload(stash, "CLONE", 0);
11572 if (cloner && GvCV(cloner)) {
11573 dSP;
11574 ENTER;
11575 SAVETMPS;
11576 PUSHMARK(SP);
11577 XPUSHs(sv_2mortal(newSVhek(HvNAME_HEK(stash))));
11578 PUTBACK;
11579 call_sv((SV*)GvCV(cloner), G_DISCARD);
11580 FREETMPS;
11581 LEAVE;
11582 }
1d7c1841 11583 }
1d7c1841 11584
bd81e77b 11585 SvREFCNT_dec(param->stashes);
1d7c1841 11586
bd81e77b
NC
11587 /* orphaned? eg threads->new inside BEGIN or use */
11588 if (PL_compcv && ! SvREFCNT(PL_compcv)) {
b37c2d43 11589 SvREFCNT_inc_simple_void(PL_compcv);
bd81e77b
NC
11590 SAVEFREESV(PL_compcv);
11591 }
dd2155a4 11592
bd81e77b
NC
11593 return my_perl;
11594}
1d7c1841 11595
bd81e77b 11596#endif /* USE_ITHREADS */
1d7c1841 11597
bd81e77b
NC
11598/*
11599=head1 Unicode Support
1d7c1841 11600
bd81e77b 11601=for apidoc sv_recode_to_utf8
1d7c1841 11602
bd81e77b
NC
11603The encoding is assumed to be an Encode object, on entry the PV
11604of the sv is assumed to be octets in that encoding, and the sv
11605will be converted into Unicode (and UTF-8).
1d7c1841 11606
bd81e77b
NC
11607If the sv already is UTF-8 (or if it is not POK), or if the encoding
11608is not a reference, nothing is done to the sv. If the encoding is not
11609an C<Encode::XS> Encoding object, bad things will happen.
11610(See F<lib/encoding.pm> and L<Encode>).
1d7c1841 11611
bd81e77b 11612The PV of the sv is returned.
1d7c1841 11613
bd81e77b 11614=cut */
1d7c1841 11615
bd81e77b
NC
11616char *
11617Perl_sv_recode_to_utf8(pTHX_ SV *sv, SV *encoding)
11618{
11619 dVAR;
11620 if (SvPOK(sv) && !SvUTF8(sv) && !IN_BYTES && SvROK(encoding)) {
11621 SV *uni;
11622 STRLEN len;
11623 const char *s;
11624 dSP;
11625 ENTER;
11626 SAVETMPS;
11627 save_re_context();
11628 PUSHMARK(sp);
11629 EXTEND(SP, 3);
11630 XPUSHs(encoding);
11631 XPUSHs(sv);
11632/*
11633 NI-S 2002/07/09
11634 Passing sv_yes is wrong - it needs to be or'ed set of constants
11635 for Encode::XS, while UTf-8 decode (currently) assumes a true value means
11636 remove converted chars from source.
1d7c1841 11637
bd81e77b 11638 Both will default the value - let them.
1d7c1841 11639
bd81e77b
NC
11640 XPUSHs(&PL_sv_yes);
11641*/
11642 PUTBACK;
11643 call_method("decode", G_SCALAR);
11644 SPAGAIN;
11645 uni = POPs;
11646 PUTBACK;
11647 s = SvPV_const(uni, len);
11648 if (s != SvPVX_const(sv)) {
11649 SvGROW(sv, len + 1);
11650 Move(s, SvPVX(sv), len + 1, char);
11651 SvCUR_set(sv, len);
11652 }
11653 FREETMPS;
11654 LEAVE;
11655 SvUTF8_on(sv);
11656 return SvPVX(sv);
389edf32 11657 }
bd81e77b
NC
11658 return SvPOKp(sv) ? SvPVX(sv) : NULL;
11659}
1d7c1841 11660
bd81e77b
NC
11661/*
11662=for apidoc sv_cat_decode
1d7c1841 11663
bd81e77b
NC
11664The encoding is assumed to be an Encode object, the PV of the ssv is
11665assumed to be octets in that encoding and decoding the input starts
11666from the position which (PV + *offset) pointed to. The dsv will be
11667concatenated the decoded UTF-8 string from ssv. Decoding will terminate
11668when the string tstr appears in decoding output or the input ends on
11669the PV of the ssv. The value which the offset points will be modified
11670to the last input position on the ssv.
1d7c1841 11671
bd81e77b 11672Returns TRUE if the terminator was found, else returns FALSE.
1d7c1841 11673
bd81e77b
NC
11674=cut */
11675
11676bool
11677Perl_sv_cat_decode(pTHX_ SV *dsv, SV *encoding,
11678 SV *ssv, int *offset, char *tstr, int tlen)
11679{
11680 dVAR;
11681 bool ret = FALSE;
11682 if (SvPOK(ssv) && SvPOK(dsv) && SvROK(encoding) && offset) {
11683 SV *offsv;
11684 dSP;
11685 ENTER;
11686 SAVETMPS;
11687 save_re_context();
11688 PUSHMARK(sp);
11689 EXTEND(SP, 6);
11690 XPUSHs(encoding);
11691 XPUSHs(dsv);
11692 XPUSHs(ssv);
11693 XPUSHs(offsv = sv_2mortal(newSViv(*offset)));
11694 XPUSHs(sv_2mortal(newSVpvn(tstr, tlen)));
11695 PUTBACK;
11696 call_method("cat_decode", G_SCALAR);
11697 SPAGAIN;
11698 ret = SvTRUE(TOPs);
11699 *offset = SvIV(offsv);
11700 PUTBACK;
11701 FREETMPS;
11702 LEAVE;
389edf32 11703 }
bd81e77b
NC
11704 else
11705 Perl_croak(aTHX_ "Invalid argument to sv_cat_decode");
11706 return ret;
1d7c1841 11707
bd81e77b 11708}
1d7c1841 11709
bd81e77b
NC
11710/* ---------------------------------------------------------------------
11711 *
11712 * support functions for report_uninit()
11713 */
1d7c1841 11714
bd81e77b
NC
11715/* the maxiumum size of array or hash where we will scan looking
11716 * for the undefined element that triggered the warning */
1d7c1841 11717
bd81e77b 11718#define FUV_MAX_SEARCH_SIZE 1000
1d7c1841 11719
bd81e77b
NC
11720/* Look for an entry in the hash whose value has the same SV as val;
11721 * If so, return a mortal copy of the key. */
1d7c1841 11722
bd81e77b
NC
11723STATIC SV*
11724S_find_hash_subscript(pTHX_ HV *hv, SV* val)
11725{
11726 dVAR;
11727 register HE **array;
11728 I32 i;
6c3182a5 11729
bd81e77b
NC
11730 if (!hv || SvMAGICAL(hv) || !HvARRAY(hv) ||
11731 (HvTOTALKEYS(hv) > FUV_MAX_SEARCH_SIZE))
a0714e2c 11732 return NULL;
6c3182a5 11733
bd81e77b 11734 array = HvARRAY(hv);
6c3182a5 11735
bd81e77b
NC
11736 for (i=HvMAX(hv); i>0; i--) {
11737 register HE *entry;
11738 for (entry = array[i]; entry; entry = HeNEXT(entry)) {
11739 if (HeVAL(entry) != val)
11740 continue;
11741 if ( HeVAL(entry) == &PL_sv_undef ||
11742 HeVAL(entry) == &PL_sv_placeholder)
11743 continue;
11744 if (!HeKEY(entry))
a0714e2c 11745 return NULL;
bd81e77b
NC
11746 if (HeKLEN(entry) == HEf_SVKEY)
11747 return sv_mortalcopy(HeKEY_sv(entry));
11748 return sv_2mortal(newSVpvn(HeKEY(entry), HeKLEN(entry)));
11749 }
11750 }
a0714e2c 11751 return NULL;
bd81e77b 11752}
6c3182a5 11753
bd81e77b
NC
11754/* Look for an entry in the array whose value has the same SV as val;
11755 * If so, return the index, otherwise return -1. */
6c3182a5 11756
bd81e77b
NC
11757STATIC I32
11758S_find_array_subscript(pTHX_ AV *av, SV* val)
11759{
97aff369 11760 dVAR;
bd81e77b
NC
11761 if (!av || SvMAGICAL(av) || !AvARRAY(av) ||
11762 (AvFILLp(av) > FUV_MAX_SEARCH_SIZE))
11763 return -1;
57c6e6d2 11764
4a021917
AL
11765 if (val != &PL_sv_undef) {
11766 SV ** const svp = AvARRAY(av);
11767 I32 i;
11768
11769 for (i=AvFILLp(av); i>=0; i--)
11770 if (svp[i] == val)
11771 return i;
bd81e77b
NC
11772 }
11773 return -1;
11774}
15a5279a 11775
bd81e77b
NC
11776/* S_varname(): return the name of a variable, optionally with a subscript.
11777 * If gv is non-zero, use the name of that global, along with gvtype (one
11778 * of "$", "@", "%"); otherwise use the name of the lexical at pad offset
11779 * targ. Depending on the value of the subscript_type flag, return:
11780 */
bce260cd 11781
bd81e77b
NC
11782#define FUV_SUBSCRIPT_NONE 1 /* "@foo" */
11783#define FUV_SUBSCRIPT_ARRAY 2 /* "$foo[aindex]" */
11784#define FUV_SUBSCRIPT_HASH 3 /* "$foo{keyname}" */
11785#define FUV_SUBSCRIPT_WITHIN 4 /* "within @foo" */
bce260cd 11786
bd81e77b
NC
11787STATIC SV*
11788S_varname(pTHX_ GV *gv, const char gvtype, PADOFFSET targ,
11789 SV* keyname, I32 aindex, int subscript_type)
11790{
1d7c1841 11791
bd81e77b
NC
11792 SV * const name = sv_newmortal();
11793 if (gv) {
11794 char buffer[2];
11795 buffer[0] = gvtype;
11796 buffer[1] = 0;
1d7c1841 11797
bd81e77b 11798 /* as gv_fullname4(), but add literal '^' for $^FOO names */
66fe0623 11799
bd81e77b 11800 gv_fullname4(name, gv, buffer, 0);
1d7c1841 11801
bd81e77b
NC
11802 if ((unsigned int)SvPVX(name)[1] <= 26) {
11803 buffer[0] = '^';
11804 buffer[1] = SvPVX(name)[1] + 'A' - 1;
1d7c1841 11805
bd81e77b
NC
11806 /* Swap the 1 unprintable control character for the 2 byte pretty
11807 version - ie substr($name, 1, 1) = $buffer; */
11808 sv_insert(name, 1, 1, buffer, 2);
1d7c1841 11809 }
bd81e77b
NC
11810 }
11811 else {
11812 U32 unused;
11813 CV * const cv = find_runcv(&unused);
11814 SV *sv;
11815 AV *av;
1d7c1841 11816
bd81e77b 11817 if (!cv || !CvPADLIST(cv))
a0714e2c 11818 return NULL;
bd81e77b
NC
11819 av = (AV*)(*av_fetch(CvPADLIST(cv), 0, FALSE));
11820 sv = *av_fetch(av, targ, FALSE);
11821 /* SvLEN in a pad name is not to be trusted */
11822 sv_setpv(name, SvPV_nolen_const(sv));
11823 }
1d7c1841 11824
bd81e77b 11825 if (subscript_type == FUV_SUBSCRIPT_HASH) {
561b68a9 11826 SV * const sv = newSV(0);
bd81e77b
NC
11827 *SvPVX(name) = '$';
11828 Perl_sv_catpvf(aTHX_ name, "{%s}",
11829 pv_display(sv,SvPVX_const(keyname), SvCUR(keyname), 0, 32));
11830 SvREFCNT_dec(sv);
11831 }
11832 else if (subscript_type == FUV_SUBSCRIPT_ARRAY) {
11833 *SvPVX(name) = '$';
11834 Perl_sv_catpvf(aTHX_ name, "[%"IVdf"]", (IV)aindex);
11835 }
11836 else if (subscript_type == FUV_SUBSCRIPT_WITHIN)
89529cee 11837 Perl_sv_insert(aTHX_ name, 0, 0, STR_WITH_LEN("within "));
1d7c1841 11838
bd81e77b
NC
11839 return name;
11840}
1d7c1841 11841
1d7c1841 11842
bd81e77b
NC
11843/*
11844=for apidoc find_uninit_var
1d7c1841 11845
bd81e77b
NC
11846Find the name of the undefined variable (if any) that caused the operator o
11847to issue a "Use of uninitialized value" warning.
11848If match is true, only return a name if it's value matches uninit_sv.
11849So roughly speaking, if a unary operator (such as OP_COS) generates a
11850warning, then following the direct child of the op may yield an
11851OP_PADSV or OP_GV that gives the name of the undefined variable. On the
11852other hand, with OP_ADD there are two branches to follow, so we only print
11853the variable name if we get an exact match.
1d7c1841 11854
bd81e77b 11855The name is returned as a mortal SV.
1d7c1841 11856
bd81e77b
NC
11857Assumes that PL_op is the op that originally triggered the error, and that
11858PL_comppad/PL_curpad points to the currently executing pad.
1d7c1841 11859
bd81e77b
NC
11860=cut
11861*/
1d7c1841 11862
bd81e77b
NC
11863STATIC SV *
11864S_find_uninit_var(pTHX_ OP* obase, SV* uninit_sv, bool match)
11865{
11866 dVAR;
11867 SV *sv;
11868 AV *av;
11869 GV *gv;
11870 OP *o, *o2, *kid;
1d7c1841 11871
bd81e77b
NC
11872 if (!obase || (match && (!uninit_sv || uninit_sv == &PL_sv_undef ||
11873 uninit_sv == &PL_sv_placeholder)))
a0714e2c 11874 return NULL;
1d7c1841 11875
bd81e77b 11876 switch (obase->op_type) {
1d7c1841 11877
bd81e77b
NC
11878 case OP_RV2AV:
11879 case OP_RV2HV:
11880 case OP_PADAV:
11881 case OP_PADHV:
11882 {
11883 const bool pad = (obase->op_type == OP_PADAV || obase->op_type == OP_PADHV);
11884 const bool hash = (obase->op_type == OP_PADHV || obase->op_type == OP_RV2HV);
11885 I32 index = 0;
a0714e2c 11886 SV *keysv = NULL;
bd81e77b 11887 int subscript_type = FUV_SUBSCRIPT_WITHIN;
1d7c1841 11888
bd81e77b
NC
11889 if (pad) { /* @lex, %lex */
11890 sv = PAD_SVl(obase->op_targ);
a0714e2c 11891 gv = NULL;
bd81e77b
NC
11892 }
11893 else {
11894 if (cUNOPx(obase)->op_first->op_type == OP_GV) {
11895 /* @global, %global */
11896 gv = cGVOPx_gv(cUNOPx(obase)->op_first);
11897 if (!gv)
11898 break;
11899 sv = hash ? (SV*)GvHV(gv): (SV*)GvAV(gv);
11900 }
11901 else /* @{expr}, %{expr} */
11902 return find_uninit_var(cUNOPx(obase)->op_first,
11903 uninit_sv, match);
11904 }
1d7c1841 11905
bd81e77b
NC
11906 /* attempt to find a match within the aggregate */
11907 if (hash) {
d4c19fe8 11908 keysv = find_hash_subscript((HV*)sv, uninit_sv);
bd81e77b
NC
11909 if (keysv)
11910 subscript_type = FUV_SUBSCRIPT_HASH;
11911 }
11912 else {
e15d5972 11913 index = find_array_subscript((AV*)sv, uninit_sv);
bd81e77b
NC
11914 if (index >= 0)
11915 subscript_type = FUV_SUBSCRIPT_ARRAY;
11916 }
1d7c1841 11917
bd81e77b
NC
11918 if (match && subscript_type == FUV_SUBSCRIPT_WITHIN)
11919 break;
1d7c1841 11920
bd81e77b
NC
11921 return varname(gv, hash ? '%' : '@', obase->op_targ,
11922 keysv, index, subscript_type);
11923 }
1d7c1841 11924
bd81e77b
NC
11925 case OP_PADSV:
11926 if (match && PAD_SVl(obase->op_targ) != uninit_sv)
11927 break;
a0714e2c
SS
11928 return varname(NULL, '$', obase->op_targ,
11929 NULL, 0, FUV_SUBSCRIPT_NONE);
1d7c1841 11930
bd81e77b
NC
11931 case OP_GVSV:
11932 gv = cGVOPx_gv(obase);
11933 if (!gv || (match && GvSV(gv) != uninit_sv))
11934 break;
a0714e2c 11935 return varname(gv, '$', 0, NULL, 0, FUV_SUBSCRIPT_NONE);
1d7c1841 11936
bd81e77b
NC
11937 case OP_AELEMFAST:
11938 if (obase->op_flags & OPf_SPECIAL) { /* lexical array */
11939 if (match) {
11940 SV **svp;
11941 av = (AV*)PAD_SV(obase->op_targ);
11942 if (!av || SvRMAGICAL(av))
11943 break;
11944 svp = av_fetch(av, (I32)obase->op_private, FALSE);
11945 if (!svp || *svp != uninit_sv)
11946 break;
11947 }
a0714e2c
SS
11948 return varname(NULL, '$', obase->op_targ,
11949 NULL, (I32)obase->op_private, FUV_SUBSCRIPT_ARRAY);
bd81e77b
NC
11950 }
11951 else {
11952 gv = cGVOPx_gv(obase);
11953 if (!gv)
11954 break;
11955 if (match) {
11956 SV **svp;
11957 av = GvAV(gv);
11958 if (!av || SvRMAGICAL(av))
11959 break;
11960 svp = av_fetch(av, (I32)obase->op_private, FALSE);
11961 if (!svp || *svp != uninit_sv)
11962 break;
11963 }
11964 return varname(gv, '$', 0,
a0714e2c 11965 NULL, (I32)obase->op_private, FUV_SUBSCRIPT_ARRAY);
bd81e77b
NC
11966 }
11967 break;
1d7c1841 11968
bd81e77b
NC
11969 case OP_EXISTS:
11970 o = cUNOPx(obase)->op_first;
11971 if (!o || o->op_type != OP_NULL ||
11972 ! (o->op_targ == OP_AELEM || o->op_targ == OP_HELEM))
11973 break;
11974 return find_uninit_var(cBINOPo->op_last, uninit_sv, match);
a2efc822 11975
bd81e77b
NC
11976 case OP_AELEM:
11977 case OP_HELEM:
11978 if (PL_op == obase)
11979 /* $a[uninit_expr] or $h{uninit_expr} */
11980 return find_uninit_var(cBINOPx(obase)->op_last, uninit_sv, match);
081fc587 11981
a0714e2c 11982 gv = NULL;
bd81e77b
NC
11983 o = cBINOPx(obase)->op_first;
11984 kid = cBINOPx(obase)->op_last;
8cf8f3d1 11985
bd81e77b 11986 /* get the av or hv, and optionally the gv */
a0714e2c 11987 sv = NULL;
bd81e77b
NC
11988 if (o->op_type == OP_PADAV || o->op_type == OP_PADHV) {
11989 sv = PAD_SV(o->op_targ);
11990 }
11991 else if ((o->op_type == OP_RV2AV || o->op_type == OP_RV2HV)
11992 && cUNOPo->op_first->op_type == OP_GV)
11993 {
11994 gv = cGVOPx_gv(cUNOPo->op_first);
11995 if (!gv)
11996 break;
11997 sv = o->op_type == OP_RV2HV ? (SV*)GvHV(gv) : (SV*)GvAV(gv);
11998 }
11999 if (!sv)
12000 break;
12001
12002 if (kid && kid->op_type == OP_CONST && SvOK(cSVOPx_sv(kid))) {
12003 /* index is constant */
12004 if (match) {
12005 if (SvMAGICAL(sv))
12006 break;
12007 if (obase->op_type == OP_HELEM) {
12008 HE* he = hv_fetch_ent((HV*)sv, cSVOPx_sv(kid), 0, 0);
12009 if (!he || HeVAL(he) != uninit_sv)
12010 break;
12011 }
12012 else {
00b6aa41 12013 SV * const * const svp = av_fetch((AV*)sv, SvIV(cSVOPx_sv(kid)), FALSE);
bd81e77b
NC
12014 if (!svp || *svp != uninit_sv)
12015 break;
12016 }
12017 }
12018 if (obase->op_type == OP_HELEM)
12019 return varname(gv, '%', o->op_targ,
12020 cSVOPx_sv(kid), 0, FUV_SUBSCRIPT_HASH);
12021 else
a0714e2c 12022 return varname(gv, '@', o->op_targ, NULL,
bd81e77b 12023 SvIV(cSVOPx_sv(kid)), FUV_SUBSCRIPT_ARRAY);
bd81e77b
NC
12024 }
12025 else {
12026 /* index is an expression;
12027 * attempt to find a match within the aggregate */
12028 if (obase->op_type == OP_HELEM) {
d4c19fe8 12029 SV * const keysv = find_hash_subscript((HV*)sv, uninit_sv);
bd81e77b
NC
12030 if (keysv)
12031 return varname(gv, '%', o->op_targ,
12032 keysv, 0, FUV_SUBSCRIPT_HASH);
12033 }
12034 else {
d4c19fe8 12035 const I32 index = find_array_subscript((AV*)sv, uninit_sv);
bd81e77b
NC
12036 if (index >= 0)
12037 return varname(gv, '@', o->op_targ,
a0714e2c 12038 NULL, index, FUV_SUBSCRIPT_ARRAY);
bd81e77b
NC
12039 }
12040 if (match)
12041 break;
12042 return varname(gv,
12043 (o->op_type == OP_PADAV || o->op_type == OP_RV2AV)
12044 ? '@' : '%',
a0714e2c 12045 o->op_targ, NULL, 0, FUV_SUBSCRIPT_WITHIN);
f284b03f 12046 }
bd81e77b 12047 break;
dc507217 12048
bd81e77b
NC
12049 case OP_AASSIGN:
12050 /* only examine RHS */
12051 return find_uninit_var(cBINOPx(obase)->op_first, uninit_sv, match);
6d26897e 12052
bd81e77b
NC
12053 case OP_OPEN:
12054 o = cUNOPx(obase)->op_first;
12055 if (o->op_type == OP_PUSHMARK)
12056 o = o->op_sibling;
1d7c1841 12057
bd81e77b
NC
12058 if (!o->op_sibling) {
12059 /* one-arg version of open is highly magical */
a0ae6670 12060
bd81e77b
NC
12061 if (o->op_type == OP_GV) { /* open FOO; */
12062 gv = cGVOPx_gv(o);
12063 if (match && GvSV(gv) != uninit_sv)
12064 break;
12065 return varname(gv, '$', 0,
a0714e2c 12066 NULL, 0, FUV_SUBSCRIPT_NONE);
bd81e77b
NC
12067 }
12068 /* other possibilities not handled are:
12069 * open $x; or open my $x; should return '${*$x}'
12070 * open expr; should return '$'.expr ideally
12071 */
12072 break;
12073 }
12074 goto do_op;
ccfc67b7 12075
bd81e77b
NC
12076 /* ops where $_ may be an implicit arg */
12077 case OP_TRANS:
12078 case OP_SUBST:
12079 case OP_MATCH:
12080 if ( !(obase->op_flags & OPf_STACKED)) {
12081 if (uninit_sv == ((obase->op_private & OPpTARGET_MY)
12082 ? PAD_SVl(obase->op_targ)
12083 : DEFSV))
12084 {
12085 sv = sv_newmortal();
12086 sv_setpvn(sv, "$_", 2);
12087 return sv;
12088 }
12089 }
12090 goto do_op;
9f4817db 12091
bd81e77b
NC
12092 case OP_PRTF:
12093 case OP_PRINT:
12094 /* skip filehandle as it can't produce 'undef' warning */
12095 o = cUNOPx(obase)->op_first;
12096 if ((obase->op_flags & OPf_STACKED) && o->op_type == OP_PUSHMARK)
12097 o = o->op_sibling->op_sibling;
12098 goto do_op2;
9f4817db 12099
9f4817db 12100
bd81e77b
NC
12101 case OP_RV2SV:
12102 case OP_CUSTOM:
12103 case OP_ENTERSUB:
12104 match = 1; /* XS or custom code could trigger random warnings */
12105 goto do_op;
9f4817db 12106
bd81e77b
NC
12107 case OP_SCHOMP:
12108 case OP_CHOMP:
12109 if (SvROK(PL_rs) && uninit_sv == SvRV(PL_rs))
396482e1 12110 return sv_2mortal(newSVpvs("${$/}"));
5f66b61c 12111 /*FALLTHROUGH*/
5d170f3a 12112
bd81e77b
NC
12113 default:
12114 do_op:
12115 if (!(obase->op_flags & OPf_KIDS))
12116 break;
12117 o = cUNOPx(obase)->op_first;
12118
12119 do_op2:
12120 if (!o)
12121 break;
f9893866 12122
bd81e77b
NC
12123 /* if all except one arg are constant, or have no side-effects,
12124 * or are optimized away, then it's unambiguous */
5f66b61c 12125 o2 = NULL;
bd81e77b 12126 for (kid=o; kid; kid = kid->op_sibling) {
e15d5972
AL
12127 if (kid) {
12128 const OPCODE type = kid->op_type;
12129 if ( (type == OP_CONST && SvOK(cSVOPx_sv(kid)))
12130 || (type == OP_NULL && ! (kid->op_flags & OPf_KIDS))
12131 || (type == OP_PUSHMARK)
bd81e77b 12132 )
bd81e77b 12133 continue;
e15d5972 12134 }
bd81e77b 12135 if (o2) { /* more than one found */
5f66b61c 12136 o2 = NULL;
bd81e77b
NC
12137 break;
12138 }
12139 o2 = kid;
12140 }
12141 if (o2)
12142 return find_uninit_var(o2, uninit_sv, match);
7a5fa8a2 12143
bd81e77b
NC
12144 /* scan all args */
12145 while (o) {
12146 sv = find_uninit_var(o, uninit_sv, 1);
12147 if (sv)
12148 return sv;
12149 o = o->op_sibling;
d0063567 12150 }
bd81e77b 12151 break;
f9893866 12152 }
a0714e2c 12153 return NULL;
9f4817db
JH
12154}
12155
220e2d4e 12156
bd81e77b
NC
12157/*
12158=for apidoc report_uninit
68795e93 12159
bd81e77b 12160Print appropriate "Use of uninitialized variable" warning
220e2d4e 12161
bd81e77b
NC
12162=cut
12163*/
220e2d4e 12164
bd81e77b
NC
12165void
12166Perl_report_uninit(pTHX_ SV* uninit_sv)
220e2d4e 12167{
97aff369 12168 dVAR;
bd81e77b 12169 if (PL_op) {
a0714e2c 12170 SV* varname = NULL;
bd81e77b
NC
12171 if (uninit_sv) {
12172 varname = find_uninit_var(PL_op, uninit_sv,0);
12173 if (varname)
12174 sv_insert(varname, 0, 0, " ", 1);
12175 }
12176 Perl_warner(aTHX_ packWARN(WARN_UNINITIALIZED), PL_warn_uninit,
12177 varname ? SvPV_nolen_const(varname) : "",
12178 " in ", OP_DESC(PL_op));
220e2d4e 12179 }
a73e8557 12180 else
bd81e77b
NC
12181 Perl_warner(aTHX_ packWARN(WARN_UNINITIALIZED), PL_warn_uninit,
12182 "", "", "");
220e2d4e 12183}
f9893866 12184
241d1a3b
NC
12185/*
12186 * Local variables:
12187 * c-indentation-style: bsd
12188 * c-basic-offset: 4
12189 * indent-tabs-mode: t
12190 * End:
12191 *
37442d52
RGS
12192 * ex: set ts=8 sts=4 sw=4 noet:
12193 */